outside.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410
  1. package nebula
  2. import (
  3. "encoding/binary"
  4. "github.com/flynn/noise"
  5. "github.com/golang/protobuf/proto"
  6. "github.com/sirupsen/logrus"
  7. "github.com/slackhq/nebula/cert"
  8. // "github.com/google/gopacket"
  9. // "github.com/google/gopacket/layers"
  10. // "encoding/binary"
  11. "errors"
  12. "fmt"
  13. "time"
  14. "golang.org/x/net/ipv4"
  15. )
  16. const (
  17. minFwPacketLen = 4
  18. )
  19. func (f *Interface) readOutsidePackets(addr *udpAddr, out []byte, packet []byte, header *Header, fwPacket *FirewallPacket, nb []byte) {
  20. err := header.Parse(packet)
  21. if err != nil {
  22. // TODO: best if we return this and let caller log
  23. // TODO: Might be better to send the literal []byte("holepunch") packet and ignore that?
  24. // Hole punch packets are 0 or 1 byte big, so lets ignore printing those errors
  25. if len(packet) > 1 {
  26. l.WithField("packet", packet).Infof("Error while parsing inbound packet from %s: %s", addr, err)
  27. }
  28. return
  29. }
  30. //l.Error("in packet ", header, packet[HeaderLen:])
  31. // verify if we've seen this index before, otherwise respond to the handshake initiation
  32. hostinfo, err := f.hostMap.QueryIndex(header.RemoteIndex)
  33. var ci *ConnectionState
  34. if err == nil {
  35. ci = hostinfo.ConnectionState
  36. }
  37. switch header.Type {
  38. case message:
  39. if !f.handleEncrypted(ci, addr, header) {
  40. return
  41. }
  42. f.decryptToTun(hostinfo, header.MessageCounter, out, packet, fwPacket, nb)
  43. // Fallthrough to the bottom to record incoming traffic
  44. case lightHouse:
  45. if !f.handleEncrypted(ci, addr, header) {
  46. return
  47. }
  48. d, err := f.decrypt(hostinfo, header.MessageCounter, out, packet, header, nb)
  49. if err != nil {
  50. l.WithError(err).WithField("udpAddr", addr).WithField("vpnIp", IntIp(hostinfo.hostId)).
  51. WithField("packet", packet).
  52. Error("Failed to decrypt lighthouse packet")
  53. //TODO: maybe after build 64 is out? 06/14/2018 - NB
  54. //f.sendRecvError(net.Addr(addr), header.RemoteIndex)
  55. return
  56. }
  57. f.lightHouse.HandleRequest(addr, hostinfo.hostId, d, hostinfo.GetCert(), f)
  58. // Fallthrough to the bottom to record incoming traffic
  59. case test:
  60. if !f.handleEncrypted(ci, addr, header) {
  61. return
  62. }
  63. d, err := f.decrypt(hostinfo, header.MessageCounter, out, packet, header, nb)
  64. if err != nil {
  65. l.WithError(err).WithField("udpAddr", addr).WithField("vpnIp", IntIp(hostinfo.hostId)).
  66. WithField("packet", packet).
  67. Error("Failed to decrypt test packet")
  68. //TODO: maybe after build 64 is out? 06/14/2018 - NB
  69. //f.sendRecvError(net.Addr(addr), header.RemoteIndex)
  70. return
  71. }
  72. if header.Subtype == testRequest {
  73. // This testRequest might be from TryPromoteBest, so we should roam
  74. // to the new IP address before responding
  75. f.handleHostRoaming(hostinfo, addr)
  76. f.send(test, testReply, ci, hostinfo, hostinfo.remote, d, nb, out)
  77. }
  78. // Fallthrough to the bottom to record incoming traffic
  79. // Non encrypted messages below here, they should not fall through to avoid tracking incoming traffic since they
  80. // are unauthenticated
  81. case handshake:
  82. HandleIncomingHandshake(f, addr, packet, header, hostinfo)
  83. return
  84. case recvError:
  85. // TODO: Remove this with recv_error deprecation
  86. f.handleRecvError(addr, header)
  87. return
  88. case closeTunnel:
  89. if !f.handleEncrypted(ci, addr, header) {
  90. return
  91. }
  92. l.WithField("vpnIp", IntIp(hostinfo.hostId)).WithField("udpAddr", addr).
  93. Info("Close tunnel received, tearing down.")
  94. f.closeTunnel(hostinfo)
  95. return
  96. default:
  97. l.Debugf("Unexpected packet received from %s", addr)
  98. return
  99. }
  100. f.handleHostRoaming(hostinfo, addr)
  101. f.connectionManager.In(hostinfo.hostId)
  102. }
  103. func (f *Interface) closeTunnel(hostInfo *HostInfo) {
  104. //TODO: this would be better as a single function in ConnectionManager that handled locks appropriately
  105. f.connectionManager.ClearIP(hostInfo.hostId)
  106. f.connectionManager.ClearPendingDeletion(hostInfo.hostId)
  107. f.lightHouse.DeleteVpnIP(hostInfo.hostId)
  108. f.hostMap.DeleteVpnIP(hostInfo.hostId)
  109. f.hostMap.DeleteIndex(hostInfo.localIndexId)
  110. }
  111. func (f *Interface) handleHostRoaming(hostinfo *HostInfo, addr *udpAddr) {
  112. if hostDidRoam(hostinfo.remote, addr) {
  113. if !hostinfo.lastRoam.IsZero() && addr.Equals(hostinfo.lastRoamRemote) && time.Since(hostinfo.lastRoam) < RoamingSupressSeconds*time.Second {
  114. if l.Level >= logrus.DebugLevel {
  115. l.WithField("vpnIp", IntIp(hostinfo.hostId)).WithField("udpAddr", hostinfo.remote).WithField("newAddr", addr).
  116. Debugf("Supressing roam back to previous remote for %d seconds", RoamingSupressSeconds)
  117. }
  118. return
  119. }
  120. l.WithField("vpnIp", IntIp(hostinfo.hostId)).WithField("udpAddr", hostinfo.remote).WithField("newAddr", addr).
  121. Info("Host roamed to new udp ip/port.")
  122. hostinfo.lastRoam = time.Now()
  123. remoteCopy := *hostinfo.remote
  124. hostinfo.lastRoamRemote = &remoteCopy
  125. hostinfo.SetRemote(*addr)
  126. if f.lightHouse.amLighthouse {
  127. f.lightHouse.AddRemote(hostinfo.hostId, addr, false)
  128. }
  129. }
  130. }
  131. func (f *Interface) handleEncrypted(ci *ConnectionState, addr *udpAddr, header *Header) bool {
  132. // If connectionstate exists and the replay protector allows, process packet
  133. // Else, send recv errors for 300 seconds after a restart to allow fast reconnection.
  134. if ci == nil || !ci.window.Check(header.MessageCounter) {
  135. f.sendRecvError(addr, header.RemoteIndex)
  136. return false
  137. }
  138. return true
  139. }
  140. // newPacket validates and parses the interesting bits for the firewall out of the ip and sub protocol headers
  141. func newPacket(data []byte, incoming bool, fp *FirewallPacket) error {
  142. // Do we at least have an ipv4 header worth of data?
  143. if len(data) < ipv4.HeaderLen {
  144. return fmt.Errorf("packet is less than %v bytes", ipv4.HeaderLen)
  145. }
  146. // Is it an ipv4 packet?
  147. if int((data[0]>>4)&0x0f) != 4 {
  148. return fmt.Errorf("packet is not ipv4, type: %v", int((data[0]>>4)&0x0f))
  149. }
  150. // Adjust our start position based on the advertised ip header length
  151. ihl := int(data[0]&0x0f) << 2
  152. // Well formed ip header length?
  153. if ihl < ipv4.HeaderLen {
  154. return fmt.Errorf("packet had an invalid header length: %v", ihl)
  155. }
  156. // Check if this is the second or further fragment of a fragmented packet.
  157. flagsfrags := binary.BigEndian.Uint16(data[6:8])
  158. fp.Fragment = (flagsfrags & 0x1FFF) != 0
  159. // Firewall handles protocol checks
  160. fp.Protocol = data[9]
  161. // Accounting for a variable header length, do we have enough data for our src/dst tuples?
  162. minLen := ihl
  163. if !fp.Fragment && fp.Protocol != fwProtoICMP {
  164. minLen += minFwPacketLen
  165. }
  166. if len(data) < minLen {
  167. return fmt.Errorf("packet is less than %v bytes, ip header len: %v", minLen, ihl)
  168. }
  169. // Firewall packets are locally oriented
  170. if incoming {
  171. fp.RemoteIP = binary.BigEndian.Uint32(data[12:16])
  172. fp.LocalIP = binary.BigEndian.Uint32(data[16:20])
  173. if fp.Fragment || fp.Protocol == fwProtoICMP {
  174. fp.RemotePort = 0
  175. fp.LocalPort = 0
  176. } else {
  177. fp.RemotePort = binary.BigEndian.Uint16(data[ihl : ihl+2])
  178. fp.LocalPort = binary.BigEndian.Uint16(data[ihl+2 : ihl+4])
  179. }
  180. } else {
  181. fp.LocalIP = binary.BigEndian.Uint32(data[12:16])
  182. fp.RemoteIP = binary.BigEndian.Uint32(data[16:20])
  183. if fp.Fragment || fp.Protocol == fwProtoICMP {
  184. fp.RemotePort = 0
  185. fp.LocalPort = 0
  186. } else {
  187. fp.LocalPort = binary.BigEndian.Uint16(data[ihl : ihl+2])
  188. fp.RemotePort = binary.BigEndian.Uint16(data[ihl+2 : ihl+4])
  189. }
  190. }
  191. return nil
  192. }
  193. func (f *Interface) decrypt(hostinfo *HostInfo, mc uint64, out []byte, packet []byte, header *Header, nb []byte) ([]byte, error) {
  194. var err error
  195. out, err = hostinfo.ConnectionState.dKey.DecryptDanger(out, packet[:HeaderLen], packet[HeaderLen:], mc, nb)
  196. if err != nil {
  197. return nil, err
  198. }
  199. if !hostinfo.ConnectionState.window.Update(mc) {
  200. l.WithField("vpnIp", IntIp(hostinfo.hostId)).WithField("header", header).
  201. Debugln("dropping out of window packet")
  202. return nil, errors.New("out of window packet")
  203. }
  204. return out, nil
  205. }
  206. func (f *Interface) decryptToTun(hostinfo *HostInfo, messageCounter uint64, out []byte, packet []byte, fwPacket *FirewallPacket, nb []byte) {
  207. var err error
  208. // TODO: This breaks subnet routing and needs to also check range of ip subnet
  209. /*
  210. if len(res) > 16 && binary.BigEndian.Uint32(res[12:16]) != ip2int(ci.peerCert.Details.Ips[0].IP) {
  211. l.Debugf("Host %s tried to spoof packet as %s.", ci.peerCert.Details.Ips[0].IP, IntIp(binary.BigEndian.Uint32(res[12:16])))
  212. }
  213. */
  214. out, err = hostinfo.ConnectionState.dKey.DecryptDanger(out, packet[:HeaderLen], packet[HeaderLen:], messageCounter, nb)
  215. if err != nil {
  216. l.WithError(err).WithField("vpnIp", IntIp(hostinfo.hostId)).Error("Failed to decrypt packet")
  217. //TODO: maybe after build 64 is out? 06/14/2018 - NB
  218. //f.sendRecvError(hostinfo.remote, header.RemoteIndex)
  219. return
  220. }
  221. err = newPacket(out, true, fwPacket)
  222. if err != nil {
  223. l.WithError(err).WithField("packet", out).WithField("hostInfo", IntIp(hostinfo.hostId)).
  224. Warnf("Error while validating inbound packet")
  225. return
  226. }
  227. if !hostinfo.ConnectionState.window.Update(messageCounter) {
  228. l.WithField("vpnIp", IntIp(hostinfo.hostId)).WithField("fwPacket", fwPacket).
  229. Debugln("dropping out of window packet")
  230. return
  231. }
  232. if f.firewall.Drop(out, *fwPacket, true, hostinfo.ConnectionState.peerCert, trustedCAs) {
  233. l.WithField("vpnIp", IntIp(hostinfo.hostId)).WithField("fwPacket", fwPacket).
  234. Debugln("dropping inbound packet")
  235. return
  236. }
  237. f.connectionManager.In(hostinfo.hostId)
  238. err = f.inside.WriteRaw(out)
  239. if err != nil {
  240. l.WithError(err).Error("Failed to write to tun")
  241. }
  242. }
  243. func (f *Interface) sendRecvError(endpoint *udpAddr, index uint32) {
  244. f.metricTxRecvError.Inc(1)
  245. //TODO: this should be a signed message so we can trust that we should drop the index
  246. b := HeaderEncode(make([]byte, HeaderLen), Version, uint8(recvError), 0, index, 0)
  247. f.outside.WriteTo(b, endpoint)
  248. if l.Level >= logrus.DebugLevel {
  249. l.WithField("index", index).
  250. WithField("udpAddr", endpoint).
  251. Debug("Recv error sent")
  252. }
  253. }
  254. func (f *Interface) handleRecvError(addr *udpAddr, h *Header) {
  255. f.metricRxRecvError.Inc(1)
  256. // This flag is to stop caring about recv_error from old versions
  257. // This should go away when the old version is gone from prod
  258. if l.Level >= logrus.DebugLevel {
  259. l.WithField("index", h.RemoteIndex).
  260. WithField("udpAddr", addr).
  261. Debug("Recv error received")
  262. }
  263. hostinfo, err := f.hostMap.QueryReverseIndex(h.RemoteIndex)
  264. if err != nil {
  265. l.Debugln(err, ": ", h.RemoteIndex)
  266. return
  267. }
  268. if !hostinfo.RecvErrorExceeded() {
  269. return
  270. }
  271. if hostinfo.remote != nil && hostinfo.remote.String() != addr.String() {
  272. l.Infoln("Someone spoofing recv_errors? ", addr, hostinfo.remote)
  273. return
  274. }
  275. id := hostinfo.localIndexId
  276. host := hostinfo.hostId
  277. // We delete this host from the main hostmap
  278. f.hostMap.DeleteIndex(id)
  279. f.hostMap.DeleteVpnIP(host)
  280. // We also delete it from pending to allow for
  281. // fast reconnect. We must null the connectionstate
  282. // or a counter reuse may happen
  283. hostinfo.ConnectionState = nil
  284. f.handshakeManager.DeleteIndex(id)
  285. f.handshakeManager.DeleteVpnIP(host)
  286. }
  287. /*
  288. func (f *Interface) sendMeta(ci *ConnectionState, endpoint *net.UDPAddr, meta *NebulaMeta) {
  289. if ci.eKey != nil {
  290. //TODO: log error?
  291. return
  292. }
  293. msg, err := proto.Marshal(meta)
  294. if err != nil {
  295. l.Debugln("failed to encode header")
  296. }
  297. c := ci.messageCounter
  298. b := HeaderEncode(nil, Version, uint8(metadata), 0, hostinfo.remoteIndexId, c)
  299. ci.messageCounter++
  300. msg := ci.eKey.EncryptDanger(b, nil, msg, c)
  301. //msg := ci.eKey.EncryptDanger(b, nil, []byte(fmt.Sprintf("%d", counter)), c)
  302. f.outside.WriteTo(msg, endpoint)
  303. }
  304. */
  305. func RecombineCertAndValidate(h *noise.HandshakeState, rawCertBytes []byte) (*cert.NebulaCertificate, error) {
  306. pk := h.PeerStatic()
  307. if pk == nil {
  308. return nil, errors.New("no peer static key was present")
  309. }
  310. if rawCertBytes == nil {
  311. return nil, errors.New("provided payload was empty")
  312. }
  313. r := &cert.RawNebulaCertificate{}
  314. err := proto.Unmarshal(rawCertBytes, r)
  315. if err != nil {
  316. return nil, fmt.Errorf("error unmarshaling cert: %s", err)
  317. }
  318. // If the Details are nil, just exit to avoid crashing
  319. if r.Details == nil {
  320. return nil, fmt.Errorf("certificate did not contain any details")
  321. }
  322. r.Details.PublicKey = pk
  323. recombined, err := proto.Marshal(r)
  324. if err != nil {
  325. return nil, fmt.Errorf("error while recombining certificate: %s", err)
  326. }
  327. c, _ := cert.UnmarshalNebulaCertificate(recombined)
  328. isValid, err := c.Verify(time.Now(), trustedCAs)
  329. if err != nil {
  330. return c, fmt.Errorf("certificate validation failed: %s", err)
  331. } else if !isValid {
  332. // This case should never happen but here's to defensive programming!
  333. return c, errors.New("certificate validation failed but did not return an error")
  334. }
  335. return c, nil
  336. }