eth.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556
  1. /*
  2. * INET An implementation of the TCP/IP protocol suite for the LINUX
  3. * operating system. INET is implemented using the BSD Socket
  4. * interface as the means of communication with the user level.
  5. *
  6. * Ethernet-type device handling.
  7. *
  8. * Version: @(#)eth.c 1.0.7 05/25/93
  9. *
  10. * Authors: Ross Biro
  11. * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
  12. * Mark Evans, <evansmp@uhura.aston.ac.uk>
  13. * Florian La Roche, <rzsfl@rz.uni-sb.de>
  14. * Alan Cox, <gw4pts@gw4pts.ampr.org>
  15. *
  16. * Fixes:
  17. * Mr Linux : Arp problems
  18. * Alan Cox : Generic queue tidyup (very tiny here)
  19. * Alan Cox : eth_header ntohs should be htons
  20. * Alan Cox : eth_rebuild_header missing an htons and
  21. * minor other things.
  22. * Tegge : Arp bug fixes.
  23. * Florian : Removed many unnecessary functions, code cleanup
  24. * and changes for new arp and skbuff.
  25. * Alan Cox : Redid header building to reflect new format.
  26. * Alan Cox : ARP only when compiled with CONFIG_INET
  27. * Greg Page : 802.2 and SNAP stuff.
  28. * Alan Cox : MAC layer pointers/new format.
  29. * Paul Gortmaker : eth_copy_and_sum shouldn't csum padding.
  30. * Alan Cox : Protect against forwarding explosions with
  31. * older network drivers and IFF_ALLMULTI.
  32. * Christer Weinigel : Better rebuild header message.
  33. * Andrew Morton : 26Feb01: kill ether_setup() - use netdev_boot_setup().
  34. *
  35. * This program is free software; you can redistribute it and/or
  36. * modify it under the terms of the GNU General Public License
  37. * as published by the Free Software Foundation; either version
  38. * 2 of the License, or (at your option) any later version.
  39. */
  40. #include <linux/module.h>
  41. #include <linux/types.h>
  42. #include <linux/kernel.h>
  43. #include <linux/string.h>
  44. #include <linux/mm.h>
  45. #include <linux/socket.h>
  46. #include <linux/in.h>
  47. #include <linux/inet.h>
  48. #include <linux/ip.h>
  49. #include <linux/netdevice.h>
  50. #include <linux/etherdevice.h>
  51. #include <linux/skbuff.h>
  52. #include <linux/errno.h>
  53. #include <linux/init.h>
  54. #include <linux/if_ether.h>
  55. #include <linux/of_net.h>
  56. #include <linux/pci.h>
  57. #include <net/dst.h>
  58. #include <net/arp.h>
  59. #include <net/sock.h>
  60. #include <net/ipv6.h>
  61. #include <net/ip.h>
  62. #include <net/dsa.h>
  63. #include <net/flow_dissector.h>
  64. #include <linux/uaccess.h>
  65. #include <net/pkt_sched.h>
  66. __setup("ether=", netdev_boot_setup);
  67. /**
  68. * eth_header - create the Ethernet header
  69. * @skb: buffer to alter
  70. * @dev: source device
  71. * @type: Ethernet type field
  72. * @daddr: destination address (NULL leave destination address)
  73. * @saddr: source address (NULL use device source address)
  74. * @len: packet length (<= skb->len)
  75. *
  76. *
  77. * Set the protocol type. For a packet of type ETH_P_802_3/2 we put the length
  78. * in here instead.
  79. */
  80. int eth_header(struct sk_buff *skb, struct net_device *dev,
  81. unsigned short type,
  82. const void *daddr, const void *saddr, unsigned int len)
  83. {
  84. struct ethhdr *eth = skb_push(skb, ETH_HLEN);
  85. if (type != ETH_P_802_3 && type != ETH_P_802_2)
  86. eth->h_proto = htons(type);
  87. else
  88. eth->h_proto = htons(len);
  89. /*
  90. * Set the source hardware address.
  91. */
  92. if (!saddr)
  93. saddr = dev->dev_addr;
  94. memcpy(eth->h_source, saddr, ETH_ALEN);
  95. if (daddr) {
  96. memcpy(eth->h_dest, daddr, ETH_ALEN);
  97. return ETH_HLEN;
  98. }
  99. /*
  100. * Anyway, the loopback-device should never use this function...
  101. */
  102. if (dev->flags & (IFF_LOOPBACK | IFF_NOARP)) {
  103. eth_zero_addr(eth->h_dest);
  104. return ETH_HLEN;
  105. }
  106. return -ETH_HLEN;
  107. }
  108. EXPORT_SYMBOL(eth_header);
  109. /**
  110. * eth_get_headlen - determine the length of header for an ethernet frame
  111. * @data: pointer to start of frame
  112. * @len: total length of frame
  113. *
  114. * Make a best effort attempt to pull the length for all of the headers for
  115. * a given frame in a linear buffer.
  116. */
  117. u32 eth_get_headlen(void *data, unsigned int len)
  118. {
  119. const unsigned int flags = FLOW_DISSECTOR_F_PARSE_1ST_FRAG;
  120. const struct ethhdr *eth = (const struct ethhdr *)data;
  121. struct flow_keys_basic keys;
  122. /* this should never happen, but better safe than sorry */
  123. if (unlikely(len < sizeof(*eth)))
  124. return len;
  125. /* parse any remaining L2/L3 headers, check for L4 */
  126. if (!skb_flow_dissect_flow_keys_basic(NULL, &keys, data, eth->h_proto,
  127. sizeof(*eth), len, flags))
  128. return max_t(u32, keys.control.thoff, sizeof(*eth));
  129. /* parse for any L4 headers */
  130. return min_t(u32, __skb_get_poff(NULL, data, &keys, len), len);
  131. }
  132. EXPORT_SYMBOL(eth_get_headlen);
  133. /**
  134. * eth_type_trans - determine the packet's protocol ID.
  135. * @skb: received socket data
  136. * @dev: receiving network device
  137. *
  138. * The rule here is that we
  139. * assume 802.3 if the type field is short enough to be a length.
  140. * This is normal practice and works for any 'now in use' protocol.
  141. */
  142. __be16 eth_type_trans(struct sk_buff *skb, struct net_device *dev)
  143. {
  144. unsigned short _service_access_point;
  145. const unsigned short *sap;
  146. const struct ethhdr *eth;
  147. skb->dev = dev;
  148. skb_reset_mac_header(skb);
  149. eth = (struct ethhdr *)skb->data;
  150. skb_pull_inline(skb, ETH_HLEN);
  151. if (unlikely(is_multicast_ether_addr_64bits(eth->h_dest))) {
  152. if (ether_addr_equal_64bits(eth->h_dest, dev->broadcast))
  153. skb->pkt_type = PACKET_BROADCAST;
  154. else
  155. skb->pkt_type = PACKET_MULTICAST;
  156. }
  157. else if (unlikely(!ether_addr_equal_64bits(eth->h_dest,
  158. dev->dev_addr)))
  159. skb->pkt_type = PACKET_OTHERHOST;
  160. /*
  161. * Some variants of DSA tagging don't have an ethertype field
  162. * at all, so we check here whether one of those tagging
  163. * variants has been configured on the receiving interface,
  164. * and if so, set skb->protocol without looking at the packet.
  165. */
  166. if (unlikely(netdev_uses_dsa(dev)))
  167. return htons(ETH_P_XDSA);
  168. if (likely(eth_proto_is_802_3(eth->h_proto)))
  169. return eth->h_proto;
  170. /*
  171. * This is a magic hack to spot IPX packets. Older Novell breaks
  172. * the protocol design and runs IPX over 802.3 without an 802.2 LLC
  173. * layer. We look for FFFF which isn't a used 802.2 SSAP/DSAP. This
  174. * won't work for fault tolerant netware but does for the rest.
  175. */
  176. sap = skb_header_pointer(skb, 0, sizeof(*sap), &_service_access_point);
  177. if (sap && *sap == 0xFFFF)
  178. return htons(ETH_P_802_3);
  179. /*
  180. * Real 802.2 LLC
  181. */
  182. return htons(ETH_P_802_2);
  183. }
  184. EXPORT_SYMBOL(eth_type_trans);
  185. /**
  186. * eth_header_parse - extract hardware address from packet
  187. * @skb: packet to extract header from
  188. * @haddr: destination buffer
  189. */
  190. int eth_header_parse(const struct sk_buff *skb, unsigned char *haddr)
  191. {
  192. const struct ethhdr *eth = eth_hdr(skb);
  193. memcpy(haddr, eth->h_source, ETH_ALEN);
  194. return ETH_ALEN;
  195. }
  196. EXPORT_SYMBOL(eth_header_parse);
  197. /**
  198. * eth_header_cache - fill cache entry from neighbour
  199. * @neigh: source neighbour
  200. * @hh: destination cache entry
  201. * @type: Ethernet type field
  202. *
  203. * Create an Ethernet header template from the neighbour.
  204. */
  205. int eth_header_cache(const struct neighbour *neigh, struct hh_cache *hh, __be16 type)
  206. {
  207. struct ethhdr *eth;
  208. const struct net_device *dev = neigh->dev;
  209. eth = (struct ethhdr *)
  210. (((u8 *) hh->hh_data) + (HH_DATA_OFF(sizeof(*eth))));
  211. if (type == htons(ETH_P_802_3))
  212. return -1;
  213. eth->h_proto = type;
  214. memcpy(eth->h_source, dev->dev_addr, ETH_ALEN);
  215. memcpy(eth->h_dest, neigh->ha, ETH_ALEN);
  216. /* Pairs with READ_ONCE() in neigh_resolve_output(),
  217. * neigh_hh_output() and neigh_update_hhs().
  218. */
  219. smp_store_release(&hh->hh_len, ETH_HLEN);
  220. return 0;
  221. }
  222. EXPORT_SYMBOL(eth_header_cache);
  223. /**
  224. * eth_header_cache_update - update cache entry
  225. * @hh: destination cache entry
  226. * @dev: network device
  227. * @haddr: new hardware address
  228. *
  229. * Called by Address Resolution module to notify changes in address.
  230. */
  231. void eth_header_cache_update(struct hh_cache *hh,
  232. const struct net_device *dev,
  233. const unsigned char *haddr)
  234. {
  235. memcpy(((u8 *) hh->hh_data) + HH_DATA_OFF(sizeof(struct ethhdr)),
  236. haddr, ETH_ALEN);
  237. }
  238. EXPORT_SYMBOL(eth_header_cache_update);
  239. /**
  240. * eth_prepare_mac_addr_change - prepare for mac change
  241. * @dev: network device
  242. * @p: socket address
  243. */
  244. int eth_prepare_mac_addr_change(struct net_device *dev, void *p)
  245. {
  246. struct sockaddr *addr = p;
  247. if (!(dev->priv_flags & IFF_LIVE_ADDR_CHANGE) && netif_running(dev))
  248. return -EBUSY;
  249. if (!is_valid_ether_addr(addr->sa_data))
  250. return -EADDRNOTAVAIL;
  251. return 0;
  252. }
  253. EXPORT_SYMBOL(eth_prepare_mac_addr_change);
  254. /**
  255. * eth_commit_mac_addr_change - commit mac change
  256. * @dev: network device
  257. * @p: socket address
  258. */
  259. void eth_commit_mac_addr_change(struct net_device *dev, void *p)
  260. {
  261. struct sockaddr *addr = p;
  262. memcpy(dev->dev_addr, addr->sa_data, ETH_ALEN);
  263. }
  264. EXPORT_SYMBOL(eth_commit_mac_addr_change);
  265. /**
  266. * eth_mac_addr - set new Ethernet hardware address
  267. * @dev: network device
  268. * @p: socket address
  269. *
  270. * Change hardware address of device.
  271. *
  272. * This doesn't change hardware matching, so needs to be overridden
  273. * for most real devices.
  274. */
  275. int eth_mac_addr(struct net_device *dev, void *p)
  276. {
  277. int ret;
  278. ret = eth_prepare_mac_addr_change(dev, p);
  279. if (ret < 0)
  280. return ret;
  281. eth_commit_mac_addr_change(dev, p);
  282. return 0;
  283. }
  284. EXPORT_SYMBOL(eth_mac_addr);
  285. /**
  286. * eth_change_mtu - set new MTU size
  287. * @dev: network device
  288. * @new_mtu: new Maximum Transfer Unit
  289. *
  290. * Allow changing MTU size. Needs to be overridden for devices
  291. * supporting jumbo frames.
  292. */
  293. int eth_change_mtu(struct net_device *dev, int new_mtu)
  294. {
  295. netdev_warn(dev, "%s is deprecated\n", __func__);
  296. dev->mtu = new_mtu;
  297. return 0;
  298. }
  299. EXPORT_SYMBOL(eth_change_mtu);
  300. int eth_validate_addr(struct net_device *dev)
  301. {
  302. if (!is_valid_ether_addr(dev->dev_addr))
  303. return -EADDRNOTAVAIL;
  304. return 0;
  305. }
  306. EXPORT_SYMBOL(eth_validate_addr);
  307. const struct header_ops eth_header_ops ____cacheline_aligned = {
  308. .create = eth_header,
  309. .parse = eth_header_parse,
  310. .cache = eth_header_cache,
  311. .cache_update = eth_header_cache_update,
  312. };
  313. /**
  314. * ether_setup - setup Ethernet network device
  315. * @dev: network device
  316. *
  317. * Fill in the fields of the device structure with Ethernet-generic values.
  318. */
  319. void ether_setup(struct net_device *dev)
  320. {
  321. dev->header_ops = &eth_header_ops;
  322. dev->type = ARPHRD_ETHER;
  323. dev->hard_header_len = ETH_HLEN;
  324. dev->min_header_len = ETH_HLEN;
  325. dev->mtu = ETH_DATA_LEN;
  326. dev->min_mtu = ETH_MIN_MTU;
  327. dev->max_mtu = ETH_DATA_LEN;
  328. dev->addr_len = ETH_ALEN;
  329. dev->tx_queue_len = DEFAULT_TX_QUEUE_LEN;
  330. dev->flags = IFF_BROADCAST|IFF_MULTICAST;
  331. dev->priv_flags |= IFF_TX_SKB_SHARING;
  332. eth_broadcast_addr(dev->broadcast);
  333. }
  334. EXPORT_SYMBOL(ether_setup);
  335. /**
  336. * alloc_etherdev_mqs - Allocates and sets up an Ethernet device
  337. * @sizeof_priv: Size of additional driver-private structure to be allocated
  338. * for this Ethernet device
  339. * @txqs: The number of TX queues this device has.
  340. * @rxqs: The number of RX queues this device has.
  341. *
  342. * Fill in the fields of the device structure with Ethernet-generic
  343. * values. Basically does everything except registering the device.
  344. *
  345. * Constructs a new net device, complete with a private data area of
  346. * size (sizeof_priv). A 32-byte (not bit) alignment is enforced for
  347. * this private data area.
  348. */
  349. struct net_device *alloc_etherdev_mqs(int sizeof_priv, unsigned int txqs,
  350. unsigned int rxqs)
  351. {
  352. return alloc_netdev_mqs(sizeof_priv, "eth%d", NET_NAME_UNKNOWN,
  353. ether_setup, txqs, rxqs);
  354. }
  355. EXPORT_SYMBOL(alloc_etherdev_mqs);
  356. static void devm_free_netdev(struct device *dev, void *res)
  357. {
  358. free_netdev(*(struct net_device **)res);
  359. }
  360. struct net_device *devm_alloc_etherdev_mqs(struct device *dev, int sizeof_priv,
  361. unsigned int txqs, unsigned int rxqs)
  362. {
  363. struct net_device **dr;
  364. struct net_device *netdev;
  365. dr = devres_alloc(devm_free_netdev, sizeof(*dr), GFP_KERNEL);
  366. if (!dr)
  367. return NULL;
  368. netdev = alloc_etherdev_mqs(sizeof_priv, txqs, rxqs);
  369. if (!netdev) {
  370. devres_free(dr);
  371. return NULL;
  372. }
  373. *dr = netdev;
  374. devres_add(dev, dr);
  375. return netdev;
  376. }
  377. EXPORT_SYMBOL(devm_alloc_etherdev_mqs);
  378. ssize_t sysfs_format_mac(char *buf, const unsigned char *addr, int len)
  379. {
  380. return scnprintf(buf, PAGE_SIZE, "%*phC\n", len, addr);
  381. }
  382. EXPORT_SYMBOL(sysfs_format_mac);
  383. struct sk_buff *eth_gro_receive(struct list_head *head, struct sk_buff *skb)
  384. {
  385. const struct packet_offload *ptype;
  386. unsigned int hlen, off_eth;
  387. struct sk_buff *pp = NULL;
  388. struct ethhdr *eh, *eh2;
  389. struct sk_buff *p;
  390. __be16 type;
  391. int flush = 1;
  392. off_eth = skb_gro_offset(skb);
  393. hlen = off_eth + sizeof(*eh);
  394. eh = skb_gro_header_fast(skb, off_eth);
  395. if (skb_gro_header_hard(skb, hlen)) {
  396. eh = skb_gro_header_slow(skb, hlen, off_eth);
  397. if (unlikely(!eh))
  398. goto out;
  399. }
  400. flush = 0;
  401. list_for_each_entry(p, head, list) {
  402. if (!NAPI_GRO_CB(p)->same_flow)
  403. continue;
  404. eh2 = (struct ethhdr *)(p->data + off_eth);
  405. if (compare_ether_header(eh, eh2)) {
  406. NAPI_GRO_CB(p)->same_flow = 0;
  407. continue;
  408. }
  409. }
  410. type = eh->h_proto;
  411. rcu_read_lock();
  412. ptype = gro_find_receive_by_type(type);
  413. if (ptype == NULL) {
  414. flush = 1;
  415. goto out_unlock;
  416. }
  417. skb_gro_pull(skb, sizeof(*eh));
  418. skb_gro_postpull_rcsum(skb, eh, sizeof(*eh));
  419. pp = call_gro_receive(ptype->callbacks.gro_receive, head, skb);
  420. out_unlock:
  421. rcu_read_unlock();
  422. out:
  423. skb_gro_flush_final(skb, pp, flush);
  424. return pp;
  425. }
  426. EXPORT_SYMBOL(eth_gro_receive);
  427. int eth_gro_complete(struct sk_buff *skb, int nhoff)
  428. {
  429. struct ethhdr *eh = (struct ethhdr *)(skb->data + nhoff);
  430. __be16 type = eh->h_proto;
  431. struct packet_offload *ptype;
  432. int err = -ENOSYS;
  433. if (skb->encapsulation)
  434. skb_set_inner_mac_header(skb, nhoff);
  435. rcu_read_lock();
  436. ptype = gro_find_complete_by_type(type);
  437. if (ptype != NULL)
  438. err = ptype->callbacks.gro_complete(skb, nhoff +
  439. sizeof(struct ethhdr));
  440. rcu_read_unlock();
  441. return err;
  442. }
  443. EXPORT_SYMBOL(eth_gro_complete);
  444. static struct packet_offload eth_packet_offload __read_mostly = {
  445. .type = cpu_to_be16(ETH_P_TEB),
  446. .priority = 10,
  447. .callbacks = {
  448. .gro_receive = eth_gro_receive,
  449. .gro_complete = eth_gro_complete,
  450. },
  451. };
  452. static int __init eth_offload_init(void)
  453. {
  454. dev_add_offload(&eth_packet_offload);
  455. return 0;
  456. }
  457. fs_initcall(eth_offload_init);
  458. unsigned char * __weak arch_get_platform_mac_address(void)
  459. {
  460. return NULL;
  461. }
  462. int eth_platform_get_mac_address(struct device *dev, u8 *mac_addr)
  463. {
  464. const unsigned char *addr;
  465. struct device_node *dp;
  466. if (dev_is_pci(dev))
  467. dp = pci_device_to_OF_node(to_pci_dev(dev));
  468. else
  469. dp = dev->of_node;
  470. addr = NULL;
  471. if (dp)
  472. addr = of_get_mac_address(dp);
  473. if (!addr)
  474. addr = arch_get_platform_mac_address();
  475. if (!addr)
  476. return -ENODEV;
  477. ether_addr_copy(mac_addr, addr);
  478. return 0;
  479. }
  480. EXPORT_SYMBOL(eth_platform_get_mac_address);