ibmveth.c 52 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937
  1. /*
  2. * IBM Power Virtual Ethernet Device Driver
  3. *
  4. * This program is free software; you can redistribute it and/or modify
  5. * it under the terms of the GNU General Public License as published by
  6. * the Free Software Foundation; either version 2 of the License, or
  7. * (at your option) any later version.
  8. *
  9. * This program is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. * GNU General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public License
  15. * along with this program; if not, see <http://www.gnu.org/licenses/>.
  16. *
  17. * Copyright (C) IBM Corporation, 2003, 2010
  18. *
  19. * Authors: Dave Larson <larson1@us.ibm.com>
  20. * Santiago Leon <santil@linux.vnet.ibm.com>
  21. * Brian King <brking@linux.vnet.ibm.com>
  22. * Robert Jennings <rcj@linux.vnet.ibm.com>
  23. * Anton Blanchard <anton@au.ibm.com>
  24. */
  25. #include <linux/module.h>
  26. #include <linux/moduleparam.h>
  27. #include <linux/types.h>
  28. #include <linux/errno.h>
  29. #include <linux/dma-mapping.h>
  30. #include <linux/kernel.h>
  31. #include <linux/netdevice.h>
  32. #include <linux/etherdevice.h>
  33. #include <linux/skbuff.h>
  34. #include <linux/init.h>
  35. #include <linux/interrupt.h>
  36. #include <linux/mm.h>
  37. #include <linux/pm.h>
  38. #include <linux/ethtool.h>
  39. #include <linux/in.h>
  40. #include <linux/ip.h>
  41. #include <linux/ipv6.h>
  42. #include <linux/slab.h>
  43. #include <asm/hvcall.h>
  44. #include <linux/atomic.h>
  45. #include <asm/vio.h>
  46. #include <asm/iommu.h>
  47. #include <asm/firmware.h>
  48. #include <net/tcp.h>
  49. #include <net/ip6_checksum.h>
  50. #include "ibmveth.h"
  51. static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance);
  52. static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter);
  53. static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev);
  54. static struct kobj_type ktype_veth_pool;
  55. static const char ibmveth_driver_name[] = "ibmveth";
  56. static const char ibmveth_driver_string[] = "IBM Power Virtual Ethernet Driver";
  57. #define ibmveth_driver_version "1.06"
  58. MODULE_AUTHOR("Santiago Leon <santil@linux.vnet.ibm.com>");
  59. MODULE_DESCRIPTION("IBM Power Virtual Ethernet Driver");
  60. MODULE_LICENSE("GPL");
  61. MODULE_VERSION(ibmveth_driver_version);
  62. static unsigned int tx_copybreak __read_mostly = 128;
  63. module_param(tx_copybreak, uint, 0644);
  64. MODULE_PARM_DESC(tx_copybreak,
  65. "Maximum size of packet that is copied to a new buffer on transmit");
  66. static unsigned int rx_copybreak __read_mostly = 128;
  67. module_param(rx_copybreak, uint, 0644);
  68. MODULE_PARM_DESC(rx_copybreak,
  69. "Maximum size of packet that is copied to a new buffer on receive");
  70. static unsigned int rx_flush __read_mostly = 0;
  71. module_param(rx_flush, uint, 0644);
  72. MODULE_PARM_DESC(rx_flush, "Flush receive buffers before use");
  73. static bool old_large_send __read_mostly;
  74. module_param(old_large_send, bool, 0444);
  75. MODULE_PARM_DESC(old_large_send,
  76. "Use old large send method on firmware that supports the new method");
  77. struct ibmveth_stat {
  78. char name[ETH_GSTRING_LEN];
  79. int offset;
  80. };
  81. #define IBMVETH_STAT_OFF(stat) offsetof(struct ibmveth_adapter, stat)
  82. #define IBMVETH_GET_STAT(a, off) *((u64 *)(((unsigned long)(a)) + off))
  83. struct ibmveth_stat ibmveth_stats[] = {
  84. { "replenish_task_cycles", IBMVETH_STAT_OFF(replenish_task_cycles) },
  85. { "replenish_no_mem", IBMVETH_STAT_OFF(replenish_no_mem) },
  86. { "replenish_add_buff_failure",
  87. IBMVETH_STAT_OFF(replenish_add_buff_failure) },
  88. { "replenish_add_buff_success",
  89. IBMVETH_STAT_OFF(replenish_add_buff_success) },
  90. { "rx_invalid_buffer", IBMVETH_STAT_OFF(rx_invalid_buffer) },
  91. { "rx_no_buffer", IBMVETH_STAT_OFF(rx_no_buffer) },
  92. { "tx_map_failed", IBMVETH_STAT_OFF(tx_map_failed) },
  93. { "tx_send_failed", IBMVETH_STAT_OFF(tx_send_failed) },
  94. { "fw_enabled_ipv4_csum", IBMVETH_STAT_OFF(fw_ipv4_csum_support) },
  95. { "fw_enabled_ipv6_csum", IBMVETH_STAT_OFF(fw_ipv6_csum_support) },
  96. { "tx_large_packets", IBMVETH_STAT_OFF(tx_large_packets) },
  97. { "rx_large_packets", IBMVETH_STAT_OFF(rx_large_packets) },
  98. { "fw_enabled_large_send", IBMVETH_STAT_OFF(fw_large_send_support) }
  99. };
  100. /* simple methods of getting data from the current rxq entry */
  101. static inline u32 ibmveth_rxq_flags(struct ibmveth_adapter *adapter)
  102. {
  103. return be32_to_cpu(adapter->rx_queue.queue_addr[adapter->rx_queue.index].flags_off);
  104. }
  105. static inline int ibmveth_rxq_toggle(struct ibmveth_adapter *adapter)
  106. {
  107. return (ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_TOGGLE) >>
  108. IBMVETH_RXQ_TOGGLE_SHIFT;
  109. }
  110. static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
  111. {
  112. return ibmveth_rxq_toggle(adapter) == adapter->rx_queue.toggle;
  113. }
  114. static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
  115. {
  116. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_VALID;
  117. }
  118. static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
  119. {
  120. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_OFF_MASK;
  121. }
  122. static inline int ibmveth_rxq_large_packet(struct ibmveth_adapter *adapter)
  123. {
  124. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_LRG_PKT;
  125. }
  126. static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
  127. {
  128. return be32_to_cpu(adapter->rx_queue.queue_addr[adapter->rx_queue.index].length);
  129. }
  130. static inline int ibmveth_rxq_csum_good(struct ibmveth_adapter *adapter)
  131. {
  132. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_CSUM_GOOD;
  133. }
  134. /* setup the initial settings for a buffer pool */
  135. static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool,
  136. u32 pool_index, u32 pool_size,
  137. u32 buff_size, u32 pool_active)
  138. {
  139. pool->size = pool_size;
  140. pool->index = pool_index;
  141. pool->buff_size = buff_size;
  142. pool->threshold = pool_size * 7 / 8;
  143. pool->active = pool_active;
  144. }
  145. /* allocate and setup an buffer pool - called during open */
  146. static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
  147. {
  148. int i;
  149. pool->free_map = kmalloc_array(pool->size, sizeof(u16), GFP_KERNEL);
  150. if (!pool->free_map)
  151. return -1;
  152. pool->dma_addr = kcalloc(pool->size, sizeof(dma_addr_t), GFP_KERNEL);
  153. if (!pool->dma_addr) {
  154. kfree(pool->free_map);
  155. pool->free_map = NULL;
  156. return -1;
  157. }
  158. pool->skbuff = kcalloc(pool->size, sizeof(void *), GFP_KERNEL);
  159. if (!pool->skbuff) {
  160. kfree(pool->dma_addr);
  161. pool->dma_addr = NULL;
  162. kfree(pool->free_map);
  163. pool->free_map = NULL;
  164. return -1;
  165. }
  166. for (i = 0; i < pool->size; ++i)
  167. pool->free_map[i] = i;
  168. atomic_set(&pool->available, 0);
  169. pool->producer_index = 0;
  170. pool->consumer_index = 0;
  171. return 0;
  172. }
  173. static inline void ibmveth_flush_buffer(void *addr, unsigned long length)
  174. {
  175. unsigned long offset;
  176. for (offset = 0; offset < length; offset += SMP_CACHE_BYTES)
  177. asm("dcbfl %0,%1" :: "b" (addr), "r" (offset));
  178. }
  179. /* replenish the buffers for a pool. note that we don't need to
  180. * skb_reserve these since they are used for incoming...
  181. */
  182. static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter,
  183. struct ibmveth_buff_pool *pool)
  184. {
  185. u32 i;
  186. u32 count = pool->size - atomic_read(&pool->available);
  187. u32 buffers_added = 0;
  188. struct sk_buff *skb;
  189. unsigned int free_index, index;
  190. u64 correlator;
  191. unsigned long lpar_rc;
  192. dma_addr_t dma_addr;
  193. mb();
  194. for (i = 0; i < count; ++i) {
  195. union ibmveth_buf_desc desc;
  196. skb = netdev_alloc_skb(adapter->netdev, pool->buff_size);
  197. if (!skb) {
  198. netdev_dbg(adapter->netdev,
  199. "replenish: unable to allocate skb\n");
  200. adapter->replenish_no_mem++;
  201. break;
  202. }
  203. free_index = pool->consumer_index;
  204. pool->consumer_index++;
  205. if (pool->consumer_index >= pool->size)
  206. pool->consumer_index = 0;
  207. index = pool->free_map[free_index];
  208. BUG_ON(index == IBM_VETH_INVALID_MAP);
  209. BUG_ON(pool->skbuff[index] != NULL);
  210. dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
  211. pool->buff_size, DMA_FROM_DEVICE);
  212. if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
  213. goto failure;
  214. pool->free_map[free_index] = IBM_VETH_INVALID_MAP;
  215. pool->dma_addr[index] = dma_addr;
  216. pool->skbuff[index] = skb;
  217. correlator = ((u64)pool->index << 32) | index;
  218. *(u64 *)skb->data = correlator;
  219. desc.fields.flags_len = IBMVETH_BUF_VALID | pool->buff_size;
  220. desc.fields.address = dma_addr;
  221. if (rx_flush) {
  222. unsigned int len = min(pool->buff_size,
  223. adapter->netdev->mtu +
  224. IBMVETH_BUFF_OH);
  225. ibmveth_flush_buffer(skb->data, len);
  226. }
  227. lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address,
  228. desc.desc);
  229. if (lpar_rc != H_SUCCESS) {
  230. goto failure;
  231. } else {
  232. buffers_added++;
  233. adapter->replenish_add_buff_success++;
  234. }
  235. }
  236. mb();
  237. atomic_add(buffers_added, &(pool->available));
  238. return;
  239. failure:
  240. pool->free_map[free_index] = index;
  241. pool->skbuff[index] = NULL;
  242. if (pool->consumer_index == 0)
  243. pool->consumer_index = pool->size - 1;
  244. else
  245. pool->consumer_index--;
  246. if (!dma_mapping_error(&adapter->vdev->dev, dma_addr))
  247. dma_unmap_single(&adapter->vdev->dev,
  248. pool->dma_addr[index], pool->buff_size,
  249. DMA_FROM_DEVICE);
  250. dev_kfree_skb_any(skb);
  251. adapter->replenish_add_buff_failure++;
  252. mb();
  253. atomic_add(buffers_added, &(pool->available));
  254. }
  255. /*
  256. * The final 8 bytes of the buffer list is a counter of frames dropped
  257. * because there was not a buffer in the buffer list capable of holding
  258. * the frame.
  259. */
  260. static void ibmveth_update_rx_no_buffer(struct ibmveth_adapter *adapter)
  261. {
  262. __be64 *p = adapter->buffer_list_addr + 4096 - 8;
  263. adapter->rx_no_buffer = be64_to_cpup(p);
  264. }
  265. /* replenish routine */
  266. static void ibmveth_replenish_task(struct ibmveth_adapter *adapter)
  267. {
  268. int i;
  269. adapter->replenish_task_cycles++;
  270. for (i = (IBMVETH_NUM_BUFF_POOLS - 1); i >= 0; i--) {
  271. struct ibmveth_buff_pool *pool = &adapter->rx_buff_pool[i];
  272. if (pool->active &&
  273. (atomic_read(&pool->available) < pool->threshold))
  274. ibmveth_replenish_buffer_pool(adapter, pool);
  275. }
  276. ibmveth_update_rx_no_buffer(adapter);
  277. }
  278. /* empty and free ana buffer pool - also used to do cleanup in error paths */
  279. static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter,
  280. struct ibmveth_buff_pool *pool)
  281. {
  282. int i;
  283. kfree(pool->free_map);
  284. pool->free_map = NULL;
  285. if (pool->skbuff && pool->dma_addr) {
  286. for (i = 0; i < pool->size; ++i) {
  287. struct sk_buff *skb = pool->skbuff[i];
  288. if (skb) {
  289. dma_unmap_single(&adapter->vdev->dev,
  290. pool->dma_addr[i],
  291. pool->buff_size,
  292. DMA_FROM_DEVICE);
  293. dev_kfree_skb_any(skb);
  294. pool->skbuff[i] = NULL;
  295. }
  296. }
  297. }
  298. if (pool->dma_addr) {
  299. kfree(pool->dma_addr);
  300. pool->dma_addr = NULL;
  301. }
  302. if (pool->skbuff) {
  303. kfree(pool->skbuff);
  304. pool->skbuff = NULL;
  305. }
  306. }
  307. /* remove a buffer from a pool */
  308. static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter,
  309. u64 correlator)
  310. {
  311. unsigned int pool = correlator >> 32;
  312. unsigned int index = correlator & 0xffffffffUL;
  313. unsigned int free_index;
  314. struct sk_buff *skb;
  315. BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
  316. BUG_ON(index >= adapter->rx_buff_pool[pool].size);
  317. skb = adapter->rx_buff_pool[pool].skbuff[index];
  318. BUG_ON(skb == NULL);
  319. adapter->rx_buff_pool[pool].skbuff[index] = NULL;
  320. dma_unmap_single(&adapter->vdev->dev,
  321. adapter->rx_buff_pool[pool].dma_addr[index],
  322. adapter->rx_buff_pool[pool].buff_size,
  323. DMA_FROM_DEVICE);
  324. free_index = adapter->rx_buff_pool[pool].producer_index;
  325. adapter->rx_buff_pool[pool].producer_index++;
  326. if (adapter->rx_buff_pool[pool].producer_index >=
  327. adapter->rx_buff_pool[pool].size)
  328. adapter->rx_buff_pool[pool].producer_index = 0;
  329. adapter->rx_buff_pool[pool].free_map[free_index] = index;
  330. mb();
  331. atomic_dec(&(adapter->rx_buff_pool[pool].available));
  332. }
  333. /* get the current buffer on the rx queue */
  334. static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
  335. {
  336. u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
  337. unsigned int pool = correlator >> 32;
  338. unsigned int index = correlator & 0xffffffffUL;
  339. BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
  340. BUG_ON(index >= adapter->rx_buff_pool[pool].size);
  341. return adapter->rx_buff_pool[pool].skbuff[index];
  342. }
  343. /* recycle the current buffer on the rx queue */
  344. static int ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter)
  345. {
  346. u32 q_index = adapter->rx_queue.index;
  347. u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator;
  348. unsigned int pool = correlator >> 32;
  349. unsigned int index = correlator & 0xffffffffUL;
  350. union ibmveth_buf_desc desc;
  351. unsigned long lpar_rc;
  352. int ret = 1;
  353. BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
  354. BUG_ON(index >= adapter->rx_buff_pool[pool].size);
  355. if (!adapter->rx_buff_pool[pool].active) {
  356. ibmveth_rxq_harvest_buffer(adapter);
  357. ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[pool]);
  358. goto out;
  359. }
  360. desc.fields.flags_len = IBMVETH_BUF_VALID |
  361. adapter->rx_buff_pool[pool].buff_size;
  362. desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index];
  363. lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
  364. if (lpar_rc != H_SUCCESS) {
  365. netdev_dbg(adapter->netdev, "h_add_logical_lan_buffer failed "
  366. "during recycle rc=%ld", lpar_rc);
  367. ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
  368. ret = 0;
  369. }
  370. if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
  371. adapter->rx_queue.index = 0;
  372. adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
  373. }
  374. out:
  375. return ret;
  376. }
  377. static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter)
  378. {
  379. ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
  380. if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
  381. adapter->rx_queue.index = 0;
  382. adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
  383. }
  384. }
  385. static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter,
  386. union ibmveth_buf_desc rxq_desc, u64 mac_address)
  387. {
  388. int rc, try_again = 1;
  389. /*
  390. * After a kexec the adapter will still be open, so our attempt to
  391. * open it will fail. So if we get a failure we free the adapter and
  392. * try again, but only once.
  393. */
  394. retry:
  395. rc = h_register_logical_lan(adapter->vdev->unit_address,
  396. adapter->buffer_list_dma, rxq_desc.desc,
  397. adapter->filter_list_dma, mac_address);
  398. if (rc != H_SUCCESS && try_again) {
  399. do {
  400. rc = h_free_logical_lan(adapter->vdev->unit_address);
  401. } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
  402. try_again = 0;
  403. goto retry;
  404. }
  405. return rc;
  406. }
  407. static u64 ibmveth_encode_mac_addr(u8 *mac)
  408. {
  409. int i;
  410. u64 encoded = 0;
  411. for (i = 0; i < ETH_ALEN; i++)
  412. encoded = (encoded << 8) | mac[i];
  413. return encoded;
  414. }
  415. static int ibmveth_open(struct net_device *netdev)
  416. {
  417. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  418. u64 mac_address;
  419. int rxq_entries = 1;
  420. unsigned long lpar_rc;
  421. int rc;
  422. union ibmveth_buf_desc rxq_desc;
  423. int i;
  424. struct device *dev;
  425. netdev_dbg(netdev, "open starting\n");
  426. napi_enable(&adapter->napi);
  427. for(i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  428. rxq_entries += adapter->rx_buff_pool[i].size;
  429. rc = -ENOMEM;
  430. adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
  431. if (!adapter->buffer_list_addr) {
  432. netdev_err(netdev, "unable to allocate list pages\n");
  433. goto out;
  434. }
  435. adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
  436. if (!adapter->filter_list_addr) {
  437. netdev_err(netdev, "unable to allocate filter pages\n");
  438. goto out_free_buffer_list;
  439. }
  440. dev = &adapter->vdev->dev;
  441. adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) *
  442. rxq_entries;
  443. adapter->rx_queue.queue_addr =
  444. dma_alloc_coherent(dev, adapter->rx_queue.queue_len,
  445. &adapter->rx_queue.queue_dma, GFP_KERNEL);
  446. if (!adapter->rx_queue.queue_addr)
  447. goto out_free_filter_list;
  448. adapter->buffer_list_dma = dma_map_single(dev,
  449. adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
  450. if (dma_mapping_error(dev, adapter->buffer_list_dma)) {
  451. netdev_err(netdev, "unable to map buffer list pages\n");
  452. goto out_free_queue_mem;
  453. }
  454. adapter->filter_list_dma = dma_map_single(dev,
  455. adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
  456. if (dma_mapping_error(dev, adapter->filter_list_dma)) {
  457. netdev_err(netdev, "unable to map filter list pages\n");
  458. goto out_unmap_buffer_list;
  459. }
  460. adapter->rx_queue.index = 0;
  461. adapter->rx_queue.num_slots = rxq_entries;
  462. adapter->rx_queue.toggle = 1;
  463. mac_address = ibmveth_encode_mac_addr(netdev->dev_addr);
  464. rxq_desc.fields.flags_len = IBMVETH_BUF_VALID |
  465. adapter->rx_queue.queue_len;
  466. rxq_desc.fields.address = adapter->rx_queue.queue_dma;
  467. netdev_dbg(netdev, "buffer list @ 0x%p\n", adapter->buffer_list_addr);
  468. netdev_dbg(netdev, "filter list @ 0x%p\n", adapter->filter_list_addr);
  469. netdev_dbg(netdev, "receive q @ 0x%p\n", adapter->rx_queue.queue_addr);
  470. h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
  471. lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address);
  472. if (lpar_rc != H_SUCCESS) {
  473. netdev_err(netdev, "h_register_logical_lan failed with %ld\n",
  474. lpar_rc);
  475. netdev_err(netdev, "buffer TCE:0x%llx filter TCE:0x%llx rxq "
  476. "desc:0x%llx MAC:0x%llx\n",
  477. adapter->buffer_list_dma,
  478. adapter->filter_list_dma,
  479. rxq_desc.desc,
  480. mac_address);
  481. rc = -ENONET;
  482. goto out_unmap_filter_list;
  483. }
  484. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  485. if (!adapter->rx_buff_pool[i].active)
  486. continue;
  487. if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) {
  488. netdev_err(netdev, "unable to alloc pool\n");
  489. adapter->rx_buff_pool[i].active = 0;
  490. rc = -ENOMEM;
  491. goto out_free_buffer_pools;
  492. }
  493. }
  494. netdev_dbg(netdev, "registering irq 0x%x\n", netdev->irq);
  495. rc = request_irq(netdev->irq, ibmveth_interrupt, 0, netdev->name,
  496. netdev);
  497. if (rc != 0) {
  498. netdev_err(netdev, "unable to request irq 0x%x, rc %d\n",
  499. netdev->irq, rc);
  500. do {
  501. lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
  502. } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
  503. goto out_free_buffer_pools;
  504. }
  505. rc = -ENOMEM;
  506. adapter->bounce_buffer =
  507. kmalloc(netdev->mtu + IBMVETH_BUFF_OH, GFP_KERNEL);
  508. if (!adapter->bounce_buffer)
  509. goto out_free_irq;
  510. adapter->bounce_buffer_dma =
  511. dma_map_single(&adapter->vdev->dev, adapter->bounce_buffer,
  512. netdev->mtu + IBMVETH_BUFF_OH, DMA_BIDIRECTIONAL);
  513. if (dma_mapping_error(dev, adapter->bounce_buffer_dma)) {
  514. netdev_err(netdev, "unable to map bounce buffer\n");
  515. goto out_free_bounce_buffer;
  516. }
  517. netdev_dbg(netdev, "initial replenish cycle\n");
  518. ibmveth_interrupt(netdev->irq, netdev);
  519. netif_start_queue(netdev);
  520. netdev_dbg(netdev, "open complete\n");
  521. return 0;
  522. out_free_bounce_buffer:
  523. kfree(adapter->bounce_buffer);
  524. out_free_irq:
  525. free_irq(netdev->irq, netdev);
  526. out_free_buffer_pools:
  527. while (--i >= 0) {
  528. if (adapter->rx_buff_pool[i].active)
  529. ibmveth_free_buffer_pool(adapter,
  530. &adapter->rx_buff_pool[i]);
  531. }
  532. out_unmap_filter_list:
  533. dma_unmap_single(dev, adapter->filter_list_dma, 4096,
  534. DMA_BIDIRECTIONAL);
  535. out_unmap_buffer_list:
  536. dma_unmap_single(dev, adapter->buffer_list_dma, 4096,
  537. DMA_BIDIRECTIONAL);
  538. out_free_queue_mem:
  539. dma_free_coherent(dev, adapter->rx_queue.queue_len,
  540. adapter->rx_queue.queue_addr,
  541. adapter->rx_queue.queue_dma);
  542. out_free_filter_list:
  543. free_page((unsigned long)adapter->filter_list_addr);
  544. out_free_buffer_list:
  545. free_page((unsigned long)adapter->buffer_list_addr);
  546. out:
  547. napi_disable(&adapter->napi);
  548. return rc;
  549. }
  550. static int ibmveth_close(struct net_device *netdev)
  551. {
  552. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  553. struct device *dev = &adapter->vdev->dev;
  554. long lpar_rc;
  555. int i;
  556. netdev_dbg(netdev, "close starting\n");
  557. napi_disable(&adapter->napi);
  558. if (!adapter->pool_config)
  559. netif_stop_queue(netdev);
  560. h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
  561. do {
  562. lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
  563. } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
  564. if (lpar_rc != H_SUCCESS) {
  565. netdev_err(netdev, "h_free_logical_lan failed with %lx, "
  566. "continuing with close\n", lpar_rc);
  567. }
  568. free_irq(netdev->irq, netdev);
  569. ibmveth_update_rx_no_buffer(adapter);
  570. dma_unmap_single(dev, adapter->buffer_list_dma, 4096,
  571. DMA_BIDIRECTIONAL);
  572. free_page((unsigned long)adapter->buffer_list_addr);
  573. dma_unmap_single(dev, adapter->filter_list_dma, 4096,
  574. DMA_BIDIRECTIONAL);
  575. free_page((unsigned long)adapter->filter_list_addr);
  576. dma_free_coherent(dev, adapter->rx_queue.queue_len,
  577. adapter->rx_queue.queue_addr,
  578. adapter->rx_queue.queue_dma);
  579. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  580. if (adapter->rx_buff_pool[i].active)
  581. ibmveth_free_buffer_pool(adapter,
  582. &adapter->rx_buff_pool[i]);
  583. dma_unmap_single(&adapter->vdev->dev, adapter->bounce_buffer_dma,
  584. adapter->netdev->mtu + IBMVETH_BUFF_OH,
  585. DMA_BIDIRECTIONAL);
  586. kfree(adapter->bounce_buffer);
  587. netdev_dbg(netdev, "close complete\n");
  588. return 0;
  589. }
  590. static int netdev_get_link_ksettings(struct net_device *dev,
  591. struct ethtool_link_ksettings *cmd)
  592. {
  593. u32 supported, advertising;
  594. supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg |
  595. SUPPORTED_FIBRE);
  596. advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg |
  597. ADVERTISED_FIBRE);
  598. cmd->base.speed = SPEED_1000;
  599. cmd->base.duplex = DUPLEX_FULL;
  600. cmd->base.port = PORT_FIBRE;
  601. cmd->base.phy_address = 0;
  602. cmd->base.autoneg = AUTONEG_ENABLE;
  603. ethtool_convert_legacy_u32_to_link_mode(cmd->link_modes.supported,
  604. supported);
  605. ethtool_convert_legacy_u32_to_link_mode(cmd->link_modes.advertising,
  606. advertising);
  607. return 0;
  608. }
  609. static void netdev_get_drvinfo(struct net_device *dev,
  610. struct ethtool_drvinfo *info)
  611. {
  612. strlcpy(info->driver, ibmveth_driver_name, sizeof(info->driver));
  613. strlcpy(info->version, ibmveth_driver_version, sizeof(info->version));
  614. }
  615. static netdev_features_t ibmveth_fix_features(struct net_device *dev,
  616. netdev_features_t features)
  617. {
  618. /*
  619. * Since the ibmveth firmware interface does not have the
  620. * concept of separate tx/rx checksum offload enable, if rx
  621. * checksum is disabled we also have to disable tx checksum
  622. * offload. Once we disable rx checksum offload, we are no
  623. * longer allowed to send tx buffers that are not properly
  624. * checksummed.
  625. */
  626. if (!(features & NETIF_F_RXCSUM))
  627. features &= ~NETIF_F_CSUM_MASK;
  628. return features;
  629. }
  630. static int ibmveth_set_csum_offload(struct net_device *dev, u32 data)
  631. {
  632. struct ibmveth_adapter *adapter = netdev_priv(dev);
  633. unsigned long set_attr, clr_attr, ret_attr;
  634. unsigned long set_attr6, clr_attr6;
  635. long ret, ret4, ret6;
  636. int rc1 = 0, rc2 = 0;
  637. int restart = 0;
  638. if (netif_running(dev)) {
  639. restart = 1;
  640. adapter->pool_config = 1;
  641. ibmveth_close(dev);
  642. adapter->pool_config = 0;
  643. }
  644. set_attr = 0;
  645. clr_attr = 0;
  646. set_attr6 = 0;
  647. clr_attr6 = 0;
  648. if (data) {
  649. set_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
  650. set_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
  651. } else {
  652. clr_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
  653. clr_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
  654. }
  655. ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  656. if (ret == H_SUCCESS &&
  657. (ret_attr & IBMVETH_ILLAN_PADDED_PKT_CSUM)) {
  658. ret4 = h_illan_attributes(adapter->vdev->unit_address, clr_attr,
  659. set_attr, &ret_attr);
  660. if (ret4 != H_SUCCESS) {
  661. netdev_err(dev, "unable to change IPv4 checksum "
  662. "offload settings. %d rc=%ld\n",
  663. data, ret4);
  664. h_illan_attributes(adapter->vdev->unit_address,
  665. set_attr, clr_attr, &ret_attr);
  666. if (data == 1)
  667. dev->features &= ~NETIF_F_IP_CSUM;
  668. } else {
  669. adapter->fw_ipv4_csum_support = data;
  670. }
  671. ret6 = h_illan_attributes(adapter->vdev->unit_address,
  672. clr_attr6, set_attr6, &ret_attr);
  673. if (ret6 != H_SUCCESS) {
  674. netdev_err(dev, "unable to change IPv6 checksum "
  675. "offload settings. %d rc=%ld\n",
  676. data, ret6);
  677. h_illan_attributes(adapter->vdev->unit_address,
  678. set_attr6, clr_attr6, &ret_attr);
  679. if (data == 1)
  680. dev->features &= ~NETIF_F_IPV6_CSUM;
  681. } else
  682. adapter->fw_ipv6_csum_support = data;
  683. if (ret4 == H_SUCCESS || ret6 == H_SUCCESS)
  684. adapter->rx_csum = data;
  685. else
  686. rc1 = -EIO;
  687. } else {
  688. rc1 = -EIO;
  689. netdev_err(dev, "unable to change checksum offload settings."
  690. " %d rc=%ld ret_attr=%lx\n", data, ret,
  691. ret_attr);
  692. }
  693. if (restart)
  694. rc2 = ibmveth_open(dev);
  695. return rc1 ? rc1 : rc2;
  696. }
  697. static int ibmveth_set_tso(struct net_device *dev, u32 data)
  698. {
  699. struct ibmveth_adapter *adapter = netdev_priv(dev);
  700. unsigned long set_attr, clr_attr, ret_attr;
  701. long ret1, ret2;
  702. int rc1 = 0, rc2 = 0;
  703. int restart = 0;
  704. if (netif_running(dev)) {
  705. restart = 1;
  706. adapter->pool_config = 1;
  707. ibmveth_close(dev);
  708. adapter->pool_config = 0;
  709. }
  710. set_attr = 0;
  711. clr_attr = 0;
  712. if (data)
  713. set_attr = IBMVETH_ILLAN_LRG_SR_ENABLED;
  714. else
  715. clr_attr = IBMVETH_ILLAN_LRG_SR_ENABLED;
  716. ret1 = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  717. if (ret1 == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_LRG_SND_SUPPORT) &&
  718. !old_large_send) {
  719. ret2 = h_illan_attributes(adapter->vdev->unit_address, clr_attr,
  720. set_attr, &ret_attr);
  721. if (ret2 != H_SUCCESS) {
  722. netdev_err(dev, "unable to change tso settings. %d rc=%ld\n",
  723. data, ret2);
  724. h_illan_attributes(adapter->vdev->unit_address,
  725. set_attr, clr_attr, &ret_attr);
  726. if (data == 1)
  727. dev->features &= ~(NETIF_F_TSO | NETIF_F_TSO6);
  728. rc1 = -EIO;
  729. } else {
  730. adapter->fw_large_send_support = data;
  731. adapter->large_send = data;
  732. }
  733. } else {
  734. /* Older firmware version of large send offload does not
  735. * support tcp6/ipv6
  736. */
  737. if (data == 1) {
  738. dev->features &= ~NETIF_F_TSO6;
  739. netdev_info(dev, "TSO feature requires all partitions to have updated driver");
  740. }
  741. adapter->large_send = data;
  742. }
  743. if (restart)
  744. rc2 = ibmveth_open(dev);
  745. return rc1 ? rc1 : rc2;
  746. }
  747. static int ibmveth_set_features(struct net_device *dev,
  748. netdev_features_t features)
  749. {
  750. struct ibmveth_adapter *adapter = netdev_priv(dev);
  751. int rx_csum = !!(features & NETIF_F_RXCSUM);
  752. int large_send = !!(features & (NETIF_F_TSO | NETIF_F_TSO6));
  753. int rc1 = 0, rc2 = 0;
  754. if (rx_csum != adapter->rx_csum) {
  755. rc1 = ibmveth_set_csum_offload(dev, rx_csum);
  756. if (rc1 && !adapter->rx_csum)
  757. dev->features =
  758. features & ~(NETIF_F_CSUM_MASK |
  759. NETIF_F_RXCSUM);
  760. }
  761. if (large_send != adapter->large_send) {
  762. rc2 = ibmveth_set_tso(dev, large_send);
  763. if (rc2 && !adapter->large_send)
  764. dev->features =
  765. features & ~(NETIF_F_TSO | NETIF_F_TSO6);
  766. }
  767. return rc1 ? rc1 : rc2;
  768. }
  769. static void ibmveth_get_strings(struct net_device *dev, u32 stringset, u8 *data)
  770. {
  771. int i;
  772. if (stringset != ETH_SS_STATS)
  773. return;
  774. for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++, data += ETH_GSTRING_LEN)
  775. memcpy(data, ibmveth_stats[i].name, ETH_GSTRING_LEN);
  776. }
  777. static int ibmveth_get_sset_count(struct net_device *dev, int sset)
  778. {
  779. switch (sset) {
  780. case ETH_SS_STATS:
  781. return ARRAY_SIZE(ibmveth_stats);
  782. default:
  783. return -EOPNOTSUPP;
  784. }
  785. }
  786. static void ibmveth_get_ethtool_stats(struct net_device *dev,
  787. struct ethtool_stats *stats, u64 *data)
  788. {
  789. int i;
  790. struct ibmveth_adapter *adapter = netdev_priv(dev);
  791. for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++)
  792. data[i] = IBMVETH_GET_STAT(adapter, ibmveth_stats[i].offset);
  793. }
  794. static const struct ethtool_ops netdev_ethtool_ops = {
  795. .get_drvinfo = netdev_get_drvinfo,
  796. .get_link = ethtool_op_get_link,
  797. .get_strings = ibmveth_get_strings,
  798. .get_sset_count = ibmveth_get_sset_count,
  799. .get_ethtool_stats = ibmveth_get_ethtool_stats,
  800. .get_link_ksettings = netdev_get_link_ksettings,
  801. };
  802. static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
  803. {
  804. return -EOPNOTSUPP;
  805. }
  806. #define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1))
  807. static int ibmveth_send(struct ibmveth_adapter *adapter,
  808. union ibmveth_buf_desc *descs, unsigned long mss)
  809. {
  810. unsigned long correlator;
  811. unsigned int retry_count;
  812. unsigned long ret;
  813. /*
  814. * The retry count sets a maximum for the number of broadcast and
  815. * multicast destinations within the system.
  816. */
  817. retry_count = 1024;
  818. correlator = 0;
  819. do {
  820. ret = h_send_logical_lan(adapter->vdev->unit_address,
  821. descs[0].desc, descs[1].desc,
  822. descs[2].desc, descs[3].desc,
  823. descs[4].desc, descs[5].desc,
  824. correlator, &correlator, mss,
  825. adapter->fw_large_send_support);
  826. } while ((ret == H_BUSY) && (retry_count--));
  827. if (ret != H_SUCCESS && ret != H_DROPPED) {
  828. netdev_err(adapter->netdev, "tx: h_send_logical_lan failed "
  829. "with rc=%ld\n", ret);
  830. return 1;
  831. }
  832. return 0;
  833. }
  834. static netdev_tx_t ibmveth_start_xmit(struct sk_buff *skb,
  835. struct net_device *netdev)
  836. {
  837. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  838. unsigned int desc_flags;
  839. union ibmveth_buf_desc descs[6];
  840. int last, i;
  841. int force_bounce = 0;
  842. dma_addr_t dma_addr;
  843. unsigned long mss = 0;
  844. /* veth doesn't handle frag_list, so linearize the skb.
  845. * When GRO is enabled SKB's can have frag_list.
  846. */
  847. if (adapter->is_active_trunk &&
  848. skb_has_frag_list(skb) && __skb_linearize(skb)) {
  849. netdev->stats.tx_dropped++;
  850. goto out;
  851. }
  852. /*
  853. * veth handles a maximum of 6 segments including the header, so
  854. * we have to linearize the skb if there are more than this.
  855. */
  856. if (skb_shinfo(skb)->nr_frags > 5 && __skb_linearize(skb)) {
  857. netdev->stats.tx_dropped++;
  858. goto out;
  859. }
  860. /* veth can't checksum offload UDP */
  861. if (skb->ip_summed == CHECKSUM_PARTIAL &&
  862. ((skb->protocol == htons(ETH_P_IP) &&
  863. ip_hdr(skb)->protocol != IPPROTO_TCP) ||
  864. (skb->protocol == htons(ETH_P_IPV6) &&
  865. ipv6_hdr(skb)->nexthdr != IPPROTO_TCP)) &&
  866. skb_checksum_help(skb)) {
  867. netdev_err(netdev, "tx: failed to checksum packet\n");
  868. netdev->stats.tx_dropped++;
  869. goto out;
  870. }
  871. desc_flags = IBMVETH_BUF_VALID;
  872. if (skb->ip_summed == CHECKSUM_PARTIAL) {
  873. unsigned char *buf = skb_transport_header(skb) +
  874. skb->csum_offset;
  875. desc_flags |= (IBMVETH_BUF_NO_CSUM | IBMVETH_BUF_CSUM_GOOD);
  876. /* Need to zero out the checksum */
  877. buf[0] = 0;
  878. buf[1] = 0;
  879. if (skb_is_gso(skb) && adapter->fw_large_send_support)
  880. desc_flags |= IBMVETH_BUF_LRG_SND;
  881. }
  882. retry_bounce:
  883. memset(descs, 0, sizeof(descs));
  884. /*
  885. * If a linear packet is below the rx threshold then
  886. * copy it into the static bounce buffer. This avoids the
  887. * cost of a TCE insert and remove.
  888. */
  889. if (force_bounce || (!skb_is_nonlinear(skb) &&
  890. (skb->len < tx_copybreak))) {
  891. skb_copy_from_linear_data(skb, adapter->bounce_buffer,
  892. skb->len);
  893. descs[0].fields.flags_len = desc_flags | skb->len;
  894. descs[0].fields.address = adapter->bounce_buffer_dma;
  895. if (ibmveth_send(adapter, descs, 0)) {
  896. adapter->tx_send_failed++;
  897. netdev->stats.tx_dropped++;
  898. } else {
  899. netdev->stats.tx_packets++;
  900. netdev->stats.tx_bytes += skb->len;
  901. }
  902. goto out;
  903. }
  904. /* Map the header */
  905. dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
  906. skb_headlen(skb), DMA_TO_DEVICE);
  907. if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
  908. goto map_failed;
  909. descs[0].fields.flags_len = desc_flags | skb_headlen(skb);
  910. descs[0].fields.address = dma_addr;
  911. /* Map the frags */
  912. for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
  913. const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
  914. dma_addr = skb_frag_dma_map(&adapter->vdev->dev, frag, 0,
  915. skb_frag_size(frag), DMA_TO_DEVICE);
  916. if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
  917. goto map_failed_frags;
  918. descs[i+1].fields.flags_len = desc_flags | skb_frag_size(frag);
  919. descs[i+1].fields.address = dma_addr;
  920. }
  921. if (skb->ip_summed == CHECKSUM_PARTIAL && skb_is_gso(skb)) {
  922. if (adapter->fw_large_send_support) {
  923. mss = (unsigned long)skb_shinfo(skb)->gso_size;
  924. adapter->tx_large_packets++;
  925. } else if (!skb_is_gso_v6(skb)) {
  926. /* Put -1 in the IP checksum to tell phyp it
  927. * is a largesend packet. Put the mss in
  928. * the TCP checksum.
  929. */
  930. ip_hdr(skb)->check = 0xffff;
  931. tcp_hdr(skb)->check =
  932. cpu_to_be16(skb_shinfo(skb)->gso_size);
  933. adapter->tx_large_packets++;
  934. }
  935. }
  936. if (ibmveth_send(adapter, descs, mss)) {
  937. adapter->tx_send_failed++;
  938. netdev->stats.tx_dropped++;
  939. } else {
  940. netdev->stats.tx_packets++;
  941. netdev->stats.tx_bytes += skb->len;
  942. }
  943. dma_unmap_single(&adapter->vdev->dev,
  944. descs[0].fields.address,
  945. descs[0].fields.flags_len & IBMVETH_BUF_LEN_MASK,
  946. DMA_TO_DEVICE);
  947. for (i = 1; i < skb_shinfo(skb)->nr_frags + 1; i++)
  948. dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address,
  949. descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK,
  950. DMA_TO_DEVICE);
  951. out:
  952. dev_consume_skb_any(skb);
  953. return NETDEV_TX_OK;
  954. map_failed_frags:
  955. last = i+1;
  956. for (i = 1; i < last; i++)
  957. dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address,
  958. descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK,
  959. DMA_TO_DEVICE);
  960. dma_unmap_single(&adapter->vdev->dev,
  961. descs[0].fields.address,
  962. descs[0].fields.flags_len & IBMVETH_BUF_LEN_MASK,
  963. DMA_TO_DEVICE);
  964. map_failed:
  965. if (!firmware_has_feature(FW_FEATURE_CMO))
  966. netdev_err(netdev, "tx: unable to map xmit buffer\n");
  967. adapter->tx_map_failed++;
  968. if (skb_linearize(skb)) {
  969. netdev->stats.tx_dropped++;
  970. goto out;
  971. }
  972. force_bounce = 1;
  973. goto retry_bounce;
  974. }
  975. static void ibmveth_rx_mss_helper(struct sk_buff *skb, u16 mss, int lrg_pkt)
  976. {
  977. struct tcphdr *tcph;
  978. int offset = 0;
  979. int hdr_len;
  980. /* only TCP packets will be aggregated */
  981. if (skb->protocol == htons(ETH_P_IP)) {
  982. struct iphdr *iph = (struct iphdr *)skb->data;
  983. if (iph->protocol == IPPROTO_TCP) {
  984. offset = iph->ihl * 4;
  985. skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
  986. } else {
  987. return;
  988. }
  989. } else if (skb->protocol == htons(ETH_P_IPV6)) {
  990. struct ipv6hdr *iph6 = (struct ipv6hdr *)skb->data;
  991. if (iph6->nexthdr == IPPROTO_TCP) {
  992. offset = sizeof(struct ipv6hdr);
  993. skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
  994. } else {
  995. return;
  996. }
  997. } else {
  998. return;
  999. }
  1000. /* if mss is not set through Large Packet bit/mss in rx buffer,
  1001. * expect that the mss will be written to the tcp header checksum.
  1002. */
  1003. tcph = (struct tcphdr *)(skb->data + offset);
  1004. if (lrg_pkt) {
  1005. skb_shinfo(skb)->gso_size = mss;
  1006. } else if (offset) {
  1007. skb_shinfo(skb)->gso_size = ntohs(tcph->check);
  1008. tcph->check = 0;
  1009. }
  1010. if (skb_shinfo(skb)->gso_size) {
  1011. hdr_len = offset + tcph->doff * 4;
  1012. skb_shinfo(skb)->gso_segs =
  1013. DIV_ROUND_UP(skb->len - hdr_len,
  1014. skb_shinfo(skb)->gso_size);
  1015. }
  1016. }
  1017. static void ibmveth_rx_csum_helper(struct sk_buff *skb,
  1018. struct ibmveth_adapter *adapter)
  1019. {
  1020. struct iphdr *iph = NULL;
  1021. struct ipv6hdr *iph6 = NULL;
  1022. __be16 skb_proto = 0;
  1023. u16 iphlen = 0;
  1024. u16 iph_proto = 0;
  1025. u16 tcphdrlen = 0;
  1026. skb_proto = be16_to_cpu(skb->protocol);
  1027. if (skb_proto == ETH_P_IP) {
  1028. iph = (struct iphdr *)skb->data;
  1029. /* If the IP checksum is not offloaded and if the packet
  1030. * is large send, the checksum must be rebuilt.
  1031. */
  1032. if (iph->check == 0xffff) {
  1033. iph->check = 0;
  1034. iph->check = ip_fast_csum((unsigned char *)iph,
  1035. iph->ihl);
  1036. }
  1037. iphlen = iph->ihl * 4;
  1038. iph_proto = iph->protocol;
  1039. } else if (skb_proto == ETH_P_IPV6) {
  1040. iph6 = (struct ipv6hdr *)skb->data;
  1041. iphlen = sizeof(struct ipv6hdr);
  1042. iph_proto = iph6->nexthdr;
  1043. }
  1044. /* In OVS environment, when a flow is not cached, specifically for a
  1045. * new TCP connection, the first packet information is passed up
  1046. * the user space for finding a flow. During this process, OVS computes
  1047. * checksum on the first packet when CHECKSUM_PARTIAL flag is set.
  1048. *
  1049. * Given that we zeroed out TCP checksum field in transmit path
  1050. * (refer ibmveth_start_xmit routine) as we set "no checksum bit",
  1051. * OVS computed checksum will be incorrect w/o TCP pseudo checksum
  1052. * in the packet. This leads to OVS dropping the packet and hence
  1053. * TCP retransmissions are seen.
  1054. *
  1055. * So, re-compute TCP pseudo header checksum.
  1056. */
  1057. if (iph_proto == IPPROTO_TCP && adapter->is_active_trunk) {
  1058. struct tcphdr *tcph = (struct tcphdr *)(skb->data + iphlen);
  1059. tcphdrlen = skb->len - iphlen;
  1060. /* Recompute TCP pseudo header checksum */
  1061. if (skb_proto == ETH_P_IP)
  1062. tcph->check = ~csum_tcpudp_magic(iph->saddr,
  1063. iph->daddr, tcphdrlen, iph_proto, 0);
  1064. else if (skb_proto == ETH_P_IPV6)
  1065. tcph->check = ~csum_ipv6_magic(&iph6->saddr,
  1066. &iph6->daddr, tcphdrlen, iph_proto, 0);
  1067. /* Setup SKB fields for checksum offload */
  1068. skb_partial_csum_set(skb, iphlen,
  1069. offsetof(struct tcphdr, check));
  1070. skb_reset_network_header(skb);
  1071. }
  1072. }
  1073. static int ibmveth_poll(struct napi_struct *napi, int budget)
  1074. {
  1075. struct ibmveth_adapter *adapter =
  1076. container_of(napi, struct ibmveth_adapter, napi);
  1077. struct net_device *netdev = adapter->netdev;
  1078. int frames_processed = 0;
  1079. unsigned long lpar_rc;
  1080. u16 mss = 0;
  1081. while (frames_processed < budget) {
  1082. if (!ibmveth_rxq_pending_buffer(adapter))
  1083. break;
  1084. smp_rmb();
  1085. if (!ibmveth_rxq_buffer_valid(adapter)) {
  1086. wmb(); /* suggested by larson1 */
  1087. adapter->rx_invalid_buffer++;
  1088. netdev_dbg(netdev, "recycling invalid buffer\n");
  1089. ibmveth_rxq_recycle_buffer(adapter);
  1090. } else {
  1091. struct sk_buff *skb, *new_skb;
  1092. int length = ibmveth_rxq_frame_length(adapter);
  1093. int offset = ibmveth_rxq_frame_offset(adapter);
  1094. int csum_good = ibmveth_rxq_csum_good(adapter);
  1095. int lrg_pkt = ibmveth_rxq_large_packet(adapter);
  1096. skb = ibmveth_rxq_get_buffer(adapter);
  1097. /* if the large packet bit is set in the rx queue
  1098. * descriptor, the mss will be written by PHYP eight
  1099. * bytes from the start of the rx buffer, which is
  1100. * skb->data at this stage
  1101. */
  1102. if (lrg_pkt) {
  1103. __be64 *rxmss = (__be64 *)(skb->data + 8);
  1104. mss = (u16)be64_to_cpu(*rxmss);
  1105. }
  1106. new_skb = NULL;
  1107. if (length < rx_copybreak)
  1108. new_skb = netdev_alloc_skb(netdev, length);
  1109. if (new_skb) {
  1110. skb_copy_to_linear_data(new_skb,
  1111. skb->data + offset,
  1112. length);
  1113. if (rx_flush)
  1114. ibmveth_flush_buffer(skb->data,
  1115. length + offset);
  1116. if (!ibmveth_rxq_recycle_buffer(adapter))
  1117. kfree_skb(skb);
  1118. skb = new_skb;
  1119. } else {
  1120. ibmveth_rxq_harvest_buffer(adapter);
  1121. skb_reserve(skb, offset);
  1122. }
  1123. skb_put(skb, length);
  1124. skb->protocol = eth_type_trans(skb, netdev);
  1125. if (csum_good) {
  1126. skb->ip_summed = CHECKSUM_UNNECESSARY;
  1127. ibmveth_rx_csum_helper(skb, adapter);
  1128. }
  1129. if (length > netdev->mtu + ETH_HLEN) {
  1130. ibmveth_rx_mss_helper(skb, mss, lrg_pkt);
  1131. adapter->rx_large_packets++;
  1132. }
  1133. napi_gro_receive(napi, skb); /* send it up */
  1134. netdev->stats.rx_packets++;
  1135. netdev->stats.rx_bytes += length;
  1136. frames_processed++;
  1137. }
  1138. }
  1139. ibmveth_replenish_task(adapter);
  1140. if (frames_processed < budget) {
  1141. napi_complete_done(napi, frames_processed);
  1142. /* We think we are done - reenable interrupts,
  1143. * then check once more to make sure we are done.
  1144. */
  1145. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  1146. VIO_IRQ_ENABLE);
  1147. BUG_ON(lpar_rc != H_SUCCESS);
  1148. if (ibmveth_rxq_pending_buffer(adapter) &&
  1149. napi_reschedule(napi)) {
  1150. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  1151. VIO_IRQ_DISABLE);
  1152. }
  1153. }
  1154. return frames_processed;
  1155. }
  1156. static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance)
  1157. {
  1158. struct net_device *netdev = dev_instance;
  1159. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1160. unsigned long lpar_rc;
  1161. if (napi_schedule_prep(&adapter->napi)) {
  1162. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  1163. VIO_IRQ_DISABLE);
  1164. BUG_ON(lpar_rc != H_SUCCESS);
  1165. __napi_schedule(&adapter->napi);
  1166. }
  1167. return IRQ_HANDLED;
  1168. }
  1169. static void ibmveth_set_multicast_list(struct net_device *netdev)
  1170. {
  1171. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1172. unsigned long lpar_rc;
  1173. if ((netdev->flags & IFF_PROMISC) ||
  1174. (netdev_mc_count(netdev) > adapter->mcastFilterSize)) {
  1175. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1176. IbmVethMcastEnableRecv |
  1177. IbmVethMcastDisableFiltering,
  1178. 0);
  1179. if (lpar_rc != H_SUCCESS) {
  1180. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1181. "entering promisc mode\n", lpar_rc);
  1182. }
  1183. } else {
  1184. struct netdev_hw_addr *ha;
  1185. /* clear the filter table & disable filtering */
  1186. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1187. IbmVethMcastEnableRecv |
  1188. IbmVethMcastDisableFiltering |
  1189. IbmVethMcastClearFilterTable,
  1190. 0);
  1191. if (lpar_rc != H_SUCCESS) {
  1192. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1193. "attempting to clear filter table\n",
  1194. lpar_rc);
  1195. }
  1196. /* add the addresses to the filter table */
  1197. netdev_for_each_mc_addr(ha, netdev) {
  1198. /* add the multicast address to the filter table */
  1199. u64 mcast_addr;
  1200. mcast_addr = ibmveth_encode_mac_addr(ha->addr);
  1201. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1202. IbmVethMcastAddFilter,
  1203. mcast_addr);
  1204. if (lpar_rc != H_SUCCESS) {
  1205. netdev_err(netdev, "h_multicast_ctrl rc=%ld "
  1206. "when adding an entry to the filter "
  1207. "table\n", lpar_rc);
  1208. }
  1209. }
  1210. /* re-enable filtering */
  1211. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1212. IbmVethMcastEnableFiltering,
  1213. 0);
  1214. if (lpar_rc != H_SUCCESS) {
  1215. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1216. "enabling filtering\n", lpar_rc);
  1217. }
  1218. }
  1219. }
  1220. static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
  1221. {
  1222. struct ibmveth_adapter *adapter = netdev_priv(dev);
  1223. struct vio_dev *viodev = adapter->vdev;
  1224. int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH;
  1225. int i, rc;
  1226. int need_restart = 0;
  1227. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1228. if (new_mtu_oh <= adapter->rx_buff_pool[i].buff_size)
  1229. break;
  1230. if (i == IBMVETH_NUM_BUFF_POOLS)
  1231. return -EINVAL;
  1232. /* Deactivate all the buffer pools so that the next loop can activate
  1233. only the buffer pools necessary to hold the new MTU */
  1234. if (netif_running(adapter->netdev)) {
  1235. need_restart = 1;
  1236. adapter->pool_config = 1;
  1237. ibmveth_close(adapter->netdev);
  1238. adapter->pool_config = 0;
  1239. }
  1240. /* Look for an active buffer pool that can hold the new MTU */
  1241. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1242. adapter->rx_buff_pool[i].active = 1;
  1243. if (new_mtu_oh <= adapter->rx_buff_pool[i].buff_size) {
  1244. dev->mtu = new_mtu;
  1245. vio_cmo_set_dev_desired(viodev,
  1246. ibmveth_get_desired_dma
  1247. (viodev));
  1248. if (need_restart) {
  1249. return ibmveth_open(adapter->netdev);
  1250. }
  1251. return 0;
  1252. }
  1253. }
  1254. if (need_restart && (rc = ibmveth_open(adapter->netdev)))
  1255. return rc;
  1256. return -EINVAL;
  1257. }
  1258. #ifdef CONFIG_NET_POLL_CONTROLLER
  1259. static void ibmveth_poll_controller(struct net_device *dev)
  1260. {
  1261. ibmveth_replenish_task(netdev_priv(dev));
  1262. ibmveth_interrupt(dev->irq, dev);
  1263. }
  1264. #endif
  1265. /**
  1266. * ibmveth_get_desired_dma - Calculate IO memory desired by the driver
  1267. *
  1268. * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
  1269. *
  1270. * Return value:
  1271. * Number of bytes of IO data the driver will need to perform well.
  1272. */
  1273. static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev)
  1274. {
  1275. struct net_device *netdev = dev_get_drvdata(&vdev->dev);
  1276. struct ibmveth_adapter *adapter;
  1277. struct iommu_table *tbl;
  1278. unsigned long ret;
  1279. int i;
  1280. int rxqentries = 1;
  1281. tbl = get_iommu_table_base(&vdev->dev);
  1282. /* netdev inits at probe time along with the structures we need below*/
  1283. if (netdev == NULL)
  1284. return IOMMU_PAGE_ALIGN(IBMVETH_IO_ENTITLEMENT_DEFAULT, tbl);
  1285. adapter = netdev_priv(netdev);
  1286. ret = IBMVETH_BUFF_LIST_SIZE + IBMVETH_FILT_LIST_SIZE;
  1287. ret += IOMMU_PAGE_ALIGN(netdev->mtu, tbl);
  1288. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1289. /* add the size of the active receive buffers */
  1290. if (adapter->rx_buff_pool[i].active)
  1291. ret +=
  1292. adapter->rx_buff_pool[i].size *
  1293. IOMMU_PAGE_ALIGN(adapter->rx_buff_pool[i].
  1294. buff_size, tbl);
  1295. rxqentries += adapter->rx_buff_pool[i].size;
  1296. }
  1297. /* add the size of the receive queue entries */
  1298. ret += IOMMU_PAGE_ALIGN(
  1299. rxqentries * sizeof(struct ibmveth_rx_q_entry), tbl);
  1300. return ret;
  1301. }
  1302. static int ibmveth_set_mac_addr(struct net_device *dev, void *p)
  1303. {
  1304. struct ibmveth_adapter *adapter = netdev_priv(dev);
  1305. struct sockaddr *addr = p;
  1306. u64 mac_address;
  1307. int rc;
  1308. if (!is_valid_ether_addr(addr->sa_data))
  1309. return -EADDRNOTAVAIL;
  1310. mac_address = ibmveth_encode_mac_addr(addr->sa_data);
  1311. rc = h_change_logical_lan_mac(adapter->vdev->unit_address, mac_address);
  1312. if (rc) {
  1313. netdev_err(adapter->netdev, "h_change_logical_lan_mac failed with rc=%d\n", rc);
  1314. return rc;
  1315. }
  1316. ether_addr_copy(dev->dev_addr, addr->sa_data);
  1317. return 0;
  1318. }
  1319. static const struct net_device_ops ibmveth_netdev_ops = {
  1320. .ndo_open = ibmveth_open,
  1321. .ndo_stop = ibmveth_close,
  1322. .ndo_start_xmit = ibmveth_start_xmit,
  1323. .ndo_set_rx_mode = ibmveth_set_multicast_list,
  1324. .ndo_do_ioctl = ibmveth_ioctl,
  1325. .ndo_change_mtu = ibmveth_change_mtu,
  1326. .ndo_fix_features = ibmveth_fix_features,
  1327. .ndo_set_features = ibmveth_set_features,
  1328. .ndo_validate_addr = eth_validate_addr,
  1329. .ndo_set_mac_address = ibmveth_set_mac_addr,
  1330. #ifdef CONFIG_NET_POLL_CONTROLLER
  1331. .ndo_poll_controller = ibmveth_poll_controller,
  1332. #endif
  1333. };
  1334. static int ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
  1335. {
  1336. int rc, i, mac_len;
  1337. struct net_device *netdev;
  1338. struct ibmveth_adapter *adapter;
  1339. unsigned char *mac_addr_p;
  1340. __be32 *mcastFilterSize_p;
  1341. long ret;
  1342. unsigned long ret_attr;
  1343. dev_dbg(&dev->dev, "entering ibmveth_probe for UA 0x%x\n",
  1344. dev->unit_address);
  1345. mac_addr_p = (unsigned char *)vio_get_attribute(dev, VETH_MAC_ADDR,
  1346. &mac_len);
  1347. if (!mac_addr_p) {
  1348. dev_err(&dev->dev, "Can't find VETH_MAC_ADDR attribute\n");
  1349. return -EINVAL;
  1350. }
  1351. /* Workaround for old/broken pHyp */
  1352. if (mac_len == 8)
  1353. mac_addr_p += 2;
  1354. else if (mac_len != 6) {
  1355. dev_err(&dev->dev, "VETH_MAC_ADDR attribute wrong len %d\n",
  1356. mac_len);
  1357. return -EINVAL;
  1358. }
  1359. mcastFilterSize_p = (__be32 *)vio_get_attribute(dev,
  1360. VETH_MCAST_FILTER_SIZE,
  1361. NULL);
  1362. if (!mcastFilterSize_p) {
  1363. dev_err(&dev->dev, "Can't find VETH_MCAST_FILTER_SIZE "
  1364. "attribute\n");
  1365. return -EINVAL;
  1366. }
  1367. netdev = alloc_etherdev(sizeof(struct ibmveth_adapter));
  1368. if (!netdev)
  1369. return -ENOMEM;
  1370. adapter = netdev_priv(netdev);
  1371. dev_set_drvdata(&dev->dev, netdev);
  1372. adapter->vdev = dev;
  1373. adapter->netdev = netdev;
  1374. adapter->mcastFilterSize = be32_to_cpu(*mcastFilterSize_p);
  1375. adapter->pool_config = 0;
  1376. netif_napi_add(netdev, &adapter->napi, ibmveth_poll, 16);
  1377. netdev->irq = dev->irq;
  1378. netdev->netdev_ops = &ibmveth_netdev_ops;
  1379. netdev->ethtool_ops = &netdev_ethtool_ops;
  1380. SET_NETDEV_DEV(netdev, &dev->dev);
  1381. netdev->hw_features = NETIF_F_SG;
  1382. if (vio_get_attribute(dev, "ibm,illan-options", NULL) != NULL) {
  1383. netdev->hw_features |= NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM |
  1384. NETIF_F_RXCSUM;
  1385. }
  1386. netdev->features |= netdev->hw_features;
  1387. ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  1388. /* If running older firmware, TSO should not be enabled by default */
  1389. if (ret == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_LRG_SND_SUPPORT) &&
  1390. !old_large_send) {
  1391. netdev->hw_features |= NETIF_F_TSO | NETIF_F_TSO6;
  1392. netdev->features |= netdev->hw_features;
  1393. } else {
  1394. netdev->hw_features |= NETIF_F_TSO;
  1395. }
  1396. adapter->is_active_trunk = false;
  1397. if (ret == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_ACTIVE_TRUNK)) {
  1398. adapter->is_active_trunk = true;
  1399. netdev->hw_features |= NETIF_F_FRAGLIST;
  1400. netdev->features |= NETIF_F_FRAGLIST;
  1401. }
  1402. netdev->min_mtu = IBMVETH_MIN_MTU;
  1403. netdev->max_mtu = ETH_MAX_MTU;
  1404. memcpy(netdev->dev_addr, mac_addr_p, ETH_ALEN);
  1405. if (firmware_has_feature(FW_FEATURE_CMO))
  1406. memcpy(pool_count, pool_count_cmo, sizeof(pool_count));
  1407. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1408. struct kobject *kobj = &adapter->rx_buff_pool[i].kobj;
  1409. int error;
  1410. ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
  1411. pool_count[i], pool_size[i],
  1412. pool_active[i]);
  1413. error = kobject_init_and_add(kobj, &ktype_veth_pool,
  1414. &dev->dev.kobj, "pool%d", i);
  1415. if (!error)
  1416. kobject_uevent(kobj, KOBJ_ADD);
  1417. }
  1418. netdev_dbg(netdev, "adapter @ 0x%p\n", adapter);
  1419. netdev_dbg(netdev, "registering netdev...\n");
  1420. ibmveth_set_features(netdev, netdev->features);
  1421. rc = register_netdev(netdev);
  1422. if (rc) {
  1423. netdev_dbg(netdev, "failed to register netdev rc=%d\n", rc);
  1424. free_netdev(netdev);
  1425. return rc;
  1426. }
  1427. netdev_dbg(netdev, "registered\n");
  1428. return 0;
  1429. }
  1430. static int ibmveth_remove(struct vio_dev *dev)
  1431. {
  1432. struct net_device *netdev = dev_get_drvdata(&dev->dev);
  1433. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1434. int i;
  1435. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1436. kobject_put(&adapter->rx_buff_pool[i].kobj);
  1437. unregister_netdev(netdev);
  1438. free_netdev(netdev);
  1439. dev_set_drvdata(&dev->dev, NULL);
  1440. return 0;
  1441. }
  1442. static struct attribute veth_active_attr;
  1443. static struct attribute veth_num_attr;
  1444. static struct attribute veth_size_attr;
  1445. static ssize_t veth_pool_show(struct kobject *kobj,
  1446. struct attribute *attr, char *buf)
  1447. {
  1448. struct ibmveth_buff_pool *pool = container_of(kobj,
  1449. struct ibmveth_buff_pool,
  1450. kobj);
  1451. if (attr == &veth_active_attr)
  1452. return sprintf(buf, "%d\n", pool->active);
  1453. else if (attr == &veth_num_attr)
  1454. return sprintf(buf, "%d\n", pool->size);
  1455. else if (attr == &veth_size_attr)
  1456. return sprintf(buf, "%d\n", pool->buff_size);
  1457. return 0;
  1458. }
  1459. static ssize_t veth_pool_store(struct kobject *kobj, struct attribute *attr,
  1460. const char *buf, size_t count)
  1461. {
  1462. struct ibmveth_buff_pool *pool = container_of(kobj,
  1463. struct ibmveth_buff_pool,
  1464. kobj);
  1465. struct net_device *netdev = dev_get_drvdata(
  1466. container_of(kobj->parent, struct device, kobj));
  1467. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1468. long value = simple_strtol(buf, NULL, 10);
  1469. long rc;
  1470. if (attr == &veth_active_attr) {
  1471. if (value && !pool->active) {
  1472. if (netif_running(netdev)) {
  1473. if (ibmveth_alloc_buffer_pool(pool)) {
  1474. netdev_err(netdev,
  1475. "unable to alloc pool\n");
  1476. return -ENOMEM;
  1477. }
  1478. pool->active = 1;
  1479. adapter->pool_config = 1;
  1480. ibmveth_close(netdev);
  1481. adapter->pool_config = 0;
  1482. if ((rc = ibmveth_open(netdev)))
  1483. return rc;
  1484. } else {
  1485. pool->active = 1;
  1486. }
  1487. } else if (!value && pool->active) {
  1488. int mtu = netdev->mtu + IBMVETH_BUFF_OH;
  1489. int i;
  1490. /* Make sure there is a buffer pool with buffers that
  1491. can hold a packet of the size of the MTU */
  1492. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1493. if (pool == &adapter->rx_buff_pool[i])
  1494. continue;
  1495. if (!adapter->rx_buff_pool[i].active)
  1496. continue;
  1497. if (mtu <= adapter->rx_buff_pool[i].buff_size)
  1498. break;
  1499. }
  1500. if (i == IBMVETH_NUM_BUFF_POOLS) {
  1501. netdev_err(netdev, "no active pool >= MTU\n");
  1502. return -EPERM;
  1503. }
  1504. if (netif_running(netdev)) {
  1505. adapter->pool_config = 1;
  1506. ibmveth_close(netdev);
  1507. pool->active = 0;
  1508. adapter->pool_config = 0;
  1509. if ((rc = ibmveth_open(netdev)))
  1510. return rc;
  1511. }
  1512. pool->active = 0;
  1513. }
  1514. } else if (attr == &veth_num_attr) {
  1515. if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT) {
  1516. return -EINVAL;
  1517. } else {
  1518. if (netif_running(netdev)) {
  1519. adapter->pool_config = 1;
  1520. ibmveth_close(netdev);
  1521. adapter->pool_config = 0;
  1522. pool->size = value;
  1523. if ((rc = ibmveth_open(netdev)))
  1524. return rc;
  1525. } else {
  1526. pool->size = value;
  1527. }
  1528. }
  1529. } else if (attr == &veth_size_attr) {
  1530. if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE) {
  1531. return -EINVAL;
  1532. } else {
  1533. if (netif_running(netdev)) {
  1534. adapter->pool_config = 1;
  1535. ibmveth_close(netdev);
  1536. adapter->pool_config = 0;
  1537. pool->buff_size = value;
  1538. if ((rc = ibmveth_open(netdev)))
  1539. return rc;
  1540. } else {
  1541. pool->buff_size = value;
  1542. }
  1543. }
  1544. }
  1545. /* kick the interrupt handler to allocate/deallocate pools */
  1546. ibmveth_interrupt(netdev->irq, netdev);
  1547. return count;
  1548. }
  1549. #define ATTR(_name, _mode) \
  1550. struct attribute veth_##_name##_attr = { \
  1551. .name = __stringify(_name), .mode = _mode, \
  1552. };
  1553. static ATTR(active, 0644);
  1554. static ATTR(num, 0644);
  1555. static ATTR(size, 0644);
  1556. static struct attribute *veth_pool_attrs[] = {
  1557. &veth_active_attr,
  1558. &veth_num_attr,
  1559. &veth_size_attr,
  1560. NULL,
  1561. };
  1562. static const struct sysfs_ops veth_pool_ops = {
  1563. .show = veth_pool_show,
  1564. .store = veth_pool_store,
  1565. };
  1566. static struct kobj_type ktype_veth_pool = {
  1567. .release = NULL,
  1568. .sysfs_ops = &veth_pool_ops,
  1569. .default_attrs = veth_pool_attrs,
  1570. };
  1571. static int ibmveth_resume(struct device *dev)
  1572. {
  1573. struct net_device *netdev = dev_get_drvdata(dev);
  1574. ibmveth_interrupt(netdev->irq, netdev);
  1575. return 0;
  1576. }
  1577. static const struct vio_device_id ibmveth_device_table[] = {
  1578. { "network", "IBM,l-lan"},
  1579. { "", "" }
  1580. };
  1581. MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
  1582. static const struct dev_pm_ops ibmveth_pm_ops = {
  1583. .resume = ibmveth_resume
  1584. };
  1585. static struct vio_driver ibmveth_driver = {
  1586. .id_table = ibmveth_device_table,
  1587. .probe = ibmveth_probe,
  1588. .remove = ibmveth_remove,
  1589. .get_desired_dma = ibmveth_get_desired_dma,
  1590. .name = ibmveth_driver_name,
  1591. .pm = &ibmveth_pm_ops,
  1592. };
  1593. static int __init ibmveth_module_init(void)
  1594. {
  1595. printk(KERN_DEBUG "%s: %s %s\n", ibmveth_driver_name,
  1596. ibmveth_driver_string, ibmveth_driver_version);
  1597. return vio_register_driver(&ibmveth_driver);
  1598. }
  1599. static void __exit ibmveth_module_exit(void)
  1600. {
  1601. vio_unregister_driver(&ibmveth_driver);
  1602. }
  1603. module_init(ibmveth_module_init);
  1604. module_exit(ibmveth_module_exit);