ibmveth.c 61 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280
  1. // SPDX-License-Identifier: GPL-2.0-or-later
  2. /*
  3. * IBM Power Virtual Ethernet Device Driver
  4. *
  5. * Copyright (C) IBM Corporation, 2003, 2010
  6. *
  7. * Authors: Dave Larson <larson1@us.ibm.com>
  8. * Santiago Leon <santil@linux.vnet.ibm.com>
  9. * Brian King <brking@linux.vnet.ibm.com>
  10. * Robert Jennings <rcj@linux.vnet.ibm.com>
  11. * Anton Blanchard <anton@au.ibm.com>
  12. */
  13. #include <linux/module.h>
  14. #include <linux/types.h>
  15. #include <linux/errno.h>
  16. #include <linux/dma-mapping.h>
  17. #include <linux/kernel.h>
  18. #include <linux/netdevice.h>
  19. #include <linux/etherdevice.h>
  20. #include <linux/skbuff.h>
  21. #include <linux/init.h>
  22. #include <linux/interrupt.h>
  23. #include <linux/mm.h>
  24. #include <linux/pm.h>
  25. #include <linux/ethtool.h>
  26. #include <linux/in.h>
  27. #include <linux/ip.h>
  28. #include <linux/ipv6.h>
  29. #include <linux/slab.h>
  30. #include <asm/hvcall.h>
  31. #include <linux/atomic.h>
  32. #include <asm/vio.h>
  33. #include <asm/iommu.h>
  34. #include <asm/firmware.h>
  35. #include <net/tcp.h>
  36. #include <net/ip6_checksum.h>
  37. #include "ibmveth.h"
  38. static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance);
  39. static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev);
  40. static struct kobj_type ktype_veth_pool;
  41. static const char ibmveth_driver_name[] = "ibmveth";
  42. static const char ibmveth_driver_string[] = "IBM Power Virtual Ethernet Driver";
  43. #define ibmveth_driver_version "1.06"
  44. MODULE_AUTHOR("Santiago Leon <santil@linux.vnet.ibm.com>");
  45. MODULE_DESCRIPTION("IBM Power Virtual Ethernet Driver");
  46. MODULE_LICENSE("GPL");
  47. MODULE_VERSION(ibmveth_driver_version);
  48. static unsigned int tx_copybreak __read_mostly = 128;
  49. module_param(tx_copybreak, uint, 0644);
  50. MODULE_PARM_DESC(tx_copybreak,
  51. "Maximum size of packet that is copied to a new buffer on transmit");
  52. static unsigned int rx_copybreak __read_mostly = 128;
  53. module_param(rx_copybreak, uint, 0644);
  54. MODULE_PARM_DESC(rx_copybreak,
  55. "Maximum size of packet that is copied to a new buffer on receive");
  56. static unsigned int rx_flush __read_mostly = 0;
  57. module_param(rx_flush, uint, 0644);
  58. MODULE_PARM_DESC(rx_flush, "Flush receive buffers before use");
  59. static bool old_large_send __read_mostly;
  60. module_param(old_large_send, bool, 0444);
  61. MODULE_PARM_DESC(old_large_send,
  62. "Use old large send method on firmware that supports the new method");
  63. struct ibmveth_stat {
  64. char name[ETH_GSTRING_LEN];
  65. int offset;
  66. };
  67. #define IBMVETH_STAT_OFF(stat) offsetof(struct ibmveth_adapter, stat)
  68. #define IBMVETH_GET_STAT(a, off) *((u64 *)(((unsigned long)(a)) + off))
  69. static struct ibmveth_stat ibmveth_stats[] = {
  70. { "replenish_task_cycles", IBMVETH_STAT_OFF(replenish_task_cycles) },
  71. { "replenish_no_mem", IBMVETH_STAT_OFF(replenish_no_mem) },
  72. { "replenish_add_buff_failure",
  73. IBMVETH_STAT_OFF(replenish_add_buff_failure) },
  74. { "replenish_add_buff_success",
  75. IBMVETH_STAT_OFF(replenish_add_buff_success) },
  76. { "rx_invalid_buffer", IBMVETH_STAT_OFF(rx_invalid_buffer) },
  77. { "rx_no_buffer", IBMVETH_STAT_OFF(rx_no_buffer) },
  78. { "tx_map_failed", IBMVETH_STAT_OFF(tx_map_failed) },
  79. { "tx_send_failed", IBMVETH_STAT_OFF(tx_send_failed) },
  80. { "fw_enabled_ipv4_csum", IBMVETH_STAT_OFF(fw_ipv4_csum_support) },
  81. { "fw_enabled_ipv6_csum", IBMVETH_STAT_OFF(fw_ipv6_csum_support) },
  82. { "tx_large_packets", IBMVETH_STAT_OFF(tx_large_packets) },
  83. { "rx_large_packets", IBMVETH_STAT_OFF(rx_large_packets) },
  84. { "fw_enabled_large_send", IBMVETH_STAT_OFF(fw_large_send_support) }
  85. };
  86. /* simple methods of getting data from the current rxq entry */
  87. static inline u32 ibmveth_rxq_flags(struct ibmveth_adapter *adapter)
  88. {
  89. return be32_to_cpu(adapter->rx_queue.queue_addr[adapter->rx_queue.index].flags_off);
  90. }
  91. static inline int ibmveth_rxq_toggle(struct ibmveth_adapter *adapter)
  92. {
  93. return (ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_TOGGLE) >>
  94. IBMVETH_RXQ_TOGGLE_SHIFT;
  95. }
  96. static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
  97. {
  98. return ibmveth_rxq_toggle(adapter) == adapter->rx_queue.toggle;
  99. }
  100. static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
  101. {
  102. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_VALID;
  103. }
  104. static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
  105. {
  106. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_OFF_MASK;
  107. }
  108. static inline int ibmveth_rxq_large_packet(struct ibmveth_adapter *adapter)
  109. {
  110. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_LRG_PKT;
  111. }
  112. static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
  113. {
  114. return be32_to_cpu(adapter->rx_queue.queue_addr[adapter->rx_queue.index].length);
  115. }
  116. static inline int ibmveth_rxq_csum_good(struct ibmveth_adapter *adapter)
  117. {
  118. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_CSUM_GOOD;
  119. }
  120. static unsigned int ibmveth_real_max_tx_queues(void)
  121. {
  122. unsigned int n_cpu = num_online_cpus();
  123. return min(n_cpu, IBMVETH_MAX_QUEUES);
  124. }
  125. /* setup the initial settings for a buffer pool */
  126. static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool,
  127. u32 pool_index, u32 pool_size,
  128. u32 buff_size, u32 pool_active)
  129. {
  130. pool->size = pool_size;
  131. pool->index = pool_index;
  132. pool->buff_size = buff_size;
  133. pool->threshold = pool_size * 7 / 8;
  134. pool->active = pool_active;
  135. }
  136. /* allocate and setup an buffer pool - called during open */
  137. static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
  138. {
  139. int i;
  140. pool->free_map = kmalloc_array(pool->size, sizeof(u16), GFP_KERNEL);
  141. if (!pool->free_map)
  142. return -1;
  143. pool->dma_addr = kzalloc_objs(dma_addr_t, pool->size);
  144. if (!pool->dma_addr) {
  145. kfree(pool->free_map);
  146. pool->free_map = NULL;
  147. return -1;
  148. }
  149. pool->skbuff = kcalloc(pool->size, sizeof(void *), GFP_KERNEL);
  150. if (!pool->skbuff) {
  151. kfree(pool->dma_addr);
  152. pool->dma_addr = NULL;
  153. kfree(pool->free_map);
  154. pool->free_map = NULL;
  155. return -1;
  156. }
  157. for (i = 0; i < pool->size; ++i)
  158. pool->free_map[i] = i;
  159. atomic_set(&pool->available, 0);
  160. pool->producer_index = 0;
  161. pool->consumer_index = 0;
  162. return 0;
  163. }
  164. static inline void ibmveth_flush_buffer(void *addr, unsigned long length)
  165. {
  166. unsigned long offset;
  167. for (offset = 0; offset < length; offset += SMP_CACHE_BYTES)
  168. asm("dcbf %0,%1,1" :: "b" (addr), "r" (offset));
  169. }
  170. /* replenish the buffers for a pool. note that we don't need to
  171. * skb_reserve these since they are used for incoming...
  172. */
  173. static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter,
  174. struct ibmveth_buff_pool *pool)
  175. {
  176. union ibmveth_buf_desc descs[IBMVETH_MAX_RX_PER_HCALL] = {0};
  177. u32 remaining = pool->size - atomic_read(&pool->available);
  178. u64 correlators[IBMVETH_MAX_RX_PER_HCALL] = {0};
  179. unsigned long lpar_rc;
  180. u32 buffers_added = 0;
  181. u32 i, filled, batch;
  182. struct vio_dev *vdev;
  183. dma_addr_t dma_addr;
  184. struct device *dev;
  185. u32 index;
  186. vdev = adapter->vdev;
  187. dev = &vdev->dev;
  188. mb();
  189. batch = adapter->rx_buffers_per_hcall;
  190. while (remaining > 0) {
  191. unsigned int free_index = pool->consumer_index;
  192. /* Fill a batch of descriptors */
  193. for (filled = 0; filled < min(remaining, batch); filled++) {
  194. index = pool->free_map[free_index];
  195. if (WARN_ON(index == IBM_VETH_INVALID_MAP)) {
  196. adapter->replenish_add_buff_failure++;
  197. netdev_info(adapter->netdev,
  198. "Invalid map index %u, reset\n",
  199. index);
  200. schedule_work(&adapter->work);
  201. break;
  202. }
  203. if (!pool->skbuff[index]) {
  204. struct sk_buff *skb = NULL;
  205. skb = netdev_alloc_skb(adapter->netdev,
  206. pool->buff_size);
  207. if (!skb) {
  208. adapter->replenish_no_mem++;
  209. adapter->replenish_add_buff_failure++;
  210. break;
  211. }
  212. dma_addr = dma_map_single(dev, skb->data,
  213. pool->buff_size,
  214. DMA_FROM_DEVICE);
  215. if (dma_mapping_error(dev, dma_addr)) {
  216. dev_kfree_skb_any(skb);
  217. adapter->replenish_add_buff_failure++;
  218. break;
  219. }
  220. pool->dma_addr[index] = dma_addr;
  221. pool->skbuff[index] = skb;
  222. } else {
  223. /* re-use case */
  224. dma_addr = pool->dma_addr[index];
  225. }
  226. if (rx_flush) {
  227. unsigned int len;
  228. len = adapter->netdev->mtu + IBMVETH_BUFF_OH;
  229. len = min(pool->buff_size, len);
  230. ibmveth_flush_buffer(pool->skbuff[index]->data,
  231. len);
  232. }
  233. descs[filled].fields.flags_len = IBMVETH_BUF_VALID |
  234. pool->buff_size;
  235. descs[filled].fields.address = dma_addr;
  236. correlators[filled] = ((u64)pool->index << 32) | index;
  237. *(u64 *)pool->skbuff[index]->data = correlators[filled];
  238. free_index++;
  239. if (free_index >= pool->size)
  240. free_index = 0;
  241. }
  242. if (!filled)
  243. break;
  244. /* single buffer case*/
  245. if (filled == 1)
  246. lpar_rc = h_add_logical_lan_buffer(vdev->unit_address,
  247. descs[0].desc);
  248. else
  249. /* Multi-buffer hcall */
  250. lpar_rc = h_add_logical_lan_buffers(vdev->unit_address,
  251. descs[0].desc,
  252. descs[1].desc,
  253. descs[2].desc,
  254. descs[3].desc,
  255. descs[4].desc,
  256. descs[5].desc,
  257. descs[6].desc,
  258. descs[7].desc);
  259. if (lpar_rc != H_SUCCESS) {
  260. dev_warn_ratelimited(dev,
  261. "RX h_add_logical_lan failed: filled=%u, rc=%lu, batch=%u\n",
  262. filled, lpar_rc, batch);
  263. goto hcall_failure;
  264. }
  265. /* Only update pool state after hcall succeeds */
  266. for (i = 0; i < filled; i++) {
  267. free_index = pool->consumer_index;
  268. pool->free_map[free_index] = IBM_VETH_INVALID_MAP;
  269. pool->consumer_index++;
  270. if (pool->consumer_index >= pool->size)
  271. pool->consumer_index = 0;
  272. }
  273. buffers_added += filled;
  274. adapter->replenish_add_buff_success += filled;
  275. remaining -= filled;
  276. memset(&descs, 0, sizeof(descs));
  277. memset(&correlators, 0, sizeof(correlators));
  278. continue;
  279. hcall_failure:
  280. for (i = 0; i < filled; i++) {
  281. index = correlators[i] & 0xffffffffUL;
  282. dma_addr = pool->dma_addr[index];
  283. if (pool->skbuff[index]) {
  284. if (dma_addr &&
  285. !dma_mapping_error(dev, dma_addr))
  286. dma_unmap_single(dev, dma_addr,
  287. pool->buff_size,
  288. DMA_FROM_DEVICE);
  289. dev_kfree_skb_any(pool->skbuff[index]);
  290. pool->skbuff[index] = NULL;
  291. }
  292. }
  293. adapter->replenish_add_buff_failure += filled;
  294. /*
  295. * If multi rx buffers hcall is no longer supported by FW
  296. * e.g. in the case of Live Parttion Migration
  297. */
  298. if (batch > 1 && lpar_rc == H_FUNCTION) {
  299. /*
  300. * Instead of retry submit single buffer individually
  301. * here just set the max rx buffer per hcall to 1
  302. * buffers will be respleshed next time
  303. * when ibmveth_replenish_buffer_pool() is called again
  304. * with single-buffer case
  305. */
  306. netdev_info(adapter->netdev,
  307. "RX Multi buffers not supported by FW, rc=%lu\n",
  308. lpar_rc);
  309. adapter->rx_buffers_per_hcall = 1;
  310. netdev_info(adapter->netdev,
  311. "Next rx replesh will fall back to single-buffer hcall\n");
  312. }
  313. break;
  314. }
  315. mb();
  316. atomic_add(buffers_added, &(pool->available));
  317. }
  318. /*
  319. * The final 8 bytes of the buffer list is a counter of frames dropped
  320. * because there was not a buffer in the buffer list capable of holding
  321. * the frame.
  322. */
  323. static void ibmveth_update_rx_no_buffer(struct ibmveth_adapter *adapter)
  324. {
  325. __be64 *p = adapter->buffer_list_addr + 4096 - 8;
  326. adapter->rx_no_buffer = be64_to_cpup(p);
  327. }
  328. /* replenish routine */
  329. static void ibmveth_replenish_task(struct ibmveth_adapter *adapter)
  330. {
  331. int i;
  332. adapter->replenish_task_cycles++;
  333. for (i = (IBMVETH_NUM_BUFF_POOLS - 1); i >= 0; i--) {
  334. struct ibmveth_buff_pool *pool = &adapter->rx_buff_pool[i];
  335. if (pool->active &&
  336. (atomic_read(&pool->available) < pool->threshold))
  337. ibmveth_replenish_buffer_pool(adapter, pool);
  338. }
  339. ibmveth_update_rx_no_buffer(adapter);
  340. }
  341. /* empty and free ana buffer pool - also used to do cleanup in error paths */
  342. static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter,
  343. struct ibmveth_buff_pool *pool)
  344. {
  345. int i;
  346. kfree(pool->free_map);
  347. pool->free_map = NULL;
  348. if (pool->skbuff && pool->dma_addr) {
  349. for (i = 0; i < pool->size; ++i) {
  350. struct sk_buff *skb = pool->skbuff[i];
  351. if (skb) {
  352. dma_unmap_single(&adapter->vdev->dev,
  353. pool->dma_addr[i],
  354. pool->buff_size,
  355. DMA_FROM_DEVICE);
  356. dev_kfree_skb_any(skb);
  357. pool->skbuff[i] = NULL;
  358. }
  359. }
  360. }
  361. if (pool->dma_addr) {
  362. kfree(pool->dma_addr);
  363. pool->dma_addr = NULL;
  364. }
  365. if (pool->skbuff) {
  366. kfree(pool->skbuff);
  367. pool->skbuff = NULL;
  368. }
  369. }
  370. /**
  371. * ibmveth_remove_buffer_from_pool - remove a buffer from a pool
  372. * @adapter: adapter instance
  373. * @correlator: identifies pool and index
  374. * @reuse: whether to reuse buffer
  375. *
  376. * Return:
  377. * * %0 - success
  378. * * %-EINVAL - correlator maps to pool or index out of range
  379. * * %-EFAULT - pool and index map to null skb
  380. */
  381. static int ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter,
  382. u64 correlator, bool reuse)
  383. {
  384. unsigned int pool = correlator >> 32;
  385. unsigned int index = correlator & 0xffffffffUL;
  386. unsigned int free_index;
  387. struct sk_buff *skb;
  388. if (WARN_ON(pool >= IBMVETH_NUM_BUFF_POOLS) ||
  389. WARN_ON(index >= adapter->rx_buff_pool[pool].size)) {
  390. schedule_work(&adapter->work);
  391. return -EINVAL;
  392. }
  393. skb = adapter->rx_buff_pool[pool].skbuff[index];
  394. if (WARN_ON(!skb)) {
  395. schedule_work(&adapter->work);
  396. return -EFAULT;
  397. }
  398. /* if we are going to reuse the buffer then keep the pointers around
  399. * but mark index as available. replenish will see the skb pointer and
  400. * assume it is to be recycled.
  401. */
  402. if (!reuse) {
  403. /* remove the skb pointer to mark free. actual freeing is done
  404. * by upper level networking after gro_recieve
  405. */
  406. adapter->rx_buff_pool[pool].skbuff[index] = NULL;
  407. dma_unmap_single(&adapter->vdev->dev,
  408. adapter->rx_buff_pool[pool].dma_addr[index],
  409. adapter->rx_buff_pool[pool].buff_size,
  410. DMA_FROM_DEVICE);
  411. }
  412. free_index = adapter->rx_buff_pool[pool].producer_index;
  413. adapter->rx_buff_pool[pool].producer_index++;
  414. if (adapter->rx_buff_pool[pool].producer_index >=
  415. adapter->rx_buff_pool[pool].size)
  416. adapter->rx_buff_pool[pool].producer_index = 0;
  417. adapter->rx_buff_pool[pool].free_map[free_index] = index;
  418. mb();
  419. atomic_dec(&(adapter->rx_buff_pool[pool].available));
  420. return 0;
  421. }
  422. /* get the current buffer on the rx queue */
  423. static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
  424. {
  425. u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
  426. unsigned int pool = correlator >> 32;
  427. unsigned int index = correlator & 0xffffffffUL;
  428. if (WARN_ON(pool >= IBMVETH_NUM_BUFF_POOLS) ||
  429. WARN_ON(index >= adapter->rx_buff_pool[pool].size)) {
  430. schedule_work(&adapter->work);
  431. return NULL;
  432. }
  433. return adapter->rx_buff_pool[pool].skbuff[index];
  434. }
  435. /**
  436. * ibmveth_rxq_harvest_buffer - Harvest buffer from pool
  437. *
  438. * @adapter: pointer to adapter
  439. * @reuse: whether to reuse buffer
  440. *
  441. * Context: called from ibmveth_poll
  442. *
  443. * Return:
  444. * * %0 - success
  445. * * other - non-zero return from ibmveth_remove_buffer_from_pool
  446. */
  447. static int ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter,
  448. bool reuse)
  449. {
  450. u64 cor;
  451. int rc;
  452. cor = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
  453. rc = ibmveth_remove_buffer_from_pool(adapter, cor, reuse);
  454. if (unlikely(rc))
  455. return rc;
  456. if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
  457. adapter->rx_queue.index = 0;
  458. adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
  459. }
  460. return 0;
  461. }
  462. static void ibmveth_free_tx_ltb(struct ibmveth_adapter *adapter, int idx)
  463. {
  464. dma_unmap_single(&adapter->vdev->dev, adapter->tx_ltb_dma[idx],
  465. adapter->tx_ltb_size, DMA_TO_DEVICE);
  466. kfree(adapter->tx_ltb_ptr[idx]);
  467. adapter->tx_ltb_ptr[idx] = NULL;
  468. }
  469. static int ibmveth_allocate_tx_ltb(struct ibmveth_adapter *adapter, int idx)
  470. {
  471. adapter->tx_ltb_ptr[idx] = kzalloc(adapter->tx_ltb_size,
  472. GFP_KERNEL);
  473. if (!adapter->tx_ltb_ptr[idx]) {
  474. netdev_err(adapter->netdev,
  475. "unable to allocate tx long term buffer\n");
  476. return -ENOMEM;
  477. }
  478. adapter->tx_ltb_dma[idx] = dma_map_single(&adapter->vdev->dev,
  479. adapter->tx_ltb_ptr[idx],
  480. adapter->tx_ltb_size,
  481. DMA_TO_DEVICE);
  482. if (dma_mapping_error(&adapter->vdev->dev, adapter->tx_ltb_dma[idx])) {
  483. netdev_err(adapter->netdev,
  484. "unable to DMA map tx long term buffer\n");
  485. kfree(adapter->tx_ltb_ptr[idx]);
  486. adapter->tx_ltb_ptr[idx] = NULL;
  487. return -ENOMEM;
  488. }
  489. return 0;
  490. }
  491. static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter,
  492. union ibmveth_buf_desc rxq_desc, u64 mac_address)
  493. {
  494. int rc, try_again = 1;
  495. /*
  496. * After a kexec the adapter will still be open, so our attempt to
  497. * open it will fail. So if we get a failure we free the adapter and
  498. * try again, but only once.
  499. */
  500. retry:
  501. rc = h_register_logical_lan(adapter->vdev->unit_address,
  502. adapter->buffer_list_dma, rxq_desc.desc,
  503. adapter->filter_list_dma, mac_address);
  504. if (rc != H_SUCCESS && try_again) {
  505. do {
  506. rc = h_free_logical_lan(adapter->vdev->unit_address);
  507. } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
  508. try_again = 0;
  509. goto retry;
  510. }
  511. return rc;
  512. }
  513. static int ibmveth_open(struct net_device *netdev)
  514. {
  515. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  516. u64 mac_address;
  517. int rxq_entries = 1;
  518. unsigned long lpar_rc;
  519. int rc;
  520. union ibmveth_buf_desc rxq_desc;
  521. int i;
  522. struct device *dev;
  523. netdev_dbg(netdev, "open starting\n");
  524. napi_enable(&adapter->napi);
  525. for(i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  526. rxq_entries += adapter->rx_buff_pool[i].size;
  527. rc = -ENOMEM;
  528. adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
  529. if (!adapter->buffer_list_addr) {
  530. netdev_err(netdev, "unable to allocate list pages\n");
  531. goto out;
  532. }
  533. adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
  534. if (!adapter->filter_list_addr) {
  535. netdev_err(netdev, "unable to allocate filter pages\n");
  536. goto out_free_buffer_list;
  537. }
  538. dev = &adapter->vdev->dev;
  539. adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) *
  540. rxq_entries;
  541. adapter->rx_queue.queue_addr =
  542. dma_alloc_coherent(dev, adapter->rx_queue.queue_len,
  543. &adapter->rx_queue.queue_dma, GFP_KERNEL);
  544. if (!adapter->rx_queue.queue_addr)
  545. goto out_free_filter_list;
  546. adapter->buffer_list_dma = dma_map_single(dev,
  547. adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
  548. if (dma_mapping_error(dev, adapter->buffer_list_dma)) {
  549. netdev_err(netdev, "unable to map buffer list pages\n");
  550. goto out_free_queue_mem;
  551. }
  552. adapter->filter_list_dma = dma_map_single(dev,
  553. adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
  554. if (dma_mapping_error(dev, adapter->filter_list_dma)) {
  555. netdev_err(netdev, "unable to map filter list pages\n");
  556. goto out_unmap_buffer_list;
  557. }
  558. for (i = 0; i < netdev->real_num_tx_queues; i++) {
  559. if (ibmveth_allocate_tx_ltb(adapter, i))
  560. goto out_free_tx_ltb;
  561. }
  562. adapter->rx_queue.index = 0;
  563. adapter->rx_queue.num_slots = rxq_entries;
  564. adapter->rx_queue.toggle = 1;
  565. mac_address = ether_addr_to_u64(netdev->dev_addr);
  566. rxq_desc.fields.flags_len = IBMVETH_BUF_VALID |
  567. adapter->rx_queue.queue_len;
  568. rxq_desc.fields.address = adapter->rx_queue.queue_dma;
  569. netdev_dbg(netdev, "buffer list @ 0x%p\n", adapter->buffer_list_addr);
  570. netdev_dbg(netdev, "filter list @ 0x%p\n", adapter->filter_list_addr);
  571. netdev_dbg(netdev, "receive q @ 0x%p\n", adapter->rx_queue.queue_addr);
  572. h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
  573. lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address);
  574. if (lpar_rc != H_SUCCESS) {
  575. netdev_err(netdev, "h_register_logical_lan failed with %ld\n",
  576. lpar_rc);
  577. netdev_err(netdev, "buffer TCE:0x%llx filter TCE:0x%llx rxq "
  578. "desc:0x%llx MAC:0x%llx\n",
  579. adapter->buffer_list_dma,
  580. adapter->filter_list_dma,
  581. rxq_desc.desc,
  582. mac_address);
  583. rc = -ENONET;
  584. goto out_unmap_filter_list;
  585. }
  586. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  587. if (!adapter->rx_buff_pool[i].active)
  588. continue;
  589. if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) {
  590. netdev_err(netdev, "unable to alloc pool\n");
  591. adapter->rx_buff_pool[i].active = 0;
  592. rc = -ENOMEM;
  593. goto out_free_buffer_pools;
  594. }
  595. }
  596. netdev_dbg(netdev, "registering irq 0x%x\n", netdev->irq);
  597. rc = request_irq(netdev->irq, ibmveth_interrupt, 0, netdev->name,
  598. netdev);
  599. if (rc != 0) {
  600. netdev_err(netdev, "unable to request irq 0x%x, rc %d\n",
  601. netdev->irq, rc);
  602. do {
  603. lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
  604. } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
  605. goto out_free_buffer_pools;
  606. }
  607. rc = -ENOMEM;
  608. netdev_dbg(netdev, "initial replenish cycle\n");
  609. ibmveth_interrupt(netdev->irq, netdev);
  610. netif_tx_start_all_queues(netdev);
  611. netdev_dbg(netdev, "open complete\n");
  612. return 0;
  613. out_free_buffer_pools:
  614. while (--i >= 0) {
  615. if (adapter->rx_buff_pool[i].active)
  616. ibmveth_free_buffer_pool(adapter,
  617. &adapter->rx_buff_pool[i]);
  618. }
  619. out_unmap_filter_list:
  620. dma_unmap_single(dev, adapter->filter_list_dma, 4096,
  621. DMA_BIDIRECTIONAL);
  622. out_free_tx_ltb:
  623. while (--i >= 0) {
  624. ibmveth_free_tx_ltb(adapter, i);
  625. }
  626. out_unmap_buffer_list:
  627. dma_unmap_single(dev, adapter->buffer_list_dma, 4096,
  628. DMA_BIDIRECTIONAL);
  629. out_free_queue_mem:
  630. dma_free_coherent(dev, adapter->rx_queue.queue_len,
  631. adapter->rx_queue.queue_addr,
  632. adapter->rx_queue.queue_dma);
  633. out_free_filter_list:
  634. free_page((unsigned long)adapter->filter_list_addr);
  635. out_free_buffer_list:
  636. free_page((unsigned long)adapter->buffer_list_addr);
  637. out:
  638. napi_disable(&adapter->napi);
  639. return rc;
  640. }
  641. static int ibmveth_close(struct net_device *netdev)
  642. {
  643. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  644. struct device *dev = &adapter->vdev->dev;
  645. long lpar_rc;
  646. int i;
  647. netdev_dbg(netdev, "close starting\n");
  648. napi_disable(&adapter->napi);
  649. netif_tx_stop_all_queues(netdev);
  650. h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
  651. do {
  652. lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
  653. } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
  654. if (lpar_rc != H_SUCCESS) {
  655. netdev_err(netdev, "h_free_logical_lan failed with %lx, "
  656. "continuing with close\n", lpar_rc);
  657. }
  658. free_irq(netdev->irq, netdev);
  659. ibmveth_update_rx_no_buffer(adapter);
  660. dma_unmap_single(dev, adapter->buffer_list_dma, 4096,
  661. DMA_BIDIRECTIONAL);
  662. free_page((unsigned long)adapter->buffer_list_addr);
  663. dma_unmap_single(dev, adapter->filter_list_dma, 4096,
  664. DMA_BIDIRECTIONAL);
  665. free_page((unsigned long)adapter->filter_list_addr);
  666. dma_free_coherent(dev, adapter->rx_queue.queue_len,
  667. adapter->rx_queue.queue_addr,
  668. adapter->rx_queue.queue_dma);
  669. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  670. if (adapter->rx_buff_pool[i].active)
  671. ibmveth_free_buffer_pool(adapter,
  672. &adapter->rx_buff_pool[i]);
  673. for (i = 0; i < netdev->real_num_tx_queues; i++)
  674. ibmveth_free_tx_ltb(adapter, i);
  675. netdev_dbg(netdev, "close complete\n");
  676. return 0;
  677. }
  678. /**
  679. * ibmveth_reset - Handle scheduled reset work
  680. *
  681. * @w: pointer to work_struct embedded in adapter structure
  682. *
  683. * Context: This routine acquires rtnl_mutex and disables its NAPI through
  684. * ibmveth_close. It can't be called directly in a context that has
  685. * already acquired rtnl_mutex or disabled its NAPI, or directly from
  686. * a poll routine.
  687. *
  688. * Return: void
  689. */
  690. static void ibmveth_reset(struct work_struct *w)
  691. {
  692. struct ibmveth_adapter *adapter = container_of(w, struct ibmveth_adapter, work);
  693. struct net_device *netdev = adapter->netdev;
  694. netdev_dbg(netdev, "reset starting\n");
  695. rtnl_lock();
  696. dev_close(adapter->netdev);
  697. dev_open(adapter->netdev, NULL);
  698. rtnl_unlock();
  699. netdev_dbg(netdev, "reset complete\n");
  700. }
  701. static int ibmveth_set_link_ksettings(struct net_device *dev,
  702. const struct ethtool_link_ksettings *cmd)
  703. {
  704. struct ibmveth_adapter *adapter = netdev_priv(dev);
  705. return ethtool_virtdev_set_link_ksettings(dev, cmd,
  706. &adapter->speed,
  707. &adapter->duplex);
  708. }
  709. static int ibmveth_get_link_ksettings(struct net_device *dev,
  710. struct ethtool_link_ksettings *cmd)
  711. {
  712. struct ibmveth_adapter *adapter = netdev_priv(dev);
  713. cmd->base.speed = adapter->speed;
  714. cmd->base.duplex = adapter->duplex;
  715. cmd->base.port = PORT_OTHER;
  716. return 0;
  717. }
  718. static void ibmveth_init_link_settings(struct net_device *dev)
  719. {
  720. struct ibmveth_adapter *adapter = netdev_priv(dev);
  721. adapter->speed = SPEED_1000;
  722. adapter->duplex = DUPLEX_FULL;
  723. }
  724. static void netdev_get_drvinfo(struct net_device *dev,
  725. struct ethtool_drvinfo *info)
  726. {
  727. strscpy(info->driver, ibmveth_driver_name, sizeof(info->driver));
  728. strscpy(info->version, ibmveth_driver_version, sizeof(info->version));
  729. }
  730. static netdev_features_t ibmveth_fix_features(struct net_device *dev,
  731. netdev_features_t features)
  732. {
  733. /*
  734. * Since the ibmveth firmware interface does not have the
  735. * concept of separate tx/rx checksum offload enable, if rx
  736. * checksum is disabled we also have to disable tx checksum
  737. * offload. Once we disable rx checksum offload, we are no
  738. * longer allowed to send tx buffers that are not properly
  739. * checksummed.
  740. */
  741. if (!(features & NETIF_F_RXCSUM))
  742. features &= ~NETIF_F_CSUM_MASK;
  743. return features;
  744. }
  745. static int ibmveth_set_csum_offload(struct net_device *dev, u32 data)
  746. {
  747. struct ibmveth_adapter *adapter = netdev_priv(dev);
  748. unsigned long set_attr, clr_attr, ret_attr;
  749. unsigned long set_attr6, clr_attr6;
  750. long ret, ret4, ret6;
  751. int rc1 = 0, rc2 = 0;
  752. int restart = 0;
  753. if (netif_running(dev)) {
  754. restart = 1;
  755. ibmveth_close(dev);
  756. }
  757. set_attr = 0;
  758. clr_attr = 0;
  759. set_attr6 = 0;
  760. clr_attr6 = 0;
  761. if (data) {
  762. set_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
  763. set_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
  764. } else {
  765. clr_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
  766. clr_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
  767. }
  768. ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  769. if (ret == H_SUCCESS &&
  770. (ret_attr & IBMVETH_ILLAN_PADDED_PKT_CSUM)) {
  771. ret4 = h_illan_attributes(adapter->vdev->unit_address, clr_attr,
  772. set_attr, &ret_attr);
  773. if (ret4 != H_SUCCESS) {
  774. netdev_err(dev, "unable to change IPv4 checksum "
  775. "offload settings. %d rc=%ld\n",
  776. data, ret4);
  777. h_illan_attributes(adapter->vdev->unit_address,
  778. set_attr, clr_attr, &ret_attr);
  779. if (data == 1)
  780. dev->features &= ~NETIF_F_IP_CSUM;
  781. } else {
  782. adapter->fw_ipv4_csum_support = data;
  783. }
  784. ret6 = h_illan_attributes(adapter->vdev->unit_address,
  785. clr_attr6, set_attr6, &ret_attr);
  786. if (ret6 != H_SUCCESS) {
  787. netdev_err(dev, "unable to change IPv6 checksum "
  788. "offload settings. %d rc=%ld\n",
  789. data, ret6);
  790. h_illan_attributes(adapter->vdev->unit_address,
  791. set_attr6, clr_attr6, &ret_attr);
  792. if (data == 1)
  793. dev->features &= ~NETIF_F_IPV6_CSUM;
  794. } else
  795. adapter->fw_ipv6_csum_support = data;
  796. if (ret4 == H_SUCCESS || ret6 == H_SUCCESS)
  797. adapter->rx_csum = data;
  798. else
  799. rc1 = -EIO;
  800. } else {
  801. rc1 = -EIO;
  802. netdev_err(dev, "unable to change checksum offload settings."
  803. " %d rc=%ld ret_attr=%lx\n", data, ret,
  804. ret_attr);
  805. }
  806. if (restart)
  807. rc2 = ibmveth_open(dev);
  808. return rc1 ? rc1 : rc2;
  809. }
  810. static int ibmveth_set_tso(struct net_device *dev, u32 data)
  811. {
  812. struct ibmveth_adapter *adapter = netdev_priv(dev);
  813. unsigned long set_attr, clr_attr, ret_attr;
  814. long ret1, ret2;
  815. int rc1 = 0, rc2 = 0;
  816. int restart = 0;
  817. if (netif_running(dev)) {
  818. restart = 1;
  819. ibmveth_close(dev);
  820. }
  821. set_attr = 0;
  822. clr_attr = 0;
  823. if (data)
  824. set_attr = IBMVETH_ILLAN_LRG_SR_ENABLED;
  825. else
  826. clr_attr = IBMVETH_ILLAN_LRG_SR_ENABLED;
  827. ret1 = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  828. if (ret1 == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_LRG_SND_SUPPORT) &&
  829. !old_large_send) {
  830. ret2 = h_illan_attributes(adapter->vdev->unit_address, clr_attr,
  831. set_attr, &ret_attr);
  832. if (ret2 != H_SUCCESS) {
  833. netdev_err(dev, "unable to change tso settings. %d rc=%ld\n",
  834. data, ret2);
  835. h_illan_attributes(adapter->vdev->unit_address,
  836. set_attr, clr_attr, &ret_attr);
  837. if (data == 1)
  838. dev->features &= ~(NETIF_F_TSO | NETIF_F_TSO6);
  839. rc1 = -EIO;
  840. } else {
  841. adapter->fw_large_send_support = data;
  842. adapter->large_send = data;
  843. }
  844. } else {
  845. /* Older firmware version of large send offload does not
  846. * support tcp6/ipv6
  847. */
  848. if (data == 1) {
  849. dev->features &= ~NETIF_F_TSO6;
  850. netdev_info(dev, "TSO feature requires all partitions to have updated driver");
  851. }
  852. adapter->large_send = data;
  853. }
  854. if (restart)
  855. rc2 = ibmveth_open(dev);
  856. return rc1 ? rc1 : rc2;
  857. }
  858. static int ibmveth_set_features(struct net_device *dev,
  859. netdev_features_t features)
  860. {
  861. struct ibmveth_adapter *adapter = netdev_priv(dev);
  862. int rx_csum = !!(features & NETIF_F_RXCSUM);
  863. int large_send = !!(features & (NETIF_F_TSO | NETIF_F_TSO6));
  864. int rc1 = 0, rc2 = 0;
  865. if (rx_csum != adapter->rx_csum) {
  866. rc1 = ibmveth_set_csum_offload(dev, rx_csum);
  867. if (rc1 && !adapter->rx_csum)
  868. dev->features =
  869. features & ~(NETIF_F_CSUM_MASK |
  870. NETIF_F_RXCSUM);
  871. }
  872. if (large_send != adapter->large_send) {
  873. rc2 = ibmveth_set_tso(dev, large_send);
  874. if (rc2 && !adapter->large_send)
  875. dev->features =
  876. features & ~(NETIF_F_TSO | NETIF_F_TSO6);
  877. }
  878. return rc1 ? rc1 : rc2;
  879. }
  880. static void ibmveth_get_strings(struct net_device *dev, u32 stringset, u8 *data)
  881. {
  882. int i;
  883. if (stringset != ETH_SS_STATS)
  884. return;
  885. for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++, data += ETH_GSTRING_LEN)
  886. memcpy(data, ibmveth_stats[i].name, ETH_GSTRING_LEN);
  887. }
  888. static int ibmveth_get_sset_count(struct net_device *dev, int sset)
  889. {
  890. switch (sset) {
  891. case ETH_SS_STATS:
  892. return ARRAY_SIZE(ibmveth_stats);
  893. default:
  894. return -EOPNOTSUPP;
  895. }
  896. }
  897. static void ibmveth_get_ethtool_stats(struct net_device *dev,
  898. struct ethtool_stats *stats, u64 *data)
  899. {
  900. int i;
  901. struct ibmveth_adapter *adapter = netdev_priv(dev);
  902. for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++)
  903. data[i] = IBMVETH_GET_STAT(adapter, ibmveth_stats[i].offset);
  904. }
  905. static void ibmveth_get_channels(struct net_device *netdev,
  906. struct ethtool_channels *channels)
  907. {
  908. channels->max_tx = ibmveth_real_max_tx_queues();
  909. channels->tx_count = netdev->real_num_tx_queues;
  910. channels->max_rx = netdev->real_num_rx_queues;
  911. channels->rx_count = netdev->real_num_rx_queues;
  912. }
  913. static int ibmveth_set_channels(struct net_device *netdev,
  914. struct ethtool_channels *channels)
  915. {
  916. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  917. unsigned int old = netdev->real_num_tx_queues,
  918. goal = channels->tx_count;
  919. int rc, i;
  920. /* If ndo_open has not been called yet then don't allocate, just set
  921. * desired netdev_queue's and return
  922. */
  923. if (!(netdev->flags & IFF_UP))
  924. return netif_set_real_num_tx_queues(netdev, goal);
  925. /* We have IBMVETH_MAX_QUEUES netdev_queue's allocated
  926. * but we may need to alloc/free the ltb's.
  927. */
  928. netif_tx_stop_all_queues(netdev);
  929. /* Allocate any queue that we need */
  930. for (i = old; i < goal; i++) {
  931. if (adapter->tx_ltb_ptr[i])
  932. continue;
  933. rc = ibmveth_allocate_tx_ltb(adapter, i);
  934. if (!rc)
  935. continue;
  936. /* if something goes wrong, free everything we just allocated */
  937. netdev_err(netdev, "Failed to allocate more tx queues, returning to %d queues\n",
  938. old);
  939. goal = old;
  940. old = i;
  941. break;
  942. }
  943. rc = netif_set_real_num_tx_queues(netdev, goal);
  944. if (rc) {
  945. netdev_err(netdev, "Failed to set real tx queues, returning to %d queues\n",
  946. old);
  947. goal = old;
  948. old = i;
  949. }
  950. /* Free any that are no longer needed */
  951. for (i = old; i > goal; i--) {
  952. if (adapter->tx_ltb_ptr[i - 1])
  953. ibmveth_free_tx_ltb(adapter, i - 1);
  954. }
  955. netif_tx_wake_all_queues(netdev);
  956. return rc;
  957. }
  958. static const struct ethtool_ops netdev_ethtool_ops = {
  959. .get_drvinfo = netdev_get_drvinfo,
  960. .get_link = ethtool_op_get_link,
  961. .get_strings = ibmveth_get_strings,
  962. .get_sset_count = ibmveth_get_sset_count,
  963. .get_ethtool_stats = ibmveth_get_ethtool_stats,
  964. .get_link_ksettings = ibmveth_get_link_ksettings,
  965. .set_link_ksettings = ibmveth_set_link_ksettings,
  966. .get_channels = ibmveth_get_channels,
  967. .set_channels = ibmveth_set_channels
  968. };
  969. static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
  970. {
  971. return -EOPNOTSUPP;
  972. }
  973. static int ibmveth_send(struct ibmveth_adapter *adapter,
  974. unsigned long desc, unsigned long mss)
  975. {
  976. unsigned long correlator;
  977. unsigned int retry_count;
  978. unsigned long ret;
  979. /*
  980. * The retry count sets a maximum for the number of broadcast and
  981. * multicast destinations within the system.
  982. */
  983. retry_count = 1024;
  984. correlator = 0;
  985. do {
  986. ret = h_send_logical_lan(adapter->vdev->unit_address, desc,
  987. correlator, &correlator, mss,
  988. adapter->fw_large_send_support);
  989. } while ((ret == H_BUSY) && (retry_count--));
  990. if (ret != H_SUCCESS && ret != H_DROPPED) {
  991. netdev_err(adapter->netdev, "tx: h_send_logical_lan failed "
  992. "with rc=%ld\n", ret);
  993. return 1;
  994. }
  995. return 0;
  996. }
  997. static int ibmveth_is_packet_unsupported(struct sk_buff *skb,
  998. struct net_device *netdev)
  999. {
  1000. struct ethhdr *ether_header;
  1001. int ret = 0;
  1002. ether_header = eth_hdr(skb);
  1003. if (ether_addr_equal(ether_header->h_dest, netdev->dev_addr)) {
  1004. netdev_dbg(netdev, "veth doesn't support loopback packets, dropping packet.\n");
  1005. netdev->stats.tx_dropped++;
  1006. ret = -EOPNOTSUPP;
  1007. }
  1008. return ret;
  1009. }
  1010. static netdev_tx_t ibmveth_start_xmit(struct sk_buff *skb,
  1011. struct net_device *netdev)
  1012. {
  1013. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1014. unsigned int desc_flags, total_bytes;
  1015. union ibmveth_buf_desc desc;
  1016. int i, queue_num = skb_get_queue_mapping(skb);
  1017. unsigned long mss = 0;
  1018. if (ibmveth_is_packet_unsupported(skb, netdev))
  1019. goto out;
  1020. /* veth can't checksum offload UDP */
  1021. if (skb->ip_summed == CHECKSUM_PARTIAL &&
  1022. ((skb->protocol == htons(ETH_P_IP) &&
  1023. ip_hdr(skb)->protocol != IPPROTO_TCP) ||
  1024. (skb->protocol == htons(ETH_P_IPV6) &&
  1025. ipv6_hdr(skb)->nexthdr != IPPROTO_TCP)) &&
  1026. skb_checksum_help(skb)) {
  1027. netdev_err(netdev, "tx: failed to checksum packet\n");
  1028. netdev->stats.tx_dropped++;
  1029. goto out;
  1030. }
  1031. desc_flags = IBMVETH_BUF_VALID;
  1032. if (skb->ip_summed == CHECKSUM_PARTIAL) {
  1033. unsigned char *buf = skb_transport_header(skb) +
  1034. skb->csum_offset;
  1035. desc_flags |= (IBMVETH_BUF_NO_CSUM | IBMVETH_BUF_CSUM_GOOD);
  1036. /* Need to zero out the checksum */
  1037. buf[0] = 0;
  1038. buf[1] = 0;
  1039. if (skb_is_gso(skb) && adapter->fw_large_send_support)
  1040. desc_flags |= IBMVETH_BUF_LRG_SND;
  1041. }
  1042. if (skb->ip_summed == CHECKSUM_PARTIAL && skb_is_gso(skb)) {
  1043. if (adapter->fw_large_send_support) {
  1044. mss = (unsigned long)skb_shinfo(skb)->gso_size;
  1045. adapter->tx_large_packets++;
  1046. } else if (!skb_is_gso_v6(skb)) {
  1047. /* Put -1 in the IP checksum to tell phyp it
  1048. * is a largesend packet. Put the mss in
  1049. * the TCP checksum.
  1050. */
  1051. ip_hdr(skb)->check = 0xffff;
  1052. tcp_hdr(skb)->check =
  1053. cpu_to_be16(skb_shinfo(skb)->gso_size);
  1054. adapter->tx_large_packets++;
  1055. }
  1056. }
  1057. /* Copy header into mapped buffer */
  1058. if (unlikely(skb->len > adapter->tx_ltb_size)) {
  1059. netdev_err(adapter->netdev, "tx: packet size (%u) exceeds ltb (%u)\n",
  1060. skb->len, adapter->tx_ltb_size);
  1061. netdev->stats.tx_dropped++;
  1062. goto out;
  1063. }
  1064. memcpy(adapter->tx_ltb_ptr[queue_num], skb->data, skb_headlen(skb));
  1065. total_bytes = skb_headlen(skb);
  1066. /* Copy frags into mapped buffers */
  1067. for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
  1068. const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
  1069. memcpy(adapter->tx_ltb_ptr[queue_num] + total_bytes,
  1070. skb_frag_address_safe(frag), skb_frag_size(frag));
  1071. total_bytes += skb_frag_size(frag);
  1072. }
  1073. if (unlikely(total_bytes != skb->len)) {
  1074. netdev_err(adapter->netdev, "tx: incorrect packet len copied into ltb (%u != %u)\n",
  1075. skb->len, total_bytes);
  1076. netdev->stats.tx_dropped++;
  1077. goto out;
  1078. }
  1079. desc.fields.flags_len = desc_flags | skb->len;
  1080. desc.fields.address = adapter->tx_ltb_dma[queue_num];
  1081. /* finish writing to long_term_buff before VIOS accessing it */
  1082. dma_wmb();
  1083. if (ibmveth_send(adapter, desc.desc, mss)) {
  1084. adapter->tx_send_failed++;
  1085. netdev->stats.tx_dropped++;
  1086. } else {
  1087. netdev->stats.tx_packets++;
  1088. netdev->stats.tx_bytes += skb->len;
  1089. }
  1090. out:
  1091. dev_consume_skb_any(skb);
  1092. return NETDEV_TX_OK;
  1093. }
  1094. static void ibmveth_rx_mss_helper(struct sk_buff *skb, u16 mss, int lrg_pkt)
  1095. {
  1096. struct tcphdr *tcph;
  1097. int offset = 0;
  1098. int hdr_len;
  1099. /* only TCP packets will be aggregated */
  1100. if (skb->protocol == htons(ETH_P_IP)) {
  1101. struct iphdr *iph = (struct iphdr *)skb->data;
  1102. if (iph->protocol == IPPROTO_TCP) {
  1103. offset = iph->ihl * 4;
  1104. skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
  1105. } else {
  1106. return;
  1107. }
  1108. } else if (skb->protocol == htons(ETH_P_IPV6)) {
  1109. struct ipv6hdr *iph6 = (struct ipv6hdr *)skb->data;
  1110. if (iph6->nexthdr == IPPROTO_TCP) {
  1111. offset = sizeof(struct ipv6hdr);
  1112. skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
  1113. } else {
  1114. return;
  1115. }
  1116. } else {
  1117. return;
  1118. }
  1119. /* if mss is not set through Large Packet bit/mss in rx buffer,
  1120. * expect that the mss will be written to the tcp header checksum.
  1121. */
  1122. tcph = (struct tcphdr *)(skb->data + offset);
  1123. if (lrg_pkt) {
  1124. skb_shinfo(skb)->gso_size = mss;
  1125. } else if (offset) {
  1126. skb_shinfo(skb)->gso_size = ntohs(tcph->check);
  1127. tcph->check = 0;
  1128. }
  1129. if (skb_shinfo(skb)->gso_size) {
  1130. hdr_len = offset + tcph->doff * 4;
  1131. skb_shinfo(skb)->gso_segs =
  1132. DIV_ROUND_UP(skb->len - hdr_len,
  1133. skb_shinfo(skb)->gso_size);
  1134. }
  1135. }
  1136. static void ibmveth_rx_csum_helper(struct sk_buff *skb,
  1137. struct ibmveth_adapter *adapter)
  1138. {
  1139. struct iphdr *iph = NULL;
  1140. struct ipv6hdr *iph6 = NULL;
  1141. __be16 skb_proto = 0;
  1142. u16 iphlen = 0;
  1143. u16 iph_proto = 0;
  1144. u16 tcphdrlen = 0;
  1145. skb_proto = be16_to_cpu(skb->protocol);
  1146. if (skb_proto == ETH_P_IP) {
  1147. iph = (struct iphdr *)skb->data;
  1148. /* If the IP checksum is not offloaded and if the packet
  1149. * is large send, the checksum must be rebuilt.
  1150. */
  1151. if (iph->check == 0xffff) {
  1152. iph->check = 0;
  1153. iph->check = ip_fast_csum((unsigned char *)iph,
  1154. iph->ihl);
  1155. }
  1156. iphlen = iph->ihl * 4;
  1157. iph_proto = iph->protocol;
  1158. } else if (skb_proto == ETH_P_IPV6) {
  1159. iph6 = (struct ipv6hdr *)skb->data;
  1160. iphlen = sizeof(struct ipv6hdr);
  1161. iph_proto = iph6->nexthdr;
  1162. }
  1163. /* When CSO is enabled the TCP checksum may have be set to NULL by
  1164. * the sender given that we zeroed out TCP checksum field in
  1165. * transmit path (refer ibmveth_start_xmit routine). In this case set
  1166. * up CHECKSUM_PARTIAL. If the packet is forwarded, the checksum will
  1167. * then be recalculated by the destination NIC (CSO must be enabled
  1168. * on the destination NIC).
  1169. *
  1170. * In an OVS environment, when a flow is not cached, specifically for a
  1171. * new TCP connection, the first packet information is passed up to
  1172. * the user space for finding a flow. During this process, OVS computes
  1173. * checksum on the first packet when CHECKSUM_PARTIAL flag is set.
  1174. *
  1175. * So, re-compute TCP pseudo header checksum.
  1176. */
  1177. if (iph_proto == IPPROTO_TCP) {
  1178. struct tcphdr *tcph = (struct tcphdr *)(skb->data + iphlen);
  1179. if (tcph->check == 0x0000) {
  1180. /* Recompute TCP pseudo header checksum */
  1181. tcphdrlen = skb->len - iphlen;
  1182. if (skb_proto == ETH_P_IP)
  1183. tcph->check =
  1184. ~csum_tcpudp_magic(iph->saddr,
  1185. iph->daddr, tcphdrlen, iph_proto, 0);
  1186. else if (skb_proto == ETH_P_IPV6)
  1187. tcph->check =
  1188. ~csum_ipv6_magic(&iph6->saddr,
  1189. &iph6->daddr, tcphdrlen, iph_proto, 0);
  1190. /* Setup SKB fields for checksum offload */
  1191. skb_partial_csum_set(skb, iphlen,
  1192. offsetof(struct tcphdr, check));
  1193. skb_reset_network_header(skb);
  1194. }
  1195. }
  1196. }
  1197. static int ibmveth_poll(struct napi_struct *napi, int budget)
  1198. {
  1199. struct ibmveth_adapter *adapter =
  1200. container_of(napi, struct ibmveth_adapter, napi);
  1201. struct net_device *netdev = adapter->netdev;
  1202. int frames_processed = 0;
  1203. unsigned long lpar_rc;
  1204. u16 mss = 0;
  1205. restart_poll:
  1206. while (frames_processed < budget) {
  1207. if (!ibmveth_rxq_pending_buffer(adapter))
  1208. break;
  1209. smp_rmb();
  1210. if (!ibmveth_rxq_buffer_valid(adapter)) {
  1211. wmb(); /* suggested by larson1 */
  1212. adapter->rx_invalid_buffer++;
  1213. netdev_dbg(netdev, "recycling invalid buffer\n");
  1214. if (unlikely(ibmveth_rxq_harvest_buffer(adapter, true)))
  1215. break;
  1216. } else {
  1217. struct sk_buff *skb, *new_skb;
  1218. int length = ibmveth_rxq_frame_length(adapter);
  1219. int offset = ibmveth_rxq_frame_offset(adapter);
  1220. int csum_good = ibmveth_rxq_csum_good(adapter);
  1221. int lrg_pkt = ibmveth_rxq_large_packet(adapter);
  1222. __sum16 iph_check = 0;
  1223. skb = ibmveth_rxq_get_buffer(adapter);
  1224. if (unlikely(!skb))
  1225. break;
  1226. /* if the large packet bit is set in the rx queue
  1227. * descriptor, the mss will be written by PHYP eight
  1228. * bytes from the start of the rx buffer, which is
  1229. * skb->data at this stage
  1230. */
  1231. if (lrg_pkt) {
  1232. __be64 *rxmss = (__be64 *)(skb->data + 8);
  1233. mss = (u16)be64_to_cpu(*rxmss);
  1234. }
  1235. new_skb = NULL;
  1236. if (length < rx_copybreak)
  1237. new_skb = netdev_alloc_skb(netdev, length);
  1238. if (new_skb) {
  1239. skb_copy_to_linear_data(new_skb,
  1240. skb->data + offset,
  1241. length);
  1242. if (rx_flush)
  1243. ibmveth_flush_buffer(skb->data,
  1244. length + offset);
  1245. if (unlikely(ibmveth_rxq_harvest_buffer(adapter, true)))
  1246. break;
  1247. skb = new_skb;
  1248. } else {
  1249. if (unlikely(ibmveth_rxq_harvest_buffer(adapter, false)))
  1250. break;
  1251. skb_reserve(skb, offset);
  1252. }
  1253. skb_put(skb, length);
  1254. skb->protocol = eth_type_trans(skb, netdev);
  1255. /* PHYP without PLSO support places a -1 in the ip
  1256. * checksum for large send frames.
  1257. */
  1258. if (skb->protocol == cpu_to_be16(ETH_P_IP)) {
  1259. struct iphdr *iph = (struct iphdr *)skb->data;
  1260. iph_check = iph->check;
  1261. }
  1262. if ((length > netdev->mtu + ETH_HLEN) ||
  1263. lrg_pkt || iph_check == 0xffff) {
  1264. ibmveth_rx_mss_helper(skb, mss, lrg_pkt);
  1265. adapter->rx_large_packets++;
  1266. }
  1267. if (csum_good) {
  1268. skb->ip_summed = CHECKSUM_UNNECESSARY;
  1269. ibmveth_rx_csum_helper(skb, adapter);
  1270. }
  1271. napi_gro_receive(napi, skb); /* send it up */
  1272. netdev->stats.rx_packets++;
  1273. netdev->stats.rx_bytes += length;
  1274. frames_processed++;
  1275. }
  1276. }
  1277. ibmveth_replenish_task(adapter);
  1278. if (frames_processed == budget)
  1279. goto out;
  1280. if (!napi_complete_done(napi, frames_processed))
  1281. goto out;
  1282. /* We think we are done - reenable interrupts,
  1283. * then check once more to make sure we are done.
  1284. */
  1285. lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_ENABLE);
  1286. if (WARN_ON(lpar_rc != H_SUCCESS)) {
  1287. schedule_work(&adapter->work);
  1288. goto out;
  1289. }
  1290. if (ibmveth_rxq_pending_buffer(adapter) && napi_schedule(napi)) {
  1291. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  1292. VIO_IRQ_DISABLE);
  1293. goto restart_poll;
  1294. }
  1295. out:
  1296. return frames_processed;
  1297. }
  1298. static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance)
  1299. {
  1300. struct net_device *netdev = dev_instance;
  1301. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1302. unsigned long lpar_rc;
  1303. if (napi_schedule_prep(&adapter->napi)) {
  1304. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  1305. VIO_IRQ_DISABLE);
  1306. WARN_ON(lpar_rc != H_SUCCESS);
  1307. __napi_schedule(&adapter->napi);
  1308. }
  1309. return IRQ_HANDLED;
  1310. }
  1311. static void ibmveth_set_multicast_list(struct net_device *netdev)
  1312. {
  1313. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1314. unsigned long lpar_rc;
  1315. if ((netdev->flags & IFF_PROMISC) ||
  1316. (netdev_mc_count(netdev) > adapter->mcastFilterSize)) {
  1317. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1318. IbmVethMcastEnableRecv |
  1319. IbmVethMcastDisableFiltering,
  1320. 0);
  1321. if (lpar_rc != H_SUCCESS) {
  1322. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1323. "entering promisc mode\n", lpar_rc);
  1324. }
  1325. } else {
  1326. struct netdev_hw_addr *ha;
  1327. /* clear the filter table & disable filtering */
  1328. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1329. IbmVethMcastEnableRecv |
  1330. IbmVethMcastDisableFiltering |
  1331. IbmVethMcastClearFilterTable,
  1332. 0);
  1333. if (lpar_rc != H_SUCCESS) {
  1334. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1335. "attempting to clear filter table\n",
  1336. lpar_rc);
  1337. }
  1338. /* add the addresses to the filter table */
  1339. netdev_for_each_mc_addr(ha, netdev) {
  1340. /* add the multicast address to the filter table */
  1341. u64 mcast_addr;
  1342. mcast_addr = ether_addr_to_u64(ha->addr);
  1343. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1344. IbmVethMcastAddFilter,
  1345. mcast_addr);
  1346. if (lpar_rc != H_SUCCESS) {
  1347. netdev_err(netdev, "h_multicast_ctrl rc=%ld "
  1348. "when adding an entry to the filter "
  1349. "table\n", lpar_rc);
  1350. }
  1351. }
  1352. /* re-enable filtering */
  1353. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1354. IbmVethMcastEnableFiltering,
  1355. 0);
  1356. if (lpar_rc != H_SUCCESS) {
  1357. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1358. "enabling filtering\n", lpar_rc);
  1359. }
  1360. }
  1361. }
  1362. static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
  1363. {
  1364. struct ibmveth_adapter *adapter = netdev_priv(dev);
  1365. struct vio_dev *viodev = adapter->vdev;
  1366. int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH;
  1367. int i, rc;
  1368. int need_restart = 0;
  1369. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1370. if (new_mtu_oh <= adapter->rx_buff_pool[i].buff_size)
  1371. break;
  1372. if (i == IBMVETH_NUM_BUFF_POOLS)
  1373. return -EINVAL;
  1374. /* Deactivate all the buffer pools so that the next loop can activate
  1375. only the buffer pools necessary to hold the new MTU */
  1376. if (netif_running(adapter->netdev)) {
  1377. need_restart = 1;
  1378. ibmveth_close(adapter->netdev);
  1379. }
  1380. /* Look for an active buffer pool that can hold the new MTU */
  1381. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1382. adapter->rx_buff_pool[i].active = 1;
  1383. if (new_mtu_oh <= adapter->rx_buff_pool[i].buff_size) {
  1384. WRITE_ONCE(dev->mtu, new_mtu);
  1385. vio_cmo_set_dev_desired(viodev,
  1386. ibmveth_get_desired_dma
  1387. (viodev));
  1388. if (need_restart) {
  1389. return ibmveth_open(adapter->netdev);
  1390. }
  1391. return 0;
  1392. }
  1393. }
  1394. if (need_restart && (rc = ibmveth_open(adapter->netdev)))
  1395. return rc;
  1396. return -EINVAL;
  1397. }
  1398. #ifdef CONFIG_NET_POLL_CONTROLLER
  1399. static void ibmveth_poll_controller(struct net_device *dev)
  1400. {
  1401. ibmveth_replenish_task(netdev_priv(dev));
  1402. ibmveth_interrupt(dev->irq, dev);
  1403. }
  1404. #endif
  1405. /**
  1406. * ibmveth_get_desired_dma - Calculate IO memory desired by the driver
  1407. *
  1408. * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
  1409. *
  1410. * Return value:
  1411. * Number of bytes of IO data the driver will need to perform well.
  1412. */
  1413. static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev)
  1414. {
  1415. struct net_device *netdev = dev_get_drvdata(&vdev->dev);
  1416. struct ibmveth_adapter *adapter;
  1417. struct iommu_table *tbl;
  1418. unsigned long ret;
  1419. int i;
  1420. int rxqentries = 1;
  1421. tbl = get_iommu_table_base(&vdev->dev);
  1422. /* netdev inits at probe time along with the structures we need below*/
  1423. if (netdev == NULL)
  1424. return IOMMU_PAGE_ALIGN(IBMVETH_IO_ENTITLEMENT_DEFAULT, tbl);
  1425. adapter = netdev_priv(netdev);
  1426. ret = IBMVETH_BUFF_LIST_SIZE + IBMVETH_FILT_LIST_SIZE;
  1427. ret += IOMMU_PAGE_ALIGN(netdev->mtu, tbl);
  1428. /* add size of mapped tx buffers */
  1429. ret += IOMMU_PAGE_ALIGN(IBMVETH_MAX_TX_BUF_SIZE, tbl);
  1430. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1431. /* add the size of the active receive buffers */
  1432. if (adapter->rx_buff_pool[i].active)
  1433. ret +=
  1434. adapter->rx_buff_pool[i].size *
  1435. IOMMU_PAGE_ALIGN(adapter->rx_buff_pool[i].
  1436. buff_size, tbl);
  1437. rxqentries += adapter->rx_buff_pool[i].size;
  1438. }
  1439. /* add the size of the receive queue entries */
  1440. ret += IOMMU_PAGE_ALIGN(
  1441. rxqentries * sizeof(struct ibmveth_rx_q_entry), tbl);
  1442. return ret;
  1443. }
  1444. static int ibmveth_set_mac_addr(struct net_device *dev, void *p)
  1445. {
  1446. struct ibmveth_adapter *adapter = netdev_priv(dev);
  1447. struct sockaddr *addr = p;
  1448. u64 mac_address;
  1449. int rc;
  1450. if (!is_valid_ether_addr(addr->sa_data))
  1451. return -EADDRNOTAVAIL;
  1452. mac_address = ether_addr_to_u64(addr->sa_data);
  1453. rc = h_change_logical_lan_mac(adapter->vdev->unit_address, mac_address);
  1454. if (rc) {
  1455. netdev_err(adapter->netdev, "h_change_logical_lan_mac failed with rc=%d\n", rc);
  1456. return rc;
  1457. }
  1458. eth_hw_addr_set(dev, addr->sa_data);
  1459. return 0;
  1460. }
  1461. static const struct net_device_ops ibmveth_netdev_ops = {
  1462. .ndo_open = ibmveth_open,
  1463. .ndo_stop = ibmveth_close,
  1464. .ndo_start_xmit = ibmveth_start_xmit,
  1465. .ndo_set_rx_mode = ibmveth_set_multicast_list,
  1466. .ndo_eth_ioctl = ibmveth_ioctl,
  1467. .ndo_change_mtu = ibmveth_change_mtu,
  1468. .ndo_fix_features = ibmveth_fix_features,
  1469. .ndo_set_features = ibmveth_set_features,
  1470. .ndo_validate_addr = eth_validate_addr,
  1471. .ndo_set_mac_address = ibmveth_set_mac_addr,
  1472. #ifdef CONFIG_NET_POLL_CONTROLLER
  1473. .ndo_poll_controller = ibmveth_poll_controller,
  1474. #endif
  1475. };
  1476. static int ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
  1477. {
  1478. int rc, i, mac_len;
  1479. struct net_device *netdev;
  1480. struct ibmveth_adapter *adapter;
  1481. unsigned char *mac_addr_p;
  1482. __be32 *mcastFilterSize_p;
  1483. long ret;
  1484. unsigned long ret_attr;
  1485. dev_dbg(&dev->dev, "entering ibmveth_probe for UA 0x%x\n",
  1486. dev->unit_address);
  1487. mac_addr_p = (unsigned char *)vio_get_attribute(dev, VETH_MAC_ADDR,
  1488. &mac_len);
  1489. if (!mac_addr_p) {
  1490. dev_err(&dev->dev, "Can't find VETH_MAC_ADDR attribute\n");
  1491. return -EINVAL;
  1492. }
  1493. /* Workaround for old/broken pHyp */
  1494. if (mac_len == 8)
  1495. mac_addr_p += 2;
  1496. else if (mac_len != 6) {
  1497. dev_err(&dev->dev, "VETH_MAC_ADDR attribute wrong len %d\n",
  1498. mac_len);
  1499. return -EINVAL;
  1500. }
  1501. mcastFilterSize_p = (__be32 *)vio_get_attribute(dev,
  1502. VETH_MCAST_FILTER_SIZE,
  1503. NULL);
  1504. if (!mcastFilterSize_p) {
  1505. dev_err(&dev->dev, "Can't find VETH_MCAST_FILTER_SIZE "
  1506. "attribute\n");
  1507. return -EINVAL;
  1508. }
  1509. netdev = alloc_etherdev_mqs(sizeof(struct ibmveth_adapter), IBMVETH_MAX_QUEUES, 1);
  1510. if (!netdev)
  1511. return -ENOMEM;
  1512. adapter = netdev_priv(netdev);
  1513. dev_set_drvdata(&dev->dev, netdev);
  1514. adapter->vdev = dev;
  1515. adapter->netdev = netdev;
  1516. INIT_WORK(&adapter->work, ibmveth_reset);
  1517. adapter->mcastFilterSize = be32_to_cpu(*mcastFilterSize_p);
  1518. ibmveth_init_link_settings(netdev);
  1519. netif_napi_add_weight(netdev, &adapter->napi, ibmveth_poll, 16);
  1520. netdev->irq = dev->irq;
  1521. netdev->netdev_ops = &ibmveth_netdev_ops;
  1522. netdev->ethtool_ops = &netdev_ethtool_ops;
  1523. SET_NETDEV_DEV(netdev, &dev->dev);
  1524. netdev->hw_features = NETIF_F_SG;
  1525. if (vio_get_attribute(dev, "ibm,illan-options", NULL) != NULL) {
  1526. netdev->hw_features |= NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM |
  1527. NETIF_F_RXCSUM;
  1528. }
  1529. netdev->features |= netdev->hw_features;
  1530. ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  1531. /* If running older firmware, TSO should not be enabled by default */
  1532. if (ret == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_LRG_SND_SUPPORT) &&
  1533. !old_large_send) {
  1534. netdev->hw_features |= NETIF_F_TSO | NETIF_F_TSO6;
  1535. netdev->features |= netdev->hw_features;
  1536. } else {
  1537. netdev->hw_features |= NETIF_F_TSO;
  1538. }
  1539. adapter->is_active_trunk = false;
  1540. if (ret == H_SUCCESS && (ret_attr & IBMVETH_ILLAN_ACTIVE_TRUNK)) {
  1541. adapter->is_active_trunk = true;
  1542. netdev->hw_features |= NETIF_F_FRAGLIST;
  1543. netdev->features |= NETIF_F_FRAGLIST;
  1544. }
  1545. if (ret == H_SUCCESS &&
  1546. (ret_attr & IBMVETH_ILLAN_RX_MULTI_BUFF_SUPPORT)) {
  1547. adapter->rx_buffers_per_hcall = IBMVETH_MAX_RX_PER_HCALL;
  1548. netdev_dbg(netdev,
  1549. "RX Multi-buffer hcall supported by FW, batch set to %u\n",
  1550. adapter->rx_buffers_per_hcall);
  1551. } else {
  1552. adapter->rx_buffers_per_hcall = 1;
  1553. netdev_dbg(netdev,
  1554. "RX Single-buffer hcall mode, batch set to %u\n",
  1555. adapter->rx_buffers_per_hcall);
  1556. }
  1557. netdev->min_mtu = IBMVETH_MIN_MTU;
  1558. netdev->max_mtu = ETH_MAX_MTU - IBMVETH_BUFF_OH;
  1559. eth_hw_addr_set(netdev, mac_addr_p);
  1560. if (firmware_has_feature(FW_FEATURE_CMO))
  1561. memcpy(pool_count, pool_count_cmo, sizeof(pool_count));
  1562. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1563. struct kobject *kobj = &adapter->rx_buff_pool[i].kobj;
  1564. int error;
  1565. ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
  1566. pool_count[i], pool_size[i],
  1567. pool_active[i]);
  1568. error = kobject_init_and_add(kobj, &ktype_veth_pool,
  1569. &dev->dev.kobj, "pool%d", i);
  1570. if (!error)
  1571. kobject_uevent(kobj, KOBJ_ADD);
  1572. }
  1573. rc = netif_set_real_num_tx_queues(netdev, min(num_online_cpus(),
  1574. IBMVETH_DEFAULT_QUEUES));
  1575. if (rc) {
  1576. netdev_dbg(netdev, "failed to set number of tx queues rc=%d\n",
  1577. rc);
  1578. free_netdev(netdev);
  1579. return rc;
  1580. }
  1581. adapter->tx_ltb_size = PAGE_ALIGN(IBMVETH_MAX_TX_BUF_SIZE);
  1582. for (i = 0; i < IBMVETH_MAX_QUEUES; i++)
  1583. adapter->tx_ltb_ptr[i] = NULL;
  1584. netdev_dbg(netdev, "adapter @ 0x%p\n", adapter);
  1585. netdev_dbg(netdev, "registering netdev...\n");
  1586. ibmveth_set_features(netdev, netdev->features);
  1587. rc = register_netdev(netdev);
  1588. if (rc) {
  1589. netdev_dbg(netdev, "failed to register netdev rc=%d\n", rc);
  1590. free_netdev(netdev);
  1591. return rc;
  1592. }
  1593. netdev_dbg(netdev, "registered\n");
  1594. return 0;
  1595. }
  1596. static void ibmveth_remove(struct vio_dev *dev)
  1597. {
  1598. struct net_device *netdev = dev_get_drvdata(&dev->dev);
  1599. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1600. int i;
  1601. cancel_work_sync(&adapter->work);
  1602. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1603. kobject_put(&adapter->rx_buff_pool[i].kobj);
  1604. unregister_netdev(netdev);
  1605. free_netdev(netdev);
  1606. dev_set_drvdata(&dev->dev, NULL);
  1607. }
  1608. static struct attribute veth_active_attr;
  1609. static struct attribute veth_num_attr;
  1610. static struct attribute veth_size_attr;
  1611. static ssize_t veth_pool_show(struct kobject *kobj,
  1612. struct attribute *attr, char *buf)
  1613. {
  1614. struct ibmveth_buff_pool *pool = container_of(kobj,
  1615. struct ibmveth_buff_pool,
  1616. kobj);
  1617. if (attr == &veth_active_attr)
  1618. return sprintf(buf, "%d\n", pool->active);
  1619. else if (attr == &veth_num_attr)
  1620. return sprintf(buf, "%d\n", pool->size);
  1621. else if (attr == &veth_size_attr)
  1622. return sprintf(buf, "%d\n", pool->buff_size);
  1623. return 0;
  1624. }
  1625. /**
  1626. * veth_pool_store - sysfs store handler for pool attributes
  1627. * @kobj: kobject embedded in pool
  1628. * @attr: attribute being changed
  1629. * @buf: value being stored
  1630. * @count: length of @buf in bytes
  1631. *
  1632. * Stores new value in pool attribute. Verifies the range of the new value for
  1633. * size and buff_size. Verifies that at least one pool remains available to
  1634. * receive MTU-sized packets.
  1635. *
  1636. * Context: Process context.
  1637. * Takes and releases rtnl_mutex to ensure correct ordering of close
  1638. * and open calls.
  1639. * Return:
  1640. * * %-EPERM - Not allowed to disabled all MTU-sized buffer pools
  1641. * * %-EINVAL - New pool size or buffer size is out of range
  1642. * * count - Return count for success
  1643. * * other - Return value from a failed ibmveth_open call
  1644. */
  1645. static ssize_t veth_pool_store(struct kobject *kobj, struct attribute *attr,
  1646. const char *buf, size_t count)
  1647. {
  1648. struct ibmveth_buff_pool *pool = container_of(kobj,
  1649. struct ibmveth_buff_pool,
  1650. kobj);
  1651. struct net_device *netdev = dev_get_drvdata(kobj_to_dev(kobj->parent));
  1652. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1653. long value = simple_strtol(buf, NULL, 10);
  1654. bool change = false;
  1655. u32 newbuff_size;
  1656. u32 oldbuff_size;
  1657. int newactive;
  1658. int oldactive;
  1659. u32 newsize;
  1660. u32 oldsize;
  1661. long rc;
  1662. rtnl_lock();
  1663. oldbuff_size = pool->buff_size;
  1664. oldactive = pool->active;
  1665. oldsize = pool->size;
  1666. newbuff_size = oldbuff_size;
  1667. newactive = oldactive;
  1668. newsize = oldsize;
  1669. if (attr == &veth_active_attr) {
  1670. if (value && !oldactive) {
  1671. newactive = 1;
  1672. change = true;
  1673. } else if (!value && oldactive) {
  1674. int mtu = netdev->mtu + IBMVETH_BUFF_OH;
  1675. int i;
  1676. /* Make sure there is a buffer pool with buffers that
  1677. can hold a packet of the size of the MTU */
  1678. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1679. if (pool == &adapter->rx_buff_pool[i])
  1680. continue;
  1681. if (!adapter->rx_buff_pool[i].active)
  1682. continue;
  1683. if (mtu <= adapter->rx_buff_pool[i].buff_size)
  1684. break;
  1685. }
  1686. if (i == IBMVETH_NUM_BUFF_POOLS) {
  1687. netdev_err(netdev, "no active pool >= MTU\n");
  1688. rc = -EPERM;
  1689. goto unlock_err;
  1690. }
  1691. newactive = 0;
  1692. change = true;
  1693. }
  1694. } else if (attr == &veth_num_attr) {
  1695. if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT) {
  1696. rc = -EINVAL;
  1697. goto unlock_err;
  1698. }
  1699. if (value != oldsize) {
  1700. newsize = value;
  1701. change = true;
  1702. }
  1703. } else if (attr == &veth_size_attr) {
  1704. if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE) {
  1705. rc = -EINVAL;
  1706. goto unlock_err;
  1707. }
  1708. if (value != oldbuff_size) {
  1709. newbuff_size = value;
  1710. change = true;
  1711. }
  1712. }
  1713. if (change) {
  1714. if (netif_running(netdev))
  1715. ibmveth_close(netdev);
  1716. pool->active = newactive;
  1717. pool->buff_size = newbuff_size;
  1718. pool->size = newsize;
  1719. if (netif_running(netdev)) {
  1720. rc = ibmveth_open(netdev);
  1721. if (rc) {
  1722. pool->active = oldactive;
  1723. pool->buff_size = oldbuff_size;
  1724. pool->size = oldsize;
  1725. goto unlock_err;
  1726. }
  1727. }
  1728. }
  1729. rtnl_unlock();
  1730. /* kick the interrupt handler to allocate/deallocate pools */
  1731. ibmveth_interrupt(netdev->irq, netdev);
  1732. return count;
  1733. unlock_err:
  1734. rtnl_unlock();
  1735. return rc;
  1736. }
  1737. #define ATTR(_name, _mode) \
  1738. struct attribute veth_##_name##_attr = { \
  1739. .name = __stringify(_name), .mode = _mode, \
  1740. };
  1741. static ATTR(active, 0644);
  1742. static ATTR(num, 0644);
  1743. static ATTR(size, 0644);
  1744. static struct attribute *veth_pool_attrs[] = {
  1745. &veth_active_attr,
  1746. &veth_num_attr,
  1747. &veth_size_attr,
  1748. NULL,
  1749. };
  1750. ATTRIBUTE_GROUPS(veth_pool);
  1751. static const struct sysfs_ops veth_pool_ops = {
  1752. .show = veth_pool_show,
  1753. .store = veth_pool_store,
  1754. };
  1755. static struct kobj_type ktype_veth_pool = {
  1756. .release = NULL,
  1757. .sysfs_ops = &veth_pool_ops,
  1758. .default_groups = veth_pool_groups,
  1759. };
  1760. static int ibmveth_resume(struct device *dev)
  1761. {
  1762. struct net_device *netdev = dev_get_drvdata(dev);
  1763. ibmveth_interrupt(netdev->irq, netdev);
  1764. return 0;
  1765. }
  1766. static const struct vio_device_id ibmveth_device_table[] = {
  1767. { "network", "IBM,l-lan"},
  1768. { "", "" }
  1769. };
  1770. MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
  1771. static const struct dev_pm_ops ibmveth_pm_ops = {
  1772. .resume = ibmveth_resume
  1773. };
  1774. static struct vio_driver ibmveth_driver = {
  1775. .id_table = ibmveth_device_table,
  1776. .probe = ibmveth_probe,
  1777. .remove = ibmveth_remove,
  1778. .get_desired_dma = ibmveth_get_desired_dma,
  1779. .name = ibmveth_driver_name,
  1780. .pm = &ibmveth_pm_ops,
  1781. };
  1782. static int __init ibmveth_module_init(void)
  1783. {
  1784. printk(KERN_DEBUG "%s: %s %s\n", ibmveth_driver_name,
  1785. ibmveth_driver_string, ibmveth_driver_version);
  1786. return vio_register_driver(&ibmveth_driver);
  1787. }
  1788. static void __exit ibmveth_module_exit(void)
  1789. {
  1790. vio_unregister_driver(&ibmveth_driver);
  1791. }
  1792. module_init(ibmveth_module_init);
  1793. module_exit(ibmveth_module_exit);
  1794. #ifdef CONFIG_IBMVETH_KUNIT_TEST
  1795. #include <kunit/test.h>
  1796. /**
  1797. * ibmveth_reset_kunit - reset routine for running in KUnit environment
  1798. *
  1799. * @w: pointer to work_struct embedded in adapter structure
  1800. *
  1801. * Context: Called in the KUnit environment. Does nothing.
  1802. *
  1803. * Return: void
  1804. */
  1805. static void ibmveth_reset_kunit(struct work_struct *w)
  1806. {
  1807. netdev_dbg(NULL, "reset_kunit starting\n");
  1808. netdev_dbg(NULL, "reset_kunit complete\n");
  1809. }
  1810. /**
  1811. * ibmveth_remove_buffer_from_pool_test - unit test for some of
  1812. * ibmveth_remove_buffer_from_pool
  1813. * @test: pointer to kunit structure
  1814. *
  1815. * Tests the error returns from ibmveth_remove_buffer_from_pool.
  1816. * ibmveth_remove_buffer_from_pool also calls WARN_ON, so dmesg should be
  1817. * checked to see that these warnings happened.
  1818. *
  1819. * Return: void
  1820. */
  1821. static void ibmveth_remove_buffer_from_pool_test(struct kunit *test)
  1822. {
  1823. struct ibmveth_adapter *adapter = kunit_kzalloc(test, sizeof(*adapter), GFP_KERNEL);
  1824. struct ibmveth_buff_pool *pool;
  1825. u64 correlator;
  1826. KUNIT_ASSERT_NOT_ERR_OR_NULL(test, adapter);
  1827. INIT_WORK(&adapter->work, ibmveth_reset_kunit);
  1828. /* Set sane values for buffer pools */
  1829. for (int i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1830. ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
  1831. pool_count[i], pool_size[i],
  1832. pool_active[i]);
  1833. pool = &adapter->rx_buff_pool[0];
  1834. pool->skbuff = kunit_kcalloc(test, pool->size, sizeof(void *), GFP_KERNEL);
  1835. KUNIT_ASSERT_NOT_ERR_OR_NULL(test, pool->skbuff);
  1836. correlator = ((u64)IBMVETH_NUM_BUFF_POOLS << 32) | 0;
  1837. KUNIT_EXPECT_EQ(test, -EINVAL, ibmveth_remove_buffer_from_pool(adapter, correlator, false));
  1838. KUNIT_EXPECT_EQ(test, -EINVAL, ibmveth_remove_buffer_from_pool(adapter, correlator, true));
  1839. correlator = ((u64)0 << 32) | adapter->rx_buff_pool[0].size;
  1840. KUNIT_EXPECT_EQ(test, -EINVAL, ibmveth_remove_buffer_from_pool(adapter, correlator, false));
  1841. KUNIT_EXPECT_EQ(test, -EINVAL, ibmveth_remove_buffer_from_pool(adapter, correlator, true));
  1842. correlator = (u64)0 | 0;
  1843. pool->skbuff[0] = NULL;
  1844. KUNIT_EXPECT_EQ(test, -EFAULT, ibmveth_remove_buffer_from_pool(adapter, correlator, false));
  1845. KUNIT_EXPECT_EQ(test, -EFAULT, ibmveth_remove_buffer_from_pool(adapter, correlator, true));
  1846. flush_work(&adapter->work);
  1847. }
  1848. /**
  1849. * ibmveth_rxq_get_buffer_test - unit test for ibmveth_rxq_get_buffer
  1850. * @test: pointer to kunit structure
  1851. *
  1852. * Tests ibmveth_rxq_get_buffer. ibmveth_rxq_get_buffer also calls WARN_ON for
  1853. * the NULL returns, so dmesg should be checked to see that these warnings
  1854. * happened.
  1855. *
  1856. * Return: void
  1857. */
  1858. static void ibmveth_rxq_get_buffer_test(struct kunit *test)
  1859. {
  1860. struct ibmveth_adapter *adapter = kunit_kzalloc(test, sizeof(*adapter), GFP_KERNEL);
  1861. struct sk_buff *skb = kunit_kzalloc(test, sizeof(*skb), GFP_KERNEL);
  1862. struct ibmveth_buff_pool *pool;
  1863. KUNIT_ASSERT_NOT_ERR_OR_NULL(test, adapter);
  1864. KUNIT_ASSERT_NOT_ERR_OR_NULL(test, skb);
  1865. INIT_WORK(&adapter->work, ibmveth_reset_kunit);
  1866. adapter->rx_queue.queue_len = 1;
  1867. adapter->rx_queue.index = 0;
  1868. adapter->rx_queue.queue_addr = kunit_kzalloc(test, sizeof(struct ibmveth_rx_q_entry),
  1869. GFP_KERNEL);
  1870. KUNIT_ASSERT_NOT_ERR_OR_NULL(test, adapter->rx_queue.queue_addr);
  1871. /* Set sane values for buffer pools */
  1872. for (int i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1873. ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
  1874. pool_count[i], pool_size[i],
  1875. pool_active[i]);
  1876. pool = &adapter->rx_buff_pool[0];
  1877. pool->skbuff = kunit_kcalloc(test, pool->size, sizeof(void *), GFP_KERNEL);
  1878. KUNIT_ASSERT_NOT_ERR_OR_NULL(test, pool->skbuff);
  1879. adapter->rx_queue.queue_addr[0].correlator = (u64)IBMVETH_NUM_BUFF_POOLS << 32 | 0;
  1880. KUNIT_EXPECT_PTR_EQ(test, NULL, ibmveth_rxq_get_buffer(adapter));
  1881. adapter->rx_queue.queue_addr[0].correlator = (u64)0 << 32 | adapter->rx_buff_pool[0].size;
  1882. KUNIT_EXPECT_PTR_EQ(test, NULL, ibmveth_rxq_get_buffer(adapter));
  1883. pool->skbuff[0] = skb;
  1884. adapter->rx_queue.queue_addr[0].correlator = (u64)0 << 32 | 0;
  1885. KUNIT_EXPECT_PTR_EQ(test, skb, ibmveth_rxq_get_buffer(adapter));
  1886. flush_work(&adapter->work);
  1887. }
  1888. static struct kunit_case ibmveth_test_cases[] = {
  1889. KUNIT_CASE(ibmveth_remove_buffer_from_pool_test),
  1890. KUNIT_CASE(ibmveth_rxq_get_buffer_test),
  1891. {}
  1892. };
  1893. static struct kunit_suite ibmveth_test_suite = {
  1894. .name = "ibmveth-kunit-test",
  1895. .test_cases = ibmveth_test_cases,
  1896. };
  1897. kunit_test_suite(ibmveth_test_suite);
  1898. #endif