ibmveth.c 45 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667
  1. /*
  2. * IBM eServer i/pSeries Virtual Ethernet Device Driver
  3. * Copyright (C) 2003 IBM Corp.
  4. * Originally written by Dave Larson (larson1@us.ibm.com)
  5. * Maintained by Santiago Leon (santil@us.ibm.com)
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; either version 2 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
  20. * USA
  21. *
  22. * This module contains the implementation of a virtual ethernet device
  23. * for use with IBM i/pSeries LPAR Linux. It utilizes the logical LAN
  24. * option of the RS/6000 Platform Architechture to interface with virtual
  25. * ethernet NICs that are presented to the partition by the hypervisor.
  26. */
  27. #include <linux/module.h>
  28. #include <linux/moduleparam.h>
  29. #include <linux/types.h>
  30. #include <linux/errno.h>
  31. #include <linux/dma-mapping.h>
  32. #include <linux/kernel.h>
  33. #include <linux/netdevice.h>
  34. #include <linux/etherdevice.h>
  35. #include <linux/skbuff.h>
  36. #include <linux/init.h>
  37. #include <linux/mm.h>
  38. #include <linux/pm.h>
  39. #include <linux/ethtool.h>
  40. #include <linux/in.h>
  41. #include <linux/ip.h>
  42. #include <linux/ipv6.h>
  43. #include <linux/slab.h>
  44. #include <asm/hvcall.h>
  45. #include <asm/atomic.h>
  46. #include <asm/vio.h>
  47. #include <asm/iommu.h>
  48. #include <asm/firmware.h>
  49. #include "ibmveth.h"
  50. static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance);
  51. static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter);
  52. static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev);
  53. static struct kobj_type ktype_veth_pool;
  54. static const char ibmveth_driver_name[] = "ibmveth";
  55. static const char ibmveth_driver_string[] = "IBM i/pSeries Virtual Ethernet "
  56. "Driver";
  57. #define ibmveth_driver_version "1.03"
  58. MODULE_AUTHOR("Santiago Leon <santil@us.ibm.com>");
  59. MODULE_DESCRIPTION("IBM i/pSeries Virtual Ethernet Driver");
  60. MODULE_LICENSE("GPL");
  61. MODULE_VERSION(ibmveth_driver_version);
  62. static unsigned int tx_copybreak __read_mostly = 128;
  63. module_param(tx_copybreak, uint, 0644);
  64. MODULE_PARM_DESC(tx_copybreak,
  65. "Maximum size of packet that is copied to a new buffer on transmit");
  66. static unsigned int rx_copybreak __read_mostly = 128;
  67. module_param(rx_copybreak, uint, 0644);
  68. MODULE_PARM_DESC(rx_copybreak,
  69. "Maximum size of packet that is copied to a new buffer on receive");
  70. static unsigned int rx_flush __read_mostly = 0;
  71. module_param(rx_flush, uint, 0644);
  72. MODULE_PARM_DESC(rx_flush, "Flush receive buffers before use");
  73. struct ibmveth_stat {
  74. char name[ETH_GSTRING_LEN];
  75. int offset;
  76. };
  77. #define IBMVETH_STAT_OFF(stat) offsetof(struct ibmveth_adapter, stat)
  78. #define IBMVETH_GET_STAT(a, off) *((u64 *)(((unsigned long)(a)) + off))
  79. struct ibmveth_stat ibmveth_stats[] = {
  80. { "replenish_task_cycles", IBMVETH_STAT_OFF(replenish_task_cycles) },
  81. { "replenish_no_mem", IBMVETH_STAT_OFF(replenish_no_mem) },
  82. { "replenish_add_buff_failure",
  83. IBMVETH_STAT_OFF(replenish_add_buff_failure) },
  84. { "replenish_add_buff_success",
  85. IBMVETH_STAT_OFF(replenish_add_buff_success) },
  86. { "rx_invalid_buffer", IBMVETH_STAT_OFF(rx_invalid_buffer) },
  87. { "rx_no_buffer", IBMVETH_STAT_OFF(rx_no_buffer) },
  88. { "tx_map_failed", IBMVETH_STAT_OFF(tx_map_failed) },
  89. { "tx_send_failed", IBMVETH_STAT_OFF(tx_send_failed) },
  90. { "fw_enabled_ipv4_csum", IBMVETH_STAT_OFF(fw_ipv4_csum_support) },
  91. { "fw_enabled_ipv6_csum", IBMVETH_STAT_OFF(fw_ipv6_csum_support) },
  92. };
  93. /* simple methods of getting data from the current rxq entry */
  94. static inline u32 ibmveth_rxq_flags(struct ibmveth_adapter *adapter)
  95. {
  96. return adapter->rx_queue.queue_addr[adapter->rx_queue.index].flags_off;
  97. }
  98. static inline int ibmveth_rxq_toggle(struct ibmveth_adapter *adapter)
  99. {
  100. return (ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_TOGGLE) >>
  101. IBMVETH_RXQ_TOGGLE_SHIFT;
  102. }
  103. static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
  104. {
  105. return ibmveth_rxq_toggle(adapter) == adapter->rx_queue.toggle;
  106. }
  107. static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
  108. {
  109. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_VALID;
  110. }
  111. static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
  112. {
  113. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_OFF_MASK;
  114. }
  115. static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
  116. {
  117. return adapter->rx_queue.queue_addr[adapter->rx_queue.index].length;
  118. }
  119. static inline int ibmveth_rxq_csum_good(struct ibmveth_adapter *adapter)
  120. {
  121. return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_CSUM_GOOD;
  122. }
  123. /* setup the initial settings for a buffer pool */
  124. static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool,
  125. u32 pool_index, u32 pool_size,
  126. u32 buff_size, u32 pool_active)
  127. {
  128. pool->size = pool_size;
  129. pool->index = pool_index;
  130. pool->buff_size = buff_size;
  131. pool->threshold = pool_size * 7 / 8;
  132. pool->active = pool_active;
  133. }
  134. /* allocate and setup an buffer pool - called during open */
  135. static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
  136. {
  137. int i;
  138. pool->free_map = kmalloc(sizeof(u16) * pool->size, GFP_KERNEL);
  139. if (!pool->free_map)
  140. return -1;
  141. pool->dma_addr = kmalloc(sizeof(dma_addr_t) * pool->size, GFP_KERNEL);
  142. if (!pool->dma_addr) {
  143. kfree(pool->free_map);
  144. pool->free_map = NULL;
  145. return -1;
  146. }
  147. pool->skbuff = kcalloc(pool->size, sizeof(void *), GFP_KERNEL);
  148. if (!pool->skbuff) {
  149. kfree(pool->dma_addr);
  150. pool->dma_addr = NULL;
  151. kfree(pool->free_map);
  152. pool->free_map = NULL;
  153. return -1;
  154. }
  155. memset(pool->dma_addr, 0, sizeof(dma_addr_t) * pool->size);
  156. for (i = 0; i < pool->size; ++i)
  157. pool->free_map[i] = i;
  158. atomic_set(&pool->available, 0);
  159. pool->producer_index = 0;
  160. pool->consumer_index = 0;
  161. return 0;
  162. }
  163. static inline void ibmveth_flush_buffer(void *addr, unsigned long length)
  164. {
  165. unsigned long offset;
  166. for (offset = 0; offset < length; offset += SMP_CACHE_BYTES)
  167. asm("dcbfl %0,%1" :: "b" (addr), "r" (offset));
  168. }
  169. /* replenish the buffers for a pool. note that we don't need to
  170. * skb_reserve these since they are used for incoming...
  171. */
  172. static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter,
  173. struct ibmveth_buff_pool *pool)
  174. {
  175. u32 i;
  176. u32 count = pool->size - atomic_read(&pool->available);
  177. u32 buffers_added = 0;
  178. struct sk_buff *skb;
  179. unsigned int free_index, index;
  180. u64 correlator;
  181. unsigned long lpar_rc;
  182. dma_addr_t dma_addr;
  183. mb();
  184. for (i = 0; i < count; ++i) {
  185. union ibmveth_buf_desc desc;
  186. skb = netdev_alloc_skb(adapter->netdev, pool->buff_size);
  187. if (!skb) {
  188. netdev_dbg(adapter->netdev,
  189. "replenish: unable to allocate skb\n");
  190. adapter->replenish_no_mem++;
  191. break;
  192. }
  193. free_index = pool->consumer_index;
  194. pool->consumer_index++;
  195. if (pool->consumer_index >= pool->size)
  196. pool->consumer_index = 0;
  197. index = pool->free_map[free_index];
  198. BUG_ON(index == IBM_VETH_INVALID_MAP);
  199. BUG_ON(pool->skbuff[index] != NULL);
  200. dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
  201. pool->buff_size, DMA_FROM_DEVICE);
  202. if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
  203. goto failure;
  204. pool->free_map[free_index] = IBM_VETH_INVALID_MAP;
  205. pool->dma_addr[index] = dma_addr;
  206. pool->skbuff[index] = skb;
  207. correlator = ((u64)pool->index << 32) | index;
  208. *(u64 *)skb->data = correlator;
  209. desc.fields.flags_len = IBMVETH_BUF_VALID | pool->buff_size;
  210. desc.fields.address = dma_addr;
  211. if (rx_flush) {
  212. unsigned int len = min(pool->buff_size,
  213. adapter->netdev->mtu +
  214. IBMVETH_BUFF_OH);
  215. ibmveth_flush_buffer(skb->data, len);
  216. }
  217. lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address,
  218. desc.desc);
  219. if (lpar_rc != H_SUCCESS) {
  220. goto failure;
  221. } else {
  222. buffers_added++;
  223. adapter->replenish_add_buff_success++;
  224. }
  225. }
  226. mb();
  227. atomic_add(buffers_added, &(pool->available));
  228. return;
  229. failure:
  230. pool->free_map[free_index] = index;
  231. pool->skbuff[index] = NULL;
  232. if (pool->consumer_index == 0)
  233. pool->consumer_index = pool->size - 1;
  234. else
  235. pool->consumer_index--;
  236. if (!dma_mapping_error(&adapter->vdev->dev, dma_addr))
  237. dma_unmap_single(&adapter->vdev->dev,
  238. pool->dma_addr[index], pool->buff_size,
  239. DMA_FROM_DEVICE);
  240. dev_kfree_skb_any(skb);
  241. adapter->replenish_add_buff_failure++;
  242. mb();
  243. atomic_add(buffers_added, &(pool->available));
  244. }
  245. /* replenish routine */
  246. static void ibmveth_replenish_task(struct ibmveth_adapter *adapter)
  247. {
  248. int i;
  249. adapter->replenish_task_cycles++;
  250. for (i = (IBMVETH_NUM_BUFF_POOLS - 1); i >= 0; i--) {
  251. struct ibmveth_buff_pool *pool = &adapter->rx_buff_pool[i];
  252. if (pool->active &&
  253. (atomic_read(&pool->available) < pool->threshold))
  254. ibmveth_replenish_buffer_pool(adapter, pool);
  255. }
  256. adapter->rx_no_buffer = *(u64 *)(((char*)adapter->buffer_list_addr) +
  257. 4096 - 8);
  258. }
  259. /* empty and free ana buffer pool - also used to do cleanup in error paths */
  260. static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter,
  261. struct ibmveth_buff_pool *pool)
  262. {
  263. int i;
  264. kfree(pool->free_map);
  265. pool->free_map = NULL;
  266. if (pool->skbuff && pool->dma_addr) {
  267. for (i = 0; i < pool->size; ++i) {
  268. struct sk_buff *skb = pool->skbuff[i];
  269. if (skb) {
  270. dma_unmap_single(&adapter->vdev->dev,
  271. pool->dma_addr[i],
  272. pool->buff_size,
  273. DMA_FROM_DEVICE);
  274. dev_kfree_skb_any(skb);
  275. pool->skbuff[i] = NULL;
  276. }
  277. }
  278. }
  279. if (pool->dma_addr) {
  280. kfree(pool->dma_addr);
  281. pool->dma_addr = NULL;
  282. }
  283. if (pool->skbuff) {
  284. kfree(pool->skbuff);
  285. pool->skbuff = NULL;
  286. }
  287. }
  288. /* remove a buffer from a pool */
  289. static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter,
  290. u64 correlator)
  291. {
  292. unsigned int pool = correlator >> 32;
  293. unsigned int index = correlator & 0xffffffffUL;
  294. unsigned int free_index;
  295. struct sk_buff *skb;
  296. BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
  297. BUG_ON(index >= adapter->rx_buff_pool[pool].size);
  298. skb = adapter->rx_buff_pool[pool].skbuff[index];
  299. BUG_ON(skb == NULL);
  300. adapter->rx_buff_pool[pool].skbuff[index] = NULL;
  301. dma_unmap_single(&adapter->vdev->dev,
  302. adapter->rx_buff_pool[pool].dma_addr[index],
  303. adapter->rx_buff_pool[pool].buff_size,
  304. DMA_FROM_DEVICE);
  305. free_index = adapter->rx_buff_pool[pool].producer_index;
  306. adapter->rx_buff_pool[pool].producer_index++;
  307. if (adapter->rx_buff_pool[pool].producer_index >=
  308. adapter->rx_buff_pool[pool].size)
  309. adapter->rx_buff_pool[pool].producer_index = 0;
  310. adapter->rx_buff_pool[pool].free_map[free_index] = index;
  311. mb();
  312. atomic_dec(&(adapter->rx_buff_pool[pool].available));
  313. }
  314. /* get the current buffer on the rx queue */
  315. static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
  316. {
  317. u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
  318. unsigned int pool = correlator >> 32;
  319. unsigned int index = correlator & 0xffffffffUL;
  320. BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
  321. BUG_ON(index >= adapter->rx_buff_pool[pool].size);
  322. return adapter->rx_buff_pool[pool].skbuff[index];
  323. }
  324. /* recycle the current buffer on the rx queue */
  325. static void ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter)
  326. {
  327. u32 q_index = adapter->rx_queue.index;
  328. u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator;
  329. unsigned int pool = correlator >> 32;
  330. unsigned int index = correlator & 0xffffffffUL;
  331. union ibmveth_buf_desc desc;
  332. unsigned long lpar_rc;
  333. BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
  334. BUG_ON(index >= adapter->rx_buff_pool[pool].size);
  335. if (!adapter->rx_buff_pool[pool].active) {
  336. ibmveth_rxq_harvest_buffer(adapter);
  337. ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[pool]);
  338. return;
  339. }
  340. desc.fields.flags_len = IBMVETH_BUF_VALID |
  341. adapter->rx_buff_pool[pool].buff_size;
  342. desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index];
  343. lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
  344. if (lpar_rc != H_SUCCESS) {
  345. netdev_dbg(adapter->netdev, "h_add_logical_lan_buffer failed "
  346. "during recycle rc=%ld", lpar_rc);
  347. ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
  348. }
  349. if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
  350. adapter->rx_queue.index = 0;
  351. adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
  352. }
  353. }
  354. static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter)
  355. {
  356. ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
  357. if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
  358. adapter->rx_queue.index = 0;
  359. adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
  360. }
  361. }
  362. static void ibmveth_cleanup(struct ibmveth_adapter *adapter)
  363. {
  364. int i;
  365. struct device *dev = &adapter->vdev->dev;
  366. if (adapter->buffer_list_addr != NULL) {
  367. if (!dma_mapping_error(dev, adapter->buffer_list_dma)) {
  368. dma_unmap_single(dev, adapter->buffer_list_dma, 4096,
  369. DMA_BIDIRECTIONAL);
  370. adapter->buffer_list_dma = DMA_ERROR_CODE;
  371. }
  372. free_page((unsigned long)adapter->buffer_list_addr);
  373. adapter->buffer_list_addr = NULL;
  374. }
  375. if (adapter->filter_list_addr != NULL) {
  376. if (!dma_mapping_error(dev, adapter->filter_list_dma)) {
  377. dma_unmap_single(dev, adapter->filter_list_dma, 4096,
  378. DMA_BIDIRECTIONAL);
  379. adapter->filter_list_dma = DMA_ERROR_CODE;
  380. }
  381. free_page((unsigned long)adapter->filter_list_addr);
  382. adapter->filter_list_addr = NULL;
  383. }
  384. if (adapter->rx_queue.queue_addr != NULL) {
  385. if (!dma_mapping_error(dev, adapter->rx_queue.queue_dma)) {
  386. dma_unmap_single(dev,
  387. adapter->rx_queue.queue_dma,
  388. adapter->rx_queue.queue_len,
  389. DMA_BIDIRECTIONAL);
  390. adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
  391. }
  392. kfree(adapter->rx_queue.queue_addr);
  393. adapter->rx_queue.queue_addr = NULL;
  394. }
  395. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  396. if (adapter->rx_buff_pool[i].active)
  397. ibmveth_free_buffer_pool(adapter,
  398. &adapter->rx_buff_pool[i]);
  399. if (adapter->bounce_buffer != NULL) {
  400. if (!dma_mapping_error(dev, adapter->bounce_buffer_dma)) {
  401. dma_unmap_single(&adapter->vdev->dev,
  402. adapter->bounce_buffer_dma,
  403. adapter->netdev->mtu + IBMVETH_BUFF_OH,
  404. DMA_BIDIRECTIONAL);
  405. adapter->bounce_buffer_dma = DMA_ERROR_CODE;
  406. }
  407. kfree(adapter->bounce_buffer);
  408. adapter->bounce_buffer = NULL;
  409. }
  410. }
  411. static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter,
  412. union ibmveth_buf_desc rxq_desc, u64 mac_address)
  413. {
  414. int rc, try_again = 1;
  415. /*
  416. * After a kexec the adapter will still be open, so our attempt to
  417. * open it will fail. So if we get a failure we free the adapter and
  418. * try again, but only once.
  419. */
  420. retry:
  421. rc = h_register_logical_lan(adapter->vdev->unit_address,
  422. adapter->buffer_list_dma, rxq_desc.desc,
  423. adapter->filter_list_dma, mac_address);
  424. if (rc != H_SUCCESS && try_again) {
  425. do {
  426. rc = h_free_logical_lan(adapter->vdev->unit_address);
  427. } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
  428. try_again = 0;
  429. goto retry;
  430. }
  431. return rc;
  432. }
  433. static int ibmveth_open(struct net_device *netdev)
  434. {
  435. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  436. u64 mac_address = 0;
  437. int rxq_entries = 1;
  438. unsigned long lpar_rc;
  439. int rc;
  440. union ibmveth_buf_desc rxq_desc;
  441. int i;
  442. struct device *dev;
  443. netdev_dbg(netdev, "open starting\n");
  444. napi_enable(&adapter->napi);
  445. for(i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  446. rxq_entries += adapter->rx_buff_pool[i].size;
  447. adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
  448. adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
  449. if (!adapter->buffer_list_addr || !adapter->filter_list_addr) {
  450. netdev_err(netdev, "unable to allocate filter or buffer list "
  451. "pages\n");
  452. ibmveth_cleanup(adapter);
  453. napi_disable(&adapter->napi);
  454. return -ENOMEM;
  455. }
  456. adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) *
  457. rxq_entries;
  458. adapter->rx_queue.queue_addr = kmalloc(adapter->rx_queue.queue_len,
  459. GFP_KERNEL);
  460. if (!adapter->rx_queue.queue_addr) {
  461. netdev_err(netdev, "unable to allocate rx queue pages\n");
  462. ibmveth_cleanup(adapter);
  463. napi_disable(&adapter->napi);
  464. return -ENOMEM;
  465. }
  466. dev = &adapter->vdev->dev;
  467. adapter->buffer_list_dma = dma_map_single(dev,
  468. adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
  469. adapter->filter_list_dma = dma_map_single(dev,
  470. adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
  471. adapter->rx_queue.queue_dma = dma_map_single(dev,
  472. adapter->rx_queue.queue_addr,
  473. adapter->rx_queue.queue_len, DMA_BIDIRECTIONAL);
  474. if ((dma_mapping_error(dev, adapter->buffer_list_dma)) ||
  475. (dma_mapping_error(dev, adapter->filter_list_dma)) ||
  476. (dma_mapping_error(dev, adapter->rx_queue.queue_dma))) {
  477. netdev_err(netdev, "unable to map filter or buffer list "
  478. "pages\n");
  479. ibmveth_cleanup(adapter);
  480. napi_disable(&adapter->napi);
  481. return -ENOMEM;
  482. }
  483. adapter->rx_queue.index = 0;
  484. adapter->rx_queue.num_slots = rxq_entries;
  485. adapter->rx_queue.toggle = 1;
  486. memcpy(&mac_address, netdev->dev_addr, netdev->addr_len);
  487. mac_address = mac_address >> 16;
  488. rxq_desc.fields.flags_len = IBMVETH_BUF_VALID |
  489. adapter->rx_queue.queue_len;
  490. rxq_desc.fields.address = adapter->rx_queue.queue_dma;
  491. netdev_dbg(netdev, "buffer list @ 0x%p\n", adapter->buffer_list_addr);
  492. netdev_dbg(netdev, "filter list @ 0x%p\n", adapter->filter_list_addr);
  493. netdev_dbg(netdev, "receive q @ 0x%p\n", adapter->rx_queue.queue_addr);
  494. h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
  495. lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address);
  496. if (lpar_rc != H_SUCCESS) {
  497. netdev_err(netdev, "h_register_logical_lan failed with %ld\n",
  498. lpar_rc);
  499. netdev_err(netdev, "buffer TCE:0x%llx filter TCE:0x%llx rxq "
  500. "desc:0x%llx MAC:0x%llx\n",
  501. adapter->buffer_list_dma,
  502. adapter->filter_list_dma,
  503. rxq_desc.desc,
  504. mac_address);
  505. ibmveth_cleanup(adapter);
  506. napi_disable(&adapter->napi);
  507. return -ENONET;
  508. }
  509. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  510. if (!adapter->rx_buff_pool[i].active)
  511. continue;
  512. if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) {
  513. netdev_err(netdev, "unable to alloc pool\n");
  514. adapter->rx_buff_pool[i].active = 0;
  515. ibmveth_cleanup(adapter);
  516. napi_disable(&adapter->napi);
  517. return -ENOMEM ;
  518. }
  519. }
  520. netdev_dbg(netdev, "registering irq 0x%x\n", netdev->irq);
  521. rc = request_irq(netdev->irq, ibmveth_interrupt, 0, netdev->name,
  522. netdev);
  523. if (rc != 0) {
  524. netdev_err(netdev, "unable to request irq 0x%x, rc %d\n",
  525. netdev->irq, rc);
  526. do {
  527. rc = h_free_logical_lan(adapter->vdev->unit_address);
  528. } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
  529. ibmveth_cleanup(adapter);
  530. napi_disable(&adapter->napi);
  531. return rc;
  532. }
  533. adapter->bounce_buffer =
  534. kmalloc(netdev->mtu + IBMVETH_BUFF_OH, GFP_KERNEL);
  535. if (!adapter->bounce_buffer) {
  536. netdev_err(netdev, "unable to allocate bounce buffer\n");
  537. ibmveth_cleanup(adapter);
  538. napi_disable(&adapter->napi);
  539. return -ENOMEM;
  540. }
  541. adapter->bounce_buffer_dma =
  542. dma_map_single(&adapter->vdev->dev, adapter->bounce_buffer,
  543. netdev->mtu + IBMVETH_BUFF_OH, DMA_BIDIRECTIONAL);
  544. if (dma_mapping_error(dev, adapter->bounce_buffer_dma)) {
  545. netdev_err(netdev, "unable to map bounce buffer\n");
  546. ibmveth_cleanup(adapter);
  547. napi_disable(&adapter->napi);
  548. return -ENOMEM;
  549. }
  550. netdev_dbg(netdev, "initial replenish cycle\n");
  551. ibmveth_interrupt(netdev->irq, netdev);
  552. netif_start_queue(netdev);
  553. netdev_dbg(netdev, "open complete\n");
  554. return 0;
  555. }
  556. static int ibmveth_close(struct net_device *netdev)
  557. {
  558. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  559. long lpar_rc;
  560. netdev_dbg(netdev, "close starting\n");
  561. napi_disable(&adapter->napi);
  562. if (!adapter->pool_config)
  563. netif_stop_queue(netdev);
  564. h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
  565. do {
  566. lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
  567. } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
  568. if (lpar_rc != H_SUCCESS) {
  569. netdev_err(netdev, "h_free_logical_lan failed with %lx, "
  570. "continuing with close\n", lpar_rc);
  571. }
  572. free_irq(netdev->irq, netdev);
  573. adapter->rx_no_buffer = *(u64 *)(((char *)adapter->buffer_list_addr) +
  574. 4096 - 8);
  575. ibmveth_cleanup(adapter);
  576. netdev_dbg(netdev, "close complete\n");
  577. return 0;
  578. }
  579. static int netdev_get_settings(struct net_device *dev, struct ethtool_cmd *cmd)
  580. {
  581. cmd->supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg |
  582. SUPPORTED_FIBRE);
  583. cmd->advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg |
  584. ADVERTISED_FIBRE);
  585. cmd->speed = SPEED_1000;
  586. cmd->duplex = DUPLEX_FULL;
  587. cmd->port = PORT_FIBRE;
  588. cmd->phy_address = 0;
  589. cmd->transceiver = XCVR_INTERNAL;
  590. cmd->autoneg = AUTONEG_ENABLE;
  591. cmd->maxtxpkt = 0;
  592. cmd->maxrxpkt = 1;
  593. return 0;
  594. }
  595. static void netdev_get_drvinfo(struct net_device *dev,
  596. struct ethtool_drvinfo *info)
  597. {
  598. strncpy(info->driver, ibmveth_driver_name, sizeof(info->driver) - 1);
  599. strncpy(info->version, ibmveth_driver_version,
  600. sizeof(info->version) - 1);
  601. }
  602. static u32 netdev_get_link(struct net_device *dev)
  603. {
  604. return 1;
  605. }
  606. static void ibmveth_set_rx_csum_flags(struct net_device *dev, u32 data)
  607. {
  608. struct ibmveth_adapter *adapter = netdev_priv(dev);
  609. if (data) {
  610. adapter->rx_csum = 1;
  611. } else {
  612. /*
  613. * Since the ibmveth firmware interface does not have the
  614. * concept of separate tx/rx checksum offload enable, if rx
  615. * checksum is disabled we also have to disable tx checksum
  616. * offload. Once we disable rx checksum offload, we are no
  617. * longer allowed to send tx buffers that are not properly
  618. * checksummed.
  619. */
  620. adapter->rx_csum = 0;
  621. dev->features &= ~NETIF_F_IP_CSUM;
  622. dev->features &= ~NETIF_F_IPV6_CSUM;
  623. }
  624. }
  625. static void ibmveth_set_tx_csum_flags(struct net_device *dev, u32 data)
  626. {
  627. struct ibmveth_adapter *adapter = netdev_priv(dev);
  628. if (data) {
  629. if (adapter->fw_ipv4_csum_support)
  630. dev->features |= NETIF_F_IP_CSUM;
  631. if (adapter->fw_ipv6_csum_support)
  632. dev->features |= NETIF_F_IPV6_CSUM;
  633. adapter->rx_csum = 1;
  634. } else {
  635. dev->features &= ~NETIF_F_IP_CSUM;
  636. dev->features &= ~NETIF_F_IPV6_CSUM;
  637. }
  638. }
  639. static int ibmveth_set_csum_offload(struct net_device *dev, u32 data,
  640. void (*done) (struct net_device *, u32))
  641. {
  642. struct ibmveth_adapter *adapter = netdev_priv(dev);
  643. unsigned long set_attr, clr_attr, ret_attr;
  644. unsigned long set_attr6, clr_attr6;
  645. long ret, ret6;
  646. int rc1 = 0, rc2 = 0;
  647. int restart = 0;
  648. if (netif_running(dev)) {
  649. restart = 1;
  650. adapter->pool_config = 1;
  651. ibmveth_close(dev);
  652. adapter->pool_config = 0;
  653. }
  654. set_attr = 0;
  655. clr_attr = 0;
  656. if (data) {
  657. set_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
  658. set_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
  659. } else {
  660. clr_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
  661. clr_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
  662. }
  663. ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
  664. if (ret == H_SUCCESS && !(ret_attr & IBMVETH_ILLAN_ACTIVE_TRUNK) &&
  665. !(ret_attr & IBMVETH_ILLAN_TRUNK_PRI_MASK) &&
  666. (ret_attr & IBMVETH_ILLAN_PADDED_PKT_CSUM)) {
  667. ret = h_illan_attributes(adapter->vdev->unit_address, clr_attr,
  668. set_attr, &ret_attr);
  669. if (ret != H_SUCCESS) {
  670. netdev_err(dev, "unable to change IPv4 checksum "
  671. "offload settings. %d rc=%ld\n",
  672. data, ret);
  673. ret = h_illan_attributes(adapter->vdev->unit_address,
  674. set_attr, clr_attr, &ret_attr);
  675. } else {
  676. adapter->fw_ipv4_csum_support = data;
  677. }
  678. ret6 = h_illan_attributes(adapter->vdev->unit_address,
  679. clr_attr6, set_attr6, &ret_attr);
  680. if (ret6 != H_SUCCESS) {
  681. netdev_err(dev, "unable to change IPv6 checksum "
  682. "offload settings. %d rc=%ld\n",
  683. data, ret);
  684. ret = h_illan_attributes(adapter->vdev->unit_address,
  685. set_attr6, clr_attr6,
  686. &ret_attr);
  687. } else
  688. adapter->fw_ipv6_csum_support = data;
  689. if (ret == H_SUCCESS || ret6 == H_SUCCESS)
  690. done(dev, data);
  691. else
  692. rc1 = -EIO;
  693. } else {
  694. rc1 = -EIO;
  695. netdev_err(dev, "unable to change checksum offload settings."
  696. " %d rc=%ld ret_attr=%lx\n", data, ret,
  697. ret_attr);
  698. }
  699. if (restart)
  700. rc2 = ibmveth_open(dev);
  701. return rc1 ? rc1 : rc2;
  702. }
  703. static int ibmveth_set_rx_csum(struct net_device *dev, u32 data)
  704. {
  705. struct ibmveth_adapter *adapter = netdev_priv(dev);
  706. if ((data && adapter->rx_csum) || (!data && !adapter->rx_csum))
  707. return 0;
  708. return ibmveth_set_csum_offload(dev, data, ibmveth_set_rx_csum_flags);
  709. }
  710. static int ibmveth_set_tx_csum(struct net_device *dev, u32 data)
  711. {
  712. struct ibmveth_adapter *adapter = netdev_priv(dev);
  713. int rc = 0;
  714. if (data && (dev->features & (NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM)))
  715. return 0;
  716. if (!data && !(dev->features & (NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM)))
  717. return 0;
  718. if (data && !adapter->rx_csum)
  719. rc = ibmveth_set_csum_offload(dev, data,
  720. ibmveth_set_tx_csum_flags);
  721. else
  722. ibmveth_set_tx_csum_flags(dev, data);
  723. return rc;
  724. }
  725. static u32 ibmveth_get_rx_csum(struct net_device *dev)
  726. {
  727. struct ibmveth_adapter *adapter = netdev_priv(dev);
  728. return adapter->rx_csum;
  729. }
  730. static void ibmveth_get_strings(struct net_device *dev, u32 stringset, u8 *data)
  731. {
  732. int i;
  733. if (stringset != ETH_SS_STATS)
  734. return;
  735. for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++, data += ETH_GSTRING_LEN)
  736. memcpy(data, ibmveth_stats[i].name, ETH_GSTRING_LEN);
  737. }
  738. static int ibmveth_get_sset_count(struct net_device *dev, int sset)
  739. {
  740. switch (sset) {
  741. case ETH_SS_STATS:
  742. return ARRAY_SIZE(ibmveth_stats);
  743. default:
  744. return -EOPNOTSUPP;
  745. }
  746. }
  747. static void ibmveth_get_ethtool_stats(struct net_device *dev,
  748. struct ethtool_stats *stats, u64 *data)
  749. {
  750. int i;
  751. struct ibmveth_adapter *adapter = netdev_priv(dev);
  752. for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++)
  753. data[i] = IBMVETH_GET_STAT(adapter, ibmveth_stats[i].offset);
  754. }
  755. static const struct ethtool_ops netdev_ethtool_ops = {
  756. .get_drvinfo = netdev_get_drvinfo,
  757. .get_settings = netdev_get_settings,
  758. .get_link = netdev_get_link,
  759. .set_tx_csum = ibmveth_set_tx_csum,
  760. .get_rx_csum = ibmveth_get_rx_csum,
  761. .set_rx_csum = ibmveth_set_rx_csum,
  762. .get_strings = ibmveth_get_strings,
  763. .get_sset_count = ibmveth_get_sset_count,
  764. .get_ethtool_stats = ibmveth_get_ethtool_stats,
  765. .set_sg = ethtool_op_set_sg,
  766. };
  767. static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
  768. {
  769. return -EOPNOTSUPP;
  770. }
  771. #define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1))
  772. static int ibmveth_send(struct ibmveth_adapter *adapter,
  773. union ibmveth_buf_desc *descs)
  774. {
  775. unsigned long correlator;
  776. unsigned int retry_count;
  777. unsigned long ret;
  778. /*
  779. * The retry count sets a maximum for the number of broadcast and
  780. * multicast destinations within the system.
  781. */
  782. retry_count = 1024;
  783. correlator = 0;
  784. do {
  785. ret = h_send_logical_lan(adapter->vdev->unit_address,
  786. descs[0].desc, descs[1].desc,
  787. descs[2].desc, descs[3].desc,
  788. descs[4].desc, descs[5].desc,
  789. correlator, &correlator);
  790. } while ((ret == H_BUSY) && (retry_count--));
  791. if (ret != H_SUCCESS && ret != H_DROPPED) {
  792. netdev_err(adapter->netdev, "tx: h_send_logical_lan failed "
  793. "with rc=%ld\n", ret);
  794. return 1;
  795. }
  796. return 0;
  797. }
  798. static netdev_tx_t ibmveth_start_xmit(struct sk_buff *skb,
  799. struct net_device *netdev)
  800. {
  801. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  802. unsigned int desc_flags;
  803. union ibmveth_buf_desc descs[6];
  804. int last, i;
  805. int force_bounce = 0;
  806. /*
  807. * veth handles a maximum of 6 segments including the header, so
  808. * we have to linearize the skb if there are more than this.
  809. */
  810. if (skb_shinfo(skb)->nr_frags > 5 && __skb_linearize(skb)) {
  811. netdev->stats.tx_dropped++;
  812. goto out;
  813. }
  814. /* veth can't checksum offload UDP */
  815. if (skb->ip_summed == CHECKSUM_PARTIAL &&
  816. ((skb->protocol == htons(ETH_P_IP) &&
  817. ip_hdr(skb)->protocol != IPPROTO_TCP) ||
  818. (skb->protocol == htons(ETH_P_IPV6) &&
  819. ipv6_hdr(skb)->nexthdr != IPPROTO_TCP)) &&
  820. skb_checksum_help(skb)) {
  821. netdev_err(netdev, "tx: failed to checksum packet\n");
  822. netdev->stats.tx_dropped++;
  823. goto out;
  824. }
  825. desc_flags = IBMVETH_BUF_VALID;
  826. if (skb->ip_summed == CHECKSUM_PARTIAL) {
  827. unsigned char *buf = skb_transport_header(skb) +
  828. skb->csum_offset;
  829. desc_flags |= (IBMVETH_BUF_NO_CSUM | IBMVETH_BUF_CSUM_GOOD);
  830. /* Need to zero out the checksum */
  831. buf[0] = 0;
  832. buf[1] = 0;
  833. }
  834. retry_bounce:
  835. memset(descs, 0, sizeof(descs));
  836. /*
  837. * If a linear packet is below the rx threshold then
  838. * copy it into the static bounce buffer. This avoids the
  839. * cost of a TCE insert and remove.
  840. */
  841. if (force_bounce || (!skb_is_nonlinear(skb) &&
  842. (skb->len < tx_copybreak))) {
  843. skb_copy_from_linear_data(skb, adapter->bounce_buffer,
  844. skb->len);
  845. descs[0].fields.flags_len = desc_flags | skb->len;
  846. descs[0].fields.address = adapter->bounce_buffer_dma;
  847. if (ibmveth_send(adapter, descs)) {
  848. adapter->tx_send_failed++;
  849. netdev->stats.tx_dropped++;
  850. } else {
  851. netdev->stats.tx_packets++;
  852. netdev->stats.tx_bytes += skb->len;
  853. }
  854. goto out;
  855. }
  856. /* Map the header */
  857. descs[0].fields.address = dma_map_single(&adapter->vdev->dev, skb->data,
  858. skb_headlen(skb),
  859. DMA_TO_DEVICE);
  860. if (dma_mapping_error(&adapter->vdev->dev, descs[0].fields.address))
  861. goto map_failed;
  862. descs[0].fields.flags_len = desc_flags | skb_headlen(skb);
  863. /* Map the frags */
  864. for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
  865. unsigned long dma_addr;
  866. skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
  867. dma_addr = dma_map_page(&adapter->vdev->dev, frag->page,
  868. frag->page_offset, frag->size,
  869. DMA_TO_DEVICE);
  870. if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
  871. goto map_failed_frags;
  872. descs[i+1].fields.flags_len = desc_flags | frag->size;
  873. descs[i+1].fields.address = dma_addr;
  874. }
  875. if (ibmveth_send(adapter, descs)) {
  876. adapter->tx_send_failed++;
  877. netdev->stats.tx_dropped++;
  878. } else {
  879. netdev->stats.tx_packets++;
  880. netdev->stats.tx_bytes += skb->len;
  881. }
  882. for (i = 0; i < skb_shinfo(skb)->nr_frags + 1; i++)
  883. dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address,
  884. descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK,
  885. DMA_TO_DEVICE);
  886. out:
  887. dev_kfree_skb(skb);
  888. return NETDEV_TX_OK;
  889. map_failed_frags:
  890. last = i+1;
  891. for (i = 0; i < last; i++)
  892. dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address,
  893. descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK,
  894. DMA_TO_DEVICE);
  895. map_failed:
  896. if (!firmware_has_feature(FW_FEATURE_CMO))
  897. netdev_err(netdev, "tx: unable to map xmit buffer\n");
  898. adapter->tx_map_failed++;
  899. skb_linearize(skb);
  900. force_bounce = 1;
  901. goto retry_bounce;
  902. }
  903. static int ibmveth_poll(struct napi_struct *napi, int budget)
  904. {
  905. struct ibmveth_adapter *adapter =
  906. container_of(napi, struct ibmveth_adapter, napi);
  907. struct net_device *netdev = adapter->netdev;
  908. int frames_processed = 0;
  909. unsigned long lpar_rc;
  910. restart_poll:
  911. do {
  912. if (!ibmveth_rxq_pending_buffer(adapter))
  913. break;
  914. smp_rmb();
  915. if (!ibmveth_rxq_buffer_valid(adapter)) {
  916. wmb(); /* suggested by larson1 */
  917. adapter->rx_invalid_buffer++;
  918. netdev_dbg(netdev, "recycling invalid buffer\n");
  919. ibmveth_rxq_recycle_buffer(adapter);
  920. } else {
  921. struct sk_buff *skb, *new_skb;
  922. int length = ibmveth_rxq_frame_length(adapter);
  923. int offset = ibmveth_rxq_frame_offset(adapter);
  924. int csum_good = ibmveth_rxq_csum_good(adapter);
  925. skb = ibmveth_rxq_get_buffer(adapter);
  926. new_skb = NULL;
  927. if (length < rx_copybreak)
  928. new_skb = netdev_alloc_skb(netdev, length);
  929. if (new_skb) {
  930. skb_copy_to_linear_data(new_skb,
  931. skb->data + offset,
  932. length);
  933. if (rx_flush)
  934. ibmveth_flush_buffer(skb->data,
  935. length + offset);
  936. skb = new_skb;
  937. ibmveth_rxq_recycle_buffer(adapter);
  938. } else {
  939. ibmveth_rxq_harvest_buffer(adapter);
  940. skb_reserve(skb, offset);
  941. }
  942. skb_put(skb, length);
  943. skb->protocol = eth_type_trans(skb, netdev);
  944. if (csum_good)
  945. skb->ip_summed = CHECKSUM_UNNECESSARY;
  946. netif_receive_skb(skb); /* send it up */
  947. netdev->stats.rx_packets++;
  948. netdev->stats.rx_bytes += length;
  949. frames_processed++;
  950. }
  951. } while (frames_processed < budget);
  952. ibmveth_replenish_task(adapter);
  953. if (frames_processed < budget) {
  954. /* We think we are done - reenable interrupts,
  955. * then check once more to make sure we are done.
  956. */
  957. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  958. VIO_IRQ_ENABLE);
  959. BUG_ON(lpar_rc != H_SUCCESS);
  960. napi_complete(napi);
  961. if (ibmveth_rxq_pending_buffer(adapter) &&
  962. napi_reschedule(napi)) {
  963. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  964. VIO_IRQ_DISABLE);
  965. goto restart_poll;
  966. }
  967. }
  968. return frames_processed;
  969. }
  970. static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance)
  971. {
  972. struct net_device *netdev = dev_instance;
  973. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  974. unsigned long lpar_rc;
  975. if (napi_schedule_prep(&adapter->napi)) {
  976. lpar_rc = h_vio_signal(adapter->vdev->unit_address,
  977. VIO_IRQ_DISABLE);
  978. BUG_ON(lpar_rc != H_SUCCESS);
  979. __napi_schedule(&adapter->napi);
  980. }
  981. return IRQ_HANDLED;
  982. }
  983. static void ibmveth_set_multicast_list(struct net_device *netdev)
  984. {
  985. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  986. unsigned long lpar_rc;
  987. if ((netdev->flags & IFF_PROMISC) ||
  988. (netdev_mc_count(netdev) > adapter->mcastFilterSize)) {
  989. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  990. IbmVethMcastEnableRecv |
  991. IbmVethMcastDisableFiltering,
  992. 0);
  993. if (lpar_rc != H_SUCCESS) {
  994. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  995. "entering promisc mode\n", lpar_rc);
  996. }
  997. } else {
  998. struct netdev_hw_addr *ha;
  999. /* clear the filter table & disable filtering */
  1000. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1001. IbmVethMcastEnableRecv |
  1002. IbmVethMcastDisableFiltering |
  1003. IbmVethMcastClearFilterTable,
  1004. 0);
  1005. if (lpar_rc != H_SUCCESS) {
  1006. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1007. "attempting to clear filter table\n",
  1008. lpar_rc);
  1009. }
  1010. /* add the addresses to the filter table */
  1011. netdev_for_each_mc_addr(ha, netdev) {
  1012. /* add the multicast address to the filter table */
  1013. unsigned long mcast_addr = 0;
  1014. memcpy(((char *)&mcast_addr)+2, ha->addr, 6);
  1015. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1016. IbmVethMcastAddFilter,
  1017. mcast_addr);
  1018. if (lpar_rc != H_SUCCESS) {
  1019. netdev_err(netdev, "h_multicast_ctrl rc=%ld "
  1020. "when adding an entry to the filter "
  1021. "table\n", lpar_rc);
  1022. }
  1023. }
  1024. /* re-enable filtering */
  1025. lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
  1026. IbmVethMcastEnableFiltering,
  1027. 0);
  1028. if (lpar_rc != H_SUCCESS) {
  1029. netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
  1030. "enabling filtering\n", lpar_rc);
  1031. }
  1032. }
  1033. }
  1034. static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
  1035. {
  1036. struct ibmveth_adapter *adapter = netdev_priv(dev);
  1037. struct vio_dev *viodev = adapter->vdev;
  1038. int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH;
  1039. int i, rc;
  1040. int need_restart = 0;
  1041. if (new_mtu < IBMVETH_MIN_MTU)
  1042. return -EINVAL;
  1043. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1044. if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size)
  1045. break;
  1046. if (i == IBMVETH_NUM_BUFF_POOLS)
  1047. return -EINVAL;
  1048. /* Deactivate all the buffer pools so that the next loop can activate
  1049. only the buffer pools necessary to hold the new MTU */
  1050. if (netif_running(adapter->netdev)) {
  1051. need_restart = 1;
  1052. adapter->pool_config = 1;
  1053. ibmveth_close(adapter->netdev);
  1054. adapter->pool_config = 0;
  1055. }
  1056. /* Look for an active buffer pool that can hold the new MTU */
  1057. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1058. adapter->rx_buff_pool[i].active = 1;
  1059. if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size) {
  1060. dev->mtu = new_mtu;
  1061. vio_cmo_set_dev_desired(viodev,
  1062. ibmveth_get_desired_dma
  1063. (viodev));
  1064. if (need_restart) {
  1065. return ibmveth_open(adapter->netdev);
  1066. }
  1067. return 0;
  1068. }
  1069. }
  1070. if (need_restart && (rc = ibmveth_open(adapter->netdev)))
  1071. return rc;
  1072. return -EINVAL;
  1073. }
  1074. #ifdef CONFIG_NET_POLL_CONTROLLER
  1075. static void ibmveth_poll_controller(struct net_device *dev)
  1076. {
  1077. ibmveth_replenish_task(netdev_priv(dev));
  1078. ibmveth_interrupt(dev->irq, dev);
  1079. }
  1080. #endif
  1081. /**
  1082. * ibmveth_get_desired_dma - Calculate IO memory desired by the driver
  1083. *
  1084. * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
  1085. *
  1086. * Return value:
  1087. * Number of bytes of IO data the driver will need to perform well.
  1088. */
  1089. static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev)
  1090. {
  1091. struct net_device *netdev = dev_get_drvdata(&vdev->dev);
  1092. struct ibmveth_adapter *adapter;
  1093. unsigned long ret;
  1094. int i;
  1095. int rxqentries = 1;
  1096. /* netdev inits at probe time along with the structures we need below*/
  1097. if (netdev == NULL)
  1098. return IOMMU_PAGE_ALIGN(IBMVETH_IO_ENTITLEMENT_DEFAULT);
  1099. adapter = netdev_priv(netdev);
  1100. ret = IBMVETH_BUFF_LIST_SIZE + IBMVETH_FILT_LIST_SIZE;
  1101. ret += IOMMU_PAGE_ALIGN(netdev->mtu);
  1102. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1103. /* add the size of the active receive buffers */
  1104. if (adapter->rx_buff_pool[i].active)
  1105. ret +=
  1106. adapter->rx_buff_pool[i].size *
  1107. IOMMU_PAGE_ALIGN(adapter->rx_buff_pool[i].
  1108. buff_size);
  1109. rxqentries += adapter->rx_buff_pool[i].size;
  1110. }
  1111. /* add the size of the receive queue entries */
  1112. ret += IOMMU_PAGE_ALIGN(rxqentries * sizeof(struct ibmveth_rx_q_entry));
  1113. return ret;
  1114. }
  1115. static const struct net_device_ops ibmveth_netdev_ops = {
  1116. .ndo_open = ibmveth_open,
  1117. .ndo_stop = ibmveth_close,
  1118. .ndo_start_xmit = ibmveth_start_xmit,
  1119. .ndo_set_multicast_list = ibmveth_set_multicast_list,
  1120. .ndo_do_ioctl = ibmveth_ioctl,
  1121. .ndo_change_mtu = ibmveth_change_mtu,
  1122. .ndo_validate_addr = eth_validate_addr,
  1123. .ndo_set_mac_address = eth_mac_addr,
  1124. #ifdef CONFIG_NET_POLL_CONTROLLER
  1125. .ndo_poll_controller = ibmveth_poll_controller,
  1126. #endif
  1127. };
  1128. static int __devinit ibmveth_probe(struct vio_dev *dev,
  1129. const struct vio_device_id *id)
  1130. {
  1131. int rc, i;
  1132. struct net_device *netdev;
  1133. struct ibmveth_adapter *adapter;
  1134. unsigned char *mac_addr_p;
  1135. unsigned int *mcastFilterSize_p;
  1136. dev_dbg(&dev->dev, "entering ibmveth_probe for UA 0x%x\n",
  1137. dev->unit_address);
  1138. mac_addr_p = (unsigned char *)vio_get_attribute(dev, VETH_MAC_ADDR,
  1139. NULL);
  1140. if (!mac_addr_p) {
  1141. dev_err(&dev->dev, "Can't find VETH_MAC_ADDR attribute\n");
  1142. return -EINVAL;
  1143. }
  1144. mcastFilterSize_p = (unsigned int *)vio_get_attribute(dev,
  1145. VETH_MCAST_FILTER_SIZE, NULL);
  1146. if (!mcastFilterSize_p) {
  1147. dev_err(&dev->dev, "Can't find VETH_MCAST_FILTER_SIZE "
  1148. "attribute\n");
  1149. return -EINVAL;
  1150. }
  1151. netdev = alloc_etherdev(sizeof(struct ibmveth_adapter));
  1152. if (!netdev)
  1153. return -ENOMEM;
  1154. adapter = netdev_priv(netdev);
  1155. dev_set_drvdata(&dev->dev, netdev);
  1156. adapter->vdev = dev;
  1157. adapter->netdev = netdev;
  1158. adapter->mcastFilterSize = *mcastFilterSize_p;
  1159. adapter->pool_config = 0;
  1160. netif_napi_add(netdev, &adapter->napi, ibmveth_poll, 16);
  1161. /*
  1162. * Some older boxes running PHYP non-natively have an OF that returns
  1163. * a 8-byte local-mac-address field (and the first 2 bytes have to be
  1164. * ignored) while newer boxes' OF return a 6-byte field. Note that
  1165. * IEEE 1275 specifies that local-mac-address must be a 6-byte field.
  1166. * The RPA doc specifies that the first byte must be 10b, so we'll
  1167. * just look for it to solve this 8 vs. 6 byte field issue
  1168. */
  1169. if ((*mac_addr_p & 0x3) != 0x02)
  1170. mac_addr_p += 2;
  1171. adapter->mac_addr = 0;
  1172. memcpy(&adapter->mac_addr, mac_addr_p, 6);
  1173. netdev->irq = dev->irq;
  1174. netdev->netdev_ops = &ibmveth_netdev_ops;
  1175. netdev->ethtool_ops = &netdev_ethtool_ops;
  1176. SET_NETDEV_DEV(netdev, &dev->dev);
  1177. netdev->features |= NETIF_F_SG;
  1178. memcpy(netdev->dev_addr, &adapter->mac_addr, netdev->addr_len);
  1179. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1180. struct kobject *kobj = &adapter->rx_buff_pool[i].kobj;
  1181. int error;
  1182. ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
  1183. pool_count[i], pool_size[i],
  1184. pool_active[i]);
  1185. error = kobject_init_and_add(kobj, &ktype_veth_pool,
  1186. &dev->dev.kobj, "pool%d", i);
  1187. if (!error)
  1188. kobject_uevent(kobj, KOBJ_ADD);
  1189. }
  1190. netdev_dbg(netdev, "adapter @ 0x%p\n", adapter);
  1191. adapter->buffer_list_dma = DMA_ERROR_CODE;
  1192. adapter->filter_list_dma = DMA_ERROR_CODE;
  1193. adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
  1194. netdev_dbg(netdev, "registering netdev...\n");
  1195. ibmveth_set_csum_offload(netdev, 1, ibmveth_set_tx_csum_flags);
  1196. rc = register_netdev(netdev);
  1197. if (rc) {
  1198. netdev_dbg(netdev, "failed to register netdev rc=%d\n", rc);
  1199. free_netdev(netdev);
  1200. return rc;
  1201. }
  1202. netdev_dbg(netdev, "registered\n");
  1203. return 0;
  1204. }
  1205. static int __devexit ibmveth_remove(struct vio_dev *dev)
  1206. {
  1207. struct net_device *netdev = dev_get_drvdata(&dev->dev);
  1208. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1209. int i;
  1210. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
  1211. kobject_put(&adapter->rx_buff_pool[i].kobj);
  1212. unregister_netdev(netdev);
  1213. free_netdev(netdev);
  1214. dev_set_drvdata(&dev->dev, NULL);
  1215. return 0;
  1216. }
  1217. static struct attribute veth_active_attr;
  1218. static struct attribute veth_num_attr;
  1219. static struct attribute veth_size_attr;
  1220. static ssize_t veth_pool_show(struct kobject *kobj,
  1221. struct attribute *attr, char *buf)
  1222. {
  1223. struct ibmveth_buff_pool *pool = container_of(kobj,
  1224. struct ibmveth_buff_pool,
  1225. kobj);
  1226. if (attr == &veth_active_attr)
  1227. return sprintf(buf, "%d\n", pool->active);
  1228. else if (attr == &veth_num_attr)
  1229. return sprintf(buf, "%d\n", pool->size);
  1230. else if (attr == &veth_size_attr)
  1231. return sprintf(buf, "%d\n", pool->buff_size);
  1232. return 0;
  1233. }
  1234. static ssize_t veth_pool_store(struct kobject *kobj, struct attribute *attr,
  1235. const char *buf, size_t count)
  1236. {
  1237. struct ibmveth_buff_pool *pool = container_of(kobj,
  1238. struct ibmveth_buff_pool,
  1239. kobj);
  1240. struct net_device *netdev = dev_get_drvdata(
  1241. container_of(kobj->parent, struct device, kobj));
  1242. struct ibmveth_adapter *adapter = netdev_priv(netdev);
  1243. long value = simple_strtol(buf, NULL, 10);
  1244. long rc;
  1245. if (attr == &veth_active_attr) {
  1246. if (value && !pool->active) {
  1247. if (netif_running(netdev)) {
  1248. if (ibmveth_alloc_buffer_pool(pool)) {
  1249. netdev_err(netdev,
  1250. "unable to alloc pool\n");
  1251. return -ENOMEM;
  1252. }
  1253. pool->active = 1;
  1254. adapter->pool_config = 1;
  1255. ibmveth_close(netdev);
  1256. adapter->pool_config = 0;
  1257. if ((rc = ibmveth_open(netdev)))
  1258. return rc;
  1259. } else {
  1260. pool->active = 1;
  1261. }
  1262. } else if (!value && pool->active) {
  1263. int mtu = netdev->mtu + IBMVETH_BUFF_OH;
  1264. int i;
  1265. /* Make sure there is a buffer pool with buffers that
  1266. can hold a packet of the size of the MTU */
  1267. for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
  1268. if (pool == &adapter->rx_buff_pool[i])
  1269. continue;
  1270. if (!adapter->rx_buff_pool[i].active)
  1271. continue;
  1272. if (mtu <= adapter->rx_buff_pool[i].buff_size)
  1273. break;
  1274. }
  1275. if (i == IBMVETH_NUM_BUFF_POOLS) {
  1276. netdev_err(netdev, "no active pool >= MTU\n");
  1277. return -EPERM;
  1278. }
  1279. if (netif_running(netdev)) {
  1280. adapter->pool_config = 1;
  1281. ibmveth_close(netdev);
  1282. pool->active = 0;
  1283. adapter->pool_config = 0;
  1284. if ((rc = ibmveth_open(netdev)))
  1285. return rc;
  1286. }
  1287. pool->active = 0;
  1288. }
  1289. } else if (attr == &veth_num_attr) {
  1290. if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT) {
  1291. return -EINVAL;
  1292. } else {
  1293. if (netif_running(netdev)) {
  1294. adapter->pool_config = 1;
  1295. ibmveth_close(netdev);
  1296. adapter->pool_config = 0;
  1297. pool->size = value;
  1298. if ((rc = ibmveth_open(netdev)))
  1299. return rc;
  1300. } else {
  1301. pool->size = value;
  1302. }
  1303. }
  1304. } else if (attr == &veth_size_attr) {
  1305. if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE) {
  1306. return -EINVAL;
  1307. } else {
  1308. if (netif_running(netdev)) {
  1309. adapter->pool_config = 1;
  1310. ibmveth_close(netdev);
  1311. adapter->pool_config = 0;
  1312. pool->buff_size = value;
  1313. if ((rc = ibmveth_open(netdev)))
  1314. return rc;
  1315. } else {
  1316. pool->buff_size = value;
  1317. }
  1318. }
  1319. }
  1320. /* kick the interrupt handler to allocate/deallocate pools */
  1321. ibmveth_interrupt(netdev->irq, netdev);
  1322. return count;
  1323. }
  1324. #define ATTR(_name, _mode) \
  1325. struct attribute veth_##_name##_attr = { \
  1326. .name = __stringify(_name), .mode = _mode, \
  1327. };
  1328. static ATTR(active, 0644);
  1329. static ATTR(num, 0644);
  1330. static ATTR(size, 0644);
  1331. static struct attribute *veth_pool_attrs[] = {
  1332. &veth_active_attr,
  1333. &veth_num_attr,
  1334. &veth_size_attr,
  1335. NULL,
  1336. };
  1337. static const struct sysfs_ops veth_pool_ops = {
  1338. .show = veth_pool_show,
  1339. .store = veth_pool_store,
  1340. };
  1341. static struct kobj_type ktype_veth_pool = {
  1342. .release = NULL,
  1343. .sysfs_ops = &veth_pool_ops,
  1344. .default_attrs = veth_pool_attrs,
  1345. };
  1346. static int ibmveth_resume(struct device *dev)
  1347. {
  1348. struct net_device *netdev = dev_get_drvdata(dev);
  1349. ibmveth_interrupt(netdev->irq, netdev);
  1350. return 0;
  1351. }
  1352. static struct vio_device_id ibmveth_device_table[] __devinitdata = {
  1353. { "network", "IBM,l-lan"},
  1354. { "", "" }
  1355. };
  1356. MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
  1357. static struct dev_pm_ops ibmveth_pm_ops = {
  1358. .resume = ibmveth_resume
  1359. };
  1360. static struct vio_driver ibmveth_driver = {
  1361. .id_table = ibmveth_device_table,
  1362. .probe = ibmveth_probe,
  1363. .remove = ibmveth_remove,
  1364. .get_desired_dma = ibmveth_get_desired_dma,
  1365. .driver = {
  1366. .name = ibmveth_driver_name,
  1367. .owner = THIS_MODULE,
  1368. .pm = &ibmveth_pm_ops,
  1369. }
  1370. };
  1371. static int __init ibmveth_module_init(void)
  1372. {
  1373. printk(KERN_DEBUG "%s: %s %s\n", ibmveth_driver_name,
  1374. ibmveth_driver_string, ibmveth_driver_version);
  1375. return vio_register_driver(&ibmveth_driver);
  1376. }
  1377. static void __exit ibmveth_module_exit(void)
  1378. {
  1379. vio_unregister_driver(&ibmveth_driver);
  1380. }
  1381. module_init(ibmveth_module_init);
  1382. module_exit(ibmveth_module_exit);