patch-2_6_7-vs1_9_1_12
[linux-2.6.git] / drivers / net / ibmveth.c
1 /**************************************************************************/
2 /*                                                                        */
3 /* IBM eServer i/pSeries Virtual Ethernet Device Driver                   */
4 /* Copyright (C) 2003 IBM Corp.                                           */
5 /*  Dave Larson (larson1@us.ibm.com)                                      */
6 /*  Santiago Leon (santil@us.ibm.com)                                     */
7 /*                                                                        */
8 /*  This program is free software; you can redistribute it and/or modify  */
9 /*  it under the terms of the GNU General Public License as published by  */
10 /*  the Free Software Foundation; either version 2 of the License, or     */
11 /*  (at your option) any later version.                                   */
12 /*                                                                        */
13 /*  This program is distributed in the hope that it will be useful,       */
14 /*  but WITHOUT ANY WARRANTY; without even the implied warranty of        */
15 /*  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         */
16 /*  GNU General Public License for more details.                          */
17 /*                                                                        */
18 /*  You should have received a copy of the GNU General Public License     */
19 /*  along with this program; if not, write to the Free Software           */
20 /*  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  */
21 /*                                                                   USA  */
22 /*                                                                        */
23 /* This module contains the implementation of a virtual ethernet device   */
24 /* for use with IBM i/pSeries LPAR Linux.  It utilizes the logical LAN    */
25 /* option of the RS/6000 Platform Architechture to interface with virtual */
26 /* ethernet NICs that are presented to the partition by the hypervisor.   */
27 /*                                                                        */ 
28 /**************************************************************************/
29 /*
30   TODO:
31   - remove frag processing code - no longer needed
32   - add support for sysfs
33   - possibly remove procfs support
34 */
35
36 #include <linux/config.h>
37 #include <linux/module.h>
38 #include <linux/version.h>
39 #include <linux/types.h>
40 #include <linux/errno.h>
41 #include <linux/ioport.h>
42 #include <linux/dma-mapping.h>
43 #include <linux/kernel.h>
44 #include <linux/netdevice.h>
45 #include <linux/etherdevice.h>
46 #include <linux/skbuff.h>
47 #include <linux/init.h>
48 #include <linux/delay.h>
49 #include <linux/mm.h>
50 #include <linux/ethtool.h>
51 #include <linux/proc_fs.h>
52 #include <asm/semaphore.h>
53 #include <asm/hvcall.h>
54 #include <asm/atomic.h>
55 #include <asm/iommu.h>
56 #include <asm/vio.h>
57 #include <asm/uaccess.h>
58 #include <linux/seq_file.h>
59
60 #include "ibmveth.h"
61
62 #define DEBUG 1
63
64 #define ibmveth_printk(fmt, args...) \
65   printk(KERN_INFO "%s: " fmt, __FILE__, ## args)
66
67 #define ibmveth_error_printk(fmt, args...) \
68   printk(KERN_ERR "(%s:%3.3d ua:%x) ERROR: " fmt, __FILE__, __LINE__ , adapter->vdev->unit_address, ## args)
69
70 #ifdef DEBUG
71 #define ibmveth_debug_printk_no_adapter(fmt, args...) \
72   printk(KERN_DEBUG "(%s:%3.3d): " fmt, __FILE__, __LINE__ , ## args)
73 #define ibmveth_debug_printk(fmt, args...) \
74   printk(KERN_DEBUG "(%s:%3.3d ua:%x): " fmt, __FILE__, __LINE__ , adapter->vdev->unit_address, ## args)
75 #define ibmveth_assert(expr) \
76   if(!(expr)) {                                   \
77     printk(KERN_DEBUG "assertion failed (%s:%3.3d ua:%x): %s\n", __FILE__, __LINE__, adapter->vdev->unit_address, #expr); \
78     BUG(); \
79   }
80 #else
81 #define ibmveth_debug_printk_no_adapter(fmt, args...)
82 #define ibmveth_debug_printk(fmt, args...)
83 #define ibmveth_assert(expr) 
84 #endif
85
86 static int ibmveth_open(struct net_device *dev);
87 static int ibmveth_close(struct net_device *dev);
88 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd);
89 static int ibmveth_poll(struct net_device *dev, int *budget);
90 static int ibmveth_start_xmit(struct sk_buff *skb, struct net_device *dev);
91 static struct net_device_stats *ibmveth_get_stats(struct net_device *dev);
92 static void ibmveth_set_multicast_list(struct net_device *dev);
93 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu);
94 static void ibmveth_proc_register_driver(void);
95 static void ibmveth_proc_unregister_driver(void);
96 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter);
97 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter);
98 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance, struct pt_regs *regs);
99
100 #ifdef CONFIG_PROC_FS
101 #define IBMVETH_PROC_DIR "ibmveth"
102 static struct proc_dir_entry *ibmveth_proc_dir;
103 #endif
104
105 static const char ibmveth_driver_name[] = "ibmveth";
106 static const char ibmveth_driver_string[] = "IBM i/pSeries Virtual Ethernet Driver";
107 static const char ibmveth_driver_version[] = "1.0";
108
109 MODULE_AUTHOR("Dave Larson <larson1@us.ibm.com>");
110 MODULE_DESCRIPTION("IBM i/pSeries Virtual Ethernet Driver");
111 MODULE_LICENSE("GPL");
112
113 /* simple methods of getting data from the current rxq entry */
114 static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
115 {
116         return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].toggle == adapter->rx_queue.toggle);
117 }
118
119 static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
120 {
121         return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].valid);
122 }
123
124 static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
125 {
126         return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].offset);
127 }
128
129 static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
130 {
131         return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].length);
132 }
133
134 /* setup the initial settings for a buffer pool */
135 static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool, u32 pool_index, u32 pool_size, u32 buff_size)
136 {
137         pool->size = pool_size;
138         pool->index = pool_index;
139         pool->buff_size = buff_size;
140         pool->threshold = pool_size / 2;
141 }
142
143 /* allocate and setup an buffer pool - called during open */
144 static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
145 {
146         int i;
147
148         pool->free_map = kmalloc(sizeof(u16) * pool->size, GFP_KERNEL); 
149
150         if(!pool->free_map) {
151                 return -1;
152         }
153
154         pool->dma_addr = kmalloc(sizeof(dma_addr_t) * pool->size, GFP_KERNEL); 
155         if(!pool->dma_addr) {
156                 kfree(pool->free_map);
157                 pool->free_map = NULL;
158                 return -1;
159         }
160
161         pool->skbuff = kmalloc(sizeof(void*) * pool->size, GFP_KERNEL);
162
163         if(!pool->skbuff) {
164                 kfree(pool->dma_addr);
165                 pool->dma_addr = NULL;
166
167                 kfree(pool->free_map);
168                 pool->free_map = NULL;
169                 return -1;
170         }
171
172         memset(pool->skbuff, 0, sizeof(void*) * pool->size);
173         memset(pool->dma_addr, 0, sizeof(dma_addr_t) * pool->size);
174
175         for(i = 0; i < pool->size; ++i) {
176                 pool->free_map[i] = i;
177         }
178
179         atomic_set(&pool->available, 0);
180         pool->producer_index = 0;
181         pool->consumer_index = 0;
182
183         return 0;
184 }
185
186 /* replenish the buffers for a pool.  note that we don't need to
187  * skb_reserve these since they are used for incoming...
188  */
189 static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter, struct ibmveth_buff_pool *pool)
190 {
191         u32 i;
192         u32 count = pool->size - atomic_read(&pool->available);
193         u32 buffers_added = 0;
194
195         mb();
196
197         for(i = 0; i < count; ++i) {
198                 struct sk_buff *skb;
199                 unsigned int free_index, index;
200                 u64 correlator;
201                 union ibmveth_buf_desc desc;
202                 unsigned long lpar_rc;
203                 dma_addr_t dma_addr;
204
205                 skb = alloc_skb(pool->buff_size, GFP_ATOMIC);
206
207                 if(!skb) {
208                         ibmveth_debug_printk("replenish: unable to allocate skb\n");
209                         adapter->replenish_no_mem++;
210                         break;
211                 }
212
213                 free_index = pool->consumer_index++ % pool->size;
214                 index = pool->free_map[free_index];
215         
216                 ibmveth_assert(index != 0xffff);
217                 ibmveth_assert(pool->skbuff[index] == NULL);
218
219                 dma_addr = vio_map_single(adapter->vdev, skb->data, pool->buff_size, DMA_FROM_DEVICE);
220
221                 pool->dma_addr[index] = dma_addr;
222                 pool->skbuff[index] = skb;
223
224                 correlator = ((u64)pool->index << 32) | index;
225                 *(u64*)skb->data = correlator;
226
227                 desc.desc = 0;
228                 desc.fields.valid = 1;
229                 desc.fields.length = pool->buff_size;
230                 desc.fields.address = dma_addr; 
231
232                 lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
233                     
234                 if(lpar_rc != H_Success) {
235                         pool->skbuff[index] = NULL;
236                         pool->consumer_index--;
237                         vio_unmap_single(adapter->vdev, pool->dma_addr[index], pool->buff_size, DMA_FROM_DEVICE);
238                         dev_kfree_skb_any(skb);
239                         adapter->replenish_add_buff_failure++;
240                         break;
241                 } else {
242                         pool->free_map[free_index] = 0xffff;
243                         buffers_added++;
244                         adapter->replenish_add_buff_success++;
245                 }
246         }
247     
248         mb();
249         atomic_add(buffers_added, &(pool->available));
250 }
251
252 /* check if replenishing is needed.  */
253 static inline int ibmveth_is_replenishing_needed(struct ibmveth_adapter *adapter)
254 {
255         return ((atomic_read(&adapter->rx_buff_pool[0].available) < adapter->rx_buff_pool[0].threshold) ||
256                 (atomic_read(&adapter->rx_buff_pool[1].available) < adapter->rx_buff_pool[1].threshold) ||
257                 (atomic_read(&adapter->rx_buff_pool[2].available) < adapter->rx_buff_pool[2].threshold));
258 }
259
260 /* replenish tasklet routine */
261 static void ibmveth_replenish_task(struct ibmveth_adapter *adapter) 
262 {
263         adapter->replenish_task_cycles++;
264
265         ibmveth_replenish_buffer_pool(adapter, &adapter->rx_buff_pool[0]);
266         ibmveth_replenish_buffer_pool(adapter, &adapter->rx_buff_pool[1]);
267         ibmveth_replenish_buffer_pool(adapter, &adapter->rx_buff_pool[2]);
268
269         adapter->rx_no_buffer = *(u64*)(((char*)adapter->buffer_list_addr) + 4096 - 8);
270
271         atomic_inc(&adapter->not_replenishing);
272         ibmveth_assert(atomic_read(&adapter->not_replenishing) == 1);
273 }
274
275 /* kick the replenish tasklet if we need replenishing and it isn't already running */
276 static inline void ibmveth_schedule_replenishing(struct ibmveth_adapter *adapter)
277 {
278         if(ibmveth_is_replenishing_needed(adapter) && 
279            (atomic_dec_if_positive(&adapter->not_replenishing) == 0)) { 
280                 schedule_work(&adapter->replenish_task);
281         }
282 }
283
284 /* empty and free ana buffer pool - also used to do cleanup in error paths */
285 static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter, struct ibmveth_buff_pool *pool)
286 {
287         int i;
288
289         if(pool->free_map) {
290                 kfree(pool->free_map);
291                 pool->free_map  = NULL;
292         }
293
294         if(pool->skbuff && pool->dma_addr) {
295                 for(i = 0; i < pool->size; ++i) {
296                         struct sk_buff *skb = pool->skbuff[i];
297                         if(skb) {
298                                 vio_unmap_single(adapter->vdev,
299                                                  pool->dma_addr[i],
300                                                  pool->buff_size,
301                                                  DMA_FROM_DEVICE);
302                                 dev_kfree_skb_any(skb);
303                                 pool->skbuff[i] = NULL;
304                         }
305                 }
306         }
307
308         if(pool->dma_addr) {
309                 kfree(pool->dma_addr);
310                 pool->dma_addr = NULL;
311         }
312
313         if(pool->skbuff) {
314                 kfree(pool->skbuff);
315                 pool->skbuff = NULL;
316         }
317 }
318
319 /* remove a buffer from a pool */
320 static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter, u64 correlator)
321 {
322         unsigned int pool  = correlator >> 32;
323         unsigned int index = correlator & 0xffffffffUL;
324         unsigned int free_index;
325         struct sk_buff *skb;
326
327         ibmveth_assert(pool < IbmVethNumBufferPools);
328         ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
329
330         skb = adapter->rx_buff_pool[pool].skbuff[index];
331
332         ibmveth_assert(skb != NULL);
333
334         adapter->rx_buff_pool[pool].skbuff[index] = NULL;
335
336         vio_unmap_single(adapter->vdev,
337                          adapter->rx_buff_pool[pool].dma_addr[index],
338                          adapter->rx_buff_pool[pool].buff_size,
339                          DMA_FROM_DEVICE);
340
341         free_index = adapter->rx_buff_pool[pool].producer_index++ % adapter->rx_buff_pool[pool].size;
342         adapter->rx_buff_pool[pool].free_map[free_index] = index;
343
344         mb();
345
346         atomic_dec(&(adapter->rx_buff_pool[pool].available));
347 }
348
349 /* get the current buffer on the rx queue */
350 static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
351 {
352         u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
353         unsigned int pool = correlator >> 32;
354         unsigned int index = correlator & 0xffffffffUL;
355
356         ibmveth_assert(pool < IbmVethNumBufferPools);
357         ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
358
359         return adapter->rx_buff_pool[pool].skbuff[index];
360 }
361
362 /* recycle the current buffer on the rx queue */
363 static void ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter)
364 {
365         u32 q_index = adapter->rx_queue.index;
366         u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator;
367         unsigned int pool = correlator >> 32;
368         unsigned int index = correlator & 0xffffffffUL;
369         union ibmveth_buf_desc desc;
370         unsigned long lpar_rc;
371
372         ibmveth_assert(pool < IbmVethNumBufferPools);
373         ibmveth_assert(index < adapter->rx_buff_pool[pool].size);
374
375         desc.desc = 0;
376         desc.fields.valid = 1;
377         desc.fields.length = adapter->rx_buff_pool[pool].buff_size;
378         desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index];
379
380         lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
381                     
382         if(lpar_rc != H_Success) {
383                 ibmveth_debug_printk("h_add_logical_lan_buffer failed during recycle rc=%ld", lpar_rc);
384                 ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
385         }
386
387         if(++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
388                 adapter->rx_queue.index = 0;
389                 adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
390         }
391 }
392
393 static inline void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter)
394 {
395         ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
396
397         if(++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
398                 adapter->rx_queue.index = 0;
399                 adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
400         }
401 }
402
403 static void ibmveth_cleanup(struct ibmveth_adapter *adapter)
404 {
405         if(adapter->buffer_list_addr != NULL) {
406                 if(!dma_mapping_error(adapter->buffer_list_dma)) {
407                         vio_unmap_single(adapter->vdev, adapter->buffer_list_dma, 4096, DMA_BIDIRECTIONAL);
408                         adapter->buffer_list_dma = DMA_ERROR_CODE;
409                 }
410                 free_page((unsigned long)adapter->buffer_list_addr);
411                 adapter->buffer_list_addr = NULL;
412         } 
413
414         if(adapter->filter_list_addr != NULL) {
415                 if(!dma_mapping_error(adapter->filter_list_dma)) {
416                         vio_unmap_single(adapter->vdev, adapter->filter_list_dma, 4096, DMA_BIDIRECTIONAL);
417                         adapter->filter_list_dma = DMA_ERROR_CODE;
418                 }
419                 free_page((unsigned long)adapter->filter_list_addr);
420                 adapter->filter_list_addr = NULL;
421         }
422
423         if(adapter->rx_queue.queue_addr != NULL) {
424                 if(!dma_mapping_error(adapter->rx_queue.queue_dma)) {
425                         vio_unmap_single(adapter->vdev, adapter->rx_queue.queue_dma, adapter->rx_queue.queue_len, DMA_BIDIRECTIONAL);
426                         adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
427                 }
428                 kfree(adapter->rx_queue.queue_addr);
429                 adapter->rx_queue.queue_addr = NULL;
430         }
431
432         ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[0]);
433         ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[1]);
434         ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[2]);
435 }
436
437 static int ibmveth_open(struct net_device *netdev)
438 {
439         struct ibmveth_adapter *adapter = netdev->priv;
440         u64 mac_address = 0;
441         int rxq_entries;
442         unsigned long lpar_rc;
443         int rc;
444         union ibmveth_buf_desc rxq_desc;
445
446         ibmveth_debug_printk("open starting\n");
447
448         rxq_entries =
449                 adapter->rx_buff_pool[0].size +
450                 adapter->rx_buff_pool[1].size +
451                 adapter->rx_buff_pool[2].size + 1;
452     
453         adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
454         adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
455  
456         if(!adapter->buffer_list_addr || !adapter->filter_list_addr) {
457                 ibmveth_error_printk("unable to allocate filter or buffer list pages\n");
458                 ibmveth_cleanup(adapter);
459                 return -ENOMEM;
460         }
461
462         adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) * rxq_entries;
463         adapter->rx_queue.queue_addr = kmalloc(adapter->rx_queue.queue_len, GFP_KERNEL);
464
465         if(!adapter->rx_queue.queue_addr) {
466                 ibmveth_error_printk("unable to allocate rx queue pages\n");
467                 ibmveth_cleanup(adapter);
468                 return -ENOMEM;
469         }
470
471         adapter->buffer_list_dma = vio_map_single(adapter->vdev, adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
472         adapter->filter_list_dma = vio_map_single(adapter->vdev, adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
473         adapter->rx_queue.queue_dma = vio_map_single(adapter->vdev, adapter->rx_queue.queue_addr, adapter->rx_queue.queue_len, DMA_BIDIRECTIONAL);
474
475         if((dma_mapping_error(adapter->buffer_list_dma) ) ||
476            (dma_mapping_error(adapter->filter_list_dma)) ||
477            (dma_mapping_error(adapter->rx_queue.queue_dma))) {
478                 ibmveth_error_printk("unable to map filter or buffer list pages\n");
479                 ibmveth_cleanup(adapter);
480                 return -ENOMEM;
481         }
482
483         adapter->rx_queue.index = 0;
484         adapter->rx_queue.num_slots = rxq_entries;
485         adapter->rx_queue.toggle = 1;
486
487         if(ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[0]) ||
488            ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[1]) ||
489            ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[2]))
490         {
491                 ibmveth_error_printk("unable to allocate buffer pools\n");
492                 ibmveth_cleanup(adapter);
493                 return -ENOMEM;
494         }
495
496         memcpy(&mac_address, netdev->dev_addr, netdev->addr_len);
497         mac_address = mac_address >> 16;
498
499         rxq_desc.desc = 0;
500         rxq_desc.fields.valid = 1;
501         rxq_desc.fields.length = adapter->rx_queue.queue_len;
502         rxq_desc.fields.address = adapter->rx_queue.queue_dma;
503
504         ibmveth_debug_printk("buffer list @ 0x%p\n", adapter->buffer_list_addr);
505         ibmveth_debug_printk("filter list @ 0x%p\n", adapter->filter_list_addr);
506         ibmveth_debug_printk("receive q   @ 0x%p\n", adapter->rx_queue.queue_addr);
507
508     
509         lpar_rc = h_register_logical_lan(adapter->vdev->unit_address,
510                                          adapter->buffer_list_dma,
511                                          rxq_desc.desc,
512                                          adapter->filter_list_dma,
513                                          mac_address);
514
515         if(lpar_rc != H_Success) {
516                 ibmveth_error_printk("h_register_logical_lan failed with %ld\n", lpar_rc);
517                 ibmveth_error_printk("buffer TCE:0x%x filter TCE:0x%x rxq desc:0x%lx MAC:0x%lx\n",
518                                      adapter->buffer_list_dma,
519                                      adapter->filter_list_dma,
520                                      rxq_desc.desc,
521                                      mac_address);
522                 ibmveth_cleanup(adapter);
523                 return -ENONET; 
524         }
525
526         ibmveth_debug_printk("registering irq 0x%x\n", netdev->irq);
527         if((rc = request_irq(netdev->irq, &ibmveth_interrupt, 0, netdev->name, netdev)) != 0) {
528                 ibmveth_error_printk("unable to request irq 0x%x, rc %d\n", netdev->irq, rc);
529                 do {
530                         rc = h_free_logical_lan(adapter->vdev->unit_address);
531                 } while H_isLongBusy(rc);
532
533                 ibmveth_cleanup(adapter);
534                 return rc;
535         }
536
537         netif_start_queue(netdev);
538
539         ibmveth_debug_printk("scheduling initial replenish cycle\n");
540         ibmveth_schedule_replenishing(adapter);
541
542         ibmveth_debug_printk("open complete\n");
543
544         return 0;
545 }
546
547 static int ibmveth_close(struct net_device *netdev)
548 {
549         struct ibmveth_adapter *adapter = netdev->priv;
550         long lpar_rc;
551     
552         ibmveth_debug_printk("close starting\n");
553
554         netif_stop_queue(netdev);
555
556         free_irq(netdev->irq, netdev);
557
558         cancel_delayed_work(&adapter->replenish_task);
559         flush_scheduled_work();
560
561         do {
562                 lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
563         } while H_isLongBusy(lpar_rc);
564
565         if(lpar_rc != H_Success)
566         {
567                 ibmveth_error_printk("h_free_logical_lan failed with %lx, continuing with close\n",
568                                      lpar_rc);
569         }
570
571         adapter->rx_no_buffer = *(u64*)(((char*)adapter->buffer_list_addr) + 4096 - 8);
572
573         ibmveth_cleanup(adapter);
574
575         ibmveth_debug_printk("close complete\n");
576
577         return 0;
578 }
579
580 static int netdev_get_settings(struct net_device *dev, struct ethtool_cmd *cmd) {
581         cmd->supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg | SUPPORTED_FIBRE);
582         cmd->advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg | ADVERTISED_FIBRE);
583         cmd->speed = SPEED_1000;
584         cmd->duplex = DUPLEX_FULL;
585         cmd->port = PORT_FIBRE;
586         cmd->phy_address = 0;
587         cmd->transceiver = XCVR_INTERNAL;
588         cmd->autoneg = AUTONEG_ENABLE;
589         cmd->maxtxpkt = 0;
590         cmd->maxrxpkt = 1;
591         return 0;
592 }
593
594 static void netdev_get_drvinfo (struct net_device *dev, struct ethtool_drvinfo *info) {
595         strncpy(info->driver, ibmveth_driver_name, sizeof(info->driver) - 1);
596         strncpy(info->version, ibmveth_driver_version, sizeof(info->version) - 1);
597 }
598
599 static u32 netdev_get_link(struct net_device *dev) {
600         return 0;
601 }
602
603 static struct ethtool_ops netdev_ethtool_ops = {
604         .get_drvinfo            = netdev_get_drvinfo,
605         .get_settings           = netdev_get_settings,
606         .get_link               = netdev_get_link,
607         .get_sg                 = ethtool_op_get_sg,
608         .get_tx_csum            = ethtool_op_get_tx_csum,
609 };
610
611 static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
612 {
613         return -EOPNOTSUPP;
614 }
615
616 #define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1))
617
618 static int ibmveth_start_xmit(struct sk_buff *skb, struct net_device *netdev)
619 {
620         struct ibmveth_adapter *adapter = netdev->priv;
621         union ibmveth_buf_desc desc[IbmVethMaxSendFrags];
622         unsigned long lpar_rc;
623         int nfrags = 0, curfrag;
624         unsigned long correlator;
625         unsigned int retry_count;
626
627         if ((skb_shinfo(skb)->nr_frags + 1) > IbmVethMaxSendFrags) {
628                 adapter->stats.tx_dropped++;
629                 dev_kfree_skb(skb);
630                 return 0;
631         }
632
633         memset(&desc, 0, sizeof(desc));
634
635         /* nfrags = number of frags after the initial fragment */
636         nfrags = skb_shinfo(skb)->nr_frags;
637
638         if(nfrags)
639                 adapter->tx_multidesc_send++;
640
641         /* map the initial fragment */
642         desc[0].fields.length  = nfrags ? skb->len - skb->data_len : skb->len;
643         desc[0].fields.address = vio_map_single(adapter->vdev, skb->data,
644                                         desc[0].fields.length, DMA_TO_DEVICE);
645         desc[0].fields.valid   = 1;
646
647         if(dma_mapping_error(desc[0].fields.address)) {
648                 ibmveth_error_printk("tx: unable to map initial fragment\n");
649                 adapter->tx_map_failed++;
650                 adapter->stats.tx_dropped++;
651                 dev_kfree_skb(skb);
652                 return 0;
653         }
654
655         curfrag = nfrags;
656
657         /* map fragments past the initial portion if there are any */
658         while(curfrag--) {
659                 skb_frag_t *frag = &skb_shinfo(skb)->frags[curfrag];
660                 desc[curfrag+1].fields.address
661                         = vio_map_single(adapter->vdev,
662                                 page_address(frag->page) + frag->page_offset,
663                                 frag->size, DMA_TO_DEVICE);
664                 desc[curfrag+1].fields.length = frag->size;
665                 desc[curfrag+1].fields.valid  = 1;
666
667                 if(dma_mapping_error(desc[curfrag+1].fields.address)) {
668                         ibmveth_error_printk("tx: unable to map fragment %d\n", curfrag);
669                         adapter->tx_map_failed++;
670                         adapter->stats.tx_dropped++;
671                         /* Free all the mappings we just created */
672                         while(curfrag < nfrags) {
673                                 vio_unmap_single(adapter->vdev,
674                                                  desc[curfrag+1].fields.address,
675                                                  desc[curfrag+1].fields.length,
676                                                  DMA_TO_DEVICE);
677                                 curfrag++;
678                         }
679                         dev_kfree_skb(skb);
680                         return 0;
681                 }
682         }
683
684         /* send the frame. Arbitrarily set retrycount to 1024 */
685         correlator = 0;
686         retry_count = 1024;
687         do {
688                 lpar_rc = h_send_logical_lan(adapter->vdev->unit_address,
689                                              desc[0].desc,
690                                              desc[1].desc,
691                                              desc[2].desc,
692                                              desc[3].desc,
693                                              desc[4].desc,
694                                              desc[5].desc,
695                                              correlator);
696         } while ((lpar_rc == H_Busy) && (retry_count--));
697     
698         if(lpar_rc != H_Success && lpar_rc != H_Dropped) {
699                 int i;
700                 ibmveth_error_printk("tx: h_send_logical_lan failed with rc=%ld\n", lpar_rc);
701                 for(i = 0; i < 6; i++) {
702                         ibmveth_error_printk("tx: desc[%i] valid=%d, len=%d, address=0x%d\n", i,
703                                              desc[i].fields.valid, desc[i].fields.length, desc[i].fields.address);
704                 }
705                 adapter->tx_send_failed++;
706                 adapter->stats.tx_dropped++;
707         } else {
708                 adapter->stats.tx_packets++;
709                 adapter->stats.tx_bytes += skb->len;
710         }
711
712         do {
713                 vio_unmap_single(adapter->vdev, desc[nfrags].fields.address, desc[nfrags].fields.length, DMA_TO_DEVICE);
714         } while(--nfrags >= 0);
715
716         dev_kfree_skb(skb);
717         return 0;
718 }
719
720 static int ibmveth_poll(struct net_device *netdev, int *budget)
721 {
722         struct ibmveth_adapter *adapter = netdev->priv;
723         int max_frames_to_process = netdev->quota;
724         int frames_processed = 0;
725         int more_work = 1;
726         unsigned long lpar_rc;
727
728  restart_poll:
729         do {
730                 struct net_device *netdev = adapter->netdev;
731
732                 if(ibmveth_rxq_pending_buffer(adapter)) {
733                         struct sk_buff *skb;
734
735                         if(!ibmveth_rxq_buffer_valid(adapter)) {
736                                 wmb(); /* suggested by larson1 */
737                                 adapter->rx_invalid_buffer++;
738                                 ibmveth_debug_printk("recycling invalid buffer\n");
739                                 ibmveth_rxq_recycle_buffer(adapter);
740                         } else {
741                                 int length = ibmveth_rxq_frame_length(adapter);
742                                 int offset = ibmveth_rxq_frame_offset(adapter);
743                                 skb = ibmveth_rxq_get_buffer(adapter);
744
745                                 ibmveth_rxq_harvest_buffer(adapter);
746
747                                 skb_reserve(skb, offset);
748                                 skb_put(skb, length);
749                                 skb->dev = netdev;
750                                 skb->protocol = eth_type_trans(skb, netdev);
751
752                                 netif_receive_skb(skb); /* send it up */
753
754                                 adapter->stats.rx_packets++;
755                                 adapter->stats.rx_bytes += length;
756                                 frames_processed++;
757                         }
758                 } else {
759                         more_work = 0;
760                 }
761         } while(more_work && (frames_processed < max_frames_to_process));
762
763         ibmveth_schedule_replenishing(adapter);
764
765         if(more_work) {
766                 /* more work to do - return that we are not done yet */
767                 netdev->quota -= frames_processed;
768                 *budget -= frames_processed;
769                 return 1; 
770         }
771
772         /* we think we are done - reenable interrupts, then check once more to make sure we are done */
773         lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_ENABLE);
774
775         ibmveth_assert(lpar_rc == H_Success);
776
777         netif_rx_complete(netdev);
778
779         if(ibmveth_rxq_pending_buffer(adapter) && netif_rx_reschedule(netdev, frames_processed))
780         {
781                 lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
782                 ibmveth_assert(lpar_rc == H_Success);
783                 more_work = 1;
784                 goto restart_poll;
785         }
786
787         netdev->quota -= frames_processed;
788         *budget -= frames_processed;
789
790         /* we really are done */
791         return 0;
792 }
793
794 static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance, struct pt_regs *regs)
795 {   
796         struct net_device *netdev = dev_instance;
797         struct ibmveth_adapter *adapter = netdev->priv;
798         unsigned long lpar_rc;
799
800         if(netif_rx_schedule_prep(netdev)) {
801                 lpar_rc = h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
802                 ibmveth_assert(lpar_rc == H_Success);
803                 __netif_rx_schedule(netdev);
804         }
805         return IRQ_HANDLED;
806 }
807
808 static struct net_device_stats *ibmveth_get_stats(struct net_device *dev)
809 {
810         struct ibmveth_adapter *adapter = dev->priv;
811         return &adapter->stats;
812 }
813
814 static void ibmveth_set_multicast_list(struct net_device *netdev)
815 {
816         struct ibmveth_adapter *adapter = netdev->priv;
817         unsigned long lpar_rc;
818
819         if((netdev->flags & IFF_PROMISC) || (netdev->mc_count > adapter->mcastFilterSize)) {
820                 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
821                                            IbmVethMcastEnableRecv |
822                                            IbmVethMcastDisableFiltering,
823                                            0);
824                 if(lpar_rc != H_Success) {
825                         ibmveth_error_printk("h_multicast_ctrl rc=%ld when entering promisc mode\n", lpar_rc);
826                 }
827         } else {
828                 struct dev_mc_list *mclist = netdev->mc_list;
829                 int i;
830                 /* clear the filter table & disable filtering */
831                 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
832                                            IbmVethMcastEnableRecv |
833                                            IbmVethMcastDisableFiltering |
834                                            IbmVethMcastClearFilterTable,
835                                            0);
836                 if(lpar_rc != H_Success) {
837                         ibmveth_error_printk("h_multicast_ctrl rc=%ld when attempting to clear filter table\n", lpar_rc);
838                 }
839                 /* add the addresses to the filter table */
840                 for(i = 0; i < netdev->mc_count; ++i, mclist = mclist->next) {
841                         // add the multicast address to the filter table
842                         unsigned long mcast_addr = 0;
843                         memcpy(((char *)&mcast_addr)+2, mclist->dmi_addr, 6);
844                         lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
845                                                    IbmVethMcastAddFilter,
846                                                    mcast_addr);
847                         if(lpar_rc != H_Success) {
848                                 ibmveth_error_printk("h_multicast_ctrl rc=%ld when adding an entry to the filter table\n", lpar_rc);
849                         }
850                 }
851         
852                 /* re-enable filtering */
853                 lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
854                                            IbmVethMcastEnableFiltering,
855                                            0);
856                 if(lpar_rc != H_Success) {
857                         ibmveth_error_printk("h_multicast_ctrl rc=%ld when enabling filtering\n", lpar_rc);
858                 }
859         }
860 }
861
862 static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
863 {
864         if ((new_mtu < 68) || (new_mtu > (1<<20)))
865                 return -EINVAL;
866         dev->mtu = new_mtu;
867         return 0;       
868 }
869
870 static int __devinit ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
871 {
872         int rc;
873         struct net_device *netdev;
874         struct ibmveth_adapter *adapter;
875
876         unsigned char *mac_addr_p;
877         unsigned int *mcastFilterSize_p;
878
879
880         ibmveth_debug_printk_no_adapter("entering ibmveth_probe for UA 0x%x\n", 
881                                         dev->unit_address);
882
883         mac_addr_p = (unsigned char *) vio_get_attribute(dev, VETH_MAC_ADDR, 0);
884         if(!mac_addr_p) {
885                 ibmveth_error_printk("Can't find VETH_MAC_ADDR attribute\n");
886                 return 0;
887         }
888         
889         mcastFilterSize_p= (unsigned int *) vio_get_attribute(dev, VETH_MCAST_FILTER_SIZE, 0);
890         if(!mcastFilterSize_p) {
891                 ibmveth_error_printk("Can't find VETH_MCAST_FILTER_SIZE attribute\n");
892                 return 0;
893         }
894         
895         netdev = alloc_etherdev(sizeof(struct ibmveth_adapter));
896
897         if(!netdev)
898                 return -ENOMEM;
899
900         SET_MODULE_OWNER(netdev);
901
902         adapter = netdev->priv;
903         memset(adapter, 0, sizeof(adapter));
904         dev->dev.driver_data = netdev;
905
906         adapter->vdev = dev;
907         adapter->netdev = netdev;
908         adapter->mcastFilterSize= *mcastFilterSize_p;
909         
910         /*      Some older boxes running PHYP non-natively have an OF that
911                 returns a 8-byte local-mac-address field (and the first 
912                 2 bytes have to be ignored) while newer boxes' OF return
913                 a 6-byte field. Note that IEEE 1275 specifies that 
914                 local-mac-address must be a 6-byte field.
915                 The RPA doc specifies that the first byte must be 10b, so 
916                 we'll just look for it to solve this 8 vs. 6 byte field issue */
917
918         if ((*mac_addr_p & 0x3) != 0x02)
919                 mac_addr_p += 2;
920
921         adapter->mac_addr = 0;
922         memcpy(&adapter->mac_addr, mac_addr_p, 6);
923
924         adapter->liobn = dev->iommu_table->it_index;
925         
926         netdev->irq = dev->irq;
927         netdev->open               = ibmveth_open;
928         netdev->poll               = ibmveth_poll;
929         netdev->weight             = 16;
930         netdev->stop               = ibmveth_close;
931         netdev->hard_start_xmit    = ibmveth_start_xmit;
932         netdev->get_stats          = ibmveth_get_stats;
933         netdev->set_multicast_list = ibmveth_set_multicast_list;
934         netdev->do_ioctl           = ibmveth_ioctl;
935         netdev->ethtool_ops           = &netdev_ethtool_ops;
936         netdev->change_mtu         = ibmveth_change_mtu;
937         SET_NETDEV_DEV(netdev, &dev->dev);
938
939         memcpy(&netdev->dev_addr, &adapter->mac_addr, netdev->addr_len);
940
941         ibmveth_init_buffer_pool(&adapter->rx_buff_pool[0], 0, IbmVethPool0DftCnt, IbmVethPool0DftSize);
942         ibmveth_init_buffer_pool(&adapter->rx_buff_pool[1], 1, IbmVethPool1DftCnt, IbmVethPool1DftSize);
943         ibmveth_init_buffer_pool(&adapter->rx_buff_pool[2], 2, IbmVethPool2DftCnt, IbmVethPool2DftSize);
944
945         ibmveth_debug_printk("adapter @ 0x%p\n", adapter);
946
947         INIT_WORK(&adapter->replenish_task, (void*)ibmveth_replenish_task, (void*)adapter);
948
949         adapter->buffer_list_dma = DMA_ERROR_CODE;
950         adapter->filter_list_dma = DMA_ERROR_CODE;
951         adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
952
953         atomic_set(&adapter->not_replenishing, 1);
954
955         ibmveth_debug_printk("registering netdev...\n");
956
957         rc = register_netdev(netdev);
958
959         if(rc) {
960                 ibmveth_debug_printk("failed to register netdev rc=%d\n", rc);
961                 free_netdev(netdev);
962                 return rc;
963         }
964
965         ibmveth_debug_printk("registered\n");
966
967         ibmveth_proc_register_adapter(adapter);
968
969         return 0;
970 }
971
972 static int __devexit ibmveth_remove(struct vio_dev *dev)
973 {
974         struct net_device *netdev = dev->dev.driver_data;
975         struct ibmveth_adapter *adapter = netdev->priv;
976
977         unregister_netdev(netdev);
978
979         ibmveth_proc_unregister_adapter(adapter);
980
981         free_netdev(netdev);
982         return 0;
983 }
984
985 #ifdef CONFIG_PROC_FS
986 static void ibmveth_proc_register_driver(void)
987 {
988         ibmveth_proc_dir = create_proc_entry(IBMVETH_PROC_DIR, S_IFDIR, proc_net);
989         if (ibmveth_proc_dir) {
990                 SET_MODULE_OWNER(ibmveth_proc_dir);
991         }
992 }
993
994 static void ibmveth_proc_unregister_driver(void)
995 {
996         remove_proc_entry(IBMVETH_PROC_DIR, proc_net);
997 }
998
999 static void *ibmveth_seq_start(struct seq_file *seq, loff_t *pos) 
1000 {
1001         if (*pos == 0) {
1002                 return (void *)1;
1003         } else {
1004                 return NULL;
1005         }
1006 }
1007
1008 static void *ibmveth_seq_next(struct seq_file *seq, void *v, loff_t *pos)
1009 {
1010         ++*pos;
1011         return NULL;
1012 }
1013
1014 static void ibmveth_seq_stop(struct seq_file *seq, void *v) 
1015 {
1016 }
1017
1018 static int ibmveth_seq_show(struct seq_file *seq, void *v) 
1019 {
1020         struct ibmveth_adapter *adapter = seq->private;
1021         char *current_mac = ((char*) &adapter->netdev->dev_addr);
1022         char *firmware_mac = ((char*) &adapter->mac_addr) ;
1023
1024         seq_printf(seq, "%s %s\n\n", ibmveth_driver_string, ibmveth_driver_version);
1025         
1026         seq_printf(seq, "Unit Address:    0x%x\n", adapter->vdev->unit_address);
1027         seq_printf(seq, "LIOBN:           0x%lx\n", adapter->liobn);
1028         seq_printf(seq, "Current MAC:     %02X:%02X:%02X:%02X:%02X:%02X\n",
1029                    current_mac[0], current_mac[1], current_mac[2],
1030                    current_mac[3], current_mac[4], current_mac[5]);
1031         seq_printf(seq, "Firmware MAC:    %02X:%02X:%02X:%02X:%02X:%02X\n",
1032                    firmware_mac[0], firmware_mac[1], firmware_mac[2],
1033                    firmware_mac[3], firmware_mac[4], firmware_mac[5]);
1034         
1035         seq_printf(seq, "\nAdapter Statistics:\n");
1036         seq_printf(seq, "  TX:  skbuffs linearized:          %ld\n", adapter->tx_linearized);
1037         seq_printf(seq, "       multi-descriptor sends:      %ld\n", adapter->tx_multidesc_send);
1038         seq_printf(seq, "       skb_linearize failures:      %ld\n", adapter->tx_linearize_failed);
1039         seq_printf(seq, "       vio_map_single failres:      %ld\n", adapter->tx_map_failed);
1040         seq_printf(seq, "       send failures:               %ld\n", adapter->tx_send_failed);
1041         seq_printf(seq, "  RX:  replenish task cycles:       %ld\n", adapter->replenish_task_cycles);
1042         seq_printf(seq, "       alloc_skb_failures:          %ld\n", adapter->replenish_no_mem);
1043         seq_printf(seq, "       add buffer failures:         %ld\n", adapter->replenish_add_buff_failure);
1044         seq_printf(seq, "       invalid buffers:             %ld\n", adapter->rx_invalid_buffer);
1045         seq_printf(seq, "       no buffers:                  %ld\n", adapter->rx_no_buffer);
1046         
1047         return 0;
1048 }
1049 static struct seq_operations ibmveth_seq_ops = {
1050         .start = ibmveth_seq_start,
1051         .next  = ibmveth_seq_next,
1052         .stop  = ibmveth_seq_stop,
1053         .show  = ibmveth_seq_show,
1054 };
1055
1056 static int ibmveth_proc_open(struct inode *inode, struct file *file)
1057 {
1058         struct seq_file *seq;
1059         struct proc_dir_entry *proc;
1060         int rc;
1061
1062         rc = seq_open(file, &ibmveth_seq_ops);
1063         if (!rc) {
1064                 /* recover the pointer buried in proc_dir_entry data */
1065                 seq = file->private_data;
1066                 proc = PDE(inode);
1067                 seq->private = proc->data;
1068         }
1069         return rc;
1070 }
1071
1072 static struct file_operations ibmveth_proc_fops = {
1073         .owner   = THIS_MODULE,
1074         .open    = ibmveth_proc_open,
1075         .read    = seq_read,
1076         .llseek  = seq_lseek,
1077         .release = seq_release,
1078 };
1079
1080 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter)
1081 {
1082         struct proc_dir_entry *entry;
1083         if (ibmveth_proc_dir) {
1084                 entry = create_proc_entry(adapter->netdev->name, S_IFREG, ibmveth_proc_dir);
1085                 if (!entry) {
1086                         ibmveth_error_printk("Cannot create adapter proc entry");
1087                 } else {
1088                         entry->data = (void *) adapter;
1089                         entry->proc_fops = &ibmveth_proc_fops;
1090                         SET_MODULE_OWNER(entry);
1091                 }
1092         }
1093         return;
1094 }
1095
1096 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter)
1097 {
1098         if (ibmveth_proc_dir) {
1099                 remove_proc_entry(adapter->netdev->name, ibmveth_proc_dir);
1100         }
1101 }
1102
1103 #else /* CONFIG_PROC_FS */
1104 static void ibmveth_proc_register_adapter(struct ibmveth_adapter *adapter) 
1105 {
1106 }
1107
1108 static void ibmveth_proc_unregister_adapter(struct ibmveth_adapter *adapter) 
1109 {
1110 }
1111 static void ibmveth_proc_register_driver(void)
1112 {
1113 }
1114
1115 static void ibmveth_proc_unregister_driver(void)
1116 {
1117 }
1118 #endif /* CONFIG_PROC_FS */
1119
1120 static struct vio_device_id ibmveth_device_table[] __devinitdata= {
1121         { "network", "IBM,l-lan"},
1122         { 0,}
1123 };
1124
1125 MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
1126
1127 static struct vio_driver ibmveth_driver = {
1128         .name        = (char *)ibmveth_driver_name,
1129         .id_table    = ibmveth_device_table,
1130         .probe       = ibmveth_probe,
1131         .remove      = ibmveth_remove
1132 };
1133
1134 static int __init ibmveth_module_init(void)
1135 {
1136         ibmveth_printk("%s: %s %s\n", ibmveth_driver_name, ibmveth_driver_string, ibmveth_driver_version);
1137
1138         ibmveth_proc_register_driver();
1139
1140         return vio_register_driver(&ibmveth_driver);
1141 }
1142
1143 static void __exit ibmveth_module_exit(void)
1144 {
1145         vio_unregister_driver(&ibmveth_driver);
1146         ibmveth_proc_unregister_driver();
1147 }       
1148
1149 module_init(ibmveth_module_init);
1150 module_exit(ibmveth_module_exit);