2 * Copyright © 1997-2007 Alacritech, Inc. All rights reserved
4 * $Id: sxghif.h,v 1.5 2008/07/24 19:18:22 chris Exp $
8 * This file contains structures and definitions for the
9 * Alacritech Sahara host interface
12 /*******************************************************************************
14 *******************************************************************************/
15 struct SXG_UCODE_REGS {
16 // Address 0 - 0x3F = Command codes 0-15 for TCB 0. Excode 0
17 u32 Icr; // Code = 0 (extended), ExCode = 0 - Int control
18 u32 RsvdReg1; // Code = 1 - TOE -NA
19 u32 RsvdReg2; // Code = 2 - TOE -NA
20 u32 RsvdReg3; // Code = 3 - TOE -NA
21 u32 RsvdReg4; // Code = 4 - TOE -NA
22 u32 RsvdReg5; // Code = 5 - TOE -NA
23 u32 CardUp; // Code = 6 - Microcode initialized when 1
24 u32 RsvdReg7; // Code = 7 - TOE -NA
25 u32 CodeNotUsed[8]; // Codes 8-15 not used. ExCode = 0
26 // This brings us to ExCode 1 at address 0x40 = Interrupt status pointer
27 u32 Isp; // Code = 0 (extended), ExCode = 1
28 u32 PadEx1[15]; // Codes 1-15 not used with extended codes
29 // ExCode 2 = Interrupt Status Register
30 u32 Isr; // Code = 0 (extended), ExCode = 2
32 // ExCode 3 = Event base register. Location of event rings
33 u32 EventBase; // Code = 0 (extended), ExCode = 3
35 // ExCode 4 = Event ring size
36 u32 EventSize; // Code = 0 (extended), ExCode = 4
38 // ExCode 5 = TCB Buffers base address
39 u32 TcbBase; // Code = 0 (extended), ExCode = 5
41 // ExCode 6 = TCB Composite Buffers base address
42 u32 TcbCompBase; // Code = 0 (extended), ExCode = 6
44 // ExCode 7 = Transmit ring base address
45 u32 XmtBase; // Code = 0 (extended), ExCode = 7
47 // ExCode 8 = Transmit ring size
48 u32 XmtSize; // Code = 0 (extended), ExCode = 8
50 // ExCode 9 = Receive ring base address
51 u32 RcvBase; // Code = 0 (extended), ExCode = 9
53 // ExCode 10 = Receive ring size
54 u32 RcvSize; // Code = 0 (extended), ExCode = 10
56 // ExCode 11 = Read EEPROM Config
57 u32 Config; // Code = 0 (extended), ExCode = 11
59 // ExCode 12 = Multicast bits 31:0
60 u32 McastLow; // Code = 0 (extended), ExCode = 12
62 // ExCode 13 = Multicast bits 63:32
63 u32 McastHigh; // Code = 0 (extended), ExCode = 13
66 u32 Ping; // Code = 0 (extended), ExCode = 14
68 // ExCode 15 = Link MTU
69 u32 LinkMtu; // Code = 0 (extended), ExCode = 15
71 // ExCode 16 = Download synchronization
72 u32 LoadSync; // Code = 0 (extended), ExCode = 16
74 // ExCode 17 = Upper DRAM address bits on 32-bit systems
75 u32 Upper; // Code = 0 (extended), ExCode = 17
77 // ExCode 18 = Slowpath Send Index Address
78 u32 SPSendIndex; // Code = 0 (extended), ExCode = 18
80 u32 RsvdXF; // Code = 0 (extended), ExCode = 19
82 // ExCode 20 = Aggregation
83 u32 Aggregation; // Code = 0 (extended), ExCode = 20
85 // ExCode 21 = Receive MDL push timer
86 u32 PushTicks; // Code = 0 (extended), ExCode = 21
89 u32 AckFrequency; // Code = 0 (extended), ExCode = 22
98 u32 RsvdReg25; // Code = 0 (extended), ExCode = 25
100 // ExCode 26 = Receive checksum requirements
101 u32 ReceiveChecksum; // Code = 0 (extended), ExCode = 26
103 // ExCode 27 = RSS Requirements
104 u32 Rss; // Code = 0 (extended), ExCode = 27
106 // ExCode 28 = RSS Table
107 u32 RssTable; // Code = 0 (extended), ExCode = 28
109 // ExCode 29 = Event ring release entries
110 u32 EventRelease; // Code = 0 (extended), ExCode = 29
112 // ExCode 30 = Number of receive bufferlist commands on ring 0
113 u32 RcvCmd; // Code = 0 (extended), ExCode = 30
115 // ExCode 31 = slowpath transmit command - Data[31:0] = 1
116 u32 XmtCmd; // Code = 0 (extended), ExCode = 31
118 // ExCode 32 = Dump command
119 u32 DumpCmd; // Code = 0 (extended), ExCode = 32
121 // ExCode 33 = Debug command
122 u32 DebugCmd; // Code = 0 (extended), ExCode = 33
124 // There are 128 possible extended commands - each of account for 16
125 // words (including the non-relevent base command codes 1-15).
126 // Pad for the remainder of these here to bring us to the next CPU
127 // base. As extended codes are added, reduce the first array value in
128 // the following field
129 u32 PadToNextCpu[94][16]; // 94 = 128 - 34 (34 = Excodes 0 - 33)
132 // Interrupt control register (0) values
133 #define SXG_ICR_DISABLE 0x00000000
134 #define SXG_ICR_ENABLE 0x00000001
135 #define SXG_ICR_MASK 0x00000002
136 #define SXG_ICR_MSGID_MASK 0xFFFF0000
137 #define SXG_ICR_MSGID_SHIFT 16
138 #define SXG_ICR(_MessageId, _Data) \
139 ((((_MessageId) << SXG_ICR_MSGID_SHIFT) & \
140 SXG_ICR_MSGID_MASK) | (_Data))
142 // The Microcode supports up to 16 RSS queues
143 #define SXG_MAX_RSS 16
144 #define SXG_MAX_RSS_TABLE_SIZE 256 // 256-byte max
146 #define SXG_RSS_TCP6 0x00000001 // RSS TCP over IPv6
147 #define SXG_RSS_TCP4 0x00000002 // RSS TCP over IPv4
148 #define SXG_RSS_LEGACY 0x00000004 // Line-base interrupts
149 #define SXG_RSS_TABLE_SIZE 0x0000FF00 // Table size mask
150 #define SXG_RSS_TABLE_SHIFT 8
151 #define SXG_RSS_BASE_CPU 0x00FF0000 // Base CPU (not used)
152 #define SXG_RSS_BASE_SHIFT 16
154 #define SXG_RCV_IP_CSUM_ENABLED 0x00000001 // ExCode 26 (ReceiveChecksum)
155 #define SXG_RCV_TCP_CSUM_ENABLED 0x00000002 // ExCode 26 (ReceiveChecksum)
157 #define SXG_XMT_CPUID_SHIFT 16
160 #define SXG_CHECK_FOR_HANG_TIME 3000
162 #define SXG_CHECK_FOR_HANG_TIME 5
166 * TCB registers - This is really the same register memory area as UCODE_REGS
167 * above, but defined differently. Bits 17:06 of the address define the TCB,
168 * which means each TCB area occupies 0x40 (64) bytes, or 16 u32S. What really
169 * is happening is that these registers occupy the "PadEx[15]" areas in the
170 * SXG_UCODE_REGS definition above
172 struct SXG_TCB_REGS {
173 u32 ExCode; /* Extended codes - see SXG_UCODE_REGS */
174 u32 Xmt; /* Code = 1 - # of Xmt descriptors added to ring */
175 u32 Rcv; /* Code = 2 - # of Rcv descriptors added to ring */
176 u32 Rsvd1; /* Code = 3 - TOE NA */
177 u32 Rsvd2; /* Code = 4 - TOE NA */
178 u32 Rsvd3; /* Code = 5 - TOE NA */
179 u32 Invalid; /* Code = 6 - Reserved for "CardUp" see above */
180 u32 Rsvd4; /* Code = 7 - TOE NA */
181 u32 Rsvd5; /* Code = 8 - TOE NA */
182 u32 Pad[7]; /* Codes 8-15 - Not used. */
185 /***************************************************************************
188 * _______________________________________
190 * |____|____|____|____|____|____|____|____|
191 * ^^^^ ^^^^ ^^^^ ^^^^ \ /
192 * ERR --|||| |||| |||| |||| -----------------
193 * EVENT ---||| |||| |||| |||| |
194 * ----|| |||| |||| |||| |-- Crash Address
195 * UPC -----| |||| |||| ||||
196 * LEVENT -------|||| |||| ||||
197 * PDQF --------||| |||| ||||
198 * RMISS ---------|| |||| ||||
199 * BREAK ----------| |||| ||||
200 * HBEATOK ------------|||| ||||
201 * NOHBEAT -------------||| ||||
202 * ERFULL --------------|| ||||
203 * XDROP ---------------| ||||
204 * -----------------||||
205 * -----------------||||--\
206 * ||---|-CpuId of crash
208 ***************************************************************************/
209 #define SXG_ISR_ERR 0x80000000 // Error
210 #define SXG_ISR_EVENT 0x40000000 // Event ring event
211 #define SXG_ISR_NONE1 0x20000000 // Not used
212 #define SXG_ISR_UPC 0x10000000 // Dump/debug command complete
213 #define SXG_ISR_LINK 0x08000000 // Link event
214 #define SXG_ISR_PDQF 0x04000000 // Processed data queue full
215 #define SXG_ISR_RMISS 0x02000000 // Drop - no host buf
216 #define SXG_ISR_BREAK 0x01000000 // Breakpoint hit
217 #define SXG_ISR_PING 0x00800000 // Heartbeat response
218 #define SXG_ISR_DEAD 0x00400000 // Card crash
219 #define SXG_ISR_ERFULL 0x00200000 // Event ring full
220 #define SXG_ISR_XDROP 0x00100000 // XMT Drop - no DRAM bufs or XMT err
221 #define SXG_ISR_SPSEND 0x00080000 // Slow send complete
222 #define SXG_ISR_CPU 0x00070000 // Dead CPU mask
223 #define SXG_ISR_CPU_SHIFT 16 // Dead CPU shift
224 #define SXG_ISR_CRASH 0x0000FFFF // Crash address mask
226 /***************************************************************************
230 ***************************************************************************/
233 * .___________________.___________________.
234 * |<------------ Pad 0 ------------>|
235 * |_________|_________|_________|_________|0 0x00
236 * |<------------ Pad 1 ------------>|
237 * |_________|_________|_________|_________|4 0x04
238 * |<------------ Pad 2 ------------>|
239 * |_________|_________|_________|_________|8 0x08
240 * |<----------- Event Word 0 ------------>|
241 * |_________|_________|_________|_________|12 0x0c
242 * |<----------- Event Word 1 ------------>|
243 * |_________|_________|_________|_________|16 0x10
244 * |<------------- Toeplitz ------------>|
245 * |_________|_________|_________|_________|20 0x14
246 * |<----- Length ---->|<------ TCB Id --->|
247 * |_________|_________|_________|_________|24 0x18
248 * |<----- Status ---->|Evnt Code|Flsh Code|
249 * |_________|_________|_________|_________|28 0x1c
251 * |- VALID |||| ||||- RBUFC
261 * _______________________________________
262 * |<----- Status ---->|Evnt Code|Flsh Code|
263 * |_________|Cmd Index|_________|_________|28 0x1c
274 #pragma pack(push, 1)
276 u32 Pad[1]; // not used
277 u32 SndUna; // SndUna value
278 u32 Resid; // receive MDL resid
280 void *HostHandle; // Receive host handle
287 u32 Toeplitz; // RSS Toeplitz hash
289 ushort Rsvd3; // TOE NA
290 ushort HdrOffset; // Slowpath
293 unsigned char Rsvd4; // TOE NA
294 unsigned char Code; // Event code
295 unsigned char CommandIndex; // New ring index
296 unsigned char Status; // Event status
300 // Event code definitions
301 #define EVENT_CODE_BUFFERS 0x01 // Receive buffer list command (ring 0)
302 #define EVENT_CODE_SLOWRCV 0x02 // Slowpath receive
303 #define EVENT_CODE_UNUSED 0x04 // Was slowpath commands complete
306 #define EVENT_STATUS_VALID 0x80 // Entry valid
309 #define EVENT_STATUS_ERROR 0x40 // Completed with error. Index in next byte
310 #define EVENT_STATUS_TCPIP4 0x20 // TCPIPv4 frame
311 #define EVENT_STATUS_TCPBAD 0x10 // Bad TCP checksum
312 #define EVENT_STATUS_IPBAD 0x08 // Bad IP checksum
313 #define EVENT_STATUS_RCVERR 0x04 // Slowpath receive error
314 #define EVENT_STATUS_IPONLY 0x02 // IP frame
315 #define EVENT_STATUS_TCPIP6 0x01 // TCPIPv6 frame
316 #define EVENT_STATUS_TCPIP 0x21 // Combination of v4 and v6
319 // Size must be power of 2, between 128 and 16k
320 #define EVENT_RING_SIZE 4096 // ??
321 #define EVENT_RING_BATCH 16 // Hand entries back 16 at a time.
322 #define EVENT_BATCH_LIMIT 256 // Stop processing events after 256 (16 * 16)
324 struct SXG_EVENT_RING {
325 struct SXG_EVENT Ring[EVENT_RING_SIZE];
328 /***************************************************************************
332 ***************************************************************************/
333 // Maximum number of TCBS supported by hardware/microcode
334 #define SXG_MAX_TCB 4096
335 // Minimum TCBs before we fail initialization
336 #define SXG_MIN_TCB 512
338 // The bucket is determined by bits 11:4 of the toeplitz if we support 4k
339 // offloaded connections, 10:4 if we support 2k and so on.
340 #define SXG_TCB_BUCKET_SHIFT 4
341 #define SXG_TCB_PER_BUCKET 16
342 #define SXG_TCB_BUCKET_MASK 0xFF0 // Bucket portion of TCB ID
343 #define SXG_TCB_ELEMENT_MASK 0x00F // Element within bucket
344 #define SXG_TCB_BUCKETS 256 // 256 * 16 = 4k
346 #define SXG_TCB_BUFFER_SIZE 512 // ASSERT format is correct
348 #define SXG_TCB_RCVQ_SIZE 736
350 #define SXG_TCB_COMPOSITE_BUFFER_SIZE 1024
352 #define SXG_LOCATE_TCP_FRAME_HDR(_TcpObject, _IPv6) \
353 (((_TcpObject)->VlanId) ? \
354 ((_IPv6) ? /* Vlan frame header = yes */ \
355 &(_TcpObject)->CompBuffer->Frame.HasVlan.TcpIp6.SxgTcp : \
356 &(_TcpObject)->CompBuffer->Frame.HasVlan.TcpIp.SxgTcp) : \
357 ((_IPv6) ? /* Vlan frame header = No */ \
358 &(_TcpObject)->CompBuffer->Frame.NoVlan.TcpIp6.SxgTcp : \
359 &(_TcpObject)->CompBuffer->Frame.NoVlan.TcpIp.SxgTcp))
361 #define SXG_LOCATE_IP_FRAME_HDR(_TcpObject) \
362 (_TcpObject)->VlanId ? \
363 &(_TcpObject)->CompBuffer->Frame.HasVlan.TcpIp.Ip : \
364 &(_TcpObject)->CompBuffer->Frame.NoVlan.TcpIp.Ip
366 #define SXG_LOCATE_IP6_FRAME_HDR(_TcpObject) \
367 (_TcpObject)->VlanId ? \
368 &(_TcpObject)->CompBuffer->Frame.HasVlan.TcpIp6.Ip : \
369 &(_TcpObject)->CompBuffer->Frame.NoVlan.TcpIp6.Ip
372 // Horrible kludge to distinguish dumb-nic, slowpath, and
373 // fastpath traffic. Decrement the HopLimit by one
374 // for slowpath, two for fastpath. This assumes the limit is measurably
375 // greater than two, which I think is reasonable.
376 // Obviously this is DBG only. Maybe remove later, or #if 0 so we
377 // can set it when needed
378 #define SXG_DBG_HOP_LIMIT(_TcpObject, _FastPath) { \
379 PIPV6_HDR _Ip6FrameHdr; \
380 if((_TcpObject)->IPv6) { \
381 _Ip6FrameHdr = SXG_LOCATE_IP6_FRAME_HDR((_TcpObject)); \
383 _Ip6FrameHdr->HopLimit = (_TcpObject)->Cached.TtlOrHopLimit - 2; \
385 _Ip6FrameHdr->HopLimit = (_TcpObject)->Cached.TtlOrHopLimit - 1; \
390 // Do nothing with free build
391 #define SXG_DBG_HOP_LIMIT(_TcpObject, _FastPath)
394 /***************************************************************************
395 * Receive and transmit rings
396 ***************************************************************************/
397 #define SXG_MAX_RING_SIZE 256
398 #define SXG_XMT_RING_SIZE 128 // Start with 128
399 #define SXG_RCV_RING_SIZE 128 // Start with 128
400 #define SXG_MAX_ENTRIES 4096
402 // Structure and macros to manage a ring
403 struct SXG_RING_INFO {
404 unsigned char Head; // Where we add entries - Note unsigned char:RING_SIZE
405 unsigned char Tail; // Where we pull off completed entries
406 ushort Size; // Ring size - Must be multiple of 2
407 void *Context[SXG_MAX_RING_SIZE]; // Shadow ring
410 #define SXG_INITIALIZE_RING(_ring, _size) { \
413 (_ring).Size = (_size); \
415 #define SXG_ADVANCE_INDEX(_index, _size) ((_index) = ((_index) + 1) & ((_size) - 1))
416 #define SXG_PREVIOUS_INDEX(_index, _size) (((_index) - 1) &((_size) - 1))
417 #define SXG_RING_EMPTY(_ring) ((_ring)->Head == (_ring)->Tail)
418 #define SXG_RING_FULL(_ring) ((((_ring)->Head + 1) & ((_ring)->Size - 1)) == (_ring)->Tail)
419 #define SXG_RING_ADVANCE_HEAD(_ring) SXG_ADVANCE_INDEX((_ring)->Head, ((_ring)->Size))
420 #define SXG_RING_RETREAT_HEAD(_ring) ((_ring)->Head = \
421 SXG_PREVIOUS_INDEX((_ring)->Head, (_ring)->Size))
422 #define SXG_RING_ADVANCE_TAIL(_ring) { \
423 ASSERT((_ring)->Tail != (_ring)->Head); \
424 SXG_ADVANCE_INDEX((_ring)->Tail, ((_ring)->Size)); \
426 // Set cmd to the next available ring entry, set the shadow context
427 // entry and advance the ring.
428 // The appropriate lock must be held when calling this macro
429 #define SXG_GET_CMD(_ring, _ringinfo, _cmd, _context) { \
430 if(SXG_RING_FULL(_ringinfo)) { \
433 (_cmd) = &(_ring)->Descriptors[(_ringinfo)->Head]; \
434 (_ringinfo)->Context[(_ringinfo)->Head] = (void *)(_context);\
435 SXG_RING_ADVANCE_HEAD(_ringinfo); \
439 // Abort the previously allocated command by retreating the head.
440 // NOTE - The appopriate lock MUST NOT BE DROPPED between the SXG_GET_CMD
441 // and SXG_ABORT_CMD calls.
442 #define SXG_ABORT_CMD(_ringinfo) { \
443 ASSERT(!(SXG_RING_EMPTY(_ringinfo))); \
444 SXG_RING_RETREAT_HEAD(_ringinfo); \
445 (_ringinfo)->Context[(_ringinfo)->Head] = NULL; \
448 // For the given ring, return a pointer to the tail cmd and context,
449 // clear the context and advance the tail
450 #define SXG_RETURN_CMD(_ring, _ringinfo, _cmd, _context) { \
451 (_cmd) = &(_ring)->Descriptors[(_ringinfo)->Tail]; \
452 (_context) = (_ringinfo)->Context[(_ringinfo)->Tail]; \
453 (_ringinfo)->Context[(_ringinfo)->Tail] = NULL; \
454 SXG_RING_ADVANCE_TAIL(_ringinfo); \
457 /***************************************************************************
459 * Host Command Buffer - commands to INIC via the Cmd Rings
461 ***************************************************************************/
464 * .___________________.___________________.
465 * |<-------------- Sgl Low -------------->|
466 * |_________|_________|_________|_________|0 0x00
467 * |<-------------- Sgl High ------------->|
468 * |_________|_________|_________|_________|4 0x04
469 * |<------------- Sge 0 Low ----------->|
470 * |_________|_________|_________|_________|8 0x08
471 * |<------------- Sge 0 High ----------->|
472 * |_________|_________|_________|_________|12 0x0c
473 * |<------------ Sge 0 Length ---------->|
474 * |_________|_________|_________|_________|16 0x10
475 * |<----------- Window Update ----------->|
476 * |<-------- SP 1st SGE offset ---------->|
477 * |_________|_________|_________|_________|20 0x14
478 * |<----------- Total Length ------------>|
479 * |_________|_________|_________|_________|24 0x18
480 * |<----- LCnt ------>|<----- Flags ----->|
481 * |_________|_________|_________|_________|28 0x1c
483 #pragma pack(push, 1)
485 dma_addr_t Sgl; // Physical address of SGL
488 dma64_addr_t FirstSgeAddress; // Address of first SGE
489 u32 FirstSgeLength; // Length of first SGE
492 u32 SgeOffset; // Slowpath - 2nd SGE offset
493 u32 Resid; // MDL completion - clobbers update
496 u32 TotalLength; // Total transfer length
503 unsigned char Flags:4; // slowpath flags
504 unsigned char IpHl:4; // Ip header length (>>2)
505 unsigned char MacLen; // Mac header len
508 ushort Flags:4; // slowpath flags
509 ushort TcpHdrOff:7; // TCP
510 ushort MacLen:5; // Mac header len
512 ushort Flags; // flags
515 ushort SgEntries; // SG entry count including first sge
517 unsigned char Status; // Copied from event status
518 unsigned char NotUsed;
524 #pragma pack(push, 1)
537 * /.--- TCP Large segment send
542 * .___________________.____________vvvv.
544 * | LCnt |hlen|hdroff|Flgs|
545 * |___________________|||||||||||||____|
552 * //.--- Checksum TCP
553 * ///.--- Checksum IP
554 * 3 1 //// No bits - normal send
556 * .___________________._______________vvvv.
557 * | | Offload | IP | |
558 * | LCnt |MAC hlen |Hlen|Flgs|
559 * |___________________|____|____|____|____|
562 // Slowpath CMD flags
563 #define SXG_SLOWCMD_CSUM_IP 0x01 // Checksum IP
564 #define SXG_SLOWCMD_CSUM_TCP 0x02 // Checksum TCP
565 #define SXG_SLOWCMD_LSO 0x04 // Large segment send
567 struct SXG_XMT_RING {
568 struct SXG_CMD Descriptors[SXG_XMT_RING_SIZE];
571 struct SXG_RCV_RING {
572 struct SXG_CMD Descriptors[SXG_RCV_RING_SIZE];
575 /***************************************************************************
576 * Share memory buffer types - Used to identify asynchronous
577 * shared memory allocation
578 ***************************************************************************/
579 enum SXG_BUFFER_TYPE {
580 SXG_BUFFER_TYPE_RCV, // Receive buffer
581 SXG_BUFFER_TYPE_SGL // SGL buffer
584 // State for SXG buffers
585 #define SXG_BUFFER_FREE 0x01
586 #define SXG_BUFFER_BUSY 0x02
587 #define SXG_BUFFER_ONCARD 0x04
588 #define SXG_BUFFER_UPSTREAM 0x08
590 /***************************************************************************
591 * Receive data buffers
593 * Receive data buffers are given to the Sahara card 128 at a time.
594 * This is accomplished by filling in a "receive descriptor block"
595 * with 128 "receive descriptors". Each descriptor consists of
596 * a physical address, which the card uses as the address to
597 * DMA data into, and a virtual address, which is given back
598 * to the host in the "HostHandle" portion of an event.
599 * The receive descriptor data structure is defined below
600 * as SXG_RCV_DATA_DESCRIPTOR, and the corresponding block
601 * is defined as SXG_RCV_DESCRIPTOR_BLOCK.
603 * This receive descriptor block is given to the card by filling
604 * in the Sgl field of a SXG_CMD entry from pAdapt->RcvRings[0]
605 * with the physical address of the receive descriptor block.
607 * Both the receive buffers and the receive descriptor blocks
608 * require additional data structures to maintain them
609 * on a free queue and contain other information associated with them.
610 * Those data structures are defined as the SXG_RCV_DATA_BUFFER_HDR
611 * and SXG_RCV_DESCRIPTOR_BLOCK_HDR respectively.
613 * Since both the receive buffers and the receive descriptor block
614 * must be accessible by the card, both must be allocated out of
615 * shared memory. To ensure that we always have a descriptor
616 * block available for every 128 buffers, we allocate all of
617 * these resources together in a single block. This entire
618 * block is managed by a SXG_RCV_BLOCK_HDR, who's sole purpose
619 * is to maintain address information so that the entire block
622 * Further complicating matters is the fact that the receive
623 * buffers must be variable in length in order to accomodate
624 * jumbo frame configurations. We configure the buffer
625 * length so that the buffer and it's corresponding SXG_RCV_DATA_BUFFER_HDR
626 * structure add up to an even boundary. Then we place the
627 * remaining data structures after 128 of them as shown in
628 * the following diagram:
630 * _________________________________________
632 * | Variable length receive buffer #1 |
633 * |_________________________________________|
635 * | SXG_RCV_DATA_BUFFER_HDR #1 |
636 * |_________________________________________| <== Even 2k or 10k boundary
638 * | ... repeat 2-128 .. |
639 * |_________________________________________|
641 * | SXG_RCV_DESCRIPTOR_BLOCK |
642 * | Contains SXG_RCV_DATA_DESCRIPTOR * 128 |
643 * |_________________________________________|
645 * | SXG_RCV_DESCRIPTOR_BLOCK_HDR |
646 * |_________________________________________|
648 * | SXG_RCV_BLOCK_HDR |
649 * |_________________________________________|
651 * Memory consumption:
653 * Buffers and SXG_RCV_DATA_BUFFER_HDR = 2k * 128 = 256k
654 * + SXG_RCV_DESCRIPTOR_BLOCK = 2k
655 * + SXG_RCV_DESCRIPTOR_BLOCK_HDR = ~32
656 * + SXG_RCV_BLOCK_HDR = ~32
657 * => Total = ~258k/block
660 * Buffers and SXG_RCV_DATA_BUFFER_HDR = 10k * 128 = 1280k
661 * + SXG_RCV_DESCRIPTOR_BLOCK = 2k
662 * + SXG_RCV_DESCRIPTOR_BLOCK_HDR = ~32
663 * + SXG_RCV_BLOCK_HDR = ~32
664 * => Total = ~1282k/block
666 ***************************************************************************/
667 #define SXG_RCV_DATA_BUFFERS 4096 // Amount to give to the card
668 #define SXG_INITIAL_RCV_DATA_BUFFERS 8192 // Initial pool of buffers
669 #define SXG_MIN_RCV_DATA_BUFFERS 2048 // Minimum amount and when to get more
670 #define SXG_MAX_RCV_BLOCKS 128 // = 16384 receive buffers
672 // Receive buffer header
673 struct SXG_RCV_DATA_BUFFER_HDR {
674 dma_addr_t PhysicalAddress; // Buffer physical address
675 // Note - DO NOT USE the VirtualAddress field to locate data.
676 // Use the sxg.h:SXG_RECEIVE_DATA_LOCATION macro instead.
677 void *VirtualAddress; // Start of buffer
678 struct LIST_ENTRY FreeList; // Free queue of buffers
679 struct SXG_RCV_DATA_BUFFER_HDR *Next; // Fastpath data buffer queue
680 u32 Size; // Buffer size
681 u32 ByteOffset; // See SXG_RESTORE_MDL_OFFSET
682 unsigned char State; // See SXG_BUFFER state above
683 unsigned char Status; // Event status (to log PUSH)
684 struct sk_buff *skb; // Double mapped (nbl and pkt)
687 // SxgSlowReceive uses the PACKET (skb) contained
688 // in the SXG_RCV_DATA_BUFFER_HDR when indicating dumb-nic data
689 #define SxgDumbRcvPacket skb
691 #define SXG_RCV_DATA_HDR_SIZE 256 // Space for SXG_RCV_DATA_BUFFER_HDR
692 #define SXG_RCV_DATA_BUFFER_SIZE 2048 // Non jumbo = 2k including HDR
693 #define SXG_RCV_JUMBO_BUFFER_SIZE 10240 // jumbo = 10k including HDR
695 // Receive data descriptor
696 struct SXG_RCV_DATA_DESCRIPTOR {
698 struct sk_buff *VirtualAddress; // Host handle
699 u64 ForceTo8Bytes; // Force x86 to 8-byte boundary
701 dma_addr_t PhysicalAddress;
704 // Receive descriptor block
705 #define SXG_RCV_DESCRIPTORS_PER_BLOCK 128
706 #define SXG_RCV_DESCRIPTOR_BLOCK_SIZE 2048 // For sanity check
708 struct SXG_RCV_DESCRIPTOR_BLOCK {
709 struct SXG_RCV_DATA_DESCRIPTOR Descriptors[SXG_RCV_DESCRIPTORS_PER_BLOCK];
712 // Receive descriptor block header
713 struct SXG_RCV_DESCRIPTOR_BLOCK_HDR {
714 void *VirtualAddress; // Start of 2k buffer
715 dma_addr_t PhysicalAddress; // ..and it's physical address
716 struct LIST_ENTRY FreeList; // Free queue of descriptor blocks
717 unsigned char State; // See SXG_BUFFER state above
720 // Receive block header
721 struct SXG_RCV_BLOCK_HDR {
722 void *VirtualAddress; // Start of virtual memory
723 dma_addr_t PhysicalAddress; // ..and it's physical address
724 struct LIST_ENTRY AllList; // Queue of all SXG_RCV_BLOCKS
727 // Macros to determine data structure offsets into receive block
728 #define SXG_RCV_BLOCK_SIZE(_Buffersize) \
729 (((_Buffersize) * SXG_RCV_DESCRIPTORS_PER_BLOCK) + \
730 (sizeof(struct SXG_RCV_DESCRIPTOR_BLOCK)) + \
731 (sizeof(struct SXG_RCV_DESCRIPTOR_BLOCK_HDR)) + \
732 (sizeof(struct SXG_RCV_BLOCK_HDR)))
733 #define SXG_RCV_BUFFER_DATA_SIZE(_Buffersize) \
734 ((_Buffersize) - SXG_RCV_DATA_HDR_SIZE)
735 #define SXG_RCV_DATA_BUFFER_HDR_OFFSET(_Buffersize) \
736 ((_Buffersize) - SXG_RCV_DATA_HDR_SIZE)
737 #define SXG_RCV_DESCRIPTOR_BLOCK_OFFSET(_Buffersize) \
738 ((_Buffersize) * SXG_RCV_DESCRIPTORS_PER_BLOCK)
739 #define SXG_RCV_DESCRIPTOR_BLOCK_HDR_OFFSET(_Buffersize) \
740 (((_Buffersize) * SXG_RCV_DESCRIPTORS_PER_BLOCK) + \
741 (sizeof(struct SXG_RCV_DESCRIPTOR_BLOCK)))
742 #define SXG_RCV_BLOCK_HDR_OFFSET(_Buffersize) \
743 (((_Buffersize) * SXG_RCV_DESCRIPTORS_PER_BLOCK) + \
744 (sizeof(struct SXG_RCV_DESCRIPTOR_BLOCK)) + \
745 (sizeof(struct SXG_RCV_DESCRIPTOR_BLOCK_HDR)))
747 // Use the miniport reserved portion of the NBL to locate
748 // our SXG_RCV_DATA_BUFFER_HDR structure.
749 struct SXG_RCV_NBL_RESERVED {
750 struct SXG_RCV_DATA_BUFFER_HDR *RcvDataBufferHdr;
754 #define SXG_RCV_NBL_BUFFER_HDR(_NBL) (((PSXG_RCV_NBL_RESERVED)NET_BUFFER_LIST_MINIPORT_RESERVED(_NBL))->RcvDataBufferHdr)
756 /***************************************************************************
757 * Scatter gather list buffer
758 ***************************************************************************/
759 #define SXG_INITIAL_SGL_BUFFERS 8192 // Initial pool of SGL buffers
760 #define SXG_MIN_SGL_BUFFERS 2048 // Minimum amount and when to get more
761 #define SXG_MAX_SGL_BUFFERS 16384 // Maximum to allocate (note ADAPT:ushort)
763 // Self identifying structure type
765 SXG_SGL_DUMB, // Dumb NIC SGL
766 SXG_SGL_SLOW, // Slowpath protocol header - see below
767 SXG_SGL_CHIMNEY // Chimney offload SGL
770 // Note - the description below is Microsoft specific
772 // The following definition specifies the amount of shared memory to allocate
773 // for the SCATTER_GATHER_LIST portion of the SXG_SCATTER_GATHER data structure.
774 // The following considerations apply when setting this value:
775 // - First, the Sahara card is designed to read the Microsoft SGL structure
776 // straight out of host memory. This means that the SGL must reside in
777 // shared memory. If the length here is smaller than the SGL for the
778 // NET_BUFFER, then NDIS will allocate its own buffer. The buffer
779 // that NDIS allocates is not in shared memory, so when this happens,
780 // the SGL will need to be copied to a set of SXG_SCATTER_GATHER buffers.
781 // In other words.. we don't want this value to be too small.
782 // - On the other hand.. we're allocating up to 16k of these things. If
783 // we make this too big, we start to consume a ton of memory..
784 // At the moment, I'm going to limit the number of SG entries to 150.
785 // If each entry maps roughly 4k, then this should cover roughly 600kB
786 // NET_BUFFERs. Furthermore, since each entry is 24 bytes, the total
787 // SGE portion of the structure consumes 3600 bytes, which should allow
788 // the entire SXG_SCATTER_GATHER structure to reside comfortably within
789 // a 4k block, providing the remaining fields stay under 500 bytes.
791 // So with 150 entries, the SXG_SCATTER_GATHER structure becomes roughly
792 // 4k. At 16k of them, that amounts to 64M of shared memory. A ton, but
794 #define SXG_SGL_ENTRIES 150
796 // The ucode expects an NDIS SGL structure that
797 // is formatted for an x64 system. When running
798 // on an x64 system, we can simply hand the NDIS SGL
799 // to the card directly. For x86 systems we must reconstruct
800 // the SGL. The following structure defines an x64
801 // formatted SGL entry
803 dma64_addr_t Address; // same as wdm.h
804 u32 Length; // same as wdm.h
805 u32 CompilerPad; // The compiler pads to 8-bytes
806 u64 Reserved; // u32 * in wdm.h. Force to 8 bytes
809 struct SCATTER_GATHER_ELEMENT {
810 dma64_addr_t Address; // same as wdm.h
811 u32 Length; // same as wdm.h
812 u32 CompilerPad; // The compiler pads to 8-bytes
813 u64 Reserved; // u32 * in wdm.h. Force to 8 bytes
816 struct SCATTER_GATHER_LIST {
817 u32 NumberOfElements;
819 struct SCATTER_GATHER_ELEMENT Elements[];
822 // The card doesn't care about anything except elements, so
823 // we can leave the u32 * reserved field alone in the following
824 // SGL structure. But redefine from wdm.h:SCATTER_GATHER_LIST so
825 // we can specify SXG_X64_SGE and define a fixed number of elements
827 u32 NumberOfElements;
829 struct SXG_X64_SGE Elements[SXG_SGL_ENTRIES];
832 struct SXG_SCATTER_GATHER {
833 enum SXG_SGL_TYPE Type; // FIRST! Dumb-nic or offload
834 void *adapter; // Back pointer to adapter
835 struct LIST_ENTRY FreeList; // Free SXG_SCATTER_GATHER blocks
836 struct LIST_ENTRY AllList; // All SXG_SCATTER_GATHER blocks
837 dma_addr_t PhysicalAddress; // physical address
838 unsigned char State; // See SXG_BUFFER state above
839 unsigned char CmdIndex; // Command ring index
840 struct sk_buff *DumbPacket; // Associated Packet
841 u32 Direction; // For asynchronous completions
842 u32 CurOffset; // Current SGL offset
843 u32 SglRef; // SGL reference count
844 struct VLAN_HDR VlanTag; // VLAN tag to be inserted into SGL
845 struct SCATTER_GATHER_LIST *pSgl; // SGL Addr. Possibly &Sgl
846 struct SXG_X64_SGL Sgl; // SGL handed to card
849 #if defined(CONFIG_X86_64)
850 #define SXG_SGL_BUFFER(_SxgSgl) (&_SxgSgl->Sgl)
851 #define SXG_SGL_BUF_SIZE sizeof(struct SXG_X64_SGL)
852 #elif defined(CONFIG_X86)
853 // Force NDIS to give us it's own buffer so we can reformat to our own
854 #define SXG_SGL_BUFFER(_SxgSgl) NULL
855 #define SXG_SGL_BUF_SIZE 0
857 #error staging: sxg: driver is for X86 only!