source: trunk/kernel/devices/dev_nic.h @ 669

Last change on this file since 669 was 668, checked in by alain, 4 years ago

typos...

File size: 18.2 KB
RevLine 
[1]1/*
2 * dev_nic.h - NIC (Network Controler) generic device API definition.
3 *
[657]4 * Author  Alain Greiner    (2016,2017,2018,2019,2020)
[1]5 *
6 * Copyright (c) UPMC Sorbonne Universites
7 *
8 * This file is part of ALMOS-MKH
9 *
10 * ALMOS-MKH is free software; you can redistribute it and/or modify it
11 * under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; version 2.0 of the License.
13 *
14 * ALMOS-MKH is distributed in the hope that it will be useful, but
15 * WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
17 * General Public License for more details.
18 *
19 * You should have received a copy of the GNU General Public License
20 * along with ALMOS-kernel; if not, write to the Free Software Foundation,
21 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
22 */
23
24#ifndef _DEV_NIC_H
25#define _DEV_NIC_H
26
[14]27#include <kernel_config.h>
[457]28#include <hal_kernel_types.h>
[657]29#include <remote_busylock.h>
30#include <remote_buf.h>
31#include <xlist.h>
[1]32
[657]33/****  Forward declarations  ****/
34
35struct chdev_s;
36
[1]37/*****************************************************************************************
38 *     Generic Network Interface Controler definition
39 *
[657]40 * This device provides access to a generic Gigabit Ethernet network controler.
41 * It assumes that the NIC hardware peripheral handles two packets queues for sent (TX)
42 * and received (RX) packets.
43 *
44 * The supported protocols stack is : Ethernet / IPV4 / TCP or UDP
[1]45 *
[657]46 * 1) hardware assumptions
47 *
48 * The NIC device is handling two (infinite) streams of packets to or from the network.
[1]49 * It is the driver responsibility to move the RX packets from the NIC to the RX queue,
50 * and the TX packets from the TX queue to the NIC.
51 *
[657]52 * AS the RX and TX queues are independant, there is one NIC_RX device descriptor
53 * to handle RX packets, and another NIC_TX device descriptor to handle TX packets.
[1]54 *
[657]55 * In order to improve throughput, the NIC controller can implement multiple (N) channels.
56 * In this case, the channel index is defined by an hash function computed from the remote
57 * IP address and port. This index is computed by the hardware for an RX packet, and is
[663]58 * computed by the kernel for a TX packet, using a specific driver function.
[657]59 * The 2*N chdevs, and the associated server threads implementing the protocols stack,
60 * are distributed in 2*N different clusters.
[1]61 *
[657]62 * 2) User API
63 *
64 * On the user side, ALMOS-MKH implements the POSIX socket API.
[663]65 * The following kernel functions implement the socket related syscalls :
66 * - socket_build()     : create a local socket registered in process fd_array[].
67 * - socket_bind()      : attach a local IP address and port to a local socket.
68 * - socket_listen()    : local server makes a passive open.
69 * - socket_connect()   : local client makes an active open to a remote server.
70 * - socket_accept()    : local server accept a new remote client.
71 * - socket_send()      : send data on a connected socket.
72 * - socket_recv()      : receive data on a connected socket.
73 * - socket_sendto()    : send a packet to a remote (IP address/port).
74 * - socket_recvfrom()  : receive a paket from a remote (IP address/port).
[1]75 *
[663]76 * 3) NIC TX and NIC_RX server threads
[657]77 *
[663]78 * The dev_nic_tx_server() & dev_nic_rx_server() functions defined below execute
79 * the user commands stored in the sockets to implement the [ETH / IP / TCP or UDP]
80 * protocols stack, as defined in the <ksocket.c> and <ksocket.h> files.
[657]81 *
[663]82 * 4) NIC driver API
[657]83 *
[663]84 * The generic NIC device "driver" API defines the following commands, used by the
85 * NIC_TX and NIC_RX server threads, running in the cluster containing the relevant chdev,
86 * to access the NIC_TX and NIC_RX packets queues:
[657]87 *
[663]88 * - READ     : consume one packet from the NIC_RX queue.
89 * - WRITE    : produce one packet to the NIC_TX queue.
[657]90 *
[1]91 * All RX or TX paquets are sent or received in standard 2 Kbytes kernel buffers,
[657]92 * that are dynamically allocated by the protocols stack.
[1]93 * The actual TX an RX queues structures depends on the hardware NIC implementation,
[657]94 * and are defined in the HAL specific driver code.
95 *
[663]96 * Moreover, the generic NIC device "driver" API defines the following commands,
97 * used directly by a client thread running in any cluster, to access the NIC device
98 * configuration or status registers:
99 *
100 * - GET_KEY      : get channel index from remote IP address and port
101 * - SET_RUN      : activate/desactivate one channel
102 * - GET_INSTRU   : get one instrumentation counter value
103 * - CLEAR_INSTRU : reset all instrumentation counters
104 *
[657]105 * WARNING: the WTI mailboxes used by the driver ro receive events from the hardware
106 * (available RX packet, or available free TX slot, for a given channel), must be
107 * statically allocated during the kernel initialisation phase, and must be
108 * routed to the cluster containing the associated TX/RX chdev and server thread.
109 *
[1]110 *****************************************************************************************/
111
112/****  Forward declarations  ****/
113
[3]114struct chdev_s;
[1]115
[663]116/*****************************************************************************************
117 *   Various constants used by the protocols stack
118 ****************************************************************************************/
[1]119
[663]120#define SRC_MAC_5              0x66         // This is a temporary short-cut for debug
121#define SRC_MAC_4              0x55
122#define SRC_MAC_3              0x44
123#define SRC_MAC_2              0x33
124#define SRC_MAC_1              0x22
125#define SRC_MAC_0              0x11
[657]126
[663]127#define DST_MAC_5              0x66         // This is a temporary short-cut for debug
128#define DST_MAC_4              0x55
129#define DST_MAC_3              0x44
130#define DST_MAC_2              0x33
131#define DST_MAC_1              0x22
132#define DST_MAC_0              0x11
133
[657]134#define TCP_HEAD_LEN           20
135#define UDP_HEAD_LEN           8
136#define IP_HEAD_LEN            20
137#define ETH_HEAD_LEN           14
138
139#define PROTOCOL_UDP           0x11
140#define PROTOCOL_TCP           0x06
141
[663]142#define TCP_ISS_CLIENT         0x10000      // initial sequence number for TCP client
143#define TCP_ISS_SERVER         0x20000      // initial sequence number for TCP server
144#define TCP_MAX_WINDOW         0xFFFFF      // initial TCP send window
[657]145
[663]146#define PAYLOAD_MAX_LEN        1500         // max length for an UDP packet / TCP segment
[657]147
148#define TCP_FLAG_FIN           0x01
149#define TCP_FLAG_SYN           0x02
150#define TCP_FLAG_RST           0x04
151#define TCP_FLAG_PSH           0x08
152#define TCP_FLAG_ACK           0x10
153#define TCP_FLAG_URG           0x20
154
155#define NIC_RX_BUF_SIZE        0x100000     // 1 Mbytes
156#define NIC_R2T_QUEUE_SIZE     0x64         // smallest KCM size
[663]157#define NIC_CRQ_QUEUE_SIZE     0x8          // actual size is 8 * sizeof(sockaddr_t)
158#define NIC_KERNEL_BUF_SIZE    0x800        // 2 Kbytes for one ETH/IP/TCP packet
[657]159
[668]160#define CMD_
161
[657]162/*****************************************************************************************
[663]163 * This structure defines the specific chdev extension for NIC device:
164 * - queue : local pointer on the memory mapped queue of TX or RX packets, used
165 *   by the NIC driver to move packets to/from the NIC hardware. The actual descriptor
166 *   depends on the NIC implementation.
167 * - root  : root of an xlist of sockets that are in the LISTEN state, waiting one or
168 *   several TCP connection requests from remote processes. It is only used by the
169 *   NIC_RX server thread attached to a NIC_RX chdev.
170 * - lock  : lock protecting concurrent access to the litening sockets list.
[657]171 ****************************************************************************************/
172
[1]173typedef struct nic_extend_s
174{
[663]175    void            * queue;    /*! pointer on NIC packets queue descriptor (RX or TX)  */
176    xlist_entry_t     root;     /*! root of listening sockets list (only used in RX[0]) */
177    remote_busylock_t lock;     /*! lock protecting this list  (only used in RX[0]      */
[1]178}
179nic_extend_t;
180
[657]181/*****************************************************************************************
[1]182 * This enum defines the various implementations of the generic NIC peripheral.
183 * This array must be kept consistent with the define in the arch_info.h file.
[657]184 ****************************************************************************************/
[1]185
[657]186typedef enum nic_impl_e
[1]187{
[407]188    IMPL_NIC_CBF =   0,     
[1]189    IMPL_NIC_I86 =   1,
190}
191nic_impl_t;
192
[657]193/****************************************************************************************
194 * This defines the (implementation independant) commands to access the NIC hardware.
[663]195 * There is two types of commands
196 * - The first 2 commands are used by the NIC_TX and NIC_RX server threads, and stored
197 *   in the server thread descriptor, to access the NIC_RX & NIC_TX packet queues.
198 *   The buffer is always a 2K bytes kernel buffer, containing an Ethernet packet.
199 * - The next 4 synchronous commands are used by the client th, and stored in the
200 *   client thread descriptor, to directly access the NIC registers.
[657]201 ****************************************************************************************/
[1]202
203typedef enum nic_cmd_e
204{
[663]205    NIC_CMD_WRITE        = 10,  /*! put one (given length) packet to TX queue           */
206    NIC_CMD_READ         = 11,  /*! get one (any length) packet from RX queue           */
207
208    NIC_CMD_GET_KEY      = 20,  /*! return channel index from IP address and port       */ 
209    NIC_CMD_SET_RUN      = 21,  /*! enable/disable one NIC channel                      */
210    NIC_CMD_GET_INSTRU   = 22,  /*! return one intrumentation register value            */
211    NIC_CMD_CLEAR_INSTRU = 23,  /*! reset all instrumentation registers                 */
[1]212}
213nic_cmd_t;
214
215typedef struct nic_command_s
216{
[657]217    xptr_t      dev_xp;       /*! extended pointer on NIC chdev descriptor              */
218    nic_cmd_t   type;         /*! command type                                          */
[663]219    uint8_t   * buffer;       /*! local pointer on kernel buffer                        */ 
[657]220    uint32_t    length;       /*! number of bytes in buffer                             */
221    uint32_t    status;       /*! return value (depends on command type)                */
222    uint32_t    error;        /*! return an error from the hardware (0 if no error)     */
[1]223}
224nic_command_t;
225
226/******************************************************************************************
[3]227 * This function completes the NIC-RX and NIC-TX chdev descriptors initialisation.
228 * namely the link with the implementation specific driver.
229 * The func, impl, channel, is_rx, base fields have been previously initialised.
230 * It calls the specific driver initialisation function, to initialise the hardware
231 * device and the specific data structures when required.
232 * It creates the associated server thread and allocates a WTI from local ICU.
[663]233 * For a TX_NIC chedv, it allocates and initializes the R2T queue used by the
234 * NIC_RX[channel] server to send direct requests to the NIC_TX[channel] server,
235 * and the CRQ queue used to register connection requests.
[3]236 * It must de executed by a local thread.
[663]237 * For NIC_TX and NIC_RX chdevs, the "wait_root" field is actually a list of sockets.
[1]238 ******************************************************************************************
[3]239 * @ chdev    : local pointer on NIC chdev descriptor.
[1]240 *****************************************************************************************/
[3]241void dev_nic_init( struct chdev_s * chdev );
[1]242
[663]243/* Functions directly called by a client thread in any cluster */
244 
245/******************************************************************************************
246 * This function compute a channel index in range [0,nic_channels[ from the remote IP
247 * address <addr> and <port>, by calling the relevant driver command.
248 ******************************************************************************************
249 * @ addr     : [in] IP address.
250 * @ port     : [in] TCP/UDP port.
251 * @ return the selected channel index
252 *****************************************************************************************/
253uint32_t dev_nic_get_key( uint32_t addr,
254                          uint16_t port );
[657]255
[663]256/******************************************************************************************
257 * This function activate / de-activate a NIC channel DMA engine identified by the
258 * <channel> argument, as defined by the <run> argument.
259 ******************************************************************************************
260 * @ channel  : [in] NIC channel index.
261 * @ run      : [in] activate if non-zero / desactivate if zero.
262 * @ return 0 if success / return -1 if error.
263 *****************************************************************************************/
264error_t dev_nic_set_run( uint32_t channel,
265                         uint32_t run );
[657]266
[1]267/******************************************************************************************
[657]268 * This instrumentation function displays on the TXT0 kernel terminal the content
269 * of the instrumentation registers contained in the NIC device.
[663]270 ******************************************************************************************
271 * @ return 0 if success / return -1 if error.
[1]272 *****************************************************************************************/
[663]273error_t dev_nic_get_instru( void );
[1]274
275/******************************************************************************************
[657]276 * This instrumentation function reset all instrumentation registers contained
277 * in the NIC device.
[663]278 ******************************************************************************************
279 * @ return 0 if success / return -1 if error.
[657]280 *****************************************************************************************/
[663]281error_t dev_nic_clear_instru( void );
[657]282
283/* Functions executed by the TX and RX server threads */ 
284 
285/******************************************************************************************
286 * This function is executed by the server thread associated to a NIC_TX[channel] chdev.
287 * This TX server thread is created by the dev_nic_init() function.
288 * It build and send UDP packets or TCP segments for all clients threads registered in
289 * the NIC_TX[channel] chdev. The command types are (CONNECT / SEND / CLOSE), and the
290 * priority between clients is round-robin. It takes into account the request registered
291 * by the RX server thread in the R2T queue associated to the involved socket.
292 * When a command is completed, it unblocks the client thread. For a SEND command, the
293 * last byte must have been sent for an UDP socket, and it must have been acknowledged
294 * for a TCP socket.
295 * When the TX client threads queue is empty, it blocks on THREAD_BLOCKED_CLIENT
296 * condition and deschedules. It is re-activated by a client thread registering a command.
[663]297 * When the NIC_TX packet queue is full, it blocks on the THREAD_BLOCKED_ISR condition
298 * and deschedules. It is reactivated by the NIC_TX DMA engine.
[1]299 ******************************************************************************************
[657]300 * Implementation note:
301 * It execute an infinite loop in which it takes the lock protecting the clients list
302 * to build a "kleenex" list of currently registered clients.
303 * For each client registered in this "kleenex" list, it takes the lock protecting the
304 * socket state, build one packet/segment in a local 2K bytes kernel buffer, calls the
305 * transport layer to add the UDP/TCP header, calls the IP layer to add the IP header,
306 * calls the ETH layer to add the ETH header, and moves the packet to the NIC_TX_QUEUE.
307 * Finally, it updates the socket state, and release the socket lock.
308 ******************************************************************************************
309 * @ chdev    : [in] local pointer on one local NIC_TX[channel] chdev descriptor.
[1]310 *****************************************************************************************/
[657]311void dev_nic_tx_server( struct chdev_s * chdev );
[1]312
313
314/******************************************************************************************
[657]315 * This function is executed by the server thread associated to a NIC_RX[channel] chdev.
316 * This RX server thread is created by the dev_nic_init() function.
317 * It handles all UDP packets or TCP segments received by the sockets attached to
318 * the NIC_RX[channel] chdev. It writes the received data in the socket rcv_buf, and
319 * unblocks the client thread waiting on a RECV command.
320 * To implement the three steps handshahke required by a TCP connection, it posts direct
321 * requests to the TX server, using the R2T queue attached to the involved socket.
322 * It blocks on the THREAD_BLOCKED_ISR condition and deschedules when the NIC_RX_QUEUE
[663]323 * is empty, and is re-activated by the NIC_RX_ISR, when the queue becomes non empty.
[1]324 ******************************************************************************************
[657]325 * Implementation note:
326 * It executes an infinite loop in which it extracts one packet from the NIC_RX_QUEUE
327 * of received packets, copies this packet in a local 2 kbytes kernel buffer, checks
328 * the Ethernet header, checks the IP header, calls the relevant (TCP or UDP) transport
329 * protocol that search a matching socket for the received packet. It copies the payload
330 * to the relevant socket rcv_buf when the packet is acceptable, and unblocks the client
331 * thread. It discard the packet if no socket found.
332 ******************************************************************************************
333 * @ chdev    : [in] local pointer on one local NIC_RX[channel] chdev descriptor.
[1]334 *****************************************************************************************/
[657]335void dev_nic_rx_server( struct chdev_s * chdev );
[1]336
[663]337/******************************************************************************************
338 * This function displays all the fields of an ETH/IP/TCP segment or ETH/IP/UDP packet.
339 ******************************************************************************************
340 * @ is_tx   : [in] sent packet if true / received packet if false.
341 * @ pid     : [in] process identifier.
342 * @ trdid   : [in] thread identifier.
343 * @ cycle   : [in] date (number of cycles).
344 * @ buf     : [in] local pointer on kernel buffer containing the packet.
345 *****************************************************************************************/
346void dev_nic_packet_display( bool_t    is_tx,
347                             pid_t     pid,
348                             trdid_t   trdid,
349                             uint32_t  cycle,
350                             uint8_t * buf );
351
[1]352#endif  /* _DEV_NIC_H */
Note: See TracBrowser for help on using the repository browser.