123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521 |
- #include <string.h>
- #include <stdint.h>
- #include <errno.h>
- #include <byteswap.h>
- #include <malloc.h>
- #include <vsprintf.h>
- #include <gpxe/list.h>
- #include <gpxe/in.h>
- #include <gpxe/arp.h>
- #include <gpxe/if_ether.h>
- #include <gpxe/pkbuff.h>
- #include <gpxe/netdevice.h>
- #include "uip/uip.h"
- #include <gpxe/ip.h>
- #include <gpxe/tcpip.h>
-
- /** @file
- *
- * IPv4 protocol
- *
- * The gPXE IP stack is currently implemented on top of the uIP
- * protocol stack. This file provides wrappers around uIP so that
- * higher-level protocol implementations do not need to talk directly
- * to uIP (which has a somewhat baroque API).
- *
- */
-
- /* Unique IP datagram identification number */
- static uint16_t next_ident = 0;
-
- struct net_protocol ipv4_protocol;
-
- /** An IPv4 address/routing table entry */
- struct ipv4_miniroute {
- /** List of miniroutes */
- struct list_head list;
- /** Network device */
- struct net_device *netdev;
- /** IPv4 address */
- struct in_addr address;
- /** Subnet mask */
- struct in_addr netmask;
- /** Gateway address */
- struct in_addr gateway;
- };
-
- /** List of IPv4 miniroutes */
- static LIST_HEAD ( miniroutes );
-
- /** List of fragment reassembly buffers */
- static LIST_HEAD ( frag_buffers );
-
- /**
- * Add IPv4 interface
- *
- * @v netdev Network device
- * @v address IPv4 address
- * @v netmask Subnet mask
- * @v gateway Gateway address (or @c INADDR_NONE for no gateway)
- * @ret rc Return status code
- *
- */
- int add_ipv4_address ( struct net_device *netdev, struct in_addr address,
- struct in_addr netmask, struct in_addr gateway ) {
- struct ipv4_miniroute *miniroute;
-
- /* Allocate and populate miniroute structure */
- miniroute = malloc ( sizeof ( *miniroute ) );
- if ( ! miniroute )
- return -ENOMEM;
- miniroute->netdev = netdev;
- miniroute->address = address;
- miniroute->netmask = netmask;
- miniroute->gateway = gateway;
-
- /* Add to end of list if we have a gateway, otherwise to start
- * of list.
- */
- if ( gateway.s_addr != INADDR_NONE ) {
- list_add_tail ( &miniroute->list, &miniroutes );
- } else {
- list_add ( &miniroute->list, &miniroutes );
- }
- return 0;
- }
-
- /**
- * Remove IPv4 interface
- *
- * @v netdev Network device
- */
- void del_ipv4_address ( struct net_device *netdev ) {
- struct ipv4_miniroute *miniroute;
-
- list_for_each_entry ( miniroute, &miniroutes, list ) {
- if ( miniroute->netdev == netdev ) {
- list_del ( &miniroute->list );
- break;
- }
- }
- }
-
- /**
- * Dump IPv4 packet header
- *
- * @v iphdr IPv4 header
- */
- static void ipv4_dump ( struct iphdr *iphdr __unused ) {
-
- DBG ( "IP4 %p transmitting %p+%d ident %d protocol %d header-csum %x\n",
- &ipv4_protocol, iphdr, ntohs ( iphdr->len ), ntohs ( iphdr->ident ),
- iphdr->protocol, ntohs ( iphdr->chksum ) );
- DBG ( "src %s, dest %s\n", inet_ntoa ( iphdr->src ), inet_ntoa ( iphdr->dest ) );
- }
-
- /**
- * Fragment reassembly counter timeout
- *
- * @v timer Retry timer
- * @v over If asserted, the timer is greater than @c MAX_TIMEOUT
- */
- static void ipv4_frag_expired ( struct retry_timer *timer __unused,
- int over ) {
- if ( over ) {
- DBG ( "Fragment reassembly timeout" );
- /* Free the fragment buffer */
- }
- }
-
- /**
- * Free fragment buffer
- *
- * @v fragbug Fragment buffer
- */
- static void free_fragbuf ( struct frag_buffer *fragbuf ) {
- if ( fragbuf ) {
- free_dma ( fragbuf, sizeof ( *fragbuf ) );
- }
- }
-
- /**
- * Fragment reassembler
- *
- * @v pkb Packet buffer, fragment of the datagram
- * @ret frag_pkb Reassembled packet, or NULL
- */
- static struct pk_buff * ipv4_reassemble ( struct pk_buff * pkb ) {
- struct iphdr *iphdr = pkb->data;
- struct frag_buffer *fragbuf;
-
- /**
- * Check if the fragment belongs to any fragment series
- */
- list_for_each_entry ( fragbuf, &frag_buffers, list ) {
- if ( fragbuf->ident == iphdr->ident &&
- fragbuf->src.s_addr == iphdr->src.s_addr ) {
- /**
- * Check if the packet is the expected fragment
- *
- * The offset of the new packet must be equal to the
- * length of the data accumulated so far (the length of
- * the reassembled packet buffer
- */
- if ( pkb_len ( fragbuf->frag_pkb ) ==
- ( iphdr->frags & IP_MASK_OFFSET ) ) {
- /**
- * Append the contents of the fragment to the
- * reassembled packet buffer
- */
- pkb_pull ( pkb, sizeof ( *iphdr ) );
- memcpy ( pkb_put ( fragbuf->frag_pkb,
- pkb_len ( pkb ) ),
- pkb->data, pkb_len ( pkb ) );
- free_pkb ( pkb );
-
- /** Check if the fragment series is over */
- if ( !iphdr->frags & IP_MASK_MOREFRAGS ) {
- pkb = fragbuf->frag_pkb;
- free_fragbuf ( fragbuf );
- return pkb;
- }
-
- } else {
- /* Discard the fragment series */
- free_fragbuf ( fragbuf );
- free_pkb ( pkb );
- }
- return NULL;
- }
- }
-
- /** Check if the fragment is the first in the fragment series */
- if ( iphdr->frags & IP_MASK_MOREFRAGS &&
- ( ( iphdr->frags & IP_MASK_OFFSET ) == 0 ) ) {
-
- /** Create a new fragment buffer */
- fragbuf = ( struct frag_buffer* ) malloc ( sizeof( *fragbuf ) );
- fragbuf->ident = iphdr->ident;
- fragbuf->src = iphdr->src;
-
- /* Set up the reassembly packet buffer */
- fragbuf->frag_pkb = alloc_pkb ( IP_FRAG_PKB_SIZE );
- pkb_pull ( pkb, sizeof ( *iphdr ) );
- memcpy ( pkb_put ( fragbuf->frag_pkb, pkb_len ( pkb ) ),
- pkb->data, pkb_len ( pkb ) );
- free_pkb ( pkb );
-
- /* Set the reassembly timer */
- fragbuf->frag_timer.timeout = IP_FRAG_TIMEOUT;
- fragbuf->frag_timer.expired = ipv4_frag_expired;
- start_timer ( &fragbuf->frag_timer );
-
- /* Add the fragment buffer to the list of fragment buffers */
- list_add ( &fragbuf->list, &frag_buffers );
- }
-
- return NULL;
- }
-
-
- /**
- * Complete the transport-layer checksum
- *
- * @v pkb Packet buffer
- * @v tcpip Transport-layer protocol
- *
- * This function calculates the tcpip
- */
- static void ipv4_tx_csum ( struct pk_buff *pkb,
- struct tcpip_protocol *tcpip ) {
- struct iphdr *iphdr = pkb->data;
- struct ipv4_pseudo_header pshdr;
- uint16_t *csum = ( ( ( void * ) iphdr ) + sizeof ( *iphdr )
- + tcpip->csum_offset );
-
- /* Calculate pseudo header */
- pshdr.src = iphdr->src;
- pshdr.dest = iphdr->dest;
- pshdr.zero_padding = 0x00;
- pshdr.protocol = iphdr->protocol;
- /* This is only valid when IPv4 does not have options */
- pshdr.len = htons ( pkb_len ( pkb ) - sizeof ( *iphdr ) );
-
- /* Update the checksum value */
- *csum = tcpip_continue_chksum ( *csum, &pshdr, sizeof ( pshdr ) );
- }
-
- /**
- * Calculate the transport-layer checksum while processing packets
- */
- static uint16_t ipv4_rx_csum ( struct pk_buff *pkb __unused,
- uint8_t trans_proto __unused ) {
- /**
- * This function needs to be implemented. Until then, it will return
- * 0xffffffff every time
- */
- return 0xffff;
- }
-
- /**
- * Transmit IP packet
- *
- * @v pkb Packet buffer
- * @v tcpip Transport-layer protocol
- * @v st_dest Destination network-layer address
- * @ret rc Status
- *
- * This function expects a transport-layer segment and prepends the IP header
- */
- static int ipv4_tx ( struct pk_buff *pkb,
- struct tcpip_protocol *tcpip_protocol,
- struct sockaddr_tcpip *st_dest ) {
- struct iphdr *iphdr = pkb_push ( pkb, sizeof ( *iphdr ) );
- struct sockaddr_in *sin_dest = ( ( struct sockaddr_in * ) st_dest );
- struct ipv4_miniroute *miniroute;
- struct net_device *netdev = NULL;
- struct in_addr next_hop;
- uint8_t ll_dest_buf[MAX_LL_ADDR_LEN];
- const uint8_t *ll_dest = ll_dest_buf;
- int rc;
-
- /* Fill up the IP header, except source address */
- iphdr->verhdrlen = ( IP_VER << 4 ) | ( sizeof ( *iphdr ) / 4 );
- iphdr->service = IP_TOS;
- iphdr->len = htons ( pkb_len ( pkb ) );
- iphdr->ident = htons ( next_ident++ );
- iphdr->frags = 0;
- iphdr->ttl = IP_TTL;
- iphdr->protocol = tcpip_protocol->tcpip_proto;
-
- /* Copy destination address */
- iphdr->dest = sin_dest->sin_addr;
-
- /**
- * All fields in the IP header filled in except the source network
- * address (which requires routing) and the header checksum (which
- * requires the source network address). As the pseudo header requires
- * the source address as well and the transport-layer checksum is
- * updated after routing.
- */
-
- /* Use routing table to identify next hop and transmitting netdev */
- next_hop = iphdr->dest;
- list_for_each_entry ( miniroute, &miniroutes, list ) {
- int local, has_gw;
-
- local = ( ( ( iphdr->dest.s_addr ^ miniroute->address.s_addr )
- & miniroute->netmask.s_addr ) == 0 );
- has_gw = ( miniroute->gateway.s_addr != INADDR_NONE );
- if ( local || has_gw ) {
- netdev = miniroute->netdev;
- iphdr->src = miniroute->address;
- if ( ! local )
- next_hop = miniroute->gateway;
- break;
- }
- }
- /* Abort if no network device identified */
- if ( ! netdev ) {
- DBG ( "No route to %s\n", inet_ntoa ( iphdr->dest ) );
- rc = -EHOSTUNREACH;
- goto err;
- }
-
- /* Calculate the transport layer checksum */
- if ( tcpip_protocol->csum_offset > 0 ) {
- ipv4_tx_csum ( pkb, tcpip_protocol );
- }
-
- /* Calculate header checksum, in network byte order */
- iphdr->chksum = 0;
- iphdr->chksum = tcpip_chksum ( iphdr, sizeof ( *iphdr ) );
-
- /* Print IP4 header for debugging */
- ipv4_dump ( iphdr );
-
- /* Determine link-layer destination address */
- if ( next_hop.s_addr == INADDR_BROADCAST ) {
- /* Broadcast address */
- ll_dest = netdev->ll_protocol->ll_broadcast;
- } else if ( IN_MULTICAST ( next_hop.s_addr ) ) {
- /* Special case: IPv4 multicast over Ethernet. This
- * code may need to be generalised once we find out
- * what happens for other link layers.
- */
- uint8_t *next_hop_bytes = ( uint8_t * ) &next_hop;
- ll_dest_buf[0] = 0x01;
- ll_dest_buf[0] = 0x00;
- ll_dest_buf[0] = 0x5e;
- ll_dest_buf[3] = next_hop_bytes[1] & 0x7f;
- ll_dest_buf[4] = next_hop_bytes[2];
- ll_dest_buf[5] = next_hop_bytes[3];
- } else {
- /* Unicast address: resolve via ARP */
- if ( ( rc = arp_resolve ( netdev, &ipv4_protocol, &next_hop,
- &iphdr->src, ll_dest_buf ) ) != 0 ) {
- DBG ( "No ARP entry for %s\n",
- inet_ntoa ( iphdr->dest ) );
- goto err;
- }
- }
-
- /* Hand off to link layer */
- return net_tx ( pkb, netdev, &ipv4_protocol, ll_dest );
-
- err:
- free_pkb ( pkb );
- return rc;
- }
-
- /**
- * Process incoming packets
- *
- * @v pkb Packet buffer
- * @v netdev Network device
- * @v ll_source Link-layer destination source
- *
- * This function expects an IP4 network datagram. It processes the headers
- * and sends it to the transport layer.
- */
- static int ipv4_rx ( struct pk_buff *pkb, struct net_device *netdev __unused,
- const void *ll_source __unused ) {
- struct iphdr *iphdr = pkb->data;
- union {
- struct sockaddr_in sin;
- struct sockaddr_tcpip st;
- } src, dest;
- uint16_t chksum;
-
- /* Sanity check */
- if ( pkb_len ( pkb ) < sizeof ( *iphdr ) ) {
- DBG ( "IP datagram too short (%d bytes)\n", pkb_len ( pkb ) );
- goto err;
- }
-
- /* Print IP4 header for debugging */
- ipv4_dump ( iphdr );
-
- /* Validate version and header length */
- if ( iphdr->verhdrlen != 0x45 ) {
- DBG ( "Bad version and header length %x\n", iphdr->verhdrlen );
- goto err;
- }
-
- /* Validate length of IP packet */
- if ( ntohs ( iphdr->len ) > pkb_len ( pkb ) ) {
- DBG ( "Inconsistent packet length %d\n",
- ntohs ( iphdr->len ) );
- goto err;
- }
-
- /* Verify the checksum */
- if ( ( chksum = ipv4_rx_csum ( pkb, iphdr->protocol ) ) != 0xffff ) {
- DBG ( "Bad checksum %x\n", chksum );
- }
- /* Fragment reassembly */
- if ( iphdr->frags & IP_MASK_MOREFRAGS ||
- ( !iphdr->frags & IP_MASK_MOREFRAGS &&
- iphdr->frags & IP_MASK_OFFSET != 0 ) ) {
- /* Pass the fragment to the reassembler ipv4_ressable() which
- * either returns a fully reassembled packet buffer or NULL.
- */
- pkb = ipv4_reassemble ( pkb );
- if ( !pkb ) {
- return 0;
- }
- }
-
- /* To reduce code size, the following functions are not implemented:
- * 1. Check the destination address
- * 2. Check the TTL field
- * 3. Check the service field
- */
-
- /* Construct socket addresses */
- memset ( &src, 0, sizeof ( src ) );
- src.sin.sin_family = AF_INET;
- src.sin.sin_addr = iphdr->src;
- memset ( &dest, 0, sizeof ( dest ) );
- dest.sin.sin_family = AF_INET;
- dest.sin.sin_addr = iphdr->dest;
-
- /* Strip header */
- pkb_unput ( pkb, pkb_len ( pkb ) - ntohs ( iphdr->len ) );
- pkb_pull ( pkb, sizeof ( *iphdr ) );
-
- /* Send it to the transport layer */
- return tcpip_rx ( pkb, iphdr->protocol, &src.st, &dest.st );
-
- err:
- free_pkb ( pkb );
- return -EINVAL;
- }
-
- /**
- * Check existence of IPv4 address for ARP
- *
- * @v netdev Network device
- * @v net_addr Network-layer address
- * @ret rc Return status code
- */
- static int ipv4_arp_check ( struct net_device *netdev, const void *net_addr ) {
- const struct in_addr *address = net_addr;
- struct ipv4_miniroute *miniroute;
-
- list_for_each_entry ( miniroute, &miniroutes, list ) {
- if ( ( miniroute->netdev == netdev ) &&
- ( miniroute->address.s_addr == address->s_addr ) ) {
- /* Found matching address */
- return 0;
- }
- }
- return -ENOENT;
- }
-
- /**
- * Convert IPv4 address to dotted-quad notation
- *
- * @v in IP address
- * @ret string IP address in dotted-quad notation
- */
- char * inet_ntoa ( struct in_addr in ) {
- static char buf[16]; /* "xxx.xxx.xxx.xxx" */
- uint8_t *bytes = ( uint8_t * ) ∈
-
- sprintf ( buf, "%d.%d.%d.%d", bytes[0], bytes[1], bytes[2], bytes[3] );
- return buf;
- }
-
- /**
- * Transcribe IP address
- *
- * @v net_addr IP address
- * @ret string IP address in dotted-quad notation
- *
- */
- static const char * ipv4_ntoa ( const void *net_addr ) {
- return inet_ntoa ( * ( ( struct in_addr * ) net_addr ) );
- }
-
- /** IPv4 protocol */
- struct net_protocol ipv4_protocol __net_protocol = {
- .name = "IP",
- .net_proto = htons ( ETH_P_IP ),
- .net_addr_len = sizeof ( struct in_addr ),
- .rx = ipv4_rx,
- .ntoa = ipv4_ntoa,
- };
-
- /** IPv4 TCPIP net protocol */
- struct tcpip_net_protocol ipv4_tcpip_protocol __tcpip_net_protocol = {
- .name = "IPv4",
- .sa_family = AF_INET,
- .tx = ipv4_tx,
- };
-
- /** IPv4 ARP protocol */
- struct arp_net_protocol ipv4_arp_protocol __arp_net_protocol = {
- .net_protocol = &ipv4_protocol,
- .check = ipv4_arp_check,
- };
|