You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

netdevice.c 34KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288
  1. /*
  2. * Copyright (C) 2006 Michael Brown <mbrown@fensystems.co.uk>.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public License as
  6. * published by the Free Software Foundation; either version 2 of the
  7. * License, or any later version.
  8. *
  9. * This program is distributed in the hope that it will be useful, but
  10. * WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public License
  15. * along with this program; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
  17. * 02110-1301, USA.
  18. *
  19. * You can also choose to distribute this program under the terms of
  20. * the Unmodified Binary Distribution Licence (as given in the file
  21. * COPYING.UBDL), provided that you have satisfied its requirements.
  22. */
  23. FILE_LICENCE ( GPL2_OR_LATER_OR_UBDL );
  24. #include <stdint.h>
  25. #include <stdlib.h>
  26. #include <stdio.h>
  27. #include <byteswap.h>
  28. #include <string.h>
  29. #include <errno.h>
  30. #include <config/general.h>
  31. #include <ipxe/if_ether.h>
  32. #include <ipxe/iobuf.h>
  33. #include <ipxe/tables.h>
  34. #include <ipxe/process.h>
  35. #include <ipxe/init.h>
  36. #include <ipxe/malloc.h>
  37. #include <ipxe/device.h>
  38. #include <ipxe/errortab.h>
  39. #include <ipxe/profile.h>
  40. #include <ipxe/fault.h>
  41. #include <ipxe/vlan.h>
  42. #include <ipxe/netdevice.h>
  43. /** @file
  44. *
  45. * Network device management
  46. *
  47. */
  48. /** List of network devices */
  49. struct list_head net_devices = LIST_HEAD_INIT ( net_devices );
  50. /** List of open network devices, in reverse order of opening */
  51. static struct list_head open_net_devices = LIST_HEAD_INIT ( open_net_devices );
  52. /** Network device index */
  53. static unsigned int netdev_index = 0;
  54. /** Network polling profiler */
  55. static struct profiler net_poll_profiler __profiler = { .name = "net.poll" };
  56. /** Network receive profiler */
  57. static struct profiler net_rx_profiler __profiler = { .name = "net.rx" };
  58. /** Network transmit profiler */
  59. static struct profiler net_tx_profiler __profiler = { .name = "net.tx" };
  60. /** Default unknown link status code */
  61. #define EUNKNOWN_LINK_STATUS __einfo_error ( EINFO_EUNKNOWN_LINK_STATUS )
  62. #define EINFO_EUNKNOWN_LINK_STATUS \
  63. __einfo_uniqify ( EINFO_EINPROGRESS, 0x01, "Unknown" )
  64. /** Default not-yet-attempted-configuration status code */
  65. #define EUNUSED_CONFIG __einfo_error ( EINFO_EUNUSED_CONFIG )
  66. #define EINFO_EUNUSED_CONFIG \
  67. __einfo_uniqify ( EINFO_EINPROGRESS, 0x02, "Unused" )
  68. /** Default configuration-in-progress status code */
  69. #define EINPROGRESS_CONFIG __einfo_error ( EINFO_EINPROGRESS_CONFIG )
  70. #define EINFO_EINPROGRESS_CONFIG \
  71. __einfo_uniqify ( EINFO_EINPROGRESS, 0x03, "Incomplete" )
  72. /** Default link-down status code */
  73. #define ENOTCONN_LINK_DOWN __einfo_error ( EINFO_ENOTCONN_LINK_DOWN )
  74. #define EINFO_ENOTCONN_LINK_DOWN \
  75. __einfo_uniqify ( EINFO_ENOTCONN, 0x01, "Down" )
  76. /** Human-readable message for the default link statuses */
  77. struct errortab netdev_errors[] __errortab = {
  78. __einfo_errortab ( EINFO_EUNKNOWN_LINK_STATUS ),
  79. __einfo_errortab ( EINFO_ENOTCONN_LINK_DOWN ),
  80. __einfo_errortab ( EINFO_EUNUSED_CONFIG ),
  81. __einfo_errortab ( EINFO_EINPROGRESS_CONFIG ),
  82. };
  83. /**
  84. * Check whether or not network device has a link-layer address
  85. *
  86. * @v netdev Network device
  87. * @ret has_ll_addr Network device has a link-layer address
  88. */
  89. static int netdev_has_ll_addr ( struct net_device *netdev ) {
  90. uint8_t *ll_addr = netdev->ll_addr;
  91. size_t remaining = sizeof ( netdev->ll_addr );
  92. while ( remaining-- ) {
  93. if ( *(ll_addr++) != 0 )
  94. return 1;
  95. }
  96. return 0;
  97. }
  98. /**
  99. * Notify drivers of network device or link state change
  100. *
  101. * @v netdev Network device
  102. */
  103. static void netdev_notify ( struct net_device *netdev ) {
  104. struct net_driver *driver;
  105. for_each_table_entry ( driver, NET_DRIVERS ) {
  106. if ( driver->notify )
  107. driver->notify ( netdev );
  108. }
  109. }
  110. /**
  111. * Freeze network device receive queue processing
  112. *
  113. * @v netdev Network device
  114. */
  115. void netdev_rx_freeze ( struct net_device *netdev ) {
  116. /* Mark receive queue processing as frozen */
  117. netdev->state |= NETDEV_RX_FROZEN;
  118. /* Notify drivers of change */
  119. netdev_notify ( netdev );
  120. }
  121. /**
  122. * Unfreeze network device receive queue processing
  123. *
  124. * @v netdev Network device
  125. */
  126. void netdev_rx_unfreeze ( struct net_device *netdev ) {
  127. /* Mark receive queue processing as not frozen */
  128. netdev->state &= ~NETDEV_RX_FROZEN;
  129. /* Notify drivers of change */
  130. netdev_notify ( netdev );
  131. }
  132. /**
  133. * Mark network device as having a specific link state
  134. *
  135. * @v netdev Network device
  136. * @v rc Link status code
  137. */
  138. void netdev_link_err ( struct net_device *netdev, int rc ) {
  139. /* Stop link block timer */
  140. stop_timer ( &netdev->link_block );
  141. /* Record link state */
  142. netdev->link_rc = rc;
  143. if ( netdev->link_rc == 0 ) {
  144. DBGC ( netdev, "NETDEV %s link is up\n", netdev->name );
  145. } else {
  146. DBGC ( netdev, "NETDEV %s link is down: %s\n",
  147. netdev->name, strerror ( netdev->link_rc ) );
  148. }
  149. /* Notify drivers of link state change */
  150. netdev_notify ( netdev );
  151. }
  152. /**
  153. * Mark network device as having link down
  154. *
  155. * @v netdev Network device
  156. */
  157. void netdev_link_down ( struct net_device *netdev ) {
  158. /* Avoid clobbering a more detailed link status code, if one
  159. * is already set.
  160. */
  161. if ( ( netdev->link_rc == 0 ) ||
  162. ( netdev->link_rc == -EUNKNOWN_LINK_STATUS ) ) {
  163. netdev_link_err ( netdev, -ENOTCONN_LINK_DOWN );
  164. }
  165. }
  166. /**
  167. * Mark network device link as being blocked
  168. *
  169. * @v netdev Network device
  170. * @v timeout Timeout (in ticks)
  171. */
  172. void netdev_link_block ( struct net_device *netdev, unsigned long timeout ) {
  173. /* Start link block timer */
  174. if ( ! netdev_link_blocked ( netdev ) ) {
  175. DBGC ( netdev, "NETDEV %s link blocked for %ld ticks\n",
  176. netdev->name, timeout );
  177. }
  178. start_timer_fixed ( &netdev->link_block, timeout );
  179. }
  180. /**
  181. * Mark network device link as being unblocked
  182. *
  183. * @v netdev Network device
  184. */
  185. void netdev_link_unblock ( struct net_device *netdev ) {
  186. /* Stop link block timer */
  187. if ( netdev_link_blocked ( netdev ) )
  188. DBGC ( netdev, "NETDEV %s link unblocked\n", netdev->name );
  189. stop_timer ( &netdev->link_block );
  190. }
  191. /**
  192. * Handle network device link block timer expiry
  193. *
  194. * @v timer Link block timer
  195. * @v fail Failure indicator
  196. */
  197. static void netdev_link_block_expired ( struct retry_timer *timer,
  198. int fail __unused ) {
  199. struct net_device *netdev =
  200. container_of ( timer, struct net_device, link_block );
  201. /* Assume link is no longer blocked */
  202. DBGC ( netdev, "NETDEV %s link block expired\n", netdev->name );
  203. }
  204. /**
  205. * Record network device statistic
  206. *
  207. * @v stats Network device statistics
  208. * @v rc Status code
  209. */
  210. static void netdev_record_stat ( struct net_device_stats *stats, int rc ) {
  211. struct net_device_error *error;
  212. struct net_device_error *least_common_error;
  213. unsigned int i;
  214. /* If this is not an error, just update the good counter */
  215. if ( rc == 0 ) {
  216. stats->good++;
  217. return;
  218. }
  219. /* Update the bad counter */
  220. stats->bad++;
  221. /* Locate the appropriate error record */
  222. least_common_error = &stats->errors[0];
  223. for ( i = 0 ; i < ( sizeof ( stats->errors ) /
  224. sizeof ( stats->errors[0] ) ) ; i++ ) {
  225. error = &stats->errors[i];
  226. /* Update matching record, if found */
  227. if ( error->rc == rc ) {
  228. error->count++;
  229. return;
  230. }
  231. if ( error->count < least_common_error->count )
  232. least_common_error = error;
  233. }
  234. /* Overwrite the least common error record */
  235. least_common_error->rc = rc;
  236. least_common_error->count = 1;
  237. }
  238. /**
  239. * Transmit raw packet via network device
  240. *
  241. * @v netdev Network device
  242. * @v iobuf I/O buffer
  243. * @ret rc Return status code
  244. *
  245. * Transmits the packet via the specified network device. This
  246. * function takes ownership of the I/O buffer.
  247. */
  248. int netdev_tx ( struct net_device *netdev, struct io_buffer *iobuf ) {
  249. int rc;
  250. DBGC2 ( netdev, "NETDEV %s transmitting %p (%p+%zx)\n",
  251. netdev->name, iobuf, iobuf->data, iob_len ( iobuf ) );
  252. profile_start ( &net_tx_profiler );
  253. /* Enqueue packet */
  254. list_add_tail ( &iobuf->list, &netdev->tx_queue );
  255. /* Avoid calling transmit() on unopened network devices */
  256. if ( ! netdev_is_open ( netdev ) ) {
  257. rc = -ENETUNREACH;
  258. goto err;
  259. }
  260. /* Discard packet (for test purposes) if applicable */
  261. if ( ( rc = inject_fault ( NETDEV_DISCARD_RATE ) ) != 0 )
  262. goto err;
  263. /* Transmit packet */
  264. if ( ( rc = netdev->op->transmit ( netdev, iobuf ) ) != 0 )
  265. goto err;
  266. profile_stop ( &net_tx_profiler );
  267. return 0;
  268. err:
  269. netdev_tx_complete_err ( netdev, iobuf, rc );
  270. return rc;
  271. }
  272. /**
  273. * Defer transmitted packet
  274. *
  275. * @v netdev Network device
  276. * @v iobuf I/O buffer
  277. *
  278. * Drivers may call netdev_tx_defer() if there is insufficient space
  279. * in the transmit descriptor ring. Any packets deferred in this way
  280. * will be automatically retransmitted as soon as space becomes
  281. * available (i.e. as soon as the driver calls netdev_tx_complete()).
  282. *
  283. * The packet must currently be in the network device's TX queue.
  284. *
  285. * Drivers utilising netdev_tx_defer() must ensure that space in the
  286. * transmit descriptor ring is freed up @b before calling
  287. * netdev_tx_complete(). For example, if the ring is modelled using a
  288. * producer counter and a consumer counter, then the consumer counter
  289. * must be incremented before the call to netdev_tx_complete().
  290. * Failure to do this will cause the retransmitted packet to be
  291. * immediately redeferred (which will result in out-of-order
  292. * transmissions and other nastiness).
  293. */
  294. void netdev_tx_defer ( struct net_device *netdev, struct io_buffer *iobuf ) {
  295. /* Catch data corruption as early as possible */
  296. list_check_contains_entry ( iobuf, &netdev->tx_queue, list );
  297. /* Remove from transmit queue */
  298. list_del ( &iobuf->list );
  299. /* Add to deferred transmit queue */
  300. list_add_tail ( &iobuf->list, &netdev->tx_deferred );
  301. /* Record "out of space" statistic */
  302. netdev_tx_err ( netdev, NULL, -ENOBUFS );
  303. }
  304. /**
  305. * Discard transmitted packet
  306. *
  307. * @v netdev Network device
  308. * @v iobuf I/O buffer, or NULL
  309. * @v rc Packet status code
  310. *
  311. * The packet is discarded and a TX error is recorded. This function
  312. * takes ownership of the I/O buffer.
  313. */
  314. void netdev_tx_err ( struct net_device *netdev,
  315. struct io_buffer *iobuf, int rc ) {
  316. /* Update statistics counter */
  317. netdev_record_stat ( &netdev->tx_stats, rc );
  318. if ( rc == 0 ) {
  319. DBGC2 ( netdev, "NETDEV %s transmission %p complete\n",
  320. netdev->name, iobuf );
  321. } else {
  322. DBGC ( netdev, "NETDEV %s transmission %p failed: %s\n",
  323. netdev->name, iobuf, strerror ( rc ) );
  324. }
  325. /* Discard packet */
  326. free_iob ( iobuf );
  327. }
  328. /**
  329. * Complete network transmission
  330. *
  331. * @v netdev Network device
  332. * @v iobuf I/O buffer
  333. * @v rc Packet status code
  334. *
  335. * The packet must currently be in the network device's TX queue.
  336. */
  337. void netdev_tx_complete_err ( struct net_device *netdev,
  338. struct io_buffer *iobuf, int rc ) {
  339. /* Catch data corruption as early as possible */
  340. list_check_contains_entry ( iobuf, &netdev->tx_queue, list );
  341. /* Dequeue and free I/O buffer */
  342. list_del ( &iobuf->list );
  343. netdev_tx_err ( netdev, iobuf, rc );
  344. /* Transmit first pending packet, if any */
  345. if ( ( iobuf = list_first_entry ( &netdev->tx_deferred,
  346. struct io_buffer, list ) ) != NULL ) {
  347. list_del ( &iobuf->list );
  348. netdev_tx ( netdev, iobuf );
  349. }
  350. }
  351. /**
  352. * Complete network transmission
  353. *
  354. * @v netdev Network device
  355. * @v rc Packet status code
  356. *
  357. * Completes the oldest outstanding packet in the TX queue.
  358. */
  359. void netdev_tx_complete_next_err ( struct net_device *netdev, int rc ) {
  360. struct io_buffer *iobuf;
  361. if ( ( iobuf = list_first_entry ( &netdev->tx_queue, struct io_buffer,
  362. list ) ) != NULL ) {
  363. netdev_tx_complete_err ( netdev, iobuf, rc );
  364. }
  365. }
  366. /**
  367. * Flush device's transmit queue
  368. *
  369. * @v netdev Network device
  370. */
  371. static void netdev_tx_flush ( struct net_device *netdev ) {
  372. /* Discard any packets in the TX queue. This will also cause
  373. * any packets in the deferred TX queue to be discarded
  374. * automatically.
  375. */
  376. while ( ! list_empty ( &netdev->tx_queue ) ) {
  377. netdev_tx_complete_next_err ( netdev, -ECANCELED );
  378. }
  379. assert ( list_empty ( &netdev->tx_queue ) );
  380. assert ( list_empty ( &netdev->tx_deferred ) );
  381. }
  382. /**
  383. * Add packet to receive queue
  384. *
  385. * @v netdev Network device
  386. * @v iobuf I/O buffer, or NULL
  387. *
  388. * The packet is added to the network device's RX queue. This
  389. * function takes ownership of the I/O buffer.
  390. */
  391. void netdev_rx ( struct net_device *netdev, struct io_buffer *iobuf ) {
  392. int rc;
  393. DBGC2 ( netdev, "NETDEV %s received %p (%p+%zx)\n",
  394. netdev->name, iobuf, iobuf->data, iob_len ( iobuf ) );
  395. /* Discard packet (for test purposes) if applicable */
  396. if ( ( rc = inject_fault ( NETDEV_DISCARD_RATE ) ) != 0 ) {
  397. netdev_rx_err ( netdev, iobuf, rc );
  398. return;
  399. }
  400. /* Enqueue packet */
  401. list_add_tail ( &iobuf->list, &netdev->rx_queue );
  402. /* Update statistics counter */
  403. netdev_record_stat ( &netdev->rx_stats, 0 );
  404. }
  405. /**
  406. * Discard received packet
  407. *
  408. * @v netdev Network device
  409. * @v iobuf I/O buffer, or NULL
  410. * @v rc Packet status code
  411. *
  412. * The packet is discarded and an RX error is recorded. This function
  413. * takes ownership of the I/O buffer. @c iobuf may be NULL if, for
  414. * example, the net device wishes to report an error due to being
  415. * unable to allocate an I/O buffer.
  416. */
  417. void netdev_rx_err ( struct net_device *netdev,
  418. struct io_buffer *iobuf, int rc ) {
  419. DBGC ( netdev, "NETDEV %s failed to receive %p: %s\n",
  420. netdev->name, iobuf, strerror ( rc ) );
  421. /* Discard packet */
  422. free_iob ( iobuf );
  423. /* Update statistics counter */
  424. netdev_record_stat ( &netdev->rx_stats, rc );
  425. }
  426. /**
  427. * Poll for completed and received packets on network device
  428. *
  429. * @v netdev Network device
  430. *
  431. * Polls the network device for completed transmissions and received
  432. * packets. Any received packets will be added to the RX packet queue
  433. * via netdev_rx().
  434. */
  435. void netdev_poll ( struct net_device *netdev ) {
  436. if ( netdev_is_open ( netdev ) )
  437. netdev->op->poll ( netdev );
  438. }
  439. /**
  440. * Remove packet from device's receive queue
  441. *
  442. * @v netdev Network device
  443. * @ret iobuf I/O buffer, or NULL
  444. *
  445. * Removes the first packet from the device's RX queue and returns it.
  446. * Ownership of the packet is transferred to the caller.
  447. */
  448. struct io_buffer * netdev_rx_dequeue ( struct net_device *netdev ) {
  449. struct io_buffer *iobuf;
  450. iobuf = list_first_entry ( &netdev->rx_queue, struct io_buffer, list );
  451. if ( ! iobuf )
  452. return NULL;
  453. list_del ( &iobuf->list );
  454. return iobuf;
  455. }
  456. /**
  457. * Flush device's receive queue
  458. *
  459. * @v netdev Network device
  460. */
  461. static void netdev_rx_flush ( struct net_device *netdev ) {
  462. struct io_buffer *iobuf;
  463. /* Discard any packets in the RX queue */
  464. while ( ( iobuf = netdev_rx_dequeue ( netdev ) ) ) {
  465. netdev_rx_err ( netdev, iobuf, -ECANCELED );
  466. }
  467. }
  468. /**
  469. * Finish network device configuration
  470. *
  471. * @v config Network device configuration
  472. * @v rc Reason for completion
  473. */
  474. static void netdev_config_close ( struct net_device_configuration *config,
  475. int rc ) {
  476. struct net_device_configurator *configurator = config->configurator;
  477. struct net_device *netdev = config->netdev;
  478. /* Restart interface */
  479. intf_restart ( &config->job, rc );
  480. /* Record configuration result */
  481. config->rc = rc;
  482. if ( rc == 0 ) {
  483. DBGC ( netdev, "NETDEV %s configured via %s\n",
  484. netdev->name, configurator->name );
  485. } else {
  486. DBGC ( netdev, "NETDEV %s configuration via %s failed: %s\n",
  487. netdev->name, configurator->name, strerror ( rc ) );
  488. }
  489. }
  490. /** Network device configuration interface operations */
  491. static struct interface_operation netdev_config_ops[] = {
  492. INTF_OP ( intf_close, struct net_device_configuration *,
  493. netdev_config_close ),
  494. };
  495. /** Network device configuration interface descriptor */
  496. static struct interface_descriptor netdev_config_desc =
  497. INTF_DESC ( struct net_device_configuration, job, netdev_config_ops );
  498. /**
  499. * Free network device
  500. *
  501. * @v refcnt Network device reference counter
  502. */
  503. static void free_netdev ( struct refcnt *refcnt ) {
  504. struct net_device *netdev =
  505. container_of ( refcnt, struct net_device, refcnt );
  506. stop_timer ( &netdev->link_block );
  507. netdev_tx_flush ( netdev );
  508. netdev_rx_flush ( netdev );
  509. clear_settings ( netdev_settings ( netdev ) );
  510. free ( netdev );
  511. }
  512. /**
  513. * Allocate network device
  514. *
  515. * @v priv_len Length of private data area (net_device::priv)
  516. * @ret netdev Network device, or NULL
  517. *
  518. * Allocates space for a network device and its private data area.
  519. */
  520. struct net_device * alloc_netdev ( size_t priv_len ) {
  521. struct net_device *netdev;
  522. struct net_device_configurator *configurator;
  523. struct net_device_configuration *config;
  524. unsigned int num_configs;
  525. size_t confs_len;
  526. size_t total_len;
  527. num_configs = table_num_entries ( NET_DEVICE_CONFIGURATORS );
  528. confs_len = ( num_configs * sizeof ( netdev->configs[0] ) );
  529. total_len = ( sizeof ( *netdev ) + confs_len + priv_len );
  530. netdev = zalloc ( total_len );
  531. if ( netdev ) {
  532. ref_init ( &netdev->refcnt, free_netdev );
  533. netdev->link_rc = -EUNKNOWN_LINK_STATUS;
  534. timer_init ( &netdev->link_block, netdev_link_block_expired,
  535. &netdev->refcnt );
  536. INIT_LIST_HEAD ( &netdev->tx_queue );
  537. INIT_LIST_HEAD ( &netdev->tx_deferred );
  538. INIT_LIST_HEAD ( &netdev->rx_queue );
  539. netdev_settings_init ( netdev );
  540. config = netdev->configs;
  541. for_each_table_entry ( configurator, NET_DEVICE_CONFIGURATORS ){
  542. config->netdev = netdev;
  543. config->configurator = configurator;
  544. config->rc = -EUNUSED_CONFIG;
  545. intf_init ( &config->job, &netdev_config_desc,
  546. &netdev->refcnt );
  547. config++;
  548. }
  549. netdev->priv = ( ( ( void * ) netdev ) + sizeof ( *netdev ) +
  550. confs_len );
  551. }
  552. return netdev;
  553. }
  554. /**
  555. * Register network device
  556. *
  557. * @v netdev Network device
  558. * @ret rc Return status code
  559. *
  560. * Gives the network device a name and adds it to the list of network
  561. * devices.
  562. */
  563. int register_netdev ( struct net_device *netdev ) {
  564. struct ll_protocol *ll_protocol = netdev->ll_protocol;
  565. struct net_driver *driver;
  566. struct net_device *duplicate;
  567. uint32_t seed;
  568. int rc;
  569. /* Set initial link-layer address, if not already set */
  570. if ( ! netdev_has_ll_addr ( netdev ) ) {
  571. ll_protocol->init_addr ( netdev->hw_addr, netdev->ll_addr );
  572. }
  573. /* Set MTU, if not already set */
  574. if ( ! netdev->mtu ) {
  575. netdev->mtu = ( netdev->max_pkt_len -
  576. ll_protocol->ll_header_len );
  577. }
  578. /* Reject network devices that are already available via a
  579. * different hardware device.
  580. */
  581. duplicate = find_netdev_by_ll_addr ( ll_protocol, netdev->ll_addr );
  582. if ( duplicate && ( duplicate->dev != netdev->dev ) ) {
  583. DBGC ( netdev, "NETDEV rejecting duplicate (phys %s) of %s "
  584. "(phys %s)\n", netdev->dev->name, duplicate->name,
  585. duplicate->dev->name );
  586. rc = -EEXIST;
  587. goto err_duplicate;
  588. }
  589. /* Reject named network devices that already exist */
  590. if ( netdev->name[0] && ( duplicate = find_netdev ( netdev->name ) ) ) {
  591. DBGC ( netdev, "NETDEV rejecting duplicate name %s\n",
  592. duplicate->name );
  593. rc = -EEXIST;
  594. goto err_duplicate;
  595. }
  596. /* Record device index and create device name */
  597. if ( netdev->name[0] == '\0' ) {
  598. snprintf ( netdev->name, sizeof ( netdev->name ), "net%d",
  599. netdev_index );
  600. }
  601. netdev->index = ++netdev_index;
  602. /* Use least significant bits of the link-layer address to
  603. * improve the randomness of the (non-cryptographic) random
  604. * number generator.
  605. */
  606. memcpy ( &seed, ( netdev->ll_addr + ll_protocol->ll_addr_len
  607. - sizeof ( seed ) ), sizeof ( seed ) );
  608. srand ( rand() ^ seed );
  609. /* Add to device list */
  610. netdev_get ( netdev );
  611. list_add_tail ( &netdev->list, &net_devices );
  612. DBGC ( netdev, "NETDEV %s registered (phys %s hwaddr %s)\n",
  613. netdev->name, netdev->dev->name,
  614. netdev_addr ( netdev ) );
  615. /* Register per-netdev configuration settings */
  616. if ( ( rc = register_settings ( netdev_settings ( netdev ),
  617. NULL, netdev->name ) ) != 0 ) {
  618. DBGC ( netdev, "NETDEV %s could not register settings: %s\n",
  619. netdev->name, strerror ( rc ) );
  620. goto err_register_settings;
  621. }
  622. /* Probe device */
  623. for_each_table_entry ( driver, NET_DRIVERS ) {
  624. if ( driver->probe && ( rc = driver->probe ( netdev ) ) != 0 ) {
  625. DBGC ( netdev, "NETDEV %s could not add %s device: "
  626. "%s\n", netdev->name, driver->name,
  627. strerror ( rc ) );
  628. goto err_probe;
  629. }
  630. }
  631. return 0;
  632. err_probe:
  633. for_each_table_entry_continue_reverse ( driver, NET_DRIVERS ) {
  634. if ( driver->remove )
  635. driver->remove ( netdev );
  636. }
  637. clear_settings ( netdev_settings ( netdev ) );
  638. unregister_settings ( netdev_settings ( netdev ) );
  639. err_register_settings:
  640. list_del ( &netdev->list );
  641. netdev_put ( netdev );
  642. err_duplicate:
  643. return rc;
  644. }
  645. /**
  646. * Open network device
  647. *
  648. * @v netdev Network device
  649. * @ret rc Return status code
  650. */
  651. int netdev_open ( struct net_device *netdev ) {
  652. int rc;
  653. /* Do nothing if device is already open */
  654. if ( netdev->state & NETDEV_OPEN )
  655. return 0;
  656. DBGC ( netdev, "NETDEV %s opening\n", netdev->name );
  657. /* Mark as opened */
  658. netdev->state |= NETDEV_OPEN;
  659. /* Open the device */
  660. if ( ( rc = netdev->op->open ( netdev ) ) != 0 )
  661. goto err;
  662. /* Add to head of open devices list */
  663. list_add ( &netdev->open_list, &open_net_devices );
  664. /* Notify drivers of device state change */
  665. netdev_notify ( netdev );
  666. return 0;
  667. err:
  668. netdev->state &= ~NETDEV_OPEN;
  669. return rc;
  670. }
  671. /**
  672. * Close network device
  673. *
  674. * @v netdev Network device
  675. */
  676. void netdev_close ( struct net_device *netdev ) {
  677. unsigned int num_configs;
  678. unsigned int i;
  679. /* Do nothing if device is already closed */
  680. if ( ! ( netdev->state & NETDEV_OPEN ) )
  681. return;
  682. DBGC ( netdev, "NETDEV %s closing\n", netdev->name );
  683. /* Terminate any ongoing configurations. Use intf_close()
  684. * rather than intf_restart() to allow the cancellation to be
  685. * reported back to us if a configuration is actually in
  686. * progress.
  687. */
  688. num_configs = table_num_entries ( NET_DEVICE_CONFIGURATORS );
  689. for ( i = 0 ; i < num_configs ; i++ )
  690. intf_close ( &netdev->configs[i].job, -ECANCELED );
  691. /* Remove from open devices list */
  692. list_del ( &netdev->open_list );
  693. /* Mark as closed */
  694. netdev->state &= ~NETDEV_OPEN;
  695. /* Notify drivers of device state change */
  696. netdev_notify ( netdev );
  697. /* Close the device */
  698. netdev->op->close ( netdev );
  699. /* Flush TX and RX queues */
  700. netdev_tx_flush ( netdev );
  701. netdev_rx_flush ( netdev );
  702. }
  703. /**
  704. * Unregister network device
  705. *
  706. * @v netdev Network device
  707. *
  708. * Removes the network device from the list of network devices.
  709. */
  710. void unregister_netdev ( struct net_device *netdev ) {
  711. struct net_driver *driver;
  712. /* Ensure device is closed */
  713. netdev_close ( netdev );
  714. /* Remove device */
  715. for_each_table_entry_reverse ( driver, NET_DRIVERS ) {
  716. if ( driver->remove )
  717. driver->remove ( netdev );
  718. }
  719. /* Unregister per-netdev configuration settings */
  720. clear_settings ( netdev_settings ( netdev ) );
  721. unregister_settings ( netdev_settings ( netdev ) );
  722. /* Remove from device list */
  723. DBGC ( netdev, "NETDEV %s unregistered\n", netdev->name );
  724. list_del ( &netdev->list );
  725. netdev_put ( netdev );
  726. /* Reset network device index if no devices remain */
  727. if ( list_empty ( &net_devices ) )
  728. netdev_index = 0;
  729. }
  730. /** Enable or disable interrupts
  731. *
  732. * @v netdev Network device
  733. * @v enable Interrupts should be enabled
  734. */
  735. void netdev_irq ( struct net_device *netdev, int enable ) {
  736. /* Do nothing if device does not support interrupts */
  737. if ( ! netdev_irq_supported ( netdev ) )
  738. return;
  739. /* Enable or disable device interrupts */
  740. netdev->op->irq ( netdev, enable );
  741. /* Record interrupt enabled state */
  742. netdev->state &= ~NETDEV_IRQ_ENABLED;
  743. if ( enable )
  744. netdev->state |= NETDEV_IRQ_ENABLED;
  745. }
  746. /**
  747. * Get network device by name
  748. *
  749. * @v name Network device name
  750. * @ret netdev Network device, or NULL
  751. */
  752. struct net_device * find_netdev ( const char *name ) {
  753. struct net_device *netdev;
  754. /* Allow "netX" shortcut */
  755. if ( strcmp ( name, "netX" ) == 0 )
  756. return last_opened_netdev();
  757. /* Identify network device by name */
  758. list_for_each_entry ( netdev, &net_devices, list ) {
  759. if ( strcmp ( netdev->name, name ) == 0 )
  760. return netdev;
  761. }
  762. return NULL;
  763. }
  764. /**
  765. * Get network device by index
  766. *
  767. * @v index Network device index
  768. * @ret netdev Network device, or NULL
  769. */
  770. struct net_device * find_netdev_by_index ( unsigned int index ) {
  771. struct net_device *netdev;
  772. /* Identify network device by index */
  773. list_for_each_entry ( netdev, &net_devices, list ) {
  774. if ( netdev->index == index )
  775. return netdev;
  776. }
  777. return NULL;
  778. }
  779. /**
  780. * Get network device by PCI bus:dev.fn address
  781. *
  782. * @v bus_type Bus type
  783. * @v location Bus location
  784. * @ret netdev Network device, or NULL
  785. */
  786. struct net_device * find_netdev_by_location ( unsigned int bus_type,
  787. unsigned int location ) {
  788. struct net_device *netdev;
  789. list_for_each_entry ( netdev, &net_devices, list ) {
  790. if ( ( netdev->dev->desc.bus_type == bus_type ) &&
  791. ( netdev->dev->desc.location == location ) )
  792. return netdev;
  793. }
  794. return NULL;
  795. }
  796. /**
  797. * Get network device by link-layer address
  798. *
  799. * @v ll_protocol Link-layer protocol
  800. * @v ll_addr Link-layer address
  801. * @ret netdev Network device, or NULL
  802. */
  803. struct net_device * find_netdev_by_ll_addr ( struct ll_protocol *ll_protocol,
  804. const void *ll_addr ) {
  805. struct net_device *netdev;
  806. list_for_each_entry ( netdev, &net_devices, list ) {
  807. if ( ( netdev->ll_protocol == ll_protocol ) &&
  808. ( memcmp ( netdev->ll_addr, ll_addr,
  809. ll_protocol->ll_addr_len ) == 0 ) )
  810. return netdev;
  811. }
  812. return NULL;
  813. }
  814. /**
  815. * Get most recently opened network device
  816. *
  817. * @ret netdev Most recently opened network device, or NULL
  818. */
  819. struct net_device * last_opened_netdev ( void ) {
  820. struct net_device *netdev;
  821. netdev = list_first_entry ( &open_net_devices, struct net_device,
  822. open_list );
  823. if ( ! netdev )
  824. return NULL;
  825. assert ( netdev_is_open ( netdev ) );
  826. return netdev;
  827. }
  828. /**
  829. * Transmit network-layer packet
  830. *
  831. * @v iobuf I/O buffer
  832. * @v netdev Network device
  833. * @v net_protocol Network-layer protocol
  834. * @v ll_dest Destination link-layer address
  835. * @v ll_source Source link-layer address
  836. * @ret rc Return status code
  837. *
  838. * Prepends link-layer headers to the I/O buffer and transmits the
  839. * packet via the specified network device. This function takes
  840. * ownership of the I/O buffer.
  841. */
  842. int net_tx ( struct io_buffer *iobuf, struct net_device *netdev,
  843. struct net_protocol *net_protocol, const void *ll_dest,
  844. const void *ll_source ) {
  845. struct ll_protocol *ll_protocol = netdev->ll_protocol;
  846. int rc;
  847. /* Add link-layer header */
  848. if ( ( rc = ll_protocol->push ( netdev, iobuf, ll_dest, ll_source,
  849. net_protocol->net_proto ) ) != 0 ) {
  850. /* Record error for diagnosis */
  851. netdev_tx_err ( netdev, iobuf, rc );
  852. return rc;
  853. }
  854. /* Transmit packet */
  855. return netdev_tx ( netdev, iobuf );
  856. }
  857. /**
  858. * Process received network-layer packet
  859. *
  860. * @v iobuf I/O buffer
  861. * @v netdev Network device
  862. * @v net_proto Network-layer protocol, in network-byte order
  863. * @v ll_dest Destination link-layer address
  864. * @v ll_source Source link-layer address
  865. * @v flags Packet flags
  866. * @ret rc Return status code
  867. */
  868. int net_rx ( struct io_buffer *iobuf, struct net_device *netdev,
  869. uint16_t net_proto, const void *ll_dest, const void *ll_source,
  870. unsigned int flags ) {
  871. struct net_protocol *net_protocol;
  872. /* Hand off to network-layer protocol, if any */
  873. for_each_table_entry ( net_protocol, NET_PROTOCOLS ) {
  874. if ( net_protocol->net_proto == net_proto )
  875. return net_protocol->rx ( iobuf, netdev, ll_dest,
  876. ll_source, flags );
  877. }
  878. DBGC ( netdev, "NETDEV %s unknown network protocol %04x\n",
  879. netdev->name, ntohs ( net_proto ) );
  880. free_iob ( iobuf );
  881. return -ENOTSUP;
  882. }
  883. /**
  884. * Poll the network stack
  885. *
  886. * This polls all interfaces for received packets, and processes
  887. * packets from the RX queue.
  888. */
  889. void net_poll ( void ) {
  890. struct net_device *netdev;
  891. struct io_buffer *iobuf;
  892. struct ll_protocol *ll_protocol;
  893. const void *ll_dest;
  894. const void *ll_source;
  895. uint16_t net_proto;
  896. unsigned int flags;
  897. int rc;
  898. /* Poll and process each network device */
  899. list_for_each_entry ( netdev, &net_devices, list ) {
  900. /* Poll for new packets */
  901. profile_start ( &net_poll_profiler );
  902. netdev_poll ( netdev );
  903. profile_stop ( &net_poll_profiler );
  904. /* Leave received packets on the queue if receive
  905. * queue processing is currently frozen. This will
  906. * happen when the raw packets are to be manually
  907. * dequeued using netdev_rx_dequeue(), rather than
  908. * processed via the usual networking stack.
  909. */
  910. if ( netdev_rx_frozen ( netdev ) )
  911. continue;
  912. /* Process all received packets */
  913. while ( ( iobuf = netdev_rx_dequeue ( netdev ) ) ) {
  914. DBGC2 ( netdev, "NETDEV %s processing %p (%p+%zx)\n",
  915. netdev->name, iobuf, iobuf->data,
  916. iob_len ( iobuf ) );
  917. profile_start ( &net_rx_profiler );
  918. /* Remove link-layer header */
  919. ll_protocol = netdev->ll_protocol;
  920. if ( ( rc = ll_protocol->pull ( netdev, iobuf,
  921. &ll_dest, &ll_source,
  922. &net_proto,
  923. &flags ) ) != 0 ) {
  924. free_iob ( iobuf );
  925. continue;
  926. }
  927. /* Hand packet to network layer */
  928. if ( ( rc = net_rx ( iob_disown ( iobuf ), netdev,
  929. net_proto, ll_dest,
  930. ll_source, flags ) ) != 0 ) {
  931. /* Record error for diagnosis */
  932. netdev_rx_err ( netdev, NULL, rc );
  933. }
  934. profile_stop ( &net_rx_profiler );
  935. }
  936. }
  937. }
  938. /**
  939. * Single-step the network stack
  940. *
  941. * @v process Network stack process
  942. */
  943. static void net_step ( struct process *process __unused ) {
  944. net_poll();
  945. }
  946. /**
  947. * Get the VLAN tag (when VLAN support is not present)
  948. *
  949. * @v netdev Network device
  950. * @ret tag 0, indicating that device is not a VLAN device
  951. */
  952. __weak unsigned int vlan_tag ( struct net_device *netdev __unused ) {
  953. return 0;
  954. }
  955. /**
  956. * Identify VLAN device (when VLAN support is not present)
  957. *
  958. * @v trunk Trunk network device
  959. * @v tag VLAN tag
  960. * @ret netdev VLAN device, if any
  961. */
  962. __weak struct net_device * vlan_find ( struct net_device *trunk __unused,
  963. unsigned int tag __unused ) {
  964. return NULL;
  965. }
  966. /** Networking stack process */
  967. PERMANENT_PROCESS ( net_process, net_step );
  968. /**
  969. * Discard some cached network device data
  970. *
  971. * @ret discarded Number of cached items discarded
  972. */
  973. static unsigned int net_discard ( void ) {
  974. struct net_device *netdev;
  975. struct io_buffer *iobuf;
  976. unsigned int discarded = 0;
  977. /* Try to drop one deferred TX packet from each network device */
  978. for_each_netdev ( netdev ) {
  979. if ( ( iobuf = list_first_entry ( &netdev->tx_deferred,
  980. struct io_buffer,
  981. list ) ) != NULL ) {
  982. /* Discard first deferred packet */
  983. list_del ( &iobuf->list );
  984. free_iob ( iobuf );
  985. /* Report discard */
  986. discarded++;
  987. }
  988. }
  989. return discarded;
  990. }
  991. /** Network device cache discarder */
  992. struct cache_discarder net_discarder __cache_discarder ( CACHE_NORMAL ) = {
  993. .discard = net_discard,
  994. };
  995. /**
  996. * Find network device configurator
  997. *
  998. * @v name Name
  999. * @ret configurator Network device configurator, or NULL
  1000. */
  1001. struct net_device_configurator * find_netdev_configurator ( const char *name ) {
  1002. struct net_device_configurator *configurator;
  1003. for_each_table_entry ( configurator, NET_DEVICE_CONFIGURATORS ) {
  1004. if ( strcmp ( configurator->name, name ) == 0 )
  1005. return configurator;
  1006. }
  1007. return NULL;
  1008. }
  1009. /**
  1010. * Start network device configuration
  1011. *
  1012. * @v netdev Network device
  1013. * @v configurator Network device configurator
  1014. * @ret rc Return status code
  1015. */
  1016. int netdev_configure ( struct net_device *netdev,
  1017. struct net_device_configurator *configurator ) {
  1018. struct net_device_configuration *config =
  1019. netdev_configuration ( netdev, configurator );
  1020. int rc;
  1021. /* Check applicability of configurator */
  1022. if ( ! netdev_configurator_applies ( netdev, configurator ) ) {
  1023. DBGC ( netdev, "NETDEV %s does not support configuration via "
  1024. "%s\n", netdev->name, configurator->name );
  1025. return -ENOTSUP;
  1026. }
  1027. /* Terminate any ongoing configuration */
  1028. intf_restart ( &config->job, -ECANCELED );
  1029. /* Mark configuration as being in progress */
  1030. config->rc = -EINPROGRESS_CONFIG;
  1031. DBGC ( netdev, "NETDEV %s starting configuration via %s\n",
  1032. netdev->name, configurator->name );
  1033. /* Start configuration */
  1034. if ( ( rc = configurator->start ( &config->job, netdev ) ) != 0 ) {
  1035. DBGC ( netdev, "NETDEV %s could not start configuration via "
  1036. "%s: %s\n", netdev->name, configurator->name,
  1037. strerror ( rc ) );
  1038. config->rc = rc;
  1039. return rc;
  1040. }
  1041. return 0;
  1042. }
  1043. /**
  1044. * Start network device configuration via all supported configurators
  1045. *
  1046. * @v netdev Network device
  1047. * @ret rc Return status code
  1048. */
  1049. int netdev_configure_all ( struct net_device *netdev ) {
  1050. struct net_device_configurator *configurator;
  1051. int rc;
  1052. /* Start configuration for each configurator */
  1053. for_each_table_entry ( configurator, NET_DEVICE_CONFIGURATORS ) {
  1054. /* Skip any inapplicable configurators */
  1055. if ( ! netdev_configurator_applies ( netdev, configurator ) )
  1056. continue;
  1057. /* Start configuration */
  1058. if ( ( rc = netdev_configure ( netdev, configurator ) ) != 0 )
  1059. return rc;
  1060. }
  1061. return 0;
  1062. }
  1063. /**
  1064. * Check if network device has a configuration with a specified status code
  1065. *
  1066. * @v netdev Network device
  1067. * @v rc Status code
  1068. * @ret has_rc Network device has a configuration with this status code
  1069. */
  1070. static int netdev_has_configuration_rc ( struct net_device *netdev, int rc ) {
  1071. unsigned int num_configs;
  1072. unsigned int i;
  1073. num_configs = table_num_entries ( NET_DEVICE_CONFIGURATORS );
  1074. for ( i = 0 ; i < num_configs ; i++ ) {
  1075. if ( netdev->configs[i].rc == rc )
  1076. return 1;
  1077. }
  1078. return 0;
  1079. }
  1080. /**
  1081. * Check if network device configuration is in progress
  1082. *
  1083. * @v netdev Network device
  1084. * @ret is_in_progress Network device configuration is in progress
  1085. */
  1086. int netdev_configuration_in_progress ( struct net_device *netdev ) {
  1087. return netdev_has_configuration_rc ( netdev, -EINPROGRESS_CONFIG );
  1088. }
  1089. /**
  1090. * Check if network device has at least one successful configuration
  1091. *
  1092. * @v netdev Network device
  1093. * @v configurator Configurator
  1094. * @ret rc Return status code
  1095. */
  1096. int netdev_configuration_ok ( struct net_device *netdev ) {
  1097. return netdev_has_configuration_rc ( netdev, 0 );
  1098. }