You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269
  1. /*
  2. * Copyright (C) 2012 Michael Brown <mbrown@fensystems.co.uk>.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public License as
  6. * published by the Free Software Foundation; either version 2 of the
  7. * License, or (at your option) any later version.
  8. *
  9. * This program is distributed in the hope that it will be useful, but
  10. * WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public License
  15. * along with this program; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
  17. * 02110-1301, USA.
  18. */
  19. FILE_LICENCE ( GPL2_OR_LATER );
  20. /** @file
  21. *
  22. * memcpy() self-tests
  23. *
  24. */
  25. /* Forcibly enable assertions */
  26. #undef NDEBUG
  27. #include <stdint.h>
  28. #include <stdlib.h>
  29. #include <string.h>
  30. #include <ipxe/test.h>
  31. #include <ipxe/profile.h>
  32. /** Number of sample iterations for profiling */
  33. #define PROFILE_COUNT 16
  34. /* Provide global functions to allow inspection of generated code */
  35. void memcpy_0 ( void *dest, void *src ) { memcpy ( dest, src, 0 ); }
  36. void memcpy_1 ( void *dest, void *src ) { memcpy ( dest, src, 1 ); }
  37. void memcpy_2 ( void *dest, void *src ) { memcpy ( dest, src, 2 ); }
  38. void memcpy_3 ( void *dest, void *src ) { memcpy ( dest, src, 3 ); }
  39. void memcpy_4 ( void *dest, void *src ) { memcpy ( dest, src, 4 ); }
  40. void memcpy_5 ( void *dest, void *src ) { memcpy ( dest, src, 5 ); }
  41. void memcpy_6 ( void *dest, void *src ) { memcpy ( dest, src, 6 ); }
  42. void memcpy_7 ( void *dest, void *src ) { memcpy ( dest, src, 7 ); }
  43. void memcpy_8 ( void *dest, void *src ) { memcpy ( dest, src, 8 ); }
  44. void memcpy_9 ( void *dest, void *src ) { memcpy ( dest, src, 9 ); }
  45. void memcpy_10 ( void *dest, void *src ) { memcpy ( dest, src, 10 ); }
  46. void memcpy_11 ( void *dest, void *src ) { memcpy ( dest, src, 11 ); }
  47. void memcpy_12 ( void *dest, void *src ) { memcpy ( dest, src, 12 ); }
  48. void memcpy_13 ( void *dest, void *src ) { memcpy ( dest, src, 13 ); }
  49. void memcpy_14 ( void *dest, void *src ) { memcpy ( dest, src, 14 ); }
  50. void memcpy_15 ( void *dest, void *src ) { memcpy ( dest, src, 15 ); }
  51. void memcpy_16 ( void *dest, void *src ) { memcpy ( dest, src, 16 ); }
  52. void memcpy_17 ( void *dest, void *src ) { memcpy ( dest, src, 17 ); }
  53. void memcpy_18 ( void *dest, void *src ) { memcpy ( dest, src, 18 ); }
  54. void memcpy_19 ( void *dest, void *src ) { memcpy ( dest, src, 19 ); }
  55. void memcpy_20 ( void *dest, void *src ) { memcpy ( dest, src, 20 ); }
  56. void memcpy_21 ( void *dest, void *src ) { memcpy ( dest, src, 21 ); }
  57. void memcpy_22 ( void *dest, void *src ) { memcpy ( dest, src, 22 ); }
  58. void memcpy_23 ( void *dest, void *src ) { memcpy ( dest, src, 23 ); }
  59. void memcpy_24 ( void *dest, void *src ) { memcpy ( dest, src, 24 ); }
  60. void memcpy_25 ( void *dest, void *src ) { memcpy ( dest, src, 25 ); }
  61. void memcpy_26 ( void *dest, void *src ) { memcpy ( dest, src, 26 ); }
  62. void memcpy_27 ( void *dest, void *src ) { memcpy ( dest, src, 27 ); }
  63. void memcpy_28 ( void *dest, void *src ) { memcpy ( dest, src, 28 ); }
  64. void memcpy_29 ( void *dest, void *src ) { memcpy ( dest, src, 29 ); }
  65. void memcpy_30 ( void *dest, void *src ) { memcpy ( dest, src, 30 ); }
  66. void memcpy_31 ( void *dest, void *src ) { memcpy ( dest, src, 31 ); }
  67. /**
  68. * Force a call to the variable-length implementation of memcpy()
  69. *
  70. * @v dest Destination address
  71. * @v src Source address
  72. * @v len Length of data
  73. * @ret dest Destination address
  74. */
  75. __attribute__ (( noinline )) void * memcpy_var ( void *dest, const void *src,
  76. size_t len ) {
  77. return memcpy ( dest, src, len );
  78. }
  79. /**
  80. * Perform a constant-length memcpy() test
  81. *
  82. * ... Data to copy
  83. */
  84. #define MEMCPY_TEST_CONSTANT( ... ) do { \
  85. static const uint8_t src[] = { __VA_ARGS__ }; \
  86. uint8_t dest_const[ 1 + sizeof ( src ) + 1 ]; \
  87. uint8_t dest_var[ 1 + sizeof ( src ) + 1 ]; \
  88. \
  89. dest_const[0] = 0x33; \
  90. dest_const[ sizeof ( dest_const ) - 1 ] = 0x44; \
  91. memcpy ( ( dest_const + 1 ), src, \
  92. ( sizeof ( dest_const ) - 2 ) ); \
  93. ok ( dest_const[0] == 0x33 ); \
  94. ok ( dest_const[ sizeof ( dest_const ) - 1 ] == 0x44 ); \
  95. ok ( memcmp ( ( dest_const + 1 ), src, \
  96. ( sizeof ( dest_const ) - 2 ) ) == 0 ); \
  97. \
  98. dest_var[0] = 0x55; \
  99. dest_var[ sizeof ( dest_var ) - 1 ] = 0x66; \
  100. memcpy_var ( ( dest_var + 1 ), src, \
  101. ( sizeof ( dest_var ) - 2 ) ); \
  102. ok ( dest_var[0] == 0x55 ); \
  103. ok ( dest_var[ sizeof ( dest_var ) - 1 ] == 0x66 ); \
  104. ok ( memcmp ( ( dest_var + 1 ), src, \
  105. ( sizeof ( dest_var ) - 2 ) ) == 0 ); \
  106. } while ( 0 )
  107. /**
  108. * Test memcpy() speed
  109. *
  110. * @v dest_offset Destination alignment offset
  111. * @v src_offset Source alignment offset
  112. * @v len Length of data to copy
  113. */
  114. static void memcpy_test_speed ( unsigned int dest_offset,
  115. unsigned int src_offset, size_t len ) {
  116. struct profiler profiler;
  117. uint8_t *dest;
  118. uint8_t *src;
  119. unsigned int i;
  120. /* Allocate blocks */
  121. dest = malloc ( len + dest_offset );
  122. assert ( dest != NULL );
  123. src = malloc ( len + src_offset );
  124. assert ( src != NULL );
  125. /* Generate random source data */
  126. for ( i = 0 ; i < len ; i++ )
  127. src[ src_offset + i ] = random();
  128. /* Check correctness of copied data */
  129. memcpy ( ( dest + dest_offset ), ( src + src_offset ), len );
  130. ok ( memcmp ( ( dest + dest_offset ), ( src + src_offset ),
  131. len ) == 0 );
  132. /* Profile memcpy() */
  133. memset ( &profiler, 0, sizeof ( profiler ) );
  134. for ( i = 0 ; i < PROFILE_COUNT ; i++ ) {
  135. profile_start ( &profiler );
  136. memcpy ( ( dest + dest_offset ), ( src + src_offset ), len );
  137. profile_stop ( &profiler );
  138. }
  139. /* Free blocks */
  140. free ( dest );
  141. free ( src );
  142. DBG ( "MEMCPY copied %zd bytes (+%d => +%d) in %ld +/- %ld ticks\n",
  143. len, src_offset, dest_offset, profile_mean ( &profiler ),
  144. profile_stddev ( &profiler ) );
  145. }
  146. /**
  147. * Perform memcpy() self-tests
  148. *
  149. */
  150. static void memcpy_test_exec ( void ) {
  151. unsigned int dest_offset;
  152. unsigned int src_offset;
  153. /* Constant-length tests */
  154. MEMCPY_TEST_CONSTANT ( );
  155. MEMCPY_TEST_CONSTANT ( 0x86 );
  156. MEMCPY_TEST_CONSTANT ( 0x8c, 0xd3 );
  157. MEMCPY_TEST_CONSTANT ( 0x4e, 0x08, 0xed );
  158. MEMCPY_TEST_CONSTANT ( 0xcc, 0x61, 0x8f, 0x70 );
  159. MEMCPY_TEST_CONSTANT ( 0x6d, 0x28, 0xe0, 0x9e, 0x6d );
  160. MEMCPY_TEST_CONSTANT ( 0x7d, 0x13, 0x4f, 0xef, 0x17, 0xb3 );
  161. MEMCPY_TEST_CONSTANT ( 0x38, 0xa7, 0xd4, 0x8d, 0x44, 0x01, 0xfd );
  162. MEMCPY_TEST_CONSTANT ( 0x45, 0x9f, 0xf4, 0xf9, 0xf3, 0x0f, 0x99, 0x43 );
  163. MEMCPY_TEST_CONSTANT ( 0x69, 0x8c, 0xf6, 0x12, 0x79, 0x70, 0xd8, 0x1e,
  164. 0x9d );
  165. MEMCPY_TEST_CONSTANT ( 0xbe, 0x53, 0xb4, 0xb7, 0xdd, 0xe6, 0x35, 0x10,
  166. 0x3c, 0xe7 );
  167. MEMCPY_TEST_CONSTANT ( 0xaf, 0x41, 0x8a, 0x88, 0xb1, 0x4e, 0x52, 0xd4,
  168. 0xe6, 0xc3, 0x76 );
  169. MEMCPY_TEST_CONSTANT ( 0xdf, 0x43, 0xe4, 0x5d, 0xad, 0x17, 0x35, 0x38,
  170. 0x1a, 0x1d, 0x57, 0x58 );
  171. MEMCPY_TEST_CONSTANT ( 0x20, 0x52, 0x83, 0x92, 0xb9, 0x85, 0xa4, 0x06,
  172. 0x94, 0xe0, 0x3d, 0x57, 0xd4 );
  173. MEMCPY_TEST_CONSTANT ( 0xf1, 0x67, 0x31, 0x9e, 0x32, 0x98, 0x27, 0xe9,
  174. 0x8e, 0x62, 0xb4, 0x82, 0x7e, 0x02 );
  175. MEMCPY_TEST_CONSTANT ( 0x93, 0xc1, 0x55, 0xe3, 0x60, 0xce, 0xac, 0x1e,
  176. 0xae, 0x9d, 0xca, 0xec, 0x92, 0xb3, 0x38 );
  177. MEMCPY_TEST_CONSTANT ( 0xb3, 0xc1, 0xfa, 0xe7, 0x8a, 0x1c, 0xe4, 0xce,
  178. 0x85, 0xe6, 0x3c, 0xab, 0x1c, 0xa2, 0xaf, 0x7a );
  179. MEMCPY_TEST_CONSTANT ( 0x9b, 0x6e, 0x1c, 0x48, 0x82, 0xd3, 0x6e, 0x58,
  180. 0xa7, 0xb0, 0xe6, 0xea, 0x6d, 0xee, 0xc8, 0xf8,
  181. 0xaf );
  182. MEMCPY_TEST_CONSTANT ( 0x86, 0x6d, 0xb0, 0xf5, 0xf2, 0xc9, 0xcd, 0xfe,
  183. 0xfb, 0x38, 0x67, 0xbc, 0x51, 0x9d, 0x25, 0xbc,
  184. 0x09, 0x88 );
  185. MEMCPY_TEST_CONSTANT ( 0x58, 0xa4, 0x96, 0x9e, 0x98, 0x36, 0xdb, 0xae,
  186. 0x8a, 0x08, 0x7c, 0x64, 0xf9, 0xfb, 0x25, 0xb4,
  187. 0x8e, 0xf3, 0xed );
  188. MEMCPY_TEST_CONSTANT ( 0xc6, 0x3b, 0x84, 0x3c, 0x76, 0x24, 0x8e, 0x42,
  189. 0x11, 0x1f, 0x09, 0x2e, 0x24, 0xbb, 0x67, 0x71,
  190. 0x3a, 0xca, 0x60, 0xdd );
  191. MEMCPY_TEST_CONSTANT ( 0x8e, 0x2d, 0xa9, 0x58, 0x87, 0xe2, 0xac, 0x4b,
  192. 0xc8, 0xbf, 0xa2, 0x4e, 0xee, 0x3a, 0xa6, 0x71,
  193. 0x76, 0xee, 0x42, 0x05, 0x6e );
  194. MEMCPY_TEST_CONSTANT ( 0x8a, 0xda, 0xdf, 0x7b, 0x55, 0x41, 0x8c, 0xcd,
  195. 0x42, 0x40, 0x18, 0xe2, 0x60, 0xc4, 0x7d, 0x64,
  196. 0x00, 0xd5, 0xef, 0xa1, 0x7b, 0x31 );
  197. MEMCPY_TEST_CONSTANT ( 0xd9, 0x25, 0xcb, 0xbb, 0x9c, 0x1d, 0xdd, 0xcd,
  198. 0xde, 0x96, 0xd9, 0x74, 0x13, 0x95, 0xfe, 0x68,
  199. 0x0b, 0x3d, 0x30, 0x8d, 0x0c, 0x1e, 0x6d );
  200. MEMCPY_TEST_CONSTANT ( 0x2d, 0x0d, 0x02, 0x33, 0xd6, 0xbe, 0x6c, 0xa6,
  201. 0x0a, 0xab, 0xe5, 0xda, 0xe2, 0xab, 0x78, 0x3c,
  202. 0xd3, 0xdd, 0xea, 0xfa, 0x1a, 0xe4, 0xf4, 0xb3 );
  203. MEMCPY_TEST_CONSTANT ( 0x6a, 0x34, 0x39, 0xea, 0x29, 0x5f, 0xa6, 0x18,
  204. 0xc1, 0x53, 0x39, 0x78, 0xdb, 0x40, 0xf2, 0x98,
  205. 0x78, 0xcf, 0xee, 0xfd, 0xcd, 0xf8, 0x56, 0xf8,
  206. 0x30 );
  207. MEMCPY_TEST_CONSTANT ( 0xe4, 0xe5, 0x5a, 0x8d, 0xcf, 0x04, 0x29, 0x7c,
  208. 0xa7, 0xd8, 0x43, 0xbf, 0x0b, 0xbf, 0xe7, 0x68,
  209. 0xf7, 0x8c, 0x81, 0xf9, 0x3f, 0xad, 0xa4, 0x40,
  210. 0x38, 0x82 );
  211. MEMCPY_TEST_CONSTANT ( 0x71, 0xcd, 0x3d, 0x26, 0xde, 0x11, 0x23, 0xd5,
  212. 0x42, 0x6e, 0x63, 0x72, 0x53, 0xfc, 0x28, 0x06,
  213. 0x4b, 0xe0, 0x2c, 0x07, 0x6b, 0xe8, 0xd9, 0x5f,
  214. 0xf8, 0x74, 0xed );
  215. MEMCPY_TEST_CONSTANT ( 0x05, 0xb2, 0xae, 0x81, 0x91, 0xc9, 0xa2, 0x5f,
  216. 0xa9, 0x1b, 0x25, 0x7f, 0x32, 0x0c, 0x04, 0x00,
  217. 0xf1, 0x46, 0xab, 0x77, 0x1e, 0x12, 0x27, 0xe7,
  218. 0xf6, 0x1e, 0x0c, 0x29 );
  219. MEMCPY_TEST_CONSTANT ( 0x0e, 0xca, 0xa5, 0x56, 0x3d, 0x99, 0x99, 0xf9,
  220. 0x6e, 0xdd, 0x93, 0x98, 0xec, 0x8b, 0x5c, 0x71,
  221. 0x0c, 0xb0, 0xe6, 0x12, 0xf2, 0x10, 0x1a, 0xbe,
  222. 0x4a, 0xe0, 0xe3, 0x00, 0xf8 );
  223. MEMCPY_TEST_CONSTANT ( 0x40, 0xa8, 0x28, 0x5b, 0x12, 0x0d, 0x80, 0x8e,
  224. 0x8a, 0xd9, 0x92, 0x7a, 0x6e, 0x48, 0x8d, 0x14,
  225. 0x4b, 0xc6, 0xce, 0x21, 0x2f, 0x0e, 0x47, 0xbd,
  226. 0xf1, 0xca, 0x0e, 0x1f, 0x65, 0xc4 );
  227. MEMCPY_TEST_CONSTANT ( 0x84, 0x83, 0x44, 0xe8, 0x1c, 0xbf, 0x23, 0x05,
  228. 0xdf, 0xed, 0x3b, 0xb7, 0x0b, 0x4a, 0x05, 0xec,
  229. 0xb7, 0x6f, 0x1c, 0xfe, 0x05, 0x05, 0x4e, 0xd1,
  230. 0x50, 0x88, 0x81, 0x87, 0x68, 0xf6, 0x66 );
  231. MEMCPY_TEST_CONSTANT ( 0x0d, 0x1d, 0xcf, 0x3e, 0x7c, 0xf8, 0x12, 0x1b,
  232. 0x96, 0x7f, 0xff, 0x27, 0xca, 0xfe, 0xd3, 0x8b,
  233. 0x10, 0xb9, 0x5d, 0x05, 0xad, 0x50, 0xed, 0x35,
  234. 0x32, 0x9c, 0xe6, 0x3b, 0x73, 0xe0, 0x7d );
  235. /* Speed tests */
  236. memcpy_test_speed ( 0, 0, 64 );
  237. memcpy_test_speed ( 0, 0, 128 );
  238. memcpy_test_speed ( 0, 0, 256 );
  239. for ( dest_offset = 0 ; dest_offset < 4 ; dest_offset++ ) {
  240. for ( src_offset = 0 ; src_offset < 4 ; src_offset++ ) {
  241. memcpy_test_speed ( dest_offset, src_offset, 4096 );
  242. }
  243. }
  244. }
  245. /** memcpy() self-test */
  246. struct self_test memcpy_test __self_test = {
  247. .name = "memcpy",
  248. .exec = memcpy_test_exec,
  249. };