You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106
  1. /*
  2. * Copyright (C) 2007 Michael Brown <mbrown@fensystems.co.uk>.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public License as
  6. * published by the Free Software Foundation; either version 2 of the
  7. * License, or any later version.
  8. *
  9. * This program is distributed in the hope that it will be useful, but
  10. * WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public License
  15. * along with this program; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
  17. * 02110-1301, USA.
  18. */
  19. /** @file
  20. *
  21. * Optimised string operations
  22. *
  23. */
  24. FILE_LICENCE ( GPL2_OR_LATER );
  25. #include <string.h>
  26. /**
  27. * Copy memory area
  28. *
  29. * @v dest Destination address
  30. * @v src Source address
  31. * @v len Length
  32. * @ret dest Destination address
  33. */
  34. void * __attribute__ (( noinline )) __memcpy ( void *dest, const void *src,
  35. size_t len ) {
  36. void *edi = dest;
  37. const void *esi = src;
  38. int discard_ecx;
  39. /* We often do large dword-aligned and dword-length block
  40. * moves. Using movsl rather than movsb speeds these up by
  41. * around 32%.
  42. */
  43. __asm__ __volatile__ ( "rep movsl"
  44. : "=&D" ( edi ), "=&S" ( esi ),
  45. "=&c" ( discard_ecx )
  46. : "0" ( edi ), "1" ( esi ), "2" ( len >> 2 )
  47. : "memory" );
  48. __asm__ __volatile__ ( "rep movsb"
  49. : "=&D" ( edi ), "=&S" ( esi ),
  50. "=&c" ( discard_ecx )
  51. : "0" ( edi ), "1" ( esi ), "2" ( len & 3 )
  52. : "memory" );
  53. return dest;
  54. }
  55. /**
  56. * Copy memory area backwards
  57. *
  58. * @v dest Destination address
  59. * @v src Source address
  60. * @v len Length
  61. * @ret dest Destination address
  62. */
  63. void * __attribute__ (( noinline )) __memcpy_reverse ( void *dest,
  64. const void *src,
  65. size_t len ) {
  66. void *edi = ( dest + len - 1 );
  67. const void *esi = ( src + len - 1 );
  68. int discard_ecx;
  69. /* Assume memmove() is not performance-critical, and perform a
  70. * bytewise copy for simplicity.
  71. */
  72. __asm__ __volatile__ ( "std\n\t"
  73. "rep movsb\n\t"
  74. "cld\n\t"
  75. : "=&D" ( edi ), "=&S" ( esi ),
  76. "=&c" ( discard_ecx )
  77. : "0" ( edi ), "1" ( esi ),
  78. "2" ( len )
  79. : "memory" );
  80. return dest;
  81. }
  82. /**
  83. * Copy (possibly overlapping) memory area
  84. *
  85. * @v dest Destination address
  86. * @v src Source address
  87. * @v len Length
  88. * @ret dest Destination address
  89. */
  90. void * __memmove ( void *dest, const void *src, size_t len ) {
  91. if ( dest <= src ) {
  92. return __memcpy ( dest, src, len );
  93. } else {
  94. return __memcpy_reverse ( dest, src, len );
  95. }
  96. }