|
|
b9ba6d |
2011-03-20 H.J. Lu <hongjiu.lu@intel.com>
|
|
|
b9ba6d |
|
|
|
b9ba6d |
[BZ #12597]
|
|
|
b9ba6d |
* string/test-strncmp.c (do_page_test): New function.
|
|
|
b9ba6d |
(check2): Likewise.
|
|
|
b9ba6d |
(test_main): Call check2.
|
|
|
b9ba6d |
* sysdeps/x86_64/multiarch/strcmp.S: Properly cross page boundary.
|
|
|
b9ba6d |
|
|
|
b9ba6d |
Index: glibc-2.12-2-gc4ccff1/string/test-strncmp.c
|
|
|
b9ba6d |
===================================================================
|
|
|
b9ba6d |
--- glibc-2.12-2-gc4ccff1.orig/string/test-strncmp.c
|
|
|
b9ba6d |
+++ glibc-2.12-2-gc4ccff1/string/test-strncmp.c
|
|
|
b9ba6d |
@@ -200,6 +200,27 @@ do_test (size_t align1, size_t align2, s
|
|
|
b9ba6d |
}
|
|
|
b9ba6d |
|
|
|
b9ba6d |
static void
|
|
|
b9ba6d |
+do_page_test (size_t offset1, size_t offset2, char *s2)
|
|
|
b9ba6d |
+{
|
|
|
b9ba6d |
+ char *s1;
|
|
|
b9ba6d |
+ int exp_result;
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ if (offset1 >= page_size || offset2 >= page_size)
|
|
|
b9ba6d |
+ return;
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ s1 = (char *) (buf1 + offset1);
|
|
|
b9ba6d |
+ s2 += offset2;
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ exp_result= *s1;
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ FOR_EACH_IMPL (impl, 0)
|
|
|
b9ba6d |
+ {
|
|
|
b9ba6d |
+ check_result (impl, s1, s2, page_size, -exp_result);
|
|
|
b9ba6d |
+ check_result (impl, s2, s1, page_size, exp_result);
|
|
|
b9ba6d |
+ }
|
|
|
b9ba6d |
+}
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+static void
|
|
|
b9ba6d |
do_random_tests (void)
|
|
|
b9ba6d |
{
|
|
|
b9ba6d |
size_t i, j, n, align1, align2, pos, len1, len2, size;
|
|
|
b9ba6d |
@@ -312,6 +333,25 @@ check1 (void)
|
|
|
b9ba6d |
}
|
|
|
b9ba6d |
}
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+static void
|
|
|
b9ba6d |
+check2 (void)
|
|
|
b9ba6d |
+{
|
|
|
b9ba6d |
+ size_t i;
|
|
|
b9ba6d |
+ char *s1, *s2;
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ s1 = (char *) buf1;
|
|
|
b9ba6d |
+ for (i = 0; i < page_size - 1; i++)
|
|
|
b9ba6d |
+ s1[i] = 23;
|
|
|
b9ba6d |
+ s1[i] = 0;
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ s2 = strdup (s1);
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ for (i = 0; i < 64; ++i)
|
|
|
b9ba6d |
+ do_page_test (3990 + i, 2635, s2);
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
+ free (s2);
|
|
|
b9ba6d |
+}
|
|
|
b9ba6d |
+
|
|
|
b9ba6d |
int
|
|
|
b9ba6d |
test_main (void)
|
|
|
b9ba6d |
{
|
|
|
b9ba6d |
@@ -320,6 +360,7 @@ test_main (void)
|
|
|
b9ba6d |
test_init ();
|
|
|
b9ba6d |
|
|
|
b9ba6d |
check1 ();
|
|
|
b9ba6d |
+ check2 ();
|
|
|
b9ba6d |
|
|
|
b9ba6d |
printf ("%23s", "");
|
|
|
b9ba6d |
FOR_EACH_IMPL (impl, 0)
|
|
|
b9ba6d |
Index: glibc-2.12-2-gc4ccff1/sysdeps/x86_64/multiarch/strcmp.S
|
|
|
b9ba6d |
===================================================================
|
|
|
b9ba6d |
--- glibc-2.12-2-gc4ccff1.orig/sysdeps/x86_64/multiarch/strcmp.S
|
|
|
b9ba6d |
+++ glibc-2.12-2-gc4ccff1/sysdeps/x86_64/multiarch/strcmp.S
|
|
|
b9ba6d |
@@ -452,6 +452,7 @@ LABEL(loop_ashr_1_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_1_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_1_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $1, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -499,7 +500,7 @@ LABEL(nibble_ashr_1_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $14, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_1_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_1_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -544,6 +545,7 @@ LABEL(loop_ashr_2_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_2_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_2_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $2, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -591,7 +593,7 @@ LABEL(nibble_ashr_2_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $13, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_2_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_2_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -636,6 +638,7 @@ LABEL(loop_ashr_3_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_3_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_3_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $3, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -683,7 +686,7 @@ LABEL(nibble_ashr_3_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $12, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_3_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_3_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -729,6 +732,7 @@ LABEL(loop_ashr_4_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_4_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_4_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $4, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -776,7 +780,7 @@ LABEL(nibble_ashr_4_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $11, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_4_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_4_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -822,6 +826,7 @@ LABEL(loop_ashr_5_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_5_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_5_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $5, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -870,7 +875,7 @@ LABEL(nibble_ashr_5_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $10, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_5_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_5_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -916,6 +921,7 @@ LABEL(loop_ashr_6_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_6_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_6_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $6, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -963,7 +969,7 @@ LABEL(nibble_ashr_6_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $9, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_6_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_6_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1009,6 +1015,7 @@ LABEL(loop_ashr_7_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_7_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_7_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $7, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1056,7 +1063,7 @@ LABEL(nibble_ashr_7_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $8, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_7_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_7_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1102,6 +1109,7 @@ LABEL(loop_ashr_8_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_8_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_8_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $8, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1149,7 +1157,7 @@ LABEL(nibble_ashr_8_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $7, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_8_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_8_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1195,6 +1203,7 @@ LABEL(loop_ashr_9_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_9_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_9_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
|
|
|
b9ba6d |
palignr $9, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
@@ -1243,7 +1252,7 @@ LABEL(nibble_ashr_9_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $6, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_9_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_9_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1289,6 +1298,7 @@ LABEL(loop_ashr_10_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_10_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_10_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $10, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1336,7 +1346,7 @@ LABEL(nibble_ashr_10_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $5, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_10_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_10_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1382,6 +1392,7 @@ LABEL(loop_ashr_11_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_11_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_11_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $11, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1429,7 +1440,7 @@ LABEL(nibble_ashr_11_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $4, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_11_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_11_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1475,6 +1486,7 @@ LABEL(loop_ashr_12_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_12_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_12_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $12, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1522,7 +1534,7 @@ LABEL(nibble_ashr_12_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $3, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_12_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_12_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1569,6 +1581,7 @@ LABEL(loop_ashr_13_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_13_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_13_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $13, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1616,7 +1629,7 @@ LABEL(nibble_ashr_13_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $2, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_13_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_13_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1663,6 +1676,7 @@ LABEL(loop_ashr_14_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_14_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_14_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $14, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1710,7 +1724,7 @@ LABEL(nibble_ashr_14_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $1, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_14_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_14_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
jmp LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
@@ -1759,6 +1773,7 @@ LABEL(loop_ashr_15_use_sse4_2):
|
|
|
b9ba6d |
add $16, %r10
|
|
|
b9ba6d |
jg LABEL(nibble_ashr_15_use_sse4_2)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
+LABEL(nibble_ashr_15_use_sse4_2_restart):
|
|
|
b9ba6d |
movdqa (%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
palignr $15, -16(%rdi, %rdx), %xmm0
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|
|
|
b9ba6d |
@@ -1806,7 +1821,7 @@ LABEL(nibble_ashr_15_use_sse4_2):
|
|
|
b9ba6d |
jae LABEL(nibble_ashr_use_sse4_2_exit)
|
|
|
b9ba6d |
# endif
|
|
|
b9ba6d |
cmp $0, %ecx
|
|
|
b9ba6d |
- ja LABEL(loop_ashr_15_use_sse4_2)
|
|
|
b9ba6d |
+ ja LABEL(nibble_ashr_15_use_sse4_2_restart)
|
|
|
b9ba6d |
|
|
|
b9ba6d |
LABEL(nibble_ashr_use_sse4_2_exit):
|
|
|
b9ba6d |
# if !defined USE_AS_STRCASECMP_L && !defined USE_AS_STRNCASECMP_L
|