forked from rpms/glibc
8618 lines
235 KiB
Diff
8618 lines
235 KiB
Diff
--- glibc-2.11-175-gb34e12e/ChangeLog
|
|
+++ glibc-2.11.90-11/ChangeLog
|
|
@@ -237,68 +237,6 @@
|
|
|
|
* posix/sched.h: Define time_t and pid_t for XPG7.
|
|
|
|
-2010-01-12 H.J. Lu <hongjiu.lu@intel.com>
|
|
-
|
|
- * sysdeps/i386/i686/bcopy.S: New file.
|
|
-
|
|
- * sysdeps/i386/i686/cacheinfo.c (__x86_64_data_cache_size): Define.
|
|
-
|
|
- * sysdeps/i386/i686/memcpy.S (__memcpy_chk): Use ENTRY_CHK
|
|
- and END_CHK.
|
|
- * sysdeps/i386/i686/memmove.S (__memmove_chk): Likewise.
|
|
- * sysdeps/i386/i686/mempcpy.S (__mempcpy_chk): Likewise.
|
|
- * sysdeps/i386/i686/memset.S (__memset_chk): Likewise.
|
|
-
|
|
- * sysdeps/i386/i686/memmove.S: Support USE_AS_BCOPY.
|
|
-
|
|
- * sysdeps/i386/i686/multiarch/Makefile (sysdep_routines): Add
|
|
- bzero-sse2 memset-sse2 memcpy-ssse3 mempcpy-ssse3 memmove-ssse3
|
|
- memcpy-ssse3-rep mempcpy-ssse3-rep memmove-ssse3-rep
|
|
- bcopy-ssse3 bcopy-ssse3-rep memset-sse2-rep bzero-sse2-rep
|
|
- * sysdeps/i386/i686/multiarch/bcopy-ssse3-rep.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/bcopy-ssse3.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/bcopy.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/bzero-sse2-rep.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/bzero-sse2.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/bzero.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memcpy-ssse3-rep.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memcpy-ssse3.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memcpy.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memcpy_chk.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memmove-ssse3-rep.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memmove-ssse3.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memmove.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memmove_chk.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/mempcpy-ssse3-rep.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/mempcpy-ssse3.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/mempcpy.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/mempcpy_chk.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memset-sse2-rep.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memset-sse2.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memset.S: New file.
|
|
- * sysdeps/i386/i686/multiarch/memset_chk.S: New file.
|
|
-
|
|
- * sysdeps/i386/sysdep.h (ENTRY_CHK): New.
|
|
- (END_CHK): Likewise.
|
|
-
|
|
- * sysdeps/i386/i686/multiarch/ifunc-defines.sym: Add
|
|
- FEATURE_OFFSET, FEATURE_SIZE and FEATURE_INDEX_1.
|
|
- * sysdeps/x86_64/multiarch/ifunc-defines.sym: Likewise.
|
|
-
|
|
- * sysdeps/x86_64/cacheinfo.c (intel_02_cache_info): Add entries
|
|
- for 0x0e and 0x80.
|
|
- (__x86_64_data_cache_size): New.
|
|
- (init_cacheinfo): Set __x86_64_data_cache_size.
|
|
-
|
|
- * sysdeps/x86_64/multiarch/init-arch.c (__init_cpu_features): Turn
|
|
- on bit_Fast_Rep_String for Intel Core i7.
|
|
-
|
|
- * sysdeps/x86_64/multiarch/init-arch.h (bit_Fast_Rep_String): New.
|
|
- (index_Fast_Rep_String): Likewise.
|
|
- (FEATURE_INDEX_1): Likewise.
|
|
- (FEATURE_INDEX_MAX): Likewise.
|
|
- (cpu_features): Add feature.
|
|
-
|
|
2010-01-12 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
* conform/data/sys/select.h-data: Fix up for XPG7.
|
|
@@ -1903,6 +1841,11 @@ d2009-10-30 Ulrich Drepper <drepper@redhat.com>
|
|
* sysdeps/generic/ldsodefs.h (struct rtld_global): The map element in
|
|
the unique symbol hash table should not be const.
|
|
|
|
+2009-07-22 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * Makeconfig (ASFLAGS): Append $(sysdep-ASFLAGS).
|
|
+ * sysdeps/i386/Makefile (sysdep-ASFLAGS): Add -U__i686.
|
|
+
|
|
2009-07-21 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
* sysdeps/x86_64/multiarch/strstr.c: Minor cleanups. Remove
|
|
@@ -2168,6 +2111,11 @@ d2009-10-30 Ulrich Drepper <drepper@redhat.com>
|
|
out common code into new function get_common_indeces. Determine
|
|
extended family and model for Intel processors.
|
|
|
|
+2009-06-26 Andreas Schwab <aschwab@redhat.com>
|
|
+
|
|
+ * timezone/zic.c (stringzone): Don't try to generate a POSIX TZ
|
|
+ string when the timezone ends in DST.
|
|
+
|
|
2009-06-26 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
* resolv/resolv.h: Define RES_SNGLKUPREOP.
|
|
@@ -10861,6 +10809,10 @@ d2009-10-30 Ulrich Drepper <drepper@redhat.com>
|
|
[BZ #4368]
|
|
* stdlib/stdlib.h: Remove obsolete part of comment for realpath.
|
|
|
|
+2007-04-16 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * locale/programs/locarchive.c (add_alias, insert_name): Remove static.
|
|
+
|
|
2007-04-16 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
[BZ #4364]
|
|
@@ -12118,6 +12070,15 @@ d2009-10-30 Ulrich Drepper <drepper@redhat.com>
|
|
separators also if no non-zero digits found.
|
|
* stdlib/Makefile (tests): Add tst-strtod3.
|
|
|
|
+2006-12-10 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * sysdeps/unix/sysv/linux/netlinkaccess.h: Include linux/if_addr.h
|
|
+ if IFA_MAX is not defined.
|
|
+ (IFA_RTA, IFA_PAYLOAD, IFLA_RTA, IFLA_PAYLOAD): Define if not
|
|
+ defined.
|
|
+ * sysdeps/unix/sysv/linux/check_pf.c: Include netlinkaccess.h
|
|
+ instead of asm/types.h, linux/netlink.h and linux/rtnetlink.h.
|
|
+
|
|
2006-12-09 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
[BZ #3632]
|
|
--- glibc-2.11-175-gb34e12e/ChangeLog.15
|
|
+++ glibc-2.11.90-11/ChangeLog.15
|
|
@@ -477,6 +477,14 @@
|
|
|
|
2004-11-26 Jakub Jelinek <jakub@redhat.com>
|
|
|
|
+ * posix/Makefile (generated: Add getconf.speclist.
|
|
+ ($(inst_libexecdir)/getconf): Use getconf.speclist instead of
|
|
+ getconf output.
|
|
+ ($(objpfx)getconf.speclist): New rule.
|
|
+ * posix/getconf.speclist.h: New file.
|
|
+
|
|
+2004-11-26 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
* sysdeps/generic/unsecvars.h (UNSECURE_ENVVARS): Add GETCONF_DIR.
|
|
|
|
2004-11-26 Kaz Kojima <kkojima@rr.iij4u.or.jp>
|
|
@@ -1103,6 +1111,13 @@
|
|
* sysdeps/generic/tempname.c (__path_search): Add missing argument
|
|
TRY_TMPDIR.
|
|
|
|
+2004-11-02 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * include/features.h (__USE_FORTIFY_LEVEL): Also set for Red Hat
|
|
+ GCC 3.4.x-RH >= 3.4.2-8.
|
|
+ * debug/tst-chk1.c (do_test): Deal with GCC 3.4.x-RH not
|
|
+ being able to recognize subobjects.
|
|
+
|
|
2004-10-31 Mariusz Mazur <mmazur@kernel.pl>
|
|
|
|
* sysdeps/unix/sysv/linux/alpha/setregid.c: New file.
|
|
@@ -1443,6 +1458,11 @@
|
|
* sysdeps/generic/readonly-area.c (__readonly_str): Renamed to ...
|
|
(__readonly_area): ... this.
|
|
|
|
+2004-10-19 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * include/features.h (__USE_FORTIFY_LEVEL): Enable even with
|
|
+ Red Hat gcc4 4.0.0 and above.
|
|
+
|
|
2004-10-18 Jakub Jelinek <jakub@redhat.com>
|
|
|
|
* sysdeps/generic/strcpy_chk.c (__strcpy_chk): Speed up by checking
|
|
@@ -3182,6 +3202,23 @@
|
|
before return type.
|
|
* locale/localename.c (__current_locale_name): Likewise.
|
|
|
|
+2004-08-31 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * elf/ldconfig.c (parse_conf): Add prefix argument, prepend it
|
|
+ before arguments to add_dir and pass to parse_conf_include.
|
|
+ (parse_conf_include): Add prefix argument, pass it down to
|
|
+ parse_conf.
|
|
+ (main): Call arch_startup. Adjust parse_conf caller.
|
|
+ Call add_arch_dirs.
|
|
+ * sysdeps/generic/dl-cache.h (arch_startup, add_arch_dirs): Define.
|
|
+ * sysdeps/unix/sysv/linux/i386/dl-cache.h: New file.
|
|
+ * sysdeps/unix/sysv/linux/ia64/dl-cache.h (EMUL_HACK, arch_startup,
|
|
+ add_arch_dirs): Define.
|
|
+ * sysdeps/unix/sysv/linux/ia64/ldd-rewrite.sed: Prepend
|
|
+ /emul/ia32-linux before the 32-bit ld.so pathname.
|
|
+ * sysdeps/unix/sysv/linux/ia64/dl-procinfo.c: New file.
|
|
+ * sysdeps/unix/sysv/linux/ia64/dl-procinfo.h: New file.
|
|
+
|
|
2004-08-30 Roland McGrath <roland@frob.com>
|
|
|
|
* scripts/extract-abilist.awk: If `lastversion' variable defined, omit
|
|
--- glibc-2.11-175-gb34e12e/ChangeLog.16
|
|
+++ glibc-2.11.90-11/ChangeLog.16
|
|
@@ -2042,6 +2042,9 @@
|
|
(__MATHDECL_2): Use __REDIRECT_NTH instead of __REDIRECT
|
|
followed by __THROW.
|
|
|
|
+ * sysdeps/unix/sysv/linux/futimesat.c (futimesat): If
|
|
+ file == NULL, use __futimes unconditionally.
|
|
+
|
|
2006-02-02 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
* sysdeps/unix/sysv/linux/futimesat.c [__NR_futimesat]
|
|
@@ -2101,6 +2104,11 @@
|
|
* sysdeps/ieee754/ldbl-128/s_llrintl.c (__llrintl): Fix a typo.
|
|
* sysdeps/s390/fpu/libm-test-ulps: Remove llrint ulps.
|
|
|
|
+2006-01-30 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * include/bits/stdlib-ldbl.h: New file.
|
|
+ * include/bits/wchar-ldbl.h: New file.
|
|
+
|
|
2006-01-19 Thomas Schwinge <tschwinge@gnu.org>
|
|
|
|
* libio/genops.c: Include <stdbool.h>.
|
|
@@ -8922,6 +8930,12 @@
|
|
* argp/argp-help.c (__argp_error): __asprintf -> vasprintf.
|
|
(__argp_failure): Likewise.
|
|
|
|
+2005-08-08 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * sysdeps/unix/sysv/linux/dl-osinfo.h (_dl_setup_stack_chk_guard):
|
|
+ Shift marked &errno down on big-endian instead of up.
|
|
+ * elf/tst-stackguard1.c (do_test): Fix a typo.
|
|
+
|
|
2005-08-08 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
* nscd/cache.c (cache_add): Commit hash table and header to disk.
|
|
@@ -9046,6 +9060,17 @@
|
|
__syslog_chk.
|
|
* misc/Versions: Export __syslog_chk and __vsyslog_chk.
|
|
|
|
+2005-07-29 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * sysdeps/unix/sysv/linux/dl-osinfo.h: Include errno.h, hp-timing.h,
|
|
+ endian.h.
|
|
+ (_dl_setup_stack_chk_guard): Even without
|
|
+ --enable-stackguard-randomization attempt to do some guard
|
|
+ randomization using hp-timing (if available) and kernel stack and
|
|
+ mmap randomization.
|
|
+ * elf/tst-stackguard1.c (do_test): Don't fail if the poor man's
|
|
+ randomization doesn't work well enough.
|
|
+
|
|
2005-07-28 Thomas Schwinge <schwinge@nic-nac-project.de>
|
|
|
|
[BZ #1137]
|
|
--- glibc-2.11-175-gb34e12e/Makeconfig
|
|
+++ glibc-2.11.90-11/Makeconfig
|
|
@@ -780,12 +780,12 @@ endif
|
|
# The assembler can generate debug information too.
|
|
ifndef ASFLAGS
|
|
ifeq ($(have-cpp-asm-debuginfo),yes)
|
|
-ASFLAGS := $(filter -g%,$(CFLAGS))
|
|
+ASFLAGS = $(filter -g%,$(CFLAGS))
|
|
else
|
|
-ASFLAGS :=
|
|
+ASFLAGS =
|
|
endif
|
|
endif
|
|
-ASFLAGS += $(ASFLAGS-config) $(asflags-cpu)
|
|
+ASFLAGS += $(ASFLAGS-config) $(asflags-cpu) $(sysdep-ASFLAGS)
|
|
|
|
ifndef BUILD_CC
|
|
BUILD_CC = $(CC)
|
|
--- glibc-2.11-175-gb34e12e/csu/Makefile
|
|
+++ glibc-2.11.90-11/csu/Makefile
|
|
@@ -93,7 +93,8 @@ omit-deps += $(crtstuff)
|
|
$(crtstuff:%=$(objpfx)%.o): %.o: %.S $(objpfx)defs.h
|
|
$(compile.S) -g0 $(ASFLAGS-.os) -o $@
|
|
|
|
-CFLAGS-initfini.s = -g0 -fPIC -fno-inline-functions $(fno-unit-at-a-time)
|
|
+CFLAGS-initfini.s = -g0 -fPIC -fno-inline-functions $(fno-unit-at-a-time) \
|
|
+ -fno-asynchronous-unwind-tables
|
|
|
|
vpath initfini.c $(sysdirs)
|
|
|
|
--- glibc-2.11-175-gb34e12e/csu/elf-init.c
|
|
+++ glibc-2.11.90-11/csu/elf-init.c
|
|
@@ -63,6 +63,23 @@ extern void (*__init_array_end []) (int, char **, char **)
|
|
extern void (*__fini_array_start []) (void) attribute_hidden;
|
|
extern void (*__fini_array_end []) (void) attribute_hidden;
|
|
|
|
+#if defined HAVE_VISIBILITY_ATTRIBUTE \
|
|
+ && (defined SHARED || defined LIBC_NONSHARED)
|
|
+# define hidden_undef_2(x) #x
|
|
+# define hidden_undef_1(x) hidden_undef_2 (x)
|
|
+# define hidden_undef(x) \
|
|
+ __asm (hidden_undef_1 (ASM_GLOBAL_DIRECTIVE) " " #x); \
|
|
+ __asm (".hidden " #x);
|
|
+#else
|
|
+# define hidden_undef(x)
|
|
+#endif
|
|
+
|
|
+hidden_undef (__preinit_array_start)
|
|
+hidden_undef (__preinit_array_end)
|
|
+hidden_undef (__init_array_start)
|
|
+hidden_undef (__init_array_end)
|
|
+hidden_undef (__fini_array_start)
|
|
+hidden_undef (__fini_array_end)
|
|
|
|
/* These function symbols are provided for the .init/.fini section entry
|
|
points automagically by the linker. */
|
|
--- glibc-2.11-175-gb34e12e/debug/tst-chk1.c
|
|
+++ glibc-2.11.90-11/debug/tst-chk1.c
|
|
@@ -17,6 +17,9 @@
|
|
Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
02111-1307 USA. */
|
|
|
|
+/* Hack: make sure GCC doesn't know __chk_fail () will not return. */
|
|
+#define __noreturn__
|
|
+
|
|
#include <assert.h>
|
|
#include <fcntl.h>
|
|
#include <locale.h>
|
|
@@ -242,7 +245,7 @@ do_test (void)
|
|
if (memcmp (a.buf1, "aabcdabcjj", 10))
|
|
FAIL ();
|
|
|
|
-#if __USE_FORTIFY_LEVEL < 2
|
|
+#if __USE_FORTIFY_LEVEL < 2 || !__GNUC_PREREQ (4, 0)
|
|
/* The following tests are supposed to crash with -D_FORTIFY_SOURCE=2
|
|
and sufficient GCC support, as the string operations overflow
|
|
from a.buf1 into a.buf2. */
|
|
@@ -357,7 +360,7 @@ do_test (void)
|
|
memset (a.buf1 + 9, 'j', l0 + 2);
|
|
CHK_FAIL_END
|
|
|
|
-# if __USE_FORTIFY_LEVEL >= 2
|
|
+# if __USE_FORTIFY_LEVEL >= 2 && __GNUC_PREREQ (4, 0)
|
|
# define O 0
|
|
# else
|
|
# define O 1
|
|
--- glibc-2.11-175-gb34e12e/elf/ldconfig.c
|
|
+++ glibc-2.11.90-11/elf/ldconfig.c
|
|
@@ -1020,17 +1020,19 @@ search_dirs (void)
|
|
|
|
|
|
static void parse_conf_include (const char *config_file, unsigned int lineno,
|
|
- bool do_chroot, const char *pattern);
|
|
+ const char *prefix, bool do_chroot,
|
|
+ const char *pattern);
|
|
|
|
/* Parse configuration file. */
|
|
static void
|
|
-parse_conf (const char *filename, bool do_chroot)
|
|
+parse_conf (const char *filename, const char *prefix, bool do_chroot)
|
|
{
|
|
FILE *file = NULL;
|
|
char *line = NULL;
|
|
const char *canon;
|
|
size_t len = 0;
|
|
unsigned int lineno;
|
|
+ size_t prefix_len = prefix ? strlen (prefix) : 0;
|
|
|
|
if (do_chroot && opt_chroot)
|
|
{
|
|
@@ -1091,7 +1093,14 @@ parse_conf (const char *filename, bool do_chroot)
|
|
cp += 8;
|
|
while ((dir = strsep (&cp, " \t")) != NULL)
|
|
if (dir[0] != '\0')
|
|
- parse_conf_include (filename, lineno, do_chroot, dir);
|
|
+ parse_conf_include (filename, lineno, prefix, do_chroot, dir);
|
|
+ }
|
|
+ else if (prefix != NULL)
|
|
+ {
|
|
+ size_t cp_len = strlen (cp);
|
|
+ char new_cp [prefix_len + cp_len + 1];
|
|
+ memcpy (mempcpy (new_cp, prefix, prefix_len), cp, cp_len + 1);
|
|
+ add_dir (new_cp);
|
|
}
|
|
else if (!strncasecmp (cp, "hwcap", 5) && isblank (cp[5]))
|
|
{
|
|
@@ -1154,7 +1163,7 @@ parse_conf (const char *filename, bool do_chroot)
|
|
config files to read. */
|
|
static void
|
|
parse_conf_include (const char *config_file, unsigned int lineno,
|
|
- bool do_chroot, const char *pattern)
|
|
+ const char *prefix, bool do_chroot, const char *pattern)
|
|
{
|
|
if (opt_chroot && pattern[0] != '/')
|
|
error (EXIT_FAILURE, 0,
|
|
@@ -1184,7 +1193,7 @@ parse_conf_include (const char *config_file, unsigned int lineno,
|
|
{
|
|
case 0:
|
|
for (size_t i = 0; i < gl.gl_pathc; ++i)
|
|
- parse_conf (gl.gl_pathv[i], false);
|
|
+ parse_conf (gl.gl_pathv[i], prefix, false);
|
|
globfree64 (&gl);
|
|
break;
|
|
|
|
@@ -1227,6 +1236,8 @@ main (int argc, char **argv)
|
|
/* Set the text message domain. */
|
|
textdomain (_libc_intl_domainname);
|
|
|
|
+ arch_startup (argc, argv);
|
|
+
|
|
/* Parse and process arguments. */
|
|
int remaining;
|
|
argp_parse (&argp, argc, argv, 0, &remaining, NULL);
|
|
@@ -1338,12 +1349,14 @@ main (int argc, char **argv)
|
|
|
|
if (!opt_only_cline)
|
|
{
|
|
- parse_conf (config_file, true);
|
|
+ parse_conf (config_file, NULL, true);
|
|
|
|
/* Always add the standard search paths. */
|
|
add_system_dir (SLIBDIR);
|
|
if (strcmp (SLIBDIR, LIBDIR))
|
|
add_system_dir (LIBDIR);
|
|
+
|
|
+ add_arch_dirs (config_file);
|
|
}
|
|
|
|
if (! opt_ignore_aux_cache)
|
|
--- glibc-2.11-175-gb34e12e/elf/tst-stackguard1.c
|
|
+++ glibc-2.11.90-11/elf/tst-stackguard1.c
|
|
@@ -160,17 +160,21 @@ do_test (void)
|
|
the 16 runs, something is very wrong. */
|
|
int ndifferences = 0;
|
|
int ndefaults = 0;
|
|
+ int npartlyrandomized = 0;
|
|
for (i = 0; i < N; ++i)
|
|
{
|
|
if (child_stack_chk_guards[i] != child_stack_chk_guards[i+1])
|
|
ndifferences++;
|
|
else if (child_stack_chk_guards[i] == default_guard)
|
|
ndefaults++;
|
|
+ else if (*(char *) &child_stack_chk_guards[i] == 0)
|
|
+ npartlyrandomized++;
|
|
}
|
|
|
|
- printf ("differences %d defaults %d\n", ndifferences, ndefaults);
|
|
+ printf ("differences %d defaults %d partly randomized %d\n",
|
|
+ ndifferences, ndefaults, npartlyrandomized);
|
|
|
|
- if (ndifferences < N / 2 && ndefaults < N / 2)
|
|
+ if ((ndifferences + ndefaults + npartlyrandomized) < 3 * N / 4)
|
|
{
|
|
puts ("stack guard canaries are not randomized enough");
|
|
puts ("nor equal to the default canary value");
|
|
--- glibc-2.11-175-gb34e12e/include/bits/stdlib-ldbl.h
|
|
+++ glibc-2.11.90-11/include/bits/stdlib-ldbl.h
|
|
@@ -0,0 +1 @@
|
|
+#include <stdlib/bits/stdlib-ldbl.h>
|
|
--- glibc-2.11-175-gb34e12e/include/bits/wchar-ldbl.h
|
|
+++ glibc-2.11.90-11/include/bits/wchar-ldbl.h
|
|
@@ -0,0 +1 @@
|
|
+#include <wcsmbs/bits/wchar-ldbl.h>
|
|
--- glibc-2.11-175-gb34e12e/include/features.h
|
|
+++ glibc-2.11.90-11/include/features.h
|
|
@@ -308,8 +308,13 @@
|
|
#endif
|
|
|
|
#if defined _FORTIFY_SOURCE && _FORTIFY_SOURCE > 0 \
|
|
- && __GNUC_PREREQ (4, 1) && defined __OPTIMIZE__ && __OPTIMIZE__ > 0
|
|
-# if _FORTIFY_SOURCE > 1
|
|
+ && defined __OPTIMIZE__ && __OPTIMIZE__ > 0
|
|
+# if !__GNUC_PREREQ (4, 1)
|
|
+# ifdef __GNUC_RH_RELEASE__
|
|
+# warning _FORTIFY_SOURCE supported only with GCC 4.1 and later
|
|
+# endif
|
|
+# define __USE_FORTIFY_LEVEL 0
|
|
+# elif _FORTIFY_SOURCE > 1
|
|
# define __USE_FORTIFY_LEVEL 2
|
|
# else
|
|
# define __USE_FORTIFY_LEVEL 1
|
|
--- glibc-2.11-175-gb34e12e/intl/locale.alias
|
|
+++ glibc-2.11.90-11/intl/locale.alias
|
|
@@ -57,8 +57,6 @@ korean ko_KR.eucKR
|
|
korean.euc ko_KR.eucKR
|
|
ko_KR ko_KR.eucKR
|
|
lithuanian lt_LT.ISO-8859-13
|
|
-no_NO nb_NO.ISO-8859-1
|
|
-no_NO.ISO-8859-1 nb_NO.ISO-8859-1
|
|
norwegian nb_NO.ISO-8859-1
|
|
nynorsk nn_NO.ISO-8859-1
|
|
polish pl_PL.ISO-8859-2
|
|
--- glibc-2.11-175-gb34e12e/libio/stdio.h
|
|
+++ glibc-2.11.90-11/libio/stdio.h
|
|
@@ -165,10 +165,12 @@ typedef _G_fpos64_t fpos64_t;
|
|
extern struct _IO_FILE *stdin; /* Standard input stream. */
|
|
extern struct _IO_FILE *stdout; /* Standard output stream. */
|
|
extern struct _IO_FILE *stderr; /* Standard error output stream. */
|
|
+#ifdef __STDC__
|
|
/* C89/C99 say they're macros. Make them happy. */
|
|
#define stdin stdin
|
|
#define stdout stdout
|
|
#define stderr stderr
|
|
+#endif
|
|
|
|
__BEGIN_NAMESPACE_STD
|
|
/* Remove file FILENAME. */
|
|
--- glibc-2.11-175-gb34e12e/locale/iso-4217.def
|
|
+++ glibc-2.11.90-11/locale/iso-4217.def
|
|
@@ -8,6 +8,7 @@
|
|
*
|
|
* !!! The list has to be sorted !!!
|
|
*/
|
|
+DEFINE_INT_CURR("ADP") /* Andorran Peseta -> EUR */
|
|
DEFINE_INT_CURR("AED") /* United Arab Emirates Dirham */
|
|
DEFINE_INT_CURR("AFN") /* Afghanistan Afgani */
|
|
DEFINE_INT_CURR("ALL") /* Albanian Lek */
|
|
@@ -15,12 +16,14 @@ DEFINE_INT_CURR("AMD") /* Armenia Dram */
|
|
DEFINE_INT_CURR("ANG") /* Netherlands Antilles */
|
|
DEFINE_INT_CURR("AOA") /* Angolan Kwanza */
|
|
DEFINE_INT_CURR("ARS") /* Argentine Peso */
|
|
+DEFINE_INT_CURR("ATS") /* Austrian Schilling -> EUR */
|
|
DEFINE_INT_CURR("AUD") /* Australian Dollar */
|
|
DEFINE_INT_CURR("AWG") /* Aruba Guilder */
|
|
DEFINE_INT_CURR("AZM") /* Azerbaijan Manat */
|
|
DEFINE_INT_CURR("BAM") /* Bosnian and Herzegovina Convertible Mark */
|
|
DEFINE_INT_CURR("BBD") /* Barbados Dollar */
|
|
DEFINE_INT_CURR("BDT") /* Bangladesh Taka */
|
|
+DEFINE_INT_CURR("BEF") /* Belgian Franc -> EUR */
|
|
DEFINE_INT_CURR("BGN") /* Bulgarian Lev */
|
|
DEFINE_INT_CURR("BHD") /* Bahraini Dinar */
|
|
DEFINE_INT_CURR("BIF") /* Burundi Franc */
|
|
@@ -44,6 +47,7 @@ DEFINE_INT_CURR("CUP") /* Cuban Peso */
|
|
DEFINE_INT_CURR("CVE") /* Cape Verde Escudo */
|
|
DEFINE_INT_CURR("CYP") /* Cypriot Pound */
|
|
DEFINE_INT_CURR("CZK") /* Czech Koruna */
|
|
+DEFINE_INT_CURR("DEM") /* German Mark -> EUR */
|
|
DEFINE_INT_CURR("DJF") /* Djibouti Franc */
|
|
DEFINE_INT_CURR("DKK") /* Danish Krone (Faroe Islands, Greenland) */
|
|
DEFINE_INT_CURR("DOP") /* Dominican Republic */
|
|
@@ -51,16 +55,20 @@ DEFINE_INT_CURR("DZD") /* Algerian Dinar */
|
|
DEFINE_INT_CURR("EEK") /* Estonian Kroon */
|
|
DEFINE_INT_CURR("EGP") /* Egyptian Pound */
|
|
DEFINE_INT_CURR("ERN") /* Eritrean Nakfa */
|
|
+DEFINE_INT_CURR("ESP") /* Spanish Peseta -> EUR */
|
|
DEFINE_INT_CURR("ETB") /* Ethiopian Birr */
|
|
DEFINE_INT_CURR("EUR") /* European Union Euro */
|
|
+DEFINE_INT_CURR("FIM") /* Finnish Markka -> EUR */
|
|
DEFINE_INT_CURR("FJD") /* Fiji Dollar */
|
|
DEFINE_INT_CURR("FKP") /* Falkland Islands Pound (Malvinas) */
|
|
+DEFINE_INT_CURR("FRF") /* French Franc -> EUR */
|
|
DEFINE_INT_CURR("GBP") /* British Pound */
|
|
DEFINE_INT_CURR("GEL") /* Georgia Lari */
|
|
DEFINE_INT_CURR("GHC") /* Ghana Cedi */
|
|
DEFINE_INT_CURR("GIP") /* Gibraltar Pound */
|
|
DEFINE_INT_CURR("GMD") /* Gambian Dalasi */
|
|
DEFINE_INT_CURR("GNF") /* Guinea Franc */
|
|
+DEFINE_INT_CURR("GRD") /* Greek Drachma -> EUR */
|
|
DEFINE_INT_CURR("GTQ") /* Guatemala Quetzal */
|
|
DEFINE_INT_CURR("GYD") /* Guyana Dollar */
|
|
DEFINE_INT_CURR("HKD") /* Hong Kong Dollar */
|
|
@@ -69,12 +77,14 @@ DEFINE_INT_CURR("HRK") /* Croatia Kuna */
|
|
DEFINE_INT_CURR("HTG") /* Haiti Gourde */
|
|
DEFINE_INT_CURR("HUF") /* Hungarian Forint */
|
|
DEFINE_INT_CURR("IDR") /* Indonesia Rupiah */
|
|
+DEFINE_INT_CURR("IEP") /* Irish Pound -> EUR */
|
|
DEFINE_INT_CURR("ILS") /* Israeli Shekel */
|
|
DEFINE_INT_CURR("IMP") /* Isle of Man Pounds */
|
|
DEFINE_INT_CURR("INR") /* Indian Rupee (Bhutan) */
|
|
DEFINE_INT_CURR("IQD") /* Iraqi Dinar */
|
|
DEFINE_INT_CURR("IRR") /* Iranian Rial */
|
|
DEFINE_INT_CURR("ISK") /* Iceland Krona */
|
|
+DEFINE_INT_CURR("ITL") /* Italian Lira -> EUR */
|
|
DEFINE_INT_CURR("JEP") /* Jersey Pound */
|
|
DEFINE_INT_CURR("JMD") /* Jamaican Dollar */
|
|
DEFINE_INT_CURR("JOD") /* Jordanian Dinar */
|
|
@@ -94,6 +104,7 @@ DEFINE_INT_CURR("LKR") /* Sri Lankan Rupee */
|
|
DEFINE_INT_CURR("LRD") /* Liberian Dollar */
|
|
DEFINE_INT_CURR("LSL") /* Lesotho Maloti */
|
|
DEFINE_INT_CURR("LTL") /* Lithuanian Litas */
|
|
+DEFINE_INT_CURR("LUF") /* Luxembourg Franc -> EUR */
|
|
DEFINE_INT_CURR("LVL") /* Latvia Lat */
|
|
DEFINE_INT_CURR("LYD") /* Libyan Arab Jamahiriya Dinar */
|
|
DEFINE_INT_CURR("MAD") /* Moroccan Dirham */
|
|
@@ -114,6 +125,7 @@ DEFINE_INT_CURR("MZM") /* Mozambique Metical */
|
|
DEFINE_INT_CURR("NAD") /* Namibia Dollar */
|
|
DEFINE_INT_CURR("NGN") /* Nigeria Naira */
|
|
DEFINE_INT_CURR("NIO") /* Nicaragua Cordoba Oro */
|
|
+DEFINE_INT_CURR("NLG") /* Netherlands Guilder -> EUR */
|
|
DEFINE_INT_CURR("NOK") /* Norwegian Krone */
|
|
DEFINE_INT_CURR("NPR") /* Nepalese Rupee */
|
|
DEFINE_INT_CURR("NZD") /* New Zealand Dollar */
|
|
@@ -124,6 +136,7 @@ DEFINE_INT_CURR("PGK") /* Papau New Guinea Kina */
|
|
DEFINE_INT_CURR("PHP") /* Philippines Peso */
|
|
DEFINE_INT_CURR("PKR") /* Pakistan Rupee */
|
|
DEFINE_INT_CURR("PLN") /* Polish Zloty */
|
|
+DEFINE_INT_CURR("PTE") /* Portugese Escudo -> EUR */
|
|
DEFINE_INT_CURR("PYG") /* Paraguay Guarani */
|
|
DEFINE_INT_CURR("QAR") /* Qatar Rial */
|
|
DEFINE_INT_CURR("ROL") /* Romanian Leu */
|
|
--- glibc-2.11-175-gb34e12e/locale/programs/locarchive.c
|
|
+++ glibc-2.11.90-11/locale/programs/locarchive.c
|
|
@@ -241,9 +241,9 @@ oldlocrecentcmp (const void *a, const void *b)
|
|
/* forward decls for below */
|
|
static uint32_t add_locale (struct locarhandle *ah, const char *name,
|
|
locale_data_t data, bool replace);
|
|
-static void add_alias (struct locarhandle *ah, const char *alias,
|
|
- bool replace, const char *oldname,
|
|
- uint32_t *locrec_offset_p);
|
|
+void add_alias (struct locarhandle *ah, const char *alias,
|
|
+ bool replace, const char *oldname,
|
|
+ uint32_t *locrec_offset_p);
|
|
|
|
|
|
static bool
|
|
@@ -649,7 +649,7 @@ close_archive (struct locarhandle *ah)
|
|
#include "../../intl/explodename.c"
|
|
#include "../../intl/l10nflist.c"
|
|
|
|
-static struct namehashent *
|
|
+struct namehashent *
|
|
insert_name (struct locarhandle *ah,
|
|
const char *name, size_t name_len, bool replace)
|
|
{
|
|
@@ -707,7 +707,7 @@ insert_name (struct locarhandle *ah,
|
|
return &namehashtab[idx];
|
|
}
|
|
|
|
-static void
|
|
+void
|
|
add_alias (struct locarhandle *ah, const char *alias, bool replace,
|
|
const char *oldname, uint32_t *locrec_offset_p)
|
|
{
|
|
--- glibc-2.11-175-gb34e12e/localedata/Makefile
|
|
+++ glibc-2.11.90-11/localedata/Makefile
|
|
@@ -225,6 +225,7 @@ $(INSTALL-SUPPORTED-LOCALES): install-locales-dir
|
|
echo -n '...'; \
|
|
input=`echo $$locale | sed 's/\([^.]*\)[^@]*\(.*\)/\1\2/'`; \
|
|
$(LOCALEDEF) --alias-file=../intl/locale.alias \
|
|
+ --no-archive \
|
|
-i locales/$$input -c -f charmaps/$$charset \
|
|
$(addprefix --prefix=,$(install_root)) $$locale; \
|
|
echo ' done'; \
|
|
--- glibc-2.11-175-gb34e12e/localedata/SUPPORTED
|
|
+++ glibc-2.11.90-11/localedata/SUPPORTED
|
|
@@ -84,6 +84,7 @@ cy_GB.UTF-8/UTF-8 \
|
|
cy_GB/ISO-8859-14 \
|
|
da_DK.UTF-8/UTF-8 \
|
|
da_DK/ISO-8859-1 \
|
|
+da_DK.ISO-8859-15/ISO-8859-15 \
|
|
de_AT.UTF-8/UTF-8 \
|
|
de_AT/ISO-8859-1 \
|
|
de_AT@euro/ISO-8859-15 \
|
|
@@ -115,6 +116,7 @@ en_DK.UTF-8/UTF-8 \
|
|
en_DK/ISO-8859-1 \
|
|
en_GB.UTF-8/UTF-8 \
|
|
en_GB/ISO-8859-1 \
|
|
+en_GB.ISO-8859-15/ISO-8859-15 \
|
|
en_HK.UTF-8/UTF-8 \
|
|
en_HK/ISO-8859-1 \
|
|
en_IE.UTF-8/UTF-8 \
|
|
@@ -130,6 +132,7 @@ en_SG.UTF-8/UTF-8 \
|
|
en_SG/ISO-8859-1 \
|
|
en_US.UTF-8/UTF-8 \
|
|
en_US/ISO-8859-1 \
|
|
+en_US.ISO-8859-15/ISO-8859-15 \
|
|
en_ZA.UTF-8/UTF-8 \
|
|
en_ZA/ISO-8859-1 \
|
|
en_ZW.UTF-8/UTF-8 \
|
|
@@ -305,6 +308,8 @@ nl_NL/ISO-8859-1 \
|
|
nl_NL@euro/ISO-8859-15 \
|
|
nn_NO.UTF-8/UTF-8 \
|
|
nn_NO/ISO-8859-1 \
|
|
+no_NO.UTF-8/UTF-8 \
|
|
+no_NO/ISO-8859-1 \
|
|
nr_ZA/UTF-8 \
|
|
nso_ZA/UTF-8 \
|
|
oc_FR.UTF-8/UTF-8 \
|
|
@@ -364,6 +369,7 @@ sv_FI/ISO-8859-1 \
|
|
sv_FI@euro/ISO-8859-15 \
|
|
sv_SE.UTF-8/UTF-8 \
|
|
sv_SE/ISO-8859-1 \
|
|
+sv_SE.ISO-8859-15/ISO-8859-15 \
|
|
ta_IN/UTF-8 \
|
|
te_IN/UTF-8 \
|
|
tg_TJ.UTF-8/UTF-8 \
|
|
--- glibc-2.11-175-gb34e12e/localedata/locales/cy_GB
|
|
+++ glibc-2.11.90-11/localedata/locales/cy_GB
|
|
@@ -248,8 +248,11 @@ mon "<U0049><U006F><U006E><U0061><U0077><U0072>";/
|
|
d_t_fmt "<U0044><U0079><U0064><U0064><U0020><U0025><U0041><U0020><U0025><U0064><U0020><U006d><U0069><U0073><U0020><U0025><U0042><U0020><U0025><U0059><U0020><U0025><U0054><U0020><U0025><U005A>"
|
|
d_fmt "<U0025><U0064><U002E><U0025><U006D><U002E><U0025><U0079>"
|
|
t_fmt "<U0025><U0054>"
|
|
-am_pm "";""
|
|
-t_fmt_ampm ""
|
|
+am_pm "<U0041><U004D>";"<U0050><U004D>"
|
|
+t_fmt_ampm "<U0025><U006C><U003A><U0025><U004D><U003A><U0025><U0053><U0020><U0025><U0050><U0020><U0025><U005A>"
|
|
+date_fmt "<U0025><U0061><U0020><U0025><U0062><U0020><U0025><U0065>/
|
|
+<U0020><U0025><U0048><U003A><U0025><U004D><U003A><U0025><U0053><U0020>/
|
|
+<U0025><U005A><U0020><U0025><U0059>"
|
|
END LC_TIME
|
|
|
|
LC_MESSAGES
|
|
--- glibc-2.11-175-gb34e12e/localedata/locales/en_GB
|
|
+++ glibc-2.11.90-11/localedata/locales/en_GB
|
|
@@ -116,8 +116,8 @@ mon "<U004A><U0061><U006E><U0075><U0061><U0072><U0079>";/
|
|
d_t_fmt "<U0025><U0061><U0020><U0025><U0064><U0020><U0025><U0062><U0020><U0025><U0059><U0020><U0025><U0054><U0020><U0025><U005A>"
|
|
d_fmt "<U0025><U0064><U002F><U0025><U006D><U002F><U0025><U0079>"
|
|
t_fmt "<U0025><U0054>"
|
|
-am_pm "";""
|
|
-t_fmt_ampm ""
|
|
+am_pm "<U0041><U004D>";"<U0050><U004D>"
|
|
+t_fmt_ampm "<U0025><U006C><U003A><U0025><U004D><U003A><U0025><U0053><U0020><U0025><U0050><U0020><U0025><U005A>"
|
|
date_fmt "<U0025><U0061><U0020><U0025><U0062><U0020><U0025><U0065>/
|
|
<U0020><U0025><U0048><U003A><U0025><U004D><U003A><U0025><U0053><U0020>/
|
|
<U0025><U005A><U0020><U0025><U0059>"
|
|
--- glibc-2.11-175-gb34e12e/localedata/locales/no_NO
|
|
+++ glibc-2.11.90-11/localedata/locales/no_NO
|
|
@@ -0,0 +1,69 @@
|
|
+escape_char /
|
|
+comment_char %
|
|
+
|
|
+% Norwegian language locale for Norway
|
|
+% Source: Norsk Standardiseringsforbund
|
|
+% Address: University Library,
|
|
+% Drammensveien 41, N-9242 Oslo, Norge
|
|
+% Contact: Kolbjoern Aamboe
|
|
+% Tel: +47 - 22859109
|
|
+% Fax: +47 - 22434497
|
|
+% Email: kolbjorn.aambo@usit.uio.no
|
|
+% Language: no
|
|
+% Territory: NO
|
|
+% Revision: 4.3
|
|
+% Date: 1996-10-15
|
|
+% Application: general
|
|
+% Users: general
|
|
+% Repertoiremap: mnemonic.ds
|
|
+% Charset: ISO-8859-1
|
|
+% Distribution and use is free, also
|
|
+% for commercial purposes.
|
|
+
|
|
+LC_IDENTIFICATION
|
|
+copy "nb_NO"
|
|
+END LC_IDENTIFICATION
|
|
+
|
|
+LC_COLLATE
|
|
+copy "nb_NO"
|
|
+END LC_COLLATE
|
|
+
|
|
+LC_CTYPE
|
|
+copy "nb_NO"
|
|
+END LC_CTYPE
|
|
+
|
|
+LC_MONETARY
|
|
+copy "nb_NO"
|
|
+END LC_MONETARY
|
|
+
|
|
+LC_NUMERIC
|
|
+copy "nb_NO"
|
|
+END LC_NUMERIC
|
|
+
|
|
+LC_TIME
|
|
+copy "nb_NO"
|
|
+END LC_TIME
|
|
+
|
|
+LC_MESSAGES
|
|
+copy "nb_NO"
|
|
+END LC_MESSAGES
|
|
+
|
|
+LC_PAPER
|
|
+copy "nb_NO"
|
|
+END LC_PAPER
|
|
+
|
|
+LC_TELEPHONE
|
|
+copy "nb_NO"
|
|
+END LC_TELEPHONE
|
|
+
|
|
+LC_MEASUREMENT
|
|
+copy "nb_NO"
|
|
+END LC_MEASUREMENT
|
|
+
|
|
+LC_NAME
|
|
+copy "nb_NO"
|
|
+END LC_NAME
|
|
+
|
|
+LC_ADDRESS
|
|
+copy "nb_NO"
|
|
+END LC_ADDRESS
|
|
--- glibc-2.11-175-gb34e12e/localedata/locales/zh_TW
|
|
+++ glibc-2.11.90-11/localedata/locales/zh_TW
|
|
@@ -1,7 +1,7 @@
|
|
comment_char %
|
|
escape_char /
|
|
%
|
|
-% Chinese language locale for Taiwan R.O.C.
|
|
+% Chinese language locale for Taiwan
|
|
% charmap: BIG5-CP950
|
|
%
|
|
% Original Author:
|
|
@@ -17,7 +17,7 @@ escape_char /
|
|
% Reference: http://wwwold.dkuug.dk/JTC1/SC22/WG20/docs/n690.pdf
|
|
|
|
LC_IDENTIFICATION
|
|
-title "Chinese locale for Taiwan R.O.C."
|
|
+title "Chinese locale for Taiwan"
|
|
source ""
|
|
address ""
|
|
contact ""
|
|
@@ -25,7 +25,7 @@ email "bug-glibc-locales@gnu.org"
|
|
tel ""
|
|
fax ""
|
|
language "Chinese"
|
|
-territory "Taiwan R.O.C."
|
|
+territory "Taiwan"
|
|
revision "0.2"
|
|
date "2000-08-02"
|
|
%
|
|
--- glibc-2.11-175-gb34e12e/malloc/mcheck.c
|
|
+++ glibc-2.11.90-11/malloc/mcheck.c
|
|
@@ -24,9 +24,25 @@
|
|
# include <mcheck.h>
|
|
# include <stdint.h>
|
|
# include <stdio.h>
|
|
+# include <stdlib.h>
|
|
# include <libintl.h>
|
|
#endif
|
|
|
|
+#ifdef _LIBC
|
|
+extern __typeof (malloc) __libc_malloc;
|
|
+extern __typeof (free) __libc_free;
|
|
+extern __typeof (realloc) __libc_realloc;
|
|
+libc_hidden_proto (__libc_malloc)
|
|
+libc_hidden_proto (__libc_realloc)
|
|
+libc_hidden_proto (__libc_free)
|
|
+libc_hidden_proto (__libc_memalign)
|
|
+#else
|
|
+# define __libc_malloc(sz) malloc (sz)
|
|
+# define __libc_free(ptr) free (ptr)
|
|
+# define __libc_realloc(ptr, sz) realloc (ptr, sz)
|
|
+# define __libc_memalign(al, sz) memalign (al, sz)
|
|
+#endif
|
|
+
|
|
/* Old hook values. */
|
|
static void (*old_free_hook) (__ptr_t ptr, __const __ptr_t);
|
|
static __ptr_t (*old_malloc_hook) (__malloc_size_t size, const __ptr_t);
|
|
@@ -197,7 +213,7 @@ freehook (__ptr_t ptr, const __ptr_t caller)
|
|
if (old_free_hook != NULL)
|
|
(*old_free_hook) (ptr, caller);
|
|
else
|
|
- free (ptr);
|
|
+ __libc_free (ptr);
|
|
__free_hook = freehook;
|
|
}
|
|
|
|
@@ -214,7 +230,7 @@ mallochook (__malloc_size_t size, const __ptr_t caller)
|
|
hdr = (struct hdr *) (*old_malloc_hook) (sizeof (struct hdr) + size + 1,
|
|
caller);
|
|
else
|
|
- hdr = (struct hdr *) malloc (sizeof (struct hdr) + size + 1);
|
|
+ hdr = (struct hdr *) __libc_malloc (sizeof (struct hdr) + size + 1);
|
|
__malloc_hook = mallochook;
|
|
if (hdr == NULL)
|
|
return NULL;
|
|
@@ -245,7 +261,7 @@ memalignhook (__malloc_size_t alignment, __malloc_size_t size,
|
|
if (old_memalign_hook != NULL)
|
|
block = (*old_memalign_hook) (alignment, slop + size + 1, caller);
|
|
else
|
|
- block = memalign (alignment, slop + size + 1);
|
|
+ block = __libc_memalign (alignment, slop + size + 1);
|
|
__memalign_hook = memalignhook;
|
|
if (block == NULL)
|
|
return NULL;
|
|
@@ -300,8 +316,8 @@ reallochook (__ptr_t ptr, __malloc_size_t size, const __ptr_t caller)
|
|
sizeof (struct hdr) + size + 1,
|
|
caller);
|
|
else
|
|
- hdr = (struct hdr *) realloc ((__ptr_t) hdr,
|
|
- sizeof (struct hdr) + size + 1);
|
|
+ hdr = (struct hdr *) __libc_realloc ((__ptr_t) hdr,
|
|
+ sizeof (struct hdr) + size + 1);
|
|
__free_hook = freehook;
|
|
__malloc_hook = mallochook;
|
|
__memalign_hook = memalignhook;
|
|
@@ -361,8 +377,8 @@ mcheck (func)
|
|
if (__malloc_initialized <= 0 && !mcheck_used)
|
|
{
|
|
/* We call malloc() once here to ensure it is initialized. */
|
|
- void *p = malloc (0);
|
|
- free (p);
|
|
+ void *p = __libc_malloc (0);
|
|
+ __libc_free (p);
|
|
|
|
old_free_hook = __free_hook;
|
|
__free_hook = freehook;
|
|
--- glibc-2.11-175-gb34e12e/manual/libc.texinfo
|
|
+++ glibc-2.11.90-11/manual/libc.texinfo
|
|
@@ -5,7 +5,7 @@
|
|
@c setchapternewpage odd
|
|
|
|
@comment Tell install-info what to do.
|
|
-@dircategory Software libraries
|
|
+@dircategory Libraries
|
|
@direntry
|
|
* Libc: (libc). C library.
|
|
@end direntry
|
|
--- glibc-2.11-175-gb34e12e/misc/sys/cdefs.h
|
|
+++ glibc-2.11.90-11/misc/sys/cdefs.h
|
|
@@ -132,7 +132,10 @@
|
|
#define __bos(ptr) __builtin_object_size (ptr, __USE_FORTIFY_LEVEL > 1)
|
|
#define __bos0(ptr) __builtin_object_size (ptr, 0)
|
|
|
|
-#if __GNUC_PREREQ (4,3)
|
|
+#if __GNUC_PREREQ (4,3) \
|
|
+ || (defined __GNUC_RH_RELEASE__ && __GNUC__ == 4 \
|
|
+ && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ == 2 \
|
|
+ && __GNUC_RH_RELEASE__ >= 31)
|
|
# define __warndecl(name, msg) \
|
|
extern void name (void) __attribute__((__warning__ (msg)))
|
|
# define __warnattr(msg) __attribute__((__warning__ (msg)))
|
|
@@ -291,10 +294,16 @@
|
|
|
|
/* GCC 4.3 and above with -std=c99 or -std=gnu99 implements ISO C99
|
|
inline semantics, unless -fgnu89-inline is used. */
|
|
-#if !defined __cplusplus || __GNUC_PREREQ (4,3)
|
|
+#if !defined __cplusplus || __GNUC_PREREQ (4,3) \
|
|
+ || (defined __GNUC_RH_RELEASE__ && __GNUC__ == 4 \
|
|
+ && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ == 2 \
|
|
+ && __GNUC_RH_RELEASE__ >= 31)
|
|
# if defined __GNUC_STDC_INLINE__ || defined __cplusplus
|
|
# define __extern_inline extern __inline __attribute__ ((__gnu_inline__))
|
|
-# if __GNUC_PREREQ (4,3)
|
|
+# if __GNUC_PREREQ (4,3) \
|
|
+ || (defined __GNUC_RH_RELEASE__ && __GNUC__ == 4 \
|
|
+ && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ == 2 \
|
|
+ && __GNUC_RH_RELEASE__ >= 31)
|
|
# define __extern_always_inline \
|
|
extern __always_inline __attribute__ ((__gnu_inline__, __artificial__))
|
|
# else
|
|
@@ -314,7 +323,10 @@
|
|
|
|
/* GCC 4.3 and above allow passing all anonymous arguments of an
|
|
__extern_always_inline function to some other vararg function. */
|
|
-#if __GNUC_PREREQ (4,3)
|
|
+#if __GNUC_PREREQ (4,3) \
|
|
+ || (defined __GNUC_RH_RELEASE__ && __GNUC__ == 4 \
|
|
+ && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ == 2 \
|
|
+ && __GNUC_RH_RELEASE__ >= 31)
|
|
# define __va_arg_pack() __builtin_va_arg_pack ()
|
|
# define __va_arg_pack_len() __builtin_va_arg_pack_len ()
|
|
#endif
|
|
--- glibc-2.11-175-gb34e12e/nis/nss
|
|
+++ glibc-2.11.90-11/nis/nss
|
|
@@ -25,4 +25,4 @@
|
|
# memory with every getXXent() call. Otherwise each getXXent() call
|
|
# might result into a network communication with the server to get
|
|
# the next entry.
|
|
-#SETENT_BATCH_READ=TRUE
|
|
+SETENT_BATCH_READ=TRUE
|
|
--- glibc-2.11-175-gb34e12e/nptl/ChangeLog
|
|
+++ glibc-2.11.90-11/nptl/ChangeLog
|
|
@@ -3834,6 +3834,15 @@
|
|
Use __sigfillset. Document that sigfillset does the right thing wrt
|
|
to SIGSETXID.
|
|
|
|
+2005-08-08 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * tst-stackguard1.c (do_test): Likewise.
|
|
+
|
|
+2005-07-29 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * tst-stackguard1.c (do_test): Don't fail if the poor man's
|
|
+ randomization doesn't work well enough.
|
|
+
|
|
2005-07-11 Jakub Jelinek <jakub@redhat.com>
|
|
|
|
[BZ #1102]
|
|
@@ -4570,6 +4579,11 @@
|
|
Move definition inside libpthread, libc, librt check. Provide
|
|
definition for rtld.
|
|
|
|
+2004-09-02 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * pthread_cond_destroy.c (__pthread_cond_destroy): If there are
|
|
+ waiters, awake all waiters on the associated mutex.
|
|
+
|
|
2004-09-02 Ulrich Drepper <drepper@redhat.com>
|
|
|
|
* sysdeps/alpha/jmpbuf-unwind.h: Define __libc_unwind_longjmp.
|
|
@@ -6644,6 +6658,11 @@
|
|
|
|
* Makefile [$(build-shared) = yes] (tests): Depend on $(test-modules).
|
|
|
|
+2003-07-22 Jakub Jelinek <jakub@redhat.com>
|
|
+
|
|
+ * descr.h: Don't include lowlevellock.h, pthreaddef.h and dl-sysdep.h
|
|
+ if __need_struct_pthread_size, instead define lll_lock_t.
|
|
+
|
|
2003-07-25 Jakub Jelinek <jakub@redhat.com>
|
|
|
|
* tst-cancel17.c (do_test): Check if aio_cancel failed.
|
|
--- glibc-2.11-175-gb34e12e/nptl/Makefile
|
|
+++ glibc-2.11.90-11/nptl/Makefile
|
|
@@ -339,7 +339,8 @@ endif
|
|
extra-objs += $(crti-objs) $(crtn-objs)
|
|
omit-deps += crti crtn
|
|
|
|
-CFLAGS-pt-initfini.s = -g0 -fPIC -fno-inline-functions $(fno-unit-at-a-time)
|
|
+CFLAGS-pt-initfini.s = -g0 -fPIC -fno-inline-functions $(fno-unit-at-a-time) \
|
|
+ -fno-asynchronous-unwind-tables
|
|
endif
|
|
|
|
CFLAGS-flockfile.c = -D_IO_MTSAFE_IO
|
|
@@ -525,15 +526,19 @@ $(addprefix $(objpfx), \
|
|
$(tests) $(xtests) $(test-srcs))): $(objpfx)libpthread.so \
|
|
$(objpfx)libpthread_nonshared.a
|
|
$(objpfx)tst-unload: $(common-objpfx)dlfcn/libdl.so
|
|
-# $(objpfx)../libc.so is used instead of $(common-objpfx)libc.so,
|
|
+# $(objpfx)linklibc.so is used instead of $(common-objpfx)libc.so,
|
|
# since otherwise libpthread.so comes before libc.so when linking.
|
|
$(addprefix $(objpfx), $(tests-reverse)): \
|
|
- $(objpfx)../libc.so $(objpfx)libpthread.so \
|
|
+ $(objpfx)linklibc.so $(objpfx)libpthread.so \
|
|
$(objpfx)libpthread_nonshared.a
|
|
$(objpfx)../libc.so: $(common-objpfx)libc.so ;
|
|
$(addprefix $(objpfx),$(tests-static) $(xtests-static)): $(objpfx)libpthread.a
|
|
|
|
$(objpfx)tst-atfork2.out: $(objpfx)tst-atfork2mod.so
|
|
+
|
|
+$(objpfx)linklibc.so: $(common-objpfx)libc.so
|
|
+ ln -s ../libc.so $@
|
|
+generated += libclink.so
|
|
else
|
|
$(addprefix $(objpfx),$(tests) $(test-srcs)): $(objpfx)libpthread.a
|
|
endif
|
|
--- glibc-2.11-175-gb34e12e/nptl/sysdeps/unix/sysv/linux/bits/posix_opt.h
|
|
+++ glibc-2.11.90-11/nptl/sysdeps/unix/sysv/linux/bits/posix_opt.h
|
|
@@ -189,4 +189,7 @@
|
|
/* Typed memory objects are not available. */
|
|
#define _POSIX_TYPED_MEMORY_OBJECTS -1
|
|
|
|
+/* Streams are not available. */
|
|
+#define _XOPEN_STREAMS -1
|
|
+
|
|
#endif /* bits/posix_opt.h */
|
|
--- glibc-2.11-175-gb34e12e/nptl/sysdeps/unix/sysv/linux/kernel-features.h
|
|
+++ glibc-2.11.90-11/nptl/sysdeps/unix/sysv/linux/kernel-features.h
|
|
@@ -0,0 +1,6 @@
|
|
+#include_next <kernel-features.h>
|
|
+
|
|
+/* NPTL can always assume all clone thread flags work. */
|
|
+#ifndef __ASSUME_CLONE_THREAD_FLAGS
|
|
+# define __ASSUME_CLONE_THREAD_FLAGS 1
|
|
+#endif
|
|
--- glibc-2.11-175-gb34e12e/nptl/tst-stackguard1.c
|
|
+++ glibc-2.11.90-11/nptl/tst-stackguard1.c
|
|
@@ -190,17 +190,21 @@ do_test (void)
|
|
the 16 runs, something is very wrong. */
|
|
int ndifferences = 0;
|
|
int ndefaults = 0;
|
|
+ int npartlyrandomized = 0;
|
|
for (i = 0; i < N; ++i)
|
|
{
|
|
if (child_stack_chk_guards[i] != child_stack_chk_guards[i+1])
|
|
ndifferences++;
|
|
else if (child_stack_chk_guards[i] == default_guard)
|
|
ndefaults++;
|
|
+ else if (*(char *) &child_stack_chk_guards[i] == 0)
|
|
+ npartlyrandomized++;
|
|
}
|
|
|
|
- printf ("differences %d defaults %d\n", ndifferences, ndefaults);
|
|
+ printf ("differences %d defaults %d partly randomized %d\n",
|
|
+ ndifferences, ndefaults, npartlyrandomized);
|
|
|
|
- if (ndifferences < N / 2 && ndefaults < N / 2)
|
|
+ if ((ndifferences + ndefaults + npartlyrandomized) < 3 * N / 4)
|
|
{
|
|
puts ("stack guard canaries are not randomized enough");
|
|
puts ("nor equal to the default canary value");
|
|
--- glibc-2.11-175-gb34e12e/nscd/nscd.conf
|
|
+++ glibc-2.11.90-11/nscd/nscd.conf
|
|
@@ -33,7 +33,7 @@
|
|
# logfile /var/log/nscd.log
|
|
# threads 4
|
|
# max-threads 32
|
|
-# server-user nobody
|
|
+ server-user nscd
|
|
# stat-user somebody
|
|
debug-level 0
|
|
# reload-count 5
|
|
--- glibc-2.11-175-gb34e12e/nscd/nscd.init
|
|
+++ glibc-2.11.90-11/nscd/nscd.init
|
|
@@ -9,6 +9,7 @@
|
|
# slow naming services like NIS, NIS+, LDAP, or hesiod.
|
|
# processname: /usr/sbin/nscd
|
|
# config: /etc/nscd.conf
|
|
+# config: /etc/sysconfig/nscd
|
|
#
|
|
### BEGIN INIT INFO
|
|
# Provides: nscd
|
|
@@ -28,20 +29,8 @@
|
|
# Source function library.
|
|
. /etc/init.d/functions
|
|
|
|
-# nscd does not run on any kernel lower than 2.2.0 because of threading
|
|
-# problems, so we require that in first place.
|
|
-case $(uname -r) in
|
|
- 2.[2-9].*)
|
|
- # this is okay
|
|
- ;;
|
|
- [3-9]*)
|
|
- # these are of course also okay
|
|
- ;;
|
|
- *)
|
|
- #this is not
|
|
- exit 1
|
|
- ;;
|
|
-esac
|
|
+# Source an auxiliary options file if we have one, and pick up NSCD_OPTIONS.
|
|
+[ -r /etc/sysconfig/nscd ] && . /etc/sysconfig/nscd
|
|
|
|
RETVAL=0
|
|
prog=nscd
|
|
@@ -50,7 +39,7 @@ start () {
|
|
[ -d /var/run/nscd ] || mkdir /var/run/nscd
|
|
[ -d /var/db/nscd ] || mkdir /var/db/nscd
|
|
echo -n $"Starting $prog: "
|
|
- daemon /usr/sbin/nscd
|
|
+ daemon /usr/sbin/nscd $NSCD_OPTIONS
|
|
RETVAL=$?
|
|
echo
|
|
[ $RETVAL -eq 0 ] && touch /var/lock/subsys/nscd
|
|
@@ -83,7 +72,7 @@ restart() {
|
|
# See how we were called.
|
|
case "$1" in
|
|
start)
|
|
- start
|
|
+ [ -e /var/lock/subsys/nscd ] || start
|
|
RETVAL=$?
|
|
;;
|
|
stop)
|
|
@@ -99,14 +88,17 @@ case "$1" in
|
|
RETVAL=$?
|
|
;;
|
|
try-restart | condrestart)
|
|
- [ -e /var/lock/subsys/nscd ] && restart
|
|
+ [ ! -e /var/lock/subsys/nscd ] || restart
|
|
RETVAL=$?
|
|
;;
|
|
force-reload | reload)
|
|
echo -n $"Reloading $prog: "
|
|
- killproc /usr/sbin/nscd -HUP
|
|
- RETVAL=$?
|
|
- echo
|
|
+ RETVAL=0
|
|
+ /usr/sbin/nscd -i passwd || RETVAL=$?
|
|
+ /usr/sbin/nscd -i group || RETVAL=$?
|
|
+ /usr/sbin/nscd -i hosts || RETVAL=$?
|
|
+ /usr/sbin/nscd -i services || RETVAL=$?
|
|
+ echo
|
|
;;
|
|
*)
|
|
echo $"Usage: $0 {start|stop|status|restart|reload|condrestart}"
|
|
--- glibc-2.11-175-gb34e12e/posix/Makefile
|
|
+++ glibc-2.11.90-11/posix/Makefile
|
|
@@ -303,15 +303,8 @@ $(inst_libexecdir)/getconf: $(inst_bindir)/getconf \
|
|
mv -f $@/$$spec.new $@/$$spec; \
|
|
done < $(objpfx)getconf.speclist
|
|
|
|
-$(objpfx)getconf.speclist: $(objpfx)getconf
|
|
-ifeq (no,$(cross-compiling))
|
|
- LC_ALL=C GETCONF_DIR=/dev/null \
|
|
- $(run-program-prefix) $< _POSIX_V7_WIDTH_RESTRICTED_ENVS > $@.new
|
|
- LC_ALL=C GETCONF_DIR=/dev/null \
|
|
- $(run-program-prefix) $< _POSIX_V6_WIDTH_RESTRICTED_ENVS >> $@.new
|
|
- LC_ALL=C GETCONF_DIR=/dev/null \
|
|
- $(run-program-prefix) $< _XBS5_WIDTH_RESTRICTED_ENVS >> $@.new
|
|
-else
|
|
- > $@.new
|
|
-endif
|
|
+$(objpfx)getconf.speclist: getconf.speclist.h
|
|
+ $(CC) -E $(CFLAGS) $(CPPFLAGS) $< \
|
|
+ | sed -n -e '/START_OF_STRINGS/,$${/\(POSIX_V[67]\|_XBS5\)_/{s/^[^"]*"//;s/".*$$//;p}}' \
|
|
+ > $@.new
|
|
mv -f $@.new $@
|
|
--- glibc-2.11-175-gb34e12e/posix/getconf.speclist.h
|
|
+++ glibc-2.11.90-11/posix/getconf.speclist.h
|
|
@@ -0,0 +1,39 @@
|
|
+#include <unistd.h>
|
|
+const char *START_OF_STRINGS =
|
|
+#if _POSIX_V7_ILP32_OFF32 == 1
|
|
+"POSIX_V7_ILP32_OFF32"
|
|
+#endif
|
|
+#if _POSIX_V7_ILP32_OFFBIG == 1
|
|
+"POSIX_V7_ILP32_OFFBIG"
|
|
+#endif
|
|
+#if _POSIX_V7_LP64_OFF64 == 1
|
|
+"POSIX_V7_LP64_OFF64"
|
|
+#endif
|
|
+#if _POSIX_V7_LPBIG_OFFBIG == 1
|
|
+"POSIX_V7_LPBIG_OFFBIG"
|
|
+#endif
|
|
+#if _POSIX_V6_ILP32_OFF32 == 1
|
|
+"POSIX_V6_ILP32_OFF32"
|
|
+#endif
|
|
+#if _POSIX_V6_ILP32_OFFBIG == 1
|
|
+"POSIX_V6_ILP32_OFFBIG"
|
|
+#endif
|
|
+#if _POSIX_V6_LP64_OFF64 == 1
|
|
+"POSIX_V6_LP64_OFF64"
|
|
+#endif
|
|
+#if _POSIX_V6_LPBIG_OFFBIG == 1
|
|
+"POSIX_V6_LPBIG_OFFBIG"
|
|
+#endif
|
|
+#if _XBS5_ILP32_OFF32 == 1
|
|
+"XBS5_ILP32_OFF32"
|
|
+#endif
|
|
+#if _XBS5_ILP32_OFFBIG == 1
|
|
+"XBS5_ILP32_OFFBIG"
|
|
+#endif
|
|
+#if _XBS5_LP64_OFF64 == 1
|
|
+"XBS5_LP64_OFF64"
|
|
+#endif
|
|
+#if _XBS5_LPBIG_OFFBIG == 1
|
|
+"XBS5_LPBIG_OFFBIG"
|
|
+#endif
|
|
+"";
|
|
--- glibc-2.11-175-gb34e12e/streams/Makefile
|
|
+++ glibc-2.11.90-11/streams/Makefile
|
|
@@ -21,7 +21,7 @@
|
|
#
|
|
subdir := streams
|
|
|
|
-headers = stropts.h sys/stropts.h bits/stropts.h bits/xtitypes.h
|
|
+#headers = stropts.h sys/stropts.h bits/stropts.h bits/xtitypes.h
|
|
routines = isastream getmsg getpmsg putmsg putpmsg fattach fdetach
|
|
|
|
include ../Rules
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/generic/dl-cache.h
|
|
+++ glibc-2.11.90-11/sysdeps/generic/dl-cache.h
|
|
@@ -36,6 +36,14 @@
|
|
# define add_system_dir(dir) add_dir (dir)
|
|
#endif
|
|
|
|
+#ifndef arch_startup
|
|
+# define arch_startup(argc, argv) do { } while (0)
|
|
+#endif
|
|
+
|
|
+#ifndef add_arch_dirs
|
|
+# define add_arch_dirs(config_file) do { } while (0)
|
|
+#endif
|
|
+
|
|
#define CACHEMAGIC "ld.so-1.7.0"
|
|
|
|
/* libc5 and glibc 2.0/2.1 use the same format. For glibc 2.2 another
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/Makefile
|
|
+++ glibc-2.11.90-11/sysdeps/i386/Makefile
|
|
@@ -2,6 +2,8 @@
|
|
# Every i386 port in use uses gas syntax (I think).
|
|
asm-CPPFLAGS += -DGAS_SYNTAX
|
|
|
|
+sysdep-ASFLAGS += -U__i686
|
|
+
|
|
# The i386 `long double' is a distinct type we support.
|
|
long-double-fcts = yes
|
|
|
|
@@ -64,6 +66,14 @@ endif
|
|
|
|
ifneq (,$(filter -mno-tls-direct-seg-refs,$(CFLAGS)))
|
|
defines += -DNO_TLS_DIRECT_SEG_REFS
|
|
+else
|
|
+# .a libraries are not performance critical and so we
|
|
+# build them without direct TLS segment references
|
|
+# always.
|
|
+CPPFLAGS-.o += -DNO_TLS_DIRECT_SEG_REFS
|
|
+CFLAGS-.o += -mno-tls-direct-seg-refs
|
|
+CPPFLAGS-.oS += -DNO_TLS_DIRECT_SEG_REFS
|
|
+CFLAGS-.oS += -mno-tls-direct-seg-refs
|
|
endif
|
|
|
|
ifeq ($(subdir),elf)
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/bcopy.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,3 +0,0 @@
|
|
-#define USE_AS_BCOPY
|
|
-#define memmove bcopy
|
|
-#include <sysdeps/i386/i686/memmove.S>
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/cacheinfo.c
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/cacheinfo.c
|
|
@@ -1,4 +1,3 @@
|
|
-#define __x86_64_data_cache_size __x86_data_cache_size
|
|
#define __x86_64_data_cache_size_half __x86_data_cache_size_half
|
|
#define __x86_64_shared_cache_size __x86_shared_cache_size
|
|
#define __x86_64_shared_cache_size_half __x86_shared_cache_size_half
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/memcpy.S
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/memcpy.S
|
|
@@ -32,11 +32,11 @@
|
|
|
|
.text
|
|
#if defined PIC && !defined NOT_IN_libc
|
|
-ENTRY_CHK (__memcpy_chk)
|
|
+ENTRY (__memcpy_chk)
|
|
movl 12(%esp), %eax
|
|
cmpl %eax, 16(%esp)
|
|
jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END_CHK (__memcpy_chk)
|
|
+END (__memcpy_chk)
|
|
#endif
|
|
ENTRY (BP_SYM (memcpy))
|
|
ENTER
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/memmove.S
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/memmove.S
|
|
@@ -26,27 +26,18 @@
|
|
|
|
#define PARMS LINKAGE+4 /* one spilled register */
|
|
#define RTN PARMS
|
|
+#define DEST RTN+RTN_SIZE
|
|
+#define SRC DEST+PTR_SIZE
|
|
+#define LEN SRC+PTR_SIZE
|
|
|
|
.text
|
|
-
|
|
-#ifdef USE_AS_BCOPY
|
|
-# define SRC RTN+RTN_SIZE
|
|
-# define DEST SRC+PTR_SIZE
|
|
-# define LEN DEST+PTR_SIZE
|
|
-#else
|
|
-# define DEST RTN+RTN_SIZE
|
|
-# define SRC DEST+PTR_SIZE
|
|
-# define LEN SRC+PTR_SIZE
|
|
-
|
|
-# if defined PIC && !defined NOT_IN_libc
|
|
-ENTRY_CHK (__memmove_chk)
|
|
+#if defined PIC && !defined NOT_IN_libc
|
|
+ENTRY (__memmove_chk)
|
|
movl 12(%esp), %eax
|
|
cmpl %eax, 16(%esp)
|
|
jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END_CHK (__memmove_chk)
|
|
-# endif
|
|
+END (__memmove_chk)
|
|
#endif
|
|
-
|
|
ENTRY (BP_SYM (memmove))
|
|
ENTER
|
|
|
|
@@ -78,10 +69,8 @@ ENTRY (BP_SYM (memmove))
|
|
movsl
|
|
movl %edx, %esi
|
|
cfi_restore (esi)
|
|
-#ifndef USE_AS_BCOPY
|
|
movl DEST(%esp), %eax
|
|
RETURN_BOUNDED_POINTER (DEST(%esp))
|
|
-#endif
|
|
|
|
popl %edi
|
|
cfi_adjust_cfa_offset (-4)
|
|
@@ -112,10 +101,8 @@ ENTRY (BP_SYM (memmove))
|
|
movsl
|
|
movl %edx, %esi
|
|
cfi_restore (esi)
|
|
-#ifndef USE_AS_BCOPY
|
|
movl DEST(%esp), %eax
|
|
RETURN_BOUNDED_POINTER (DEST(%esp))
|
|
-#endif
|
|
|
|
cld
|
|
popl %edi
|
|
@@ -125,6 +112,4 @@ ENTRY (BP_SYM (memmove))
|
|
LEAVE
|
|
RET_PTR
|
|
END (BP_SYM (memmove))
|
|
-#ifndef USE_AS_BCOPY
|
|
libc_hidden_builtin_def (memmove)
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/mempcpy.S
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/mempcpy.S
|
|
@@ -32,11 +32,11 @@
|
|
|
|
.text
|
|
#if defined PIC && !defined NOT_IN_libc
|
|
-ENTRY_CHK (__mempcpy_chk)
|
|
+ENTRY (__mempcpy_chk)
|
|
movl 12(%esp), %eax
|
|
cmpl %eax, 16(%esp)
|
|
jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END_CHK (__mempcpy_chk)
|
|
+END (__mempcpy_chk)
|
|
#endif
|
|
ENTRY (BP_SYM (__mempcpy))
|
|
ENTER
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/memset.S
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/memset.S
|
|
@@ -40,11 +40,11 @@
|
|
|
|
.text
|
|
#if defined PIC && !defined NOT_IN_libc && !BZERO_P
|
|
-ENTRY_CHK (__memset_chk)
|
|
+ENTRY (__memset_chk)
|
|
movl 12(%esp), %eax
|
|
cmpl %eax, 16(%esp)
|
|
jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END_CHK (__memset_chk)
|
|
+END (__memset_chk)
|
|
#endif
|
|
ENTRY (BP_SYM (memset))
|
|
ENTER
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/Makefile
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/multiarch/Makefile
|
|
@@ -4,10 +4,6 @@ gen-as-const-headers += ifunc-defines.sym
|
|
endif
|
|
|
|
ifeq ($(subdir),string)
|
|
-sysdep_routines += bzero-sse2 memset-sse2 memcpy-ssse3 mempcpy-ssse3 \
|
|
- memmove-ssse3 memcpy-ssse3-rep mempcpy-ssse3-rep \
|
|
- memmove-ssse3-rep bcopy-ssse3 bcopy-ssse3-rep \
|
|
- memset-sse2-rep bzero-sse2-rep
|
|
ifeq (yes,$(config-cflags-sse4))
|
|
sysdep_routines += strcspn-c strpbrk-c strspn-c strstr-c strcasestr-c
|
|
CFLAGS-strcspn-c.c += -msse4
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/bcopy-ssse3-rep.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,4 +0,0 @@
|
|
-#define USE_AS_MEMMOVE
|
|
-#define USE_AS_BCOPY
|
|
-#define MEMCPY __bcopy_ssse3_rep
|
|
-#include "memcpy-ssse3-rep.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/bcopy-ssse3.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,4 +0,0 @@
|
|
-#define USE_AS_MEMMOVE
|
|
-#define USE_AS_BCOPY
|
|
-#define MEMCPY __bcopy_ssse3
|
|
-#include "memcpy-ssse3.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/bcopy.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,89 +0,0 @@
|
|
-/* Multiple versions of bcopy
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib. */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(bcopy)
|
|
- .type bcopy, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __bcopy_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __bcopy_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __bcopy_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(bcopy)
|
|
-# else
|
|
- .text
|
|
-ENTRY(bcopy)
|
|
- .type bcopy, @gnu_indirect_function
|
|
- cmpl $0, KIND_OFFSET+__cpu_features
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __bcopy_ia32, %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features
|
|
- jz 2f
|
|
- leal __bcopy_ssse3, %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features
|
|
- jz 2f
|
|
- leal __bcopy_ssse3_rep, %eax
|
|
-2: ret
|
|
-END(bcopy)
|
|
-# endif
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __bcopy_ia32, @function; \
|
|
- .p2align 4; \
|
|
- __bcopy_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END
|
|
-# define END(name) \
|
|
- cfi_endproc; .size __bcopy_ia32, .-__bcopy_ia32
|
|
-
|
|
-#endif
|
|
-
|
|
-#include "../bcopy.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/bzero-sse2-rep.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,3 +0,0 @@
|
|
-#define USE_AS_BZERO
|
|
-#define __memset_sse2_rep __bzero_sse2_rep
|
|
-#include "memset-sse2-rep.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/bzero-sse2.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,3 +0,0 @@
|
|
-#define USE_AS_BZERO
|
|
-#define __memset_sse2 __bzero_sse2
|
|
-#include "memset-sse2.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/bzero.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,97 +0,0 @@
|
|
-/* Multiple versions of bzero
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib. */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(__bzero)
|
|
- .type __bzero, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __bzero_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSE2, CPUID_OFFSET+index_SSE2+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __bzero_sse2@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __bzero_sse2_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(__bzero)
|
|
-# else
|
|
- .text
|
|
-ENTRY(__bzero)
|
|
- .type __bzero, @gnu_indirect_function
|
|
- cmpl $0, KIND_OFFSET+__cpu_features
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __bzero_ia32, %eax
|
|
- testl $bit_SSE2, CPUID_OFFSET+index_SSE2+__cpu_features
|
|
- jz 2f
|
|
- leal __bzero_sse2, %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features
|
|
- jz 2f
|
|
- leal __bzero_sse2_rep, %eax
|
|
-2: ret
|
|
-END(__bzero)
|
|
-# endif
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __bzero_ia32, @function; \
|
|
- .p2align 4; \
|
|
- __bzero_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END
|
|
-# define END(name) \
|
|
- cfi_endproc; .size __bzero_ia32, .-__bzero_ia32
|
|
-
|
|
-# ifdef SHARED
|
|
-# undef libc_hidden_builtin_def
|
|
-/* IFUNC doesn't work with the hidden functions in shared library since
|
|
- they will be called without setting up EBX needed for PLT which is
|
|
- used by IFUNC. */
|
|
-# define libc_hidden_builtin_def(name) \
|
|
- .globl __GI___bzero; __GI___bzero = __bzero_ia32
|
|
-# endif
|
|
-#endif
|
|
-
|
|
-#include "../bzero.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/ifunc-defines.sym
|
|
+++ glibc-2.11.90-11/sysdeps/i386/i686/multiarch/ifunc-defines.sym
|
|
@@ -13,8 +13,5 @@ CPUID_ECX_OFFSET offsetof (struct cpuid_registers, ecx)
|
|
CPUID_EDX_OFFSET offsetof (struct cpuid_registers, edx)
|
|
FAMILY_OFFSET offsetof (struct cpu_features, family)
|
|
MODEL_OFFSET offsetof (struct cpu_features, model)
|
|
-FEATURE_OFFSET offsetof (struct cpu_features, feature)
|
|
-FEATURE_SIZE sizeof (unsigned int)
|
|
|
|
COMMON_CPUID_INDEX_1
|
|
-FEATURE_INDEX_1
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memcpy-ssse3-rep.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,1785 +0,0 @@
|
|
-/* memcpy with SSSE3 and REP string.
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-
|
|
-#if !defined NOT_IN_libc \
|
|
- && (defined SHARED \
|
|
- || defined USE_AS_MEMMOVE \
|
|
- || !defined USE_MULTIARCH)
|
|
-
|
|
-#include "asm-syntax.h"
|
|
-
|
|
-#ifndef MEMCPY
|
|
-# define MEMCPY __memcpy_ssse3_rep
|
|
-# define MEMCPY_CHK __memcpy_chk_ssse3_rep
|
|
-#endif
|
|
-
|
|
-#ifdef USE_AS_BCOPY
|
|
-# define SRC PARMS
|
|
-# define DEST SRC+4
|
|
-# define LEN DEST+4
|
|
-#else
|
|
-# define DEST PARMS
|
|
-# define SRC DEST+4
|
|
-# define LEN SRC+4
|
|
-#endif
|
|
-
|
|
-#define CFI_PUSH(REG) \
|
|
- cfi_adjust_cfa_offset (4); \
|
|
- cfi_rel_offset (REG, 0)
|
|
-
|
|
-#define CFI_POP(REG) \
|
|
- cfi_adjust_cfa_offset (-4); \
|
|
- cfi_restore (REG)
|
|
-
|
|
-#define PUSH(REG) pushl REG; CFI_PUSH (REG)
|
|
-#define POP(REG) popl REG; CFI_POP (REG)
|
|
-
|
|
-#ifdef SHARED
|
|
-# define PARMS 8 /* Preserve EBX. */
|
|
-# define ENTRANCE PUSH (%ebx);
|
|
-# define RETURN_END POP (%ebx); ret
|
|
-# define RETURN RETURN_END; CFI_PUSH (%ebx)
|
|
-# define JMPTBL(I, B) I - B
|
|
-
|
|
-/* Load an entry in a jump table into EBX and branch to it. TABLE is a
|
|
- jump table with relative offsets. INDEX is a register contains the
|
|
- index into the jump table. SCALE is the scale of INDEX. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE, INDEX, SCALE) \
|
|
- /* We first load PC into EBX. */ \
|
|
- call __i686.get_pc_thunk.bx; \
|
|
- /* Get the address of the jump table. */ \
|
|
- addl $(TABLE - .), %ebx; \
|
|
- /* Get the entry and convert the relative offset to the \
|
|
- absolute address. */ \
|
|
- addl (%ebx,INDEX,SCALE), %ebx; \
|
|
- /* We loaded the jump table. Go. */ \
|
|
- jmp *%ebx
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_VALUE(TABLE) \
|
|
- addl $(TABLE - .), %ebx
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_TAIL(TABLE, INDEX, SCALE) \
|
|
- addl (%ebx,INDEX,SCALE), %ebx; \
|
|
- /* We loaded the jump table. Go. */ \
|
|
- jmp *%ebx
|
|
-
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- ALIGN (4)
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-#else
|
|
-# define PARMS 4
|
|
-# define ENTRANCE
|
|
-# define RETURN_END ret
|
|
-# define RETURN RETURN_END
|
|
-# define JMPTBL(I, B) I
|
|
-
|
|
-/* Branch to an entry in a jump table. TABLE is a jump table with
|
|
- absolute offsets. INDEX is a register contains the index into the
|
|
- jump table. SCALE is the scale of INDEX. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE, INDEX, SCALE) \
|
|
- jmp *TABLE(,INDEX,SCALE)
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_VALUE(TABLE)
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_TAIL(TABLE, INDEX, SCALE) \
|
|
- jmp *TABLE(,INDEX,SCALE)
|
|
-#endif
|
|
-
|
|
- .section .text.ssse3,"ax",@progbits
|
|
-#if defined SHARED && !defined NOT_IN_libc && !defined USE_AS_BCOPY
|
|
-ENTRY (MEMCPY_CHK)
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END (MEMCPY_CHK)
|
|
-#endif
|
|
-ENTRY (MEMCPY)
|
|
- ENTRANCE
|
|
- movl LEN(%esp), %ecx
|
|
- movl SRC(%esp), %eax
|
|
- movl DEST(%esp), %edx
|
|
-
|
|
-#ifdef USE_AS_MEMMOVE
|
|
- cmp %eax, %edx
|
|
- jb L(copy_forward)
|
|
- je L(fwd_write_0bytes)
|
|
- cmp $32, %ecx
|
|
- jge L(memmove_bwd)
|
|
- jmp L(bk_write_less32bytes_2)
|
|
-L(memmove_bwd):
|
|
- add %ecx, %eax
|
|
- cmp %eax, %edx
|
|
- movl SRC(%esp), %eax
|
|
- jb L(copy_backward)
|
|
-
|
|
-L(copy_forward):
|
|
-#endif
|
|
- cmp $48, %ecx
|
|
- jge L(48bytesormore)
|
|
-
|
|
-L(fwd_write_less32bytes):
|
|
-#ifndef USE_AS_MEMMOVE
|
|
- cmp %dl, %al
|
|
- jl L(bk_write)
|
|
-#endif
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-#ifndef USE_AS_MEMMOVE
|
|
-L(bk_write):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48_bytes_bwd), %ecx, 4)
|
|
-#endif
|
|
-
|
|
- ALIGN (4)
|
|
-/* ECX > 32 and EDX is 4 byte aligned. */
|
|
-L(48bytesormore):
|
|
- movdqu (%eax), %xmm0
|
|
- PUSH (%edi)
|
|
- movl %edx, %edi
|
|
- and $-16, %edx
|
|
- PUSH (%esi)
|
|
- add $16, %edx
|
|
- movl %edi, %esi
|
|
- sub %edx, %edi
|
|
- add %edi, %ecx
|
|
- sub %edi, %eax
|
|
-
|
|
-#ifdef SHARED_CACHE_SIZE_HALF
|
|
- cmp $SHARED_CACHE_SIZE_HALF, %ecx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmp __x86_shared_cache_size_half@GOTOFF(%ebx), %ecx
|
|
-# else
|
|
- cmp __x86_shared_cache_size_half, %ecx
|
|
-# endif
|
|
-#endif
|
|
-
|
|
- mov %eax, %edi
|
|
- jge L(large_page)
|
|
- and $0xf, %edi
|
|
- jz L(shl_0)
|
|
-
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(shl_table), %edi, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_0):
|
|
- movdqu %xmm0, (%esi)
|
|
- xor %edi, %edi
|
|
- cmp $127, %ecx
|
|
- ja L(shl_0_gobble)
|
|
- lea -32(%ecx), %ecx
|
|
-L(shl_0_loop):
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
- jl L(shl_0_end)
|
|
-
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
- jl L(shl_0_end)
|
|
-
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
- jl L(shl_0_end)
|
|
-
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
-L(shl_0_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- add %edi, %eax
|
|
- POP (%esi)
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-L(shl_0_gobble):
|
|
-
|
|
-#ifdef DATA_CACHE_SIZE_HALF
|
|
- cmp $DATA_CACHE_SIZE_HALF, %ecx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- mov __x86_data_cache_size_half@GOTOFF(%ebx), %edi
|
|
-# else
|
|
- mov __x86_data_cache_size_half, %edi
|
|
-# endif
|
|
-#endif
|
|
- mov %edi, %esi
|
|
- shr $3, %esi
|
|
- sub %esi, %edi
|
|
- cmp %edi, %ecx
|
|
- jge L(shl_0_gobble_mem_start)
|
|
- lea -128(%ecx), %ecx
|
|
- ALIGN (4)
|
|
-L(shl_0_gobble_cache_loop):
|
|
- movdqa (%eax), %xmm0
|
|
- movaps 0x10(%eax), %xmm1
|
|
- movaps 0x20(%eax), %xmm2
|
|
- movaps 0x30(%eax), %xmm3
|
|
- movaps 0x40(%eax), %xmm4
|
|
- movaps 0x50(%eax), %xmm5
|
|
- movaps 0x60(%eax), %xmm6
|
|
- movaps 0x70(%eax), %xmm7
|
|
- lea 0x80(%eax), %eax
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movaps %xmm1, 0x10(%edx)
|
|
- movaps %xmm2, 0x20(%edx)
|
|
- movaps %xmm3, 0x30(%edx)
|
|
- movaps %xmm4, 0x40(%edx)
|
|
- movaps %xmm5, 0x50(%edx)
|
|
- movaps %xmm6, 0x60(%edx)
|
|
- movaps %xmm7, 0x70(%edx)
|
|
- lea 0x80(%edx), %edx
|
|
-
|
|
- jge L(shl_0_gobble_cache_loop)
|
|
-L(shl_0_gobble_cache_loop_tail):
|
|
- cmp $-0x40, %ecx
|
|
- lea 0x80(%ecx), %ecx
|
|
- jl L(shl_0_cache_less_64bytes)
|
|
-
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x40, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
-
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
-
|
|
- movdqa 0x20(%eax), %xmm0
|
|
- movdqa 0x30(%eax), %xmm1
|
|
- add $0x40, %eax
|
|
-
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm1, 0x30(%edx)
|
|
- add $0x40, %edx
|
|
-L(shl_0_cache_less_64bytes):
|
|
- cmp $0x20, %ecx
|
|
- jl L(shl_0_cache_less_32bytes)
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x20, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
- add $0x20, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- add $0x20, %edx
|
|
-L(shl_0_cache_less_32bytes):
|
|
- cmp $0x10, %ecx
|
|
- jl L(shl_0_cache_less_16bytes)
|
|
- sub $0x10, %ecx
|
|
- movdqa (%eax), %xmm0
|
|
- add $0x10, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- add $0x10, %edx
|
|
-L(shl_0_cache_less_16bytes):
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- POP (%esi)
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_0_gobble_mem_start):
|
|
- cmp %al, %dl
|
|
- je L(copy_page_by_rep)
|
|
- lea -128(%ecx), %ecx
|
|
-L(shl_0_gobble_mem_loop):
|
|
- prefetchnta 0x1c0(%eax)
|
|
- prefetchnta 0x280(%eax)
|
|
- prefetchnta 0x1c0(%edx)
|
|
- prefetchnta 0x280(%edx)
|
|
-
|
|
- movdqa (%eax), %xmm0
|
|
- movaps 0x10(%eax), %xmm1
|
|
- movaps 0x20(%eax), %xmm2
|
|
- movaps 0x30(%eax), %xmm3
|
|
- movaps 0x40(%eax), %xmm4
|
|
- movaps 0x50(%eax), %xmm5
|
|
- movaps 0x60(%eax), %xmm6
|
|
- movaps 0x70(%eax), %xmm7
|
|
- lea 0x80(%eax), %eax
|
|
- sub $0x80, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movaps %xmm1, 0x10(%edx)
|
|
- movaps %xmm2, 0x20(%edx)
|
|
- movaps %xmm3, 0x30(%edx)
|
|
- movaps %xmm4, 0x40(%edx)
|
|
- movaps %xmm5, 0x50(%edx)
|
|
- movaps %xmm6, 0x60(%edx)
|
|
- movaps %xmm7, 0x70(%edx)
|
|
- lea 0x80(%edx), %edx
|
|
-
|
|
- jge L(shl_0_gobble_mem_loop)
|
|
- cmp $-0x40, %ecx
|
|
- lea 0x80(%ecx), %ecx
|
|
- jl L(shl_0_mem_less_64bytes)
|
|
-
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x40, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
-
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
-
|
|
- movdqa 0x20(%eax), %xmm0
|
|
- movdqa 0x30(%eax), %xmm1
|
|
- add $0x40, %eax
|
|
-
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm1, 0x30(%edx)
|
|
- add $0x40, %edx
|
|
-L(shl_0_mem_less_64bytes):
|
|
- cmp $0x20, %ecx
|
|
- jl L(shl_0_mem_less_32bytes)
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x20, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
- add $0x20, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- add $0x20, %edx
|
|
-L(shl_0_mem_less_32bytes):
|
|
- cmp $0x10, %ecx
|
|
- jl L(shl_0_mem_less_16bytes)
|
|
- sub $0x10, %ecx
|
|
- movdqa (%eax), %xmm0
|
|
- add $0x10, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- add $0x10, %edx
|
|
-L(shl_0_mem_less_16bytes):
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- POP (%esi)
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_1):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -1(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_1_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $1, %xmm2, %xmm3
|
|
- palignr $1, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_1_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $1, %xmm2, %xmm3
|
|
- palignr $1, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_1_loop)
|
|
-
|
|
-L(shl_1_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 1(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_2):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -2(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_2_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $2, %xmm2, %xmm3
|
|
- palignr $2, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_2_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $2, %xmm2, %xmm3
|
|
- palignr $2, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_2_loop)
|
|
-
|
|
-L(shl_2_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 2(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_3):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -3(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_3_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $3, %xmm2, %xmm3
|
|
- palignr $3, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_3_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $3, %xmm2, %xmm3
|
|
- palignr $3, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_3_loop)
|
|
-
|
|
-L(shl_3_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 3(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_4):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -4(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_4_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $4, %xmm2, %xmm3
|
|
- palignr $4, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_4_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $4, %xmm2, %xmm3
|
|
- palignr $4, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_4_loop)
|
|
-
|
|
-L(shl_4_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 4(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_5):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -5(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_5_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $5, %xmm2, %xmm3
|
|
- palignr $5, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_5_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $5, %xmm2, %xmm3
|
|
- palignr $5, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_5_loop)
|
|
-
|
|
-L(shl_5_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 5(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_6):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -6(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_6_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $6, %xmm2, %xmm3
|
|
- palignr $6, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_6_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $6, %xmm2, %xmm3
|
|
- palignr $6, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_6_loop)
|
|
-
|
|
-L(shl_6_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 6(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_7):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -7(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_7_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $7, %xmm2, %xmm3
|
|
- palignr $7, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_7_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $7, %xmm2, %xmm3
|
|
- palignr $7, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_7_loop)
|
|
-
|
|
-L(shl_7_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 7(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_8):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -8(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_8_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $8, %xmm2, %xmm3
|
|
- palignr $8, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_8_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $8, %xmm2, %xmm3
|
|
- palignr $8, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_8_loop)
|
|
-
|
|
-L(shl_8_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 8(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_9):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -9(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_9_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $9, %xmm2, %xmm3
|
|
- palignr $9, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_9_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $9, %xmm2, %xmm3
|
|
- palignr $9, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_9_loop)
|
|
-
|
|
-L(shl_9_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 9(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_10):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -10(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_10_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $10, %xmm2, %xmm3
|
|
- palignr $10, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_10_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $10, %xmm2, %xmm3
|
|
- palignr $10, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_10_loop)
|
|
-
|
|
-L(shl_10_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 10(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_11):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -11(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_11_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $11, %xmm2, %xmm3
|
|
- palignr $11, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_11_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $11, %xmm2, %xmm3
|
|
- palignr $11, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_11_loop)
|
|
-
|
|
-L(shl_11_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 11(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_12):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -12(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_12_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $12, %xmm2, %xmm3
|
|
- palignr $12, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_12_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $12, %xmm2, %xmm3
|
|
- palignr $12, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_12_loop)
|
|
-
|
|
-L(shl_12_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 12(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_13):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -13(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_13_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $13, %xmm2, %xmm3
|
|
- palignr $13, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_13_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $13, %xmm2, %xmm3
|
|
- palignr $13, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_13_loop)
|
|
-
|
|
-L(shl_13_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 13(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_14):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -14(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_14_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $14, %xmm2, %xmm3
|
|
- palignr $14, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_14_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $14, %xmm2, %xmm3
|
|
- palignr $14, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_14_loop)
|
|
-
|
|
-L(shl_14_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 14(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_15):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -15(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_15_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $15, %xmm2, %xmm3
|
|
- palignr $15, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_15_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $15, %xmm2, %xmm3
|
|
- palignr $15, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_15_loop)
|
|
-
|
|
-L(shl_15_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 15(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_44bytes):
|
|
- movl -44(%eax), %ecx
|
|
- movl %ecx, -44(%edx)
|
|
-L(fwd_write_40bytes):
|
|
- movl -40(%eax), %ecx
|
|
- movl %ecx, -40(%edx)
|
|
-L(fwd_write_36bytes):
|
|
- movl -36(%eax), %ecx
|
|
- movl %ecx, -36(%edx)
|
|
-L(fwd_write_32bytes):
|
|
- movl -32(%eax), %ecx
|
|
- movl %ecx, -32(%edx)
|
|
-L(fwd_write_28bytes):
|
|
- movl -28(%eax), %ecx
|
|
- movl %ecx, -28(%edx)
|
|
-L(fwd_write_24bytes):
|
|
- movl -24(%eax), %ecx
|
|
- movl %ecx, -24(%edx)
|
|
-L(fwd_write_20bytes):
|
|
- movl -20(%eax), %ecx
|
|
- movl %ecx, -20(%edx)
|
|
-L(fwd_write_16bytes):
|
|
- movl -16(%eax), %ecx
|
|
- movl %ecx, -16(%edx)
|
|
-L(fwd_write_12bytes):
|
|
- movl -12(%eax), %ecx
|
|
- movl %ecx, -12(%edx)
|
|
-L(fwd_write_8bytes):
|
|
- movl -8(%eax), %ecx
|
|
- movl %ecx, -8(%edx)
|
|
-L(fwd_write_4bytes):
|
|
- movl -4(%eax), %ecx
|
|
- movl %ecx, -4(%edx)
|
|
-L(fwd_write_0bytes):
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_5bytes):
|
|
- movl -5(%eax), %ecx
|
|
- movl -4(%eax), %eax
|
|
- movl %ecx, -5(%edx)
|
|
- movl %eax, -4(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_45bytes):
|
|
- movl -45(%eax), %ecx
|
|
- movl %ecx, -45(%edx)
|
|
-L(fwd_write_41bytes):
|
|
- movl -41(%eax), %ecx
|
|
- movl %ecx, -41(%edx)
|
|
-L(fwd_write_37bytes):
|
|
- movl -37(%eax), %ecx
|
|
- movl %ecx, -37(%edx)
|
|
-L(fwd_write_33bytes):
|
|
- movl -33(%eax), %ecx
|
|
- movl %ecx, -33(%edx)
|
|
-L(fwd_write_29bytes):
|
|
- movl -29(%eax), %ecx
|
|
- movl %ecx, -29(%edx)
|
|
-L(fwd_write_25bytes):
|
|
- movl -25(%eax), %ecx
|
|
- movl %ecx, -25(%edx)
|
|
-L(fwd_write_21bytes):
|
|
- movl -21(%eax), %ecx
|
|
- movl %ecx, -21(%edx)
|
|
-L(fwd_write_17bytes):
|
|
- movl -17(%eax), %ecx
|
|
- movl %ecx, -17(%edx)
|
|
-L(fwd_write_13bytes):
|
|
- movl -13(%eax), %ecx
|
|
- movl %ecx, -13(%edx)
|
|
-L(fwd_write_9bytes):
|
|
- movl -9(%eax), %ecx
|
|
- movl %ecx, -9(%edx)
|
|
- movl -5(%eax), %ecx
|
|
- movl %ecx, -5(%edx)
|
|
-L(fwd_write_1bytes):
|
|
- movzbl -1(%eax), %ecx
|
|
- movb %cl, -1(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_46bytes):
|
|
- movl -46(%eax), %ecx
|
|
- movl %ecx, -46(%edx)
|
|
-L(fwd_write_42bytes):
|
|
- movl -42(%eax), %ecx
|
|
- movl %ecx, -42(%edx)
|
|
-L(fwd_write_38bytes):
|
|
- movl -38(%eax), %ecx
|
|
- movl %ecx, -38(%edx)
|
|
-L(fwd_write_34bytes):
|
|
- movl -34(%eax), %ecx
|
|
- movl %ecx, -34(%edx)
|
|
-L(fwd_write_30bytes):
|
|
- movl -30(%eax), %ecx
|
|
- movl %ecx, -30(%edx)
|
|
-L(fwd_write_26bytes):
|
|
- movl -26(%eax), %ecx
|
|
- movl %ecx, -26(%edx)
|
|
-L(fwd_write_22bytes):
|
|
- movl -22(%eax), %ecx
|
|
- movl %ecx, -22(%edx)
|
|
-L(fwd_write_18bytes):
|
|
- movl -18(%eax), %ecx
|
|
- movl %ecx, -18(%edx)
|
|
-L(fwd_write_14bytes):
|
|
- movl -14(%eax), %ecx
|
|
- movl %ecx, -14(%edx)
|
|
-L(fwd_write_10bytes):
|
|
- movl -10(%eax), %ecx
|
|
- movl %ecx, -10(%edx)
|
|
-L(fwd_write_6bytes):
|
|
- movl -6(%eax), %ecx
|
|
- movl %ecx, -6(%edx)
|
|
-L(fwd_write_2bytes):
|
|
- movzwl -2(%eax), %ecx
|
|
- movw %cx, -2(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_47bytes):
|
|
- movl -47(%eax), %ecx
|
|
- movl %ecx, -47(%edx)
|
|
-L(fwd_write_43bytes):
|
|
- movl -43(%eax), %ecx
|
|
- movl %ecx, -43(%edx)
|
|
-L(fwd_write_39bytes):
|
|
- movl -39(%eax), %ecx
|
|
- movl %ecx, -39(%edx)
|
|
-L(fwd_write_35bytes):
|
|
- movl -35(%eax), %ecx
|
|
- movl %ecx, -35(%edx)
|
|
-L(fwd_write_31bytes):
|
|
- movl -31(%eax), %ecx
|
|
- movl %ecx, -31(%edx)
|
|
-L(fwd_write_27bytes):
|
|
- movl -27(%eax), %ecx
|
|
- movl %ecx, -27(%edx)
|
|
-L(fwd_write_23bytes):
|
|
- movl -23(%eax), %ecx
|
|
- movl %ecx, -23(%edx)
|
|
-L(fwd_write_19bytes):
|
|
- movl -19(%eax), %ecx
|
|
- movl %ecx, -19(%edx)
|
|
-L(fwd_write_15bytes):
|
|
- movl -15(%eax), %ecx
|
|
- movl %ecx, -15(%edx)
|
|
-L(fwd_write_11bytes):
|
|
- movl -11(%eax), %ecx
|
|
- movl %ecx, -11(%edx)
|
|
-L(fwd_write_7bytes):
|
|
- movl -7(%eax), %ecx
|
|
- movl %ecx, -7(%edx)
|
|
-L(fwd_write_3bytes):
|
|
- movzwl -3(%eax), %ecx
|
|
- movzbl -1(%eax), %eax
|
|
- movw %cx, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(large_page):
|
|
- movdqu (%eax), %xmm1
|
|
- lea 16(%eax), %eax
|
|
- movdqu %xmm0, (%esi)
|
|
- movntdq %xmm1, (%edx)
|
|
- lea 16(%edx), %edx
|
|
- cmp %al, %dl
|
|
- je L(copy_page_by_rep)
|
|
-L(large_page_loop_init):
|
|
- POP (%esi)
|
|
- lea -0x90(%ecx), %ecx
|
|
- POP (%edi)
|
|
-L(large_page_loop):
|
|
- prefetchnta 0x1c0(%eax)
|
|
- prefetchnta 0x280(%eax)
|
|
- movdqu (%eax), %xmm0
|
|
- movdqu 0x10(%eax), %xmm1
|
|
- movdqu 0x20(%eax), %xmm2
|
|
- movdqu 0x30(%eax), %xmm3
|
|
- movdqu 0x40(%eax), %xmm4
|
|
- movdqu 0x50(%eax), %xmm5
|
|
- movdqu 0x60(%eax), %xmm6
|
|
- movdqu 0x70(%eax), %xmm7
|
|
- lea 0x80(%eax), %eax
|
|
- lfence
|
|
- sub $0x80, %ecx
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm1, 0x10(%edx)
|
|
- movntdq %xmm2, 0x20(%edx)
|
|
- movntdq %xmm3, 0x30(%edx)
|
|
- movntdq %xmm4, 0x40(%edx)
|
|
- movntdq %xmm5, 0x50(%edx)
|
|
- movntdq %xmm6, 0x60(%edx)
|
|
- movntdq %xmm7, 0x70(%edx)
|
|
- lea 0x80(%edx), %edx
|
|
- jae L(large_page_loop)
|
|
- cmp $-0x40, %ecx
|
|
- lea 0x80(%ecx), %ecx
|
|
- jl L(large_page_less_64bytes)
|
|
-
|
|
- movdqu (%eax), %xmm0
|
|
- movdqu 0x10(%eax), %xmm1
|
|
- movdqu 0x20(%eax), %xmm2
|
|
- movdqu 0x30(%eax), %xmm3
|
|
- lea 0x40(%eax), %eax
|
|
-
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm1, 0x10(%edx)
|
|
- movntdq %xmm2, 0x20(%edx)
|
|
- movntdq %xmm3, 0x30(%edx)
|
|
- lea 0x40(%edx), %edx
|
|
- sub $0x40, %ecx
|
|
-L(large_page_less_64bytes):
|
|
- cmp $32, %ecx
|
|
- jl L(large_page_less_32bytes)
|
|
- movdqu (%eax), %xmm0
|
|
- movdqu 0x10(%eax), %xmm1
|
|
- lea 0x20(%eax), %eax
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm1, 0x10(%edx)
|
|
- lea 0x20(%edx), %edx
|
|
- sub $0x20, %ecx
|
|
-L(large_page_less_32bytes):
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- sfence
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(copy_page_by_rep):
|
|
- mov %eax, %esi
|
|
- mov %edx, %edi
|
|
- mov %ecx, %edx
|
|
- shr $2, %ecx
|
|
- and $3, %edx
|
|
- rep movsl
|
|
- jz L(copy_page_by_rep_exit)
|
|
- cmp $2, %edx
|
|
- jb L(copy_page_by_rep_left_1)
|
|
- movzwl (%esi), %eax
|
|
- movw %ax, (%edi)
|
|
- add $2, %esi
|
|
- add $2, %edi
|
|
- sub $2, %edx
|
|
- jz L(copy_page_by_rep_exit)
|
|
-L(copy_page_by_rep_left_1):
|
|
- movzbl (%esi), %eax
|
|
- movb %al, (%edi)
|
|
-L(copy_page_by_rep_exit):
|
|
- POP (%esi)
|
|
- POP (%edi)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_44bytes):
|
|
- movl 40(%eax), %ecx
|
|
- movl %ecx, 40(%edx)
|
|
-L(bk_write_40bytes):
|
|
- movl 36(%eax), %ecx
|
|
- movl %ecx, 36(%edx)
|
|
-L(bk_write_36bytes):
|
|
- movl 32(%eax), %ecx
|
|
- movl %ecx, 32(%edx)
|
|
-L(bk_write_32bytes):
|
|
- movl 28(%eax), %ecx
|
|
- movl %ecx, 28(%edx)
|
|
-L(bk_write_28bytes):
|
|
- movl 24(%eax), %ecx
|
|
- movl %ecx, 24(%edx)
|
|
-L(bk_write_24bytes):
|
|
- movl 20(%eax), %ecx
|
|
- movl %ecx, 20(%edx)
|
|
-L(bk_write_20bytes):
|
|
- movl 16(%eax), %ecx
|
|
- movl %ecx, 16(%edx)
|
|
-L(bk_write_16bytes):
|
|
- movl 12(%eax), %ecx
|
|
- movl %ecx, 12(%edx)
|
|
-L(bk_write_12bytes):
|
|
- movl 8(%eax), %ecx
|
|
- movl %ecx, 8(%edx)
|
|
-L(bk_write_8bytes):
|
|
- movl 4(%eax), %ecx
|
|
- movl %ecx, 4(%edx)
|
|
-L(bk_write_4bytes):
|
|
- movl (%eax), %ecx
|
|
- movl %ecx, (%edx)
|
|
-L(bk_write_0bytes):
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_45bytes):
|
|
- movl 41(%eax), %ecx
|
|
- movl %ecx, 41(%edx)
|
|
-L(bk_write_41bytes):
|
|
- movl 37(%eax), %ecx
|
|
- movl %ecx, 37(%edx)
|
|
-L(bk_write_37bytes):
|
|
- movl 33(%eax), %ecx
|
|
- movl %ecx, 33(%edx)
|
|
-L(bk_write_33bytes):
|
|
- movl 29(%eax), %ecx
|
|
- movl %ecx, 29(%edx)
|
|
-L(bk_write_29bytes):
|
|
- movl 25(%eax), %ecx
|
|
- movl %ecx, 25(%edx)
|
|
-L(bk_write_25bytes):
|
|
- movl 21(%eax), %ecx
|
|
- movl %ecx, 21(%edx)
|
|
-L(bk_write_21bytes):
|
|
- movl 17(%eax), %ecx
|
|
- movl %ecx, 17(%edx)
|
|
-L(bk_write_17bytes):
|
|
- movl 13(%eax), %ecx
|
|
- movl %ecx, 13(%edx)
|
|
-L(bk_write_13bytes):
|
|
- movl 9(%eax), %ecx
|
|
- movl %ecx, 9(%edx)
|
|
-L(bk_write_9bytes):
|
|
- movl 5(%eax), %ecx
|
|
- movl %ecx, 5(%edx)
|
|
-L(bk_write_5bytes):
|
|
- movl 1(%eax), %ecx
|
|
- movl %ecx, 1(%edx)
|
|
-L(bk_write_1bytes):
|
|
- movzbl (%eax), %ecx
|
|
- movb %cl, (%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_46bytes):
|
|
- movl 42(%eax), %ecx
|
|
- movl %ecx, 42(%edx)
|
|
-L(bk_write_42bytes):
|
|
- movl 38(%eax), %ecx
|
|
- movl %ecx, 38(%edx)
|
|
-L(bk_write_38bytes):
|
|
- movl 34(%eax), %ecx
|
|
- movl %ecx, 34(%edx)
|
|
-L(bk_write_34bytes):
|
|
- movl 30(%eax), %ecx
|
|
- movl %ecx, 30(%edx)
|
|
-L(bk_write_30bytes):
|
|
- movl 26(%eax), %ecx
|
|
- movl %ecx, 26(%edx)
|
|
-L(bk_write_26bytes):
|
|
- movl 22(%eax), %ecx
|
|
- movl %ecx, 22(%edx)
|
|
-L(bk_write_22bytes):
|
|
- movl 18(%eax), %ecx
|
|
- movl %ecx, 18(%edx)
|
|
-L(bk_write_18bytes):
|
|
- movl 14(%eax), %ecx
|
|
- movl %ecx, 14(%edx)
|
|
-L(bk_write_14bytes):
|
|
- movl 10(%eax), %ecx
|
|
- movl %ecx, 10(%edx)
|
|
-L(bk_write_10bytes):
|
|
- movl 6(%eax), %ecx
|
|
- movl %ecx, 6(%edx)
|
|
-L(bk_write_6bytes):
|
|
- movl 2(%eax), %ecx
|
|
- movl %ecx, 2(%edx)
|
|
-L(bk_write_2bytes):
|
|
- movzwl (%eax), %ecx
|
|
- movw %cx, (%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_47bytes):
|
|
- movl 43(%eax), %ecx
|
|
- movl %ecx, 43(%edx)
|
|
-L(bk_write_43bytes):
|
|
- movl 39(%eax), %ecx
|
|
- movl %ecx, 39(%edx)
|
|
-L(bk_write_39bytes):
|
|
- movl 35(%eax), %ecx
|
|
- movl %ecx, 35(%edx)
|
|
-L(bk_write_35bytes):
|
|
- movl 31(%eax), %ecx
|
|
- movl %ecx, 31(%edx)
|
|
-L(bk_write_31bytes):
|
|
- movl 27(%eax), %ecx
|
|
- movl %ecx, 27(%edx)
|
|
-L(bk_write_27bytes):
|
|
- movl 23(%eax), %ecx
|
|
- movl %ecx, 23(%edx)
|
|
-L(bk_write_23bytes):
|
|
- movl 19(%eax), %ecx
|
|
- movl %ecx, 19(%edx)
|
|
-L(bk_write_19bytes):
|
|
- movl 15(%eax), %ecx
|
|
- movl %ecx, 15(%edx)
|
|
-L(bk_write_15bytes):
|
|
- movl 11(%eax), %ecx
|
|
- movl %ecx, 11(%edx)
|
|
-L(bk_write_11bytes):
|
|
- movl 7(%eax), %ecx
|
|
- movl %ecx, 7(%edx)
|
|
-L(bk_write_7bytes):
|
|
- movl 3(%eax), %ecx
|
|
- movl %ecx, 3(%edx)
|
|
-L(bk_write_3bytes):
|
|
- movzwl 1(%eax), %ecx
|
|
- movw %cx, 1(%edx)
|
|
- movzbl (%eax), %eax
|
|
- movb %al, (%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN_END
|
|
-
|
|
-
|
|
- .pushsection .rodata.ssse3,"a",@progbits
|
|
- ALIGN (2)
|
|
-L(table_48bytes_fwd):
|
|
- .int JMPTBL (L(fwd_write_0bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_1bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_2bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_3bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_4bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_5bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_6bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_7bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_8bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_9bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_10bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_11bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_12bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_13bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_14bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_15bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_16bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_17bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_18bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_19bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_20bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_21bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_22bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_23bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_24bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_25bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_26bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_27bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_28bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_29bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_30bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_31bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_32bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_33bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_34bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_35bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_36bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_37bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_38bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_39bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_40bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_41bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_42bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_43bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_44bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_45bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_46bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_47bytes), L(table_48bytes_fwd))
|
|
-
|
|
- ALIGN (2)
|
|
-L(shl_table):
|
|
- .int JMPTBL (L(shl_0), L(shl_table))
|
|
- .int JMPTBL (L(shl_1), L(shl_table))
|
|
- .int JMPTBL (L(shl_2), L(shl_table))
|
|
- .int JMPTBL (L(shl_3), L(shl_table))
|
|
- .int JMPTBL (L(shl_4), L(shl_table))
|
|
- .int JMPTBL (L(shl_5), L(shl_table))
|
|
- .int JMPTBL (L(shl_6), L(shl_table))
|
|
- .int JMPTBL (L(shl_7), L(shl_table))
|
|
- .int JMPTBL (L(shl_8), L(shl_table))
|
|
- .int JMPTBL (L(shl_9), L(shl_table))
|
|
- .int JMPTBL (L(shl_10), L(shl_table))
|
|
- .int JMPTBL (L(shl_11), L(shl_table))
|
|
- .int JMPTBL (L(shl_12), L(shl_table))
|
|
- .int JMPTBL (L(shl_13), L(shl_table))
|
|
- .int JMPTBL (L(shl_14), L(shl_table))
|
|
- .int JMPTBL (L(shl_15), L(shl_table))
|
|
-
|
|
- ALIGN (2)
|
|
-L(table_48_bytes_bwd):
|
|
- .int JMPTBL (L(bk_write_0bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_1bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_2bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_3bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_4bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_5bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_6bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_7bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_8bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_9bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_10bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_11bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_12bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_13bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_14bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_15bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_16bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_17bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_18bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_19bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_20bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_21bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_22bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_23bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_24bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_25bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_26bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_27bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_28bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_29bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_30bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_31bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_32bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_33bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_34bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_35bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_36bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_37bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_38bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_39bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_40bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_41bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_42bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_43bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_44bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_45bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_46bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_47bytes), L(table_48_bytes_bwd))
|
|
-
|
|
- .popsection
|
|
-
|
|
-#ifdef USE_AS_MEMMOVE
|
|
- ALIGN (4)
|
|
-L(copy_backward):
|
|
- PUSH (%esi)
|
|
- movl %eax, %esi
|
|
- lea (%ecx,%edx,1),%edx
|
|
- lea (%ecx,%esi,1),%esi
|
|
- testl $0x3, %edx
|
|
- jnz L(bk_align)
|
|
-
|
|
-L(bk_aligned_4):
|
|
- cmp $64, %ecx
|
|
- jge L(bk_write_more64bytes)
|
|
-
|
|
-L(bk_write_64bytesless):
|
|
- cmp $32, %ecx
|
|
- jl L(bk_write_less32bytes)
|
|
-
|
|
-L(bk_write_more32bytes):
|
|
- /* Copy 32 bytes at a time. */
|
|
- sub $32, %ecx
|
|
- movl -4(%esi), %eax
|
|
- movl %eax, -4(%edx)
|
|
- movl -8(%esi), %eax
|
|
- movl %eax, -8(%edx)
|
|
- movl -12(%esi), %eax
|
|
- movl %eax, -12(%edx)
|
|
- movl -16(%esi), %eax
|
|
- movl %eax, -16(%edx)
|
|
- movl -20(%esi), %eax
|
|
- movl %eax, -20(%edx)
|
|
- movl -24(%esi), %eax
|
|
- movl %eax, -24(%edx)
|
|
- movl -28(%esi), %eax
|
|
- movl %eax, -28(%edx)
|
|
- movl -32(%esi), %eax
|
|
- movl %eax, -32(%edx)
|
|
- sub $32, %edx
|
|
- sub $32, %esi
|
|
-
|
|
-L(bk_write_less32bytes):
|
|
- movl %esi, %eax
|
|
- sub %ecx, %edx
|
|
- sub %ecx, %eax
|
|
- POP (%esi)
|
|
-L(bk_write_less32bytes_2):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48_bytes_bwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_align):
|
|
- cmp $8, %ecx
|
|
- jle L(bk_write_less32bytes)
|
|
- testl $1, %edx
|
|
- /* We get here only if (EDX & 3 ) != 0 so if (EDX & 1) ==0,
|
|
- then (EDX & 2) must be != 0. */
|
|
- jz L(bk_got2)
|
|
- sub $1, %esi
|
|
- sub $1, %ecx
|
|
- sub $1, %edx
|
|
- movzbl (%esi), %eax
|
|
- movb %al, (%edx)
|
|
-
|
|
- testl $2, %edx
|
|
- jz L(bk_aligned_4)
|
|
-
|
|
-L(bk_got2):
|
|
- sub $2, %esi
|
|
- sub $2, %ecx
|
|
- sub $2, %edx
|
|
- movzwl (%esi), %eax
|
|
- movw %ax, (%edx)
|
|
- jmp L(bk_aligned_4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_more64bytes):
|
|
- /* Check alignment of last byte. */
|
|
- testl $15, %edx
|
|
- jz L(bk_ssse3_cpy_pre)
|
|
-
|
|
-/* EDX is aligned 4 bytes, but not 16 bytes. */
|
|
-L(bk_ssse3_align):
|
|
- sub $4, %esi
|
|
- sub $4, %ecx
|
|
- sub $4, %edx
|
|
- movl (%esi), %eax
|
|
- movl %eax, (%edx)
|
|
-
|
|
- testl $15, %edx
|
|
- jz L(bk_ssse3_cpy_pre)
|
|
-
|
|
- sub $4, %esi
|
|
- sub $4, %ecx
|
|
- sub $4, %edx
|
|
- movl (%esi), %eax
|
|
- movl %eax, (%edx)
|
|
-
|
|
- testl $15, %edx
|
|
- jz L(bk_ssse3_cpy_pre)
|
|
-
|
|
- sub $4, %esi
|
|
- sub $4, %ecx
|
|
- sub $4, %edx
|
|
- movl (%esi), %eax
|
|
- movl %eax, (%edx)
|
|
-
|
|
-L(bk_ssse3_cpy_pre):
|
|
- cmp $64, %ecx
|
|
- jl L(bk_write_more32bytes)
|
|
-
|
|
-L(bk_ssse3_cpy):
|
|
- sub $64, %esi
|
|
- sub $64, %ecx
|
|
- sub $64, %edx
|
|
- movdqu 0x30(%esi), %xmm3
|
|
- movdqa %xmm3, 0x30(%edx)
|
|
- movdqu 0x20(%esi), %xmm2
|
|
- movdqa %xmm2, 0x20(%edx)
|
|
- movdqu 0x10(%esi), %xmm1
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- movdqu (%esi), %xmm0
|
|
- movdqa %xmm0, (%edx)
|
|
- cmp $64, %ecx
|
|
- jge L(bk_ssse3_cpy)
|
|
- jmp L(bk_write_64bytesless)
|
|
-
|
|
-#endif
|
|
-
|
|
-END (MEMCPY)
|
|
-
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memcpy-ssse3.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,1737 +0,0 @@
|
|
-/* memcpy with SSSE3
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-
|
|
-#if !defined NOT_IN_libc \
|
|
- && (defined SHARED \
|
|
- || defined USE_AS_MEMMOVE \
|
|
- || !defined USE_MULTIARCH)
|
|
-
|
|
-#include "asm-syntax.h"
|
|
-
|
|
-#ifndef MEMCPY
|
|
-# define MEMCPY __memcpy_ssse3
|
|
-# define MEMCPY_CHK __memcpy_chk_ssse3
|
|
-#endif
|
|
-
|
|
-#ifdef USE_AS_BCOPY
|
|
-# define SRC PARMS
|
|
-# define DEST SRC+4
|
|
-# define LEN DEST+4
|
|
-#else
|
|
-# define DEST PARMS
|
|
-# define SRC DEST+4
|
|
-# define LEN SRC+4
|
|
-#endif
|
|
-
|
|
-#define CFI_PUSH(REG) \
|
|
- cfi_adjust_cfa_offset (4); \
|
|
- cfi_rel_offset (REG, 0)
|
|
-
|
|
-#define CFI_POP(REG) \
|
|
- cfi_adjust_cfa_offset (-4); \
|
|
- cfi_restore (REG)
|
|
-
|
|
-#define PUSH(REG) pushl REG; CFI_PUSH (REG)
|
|
-#define POP(REG) popl REG; CFI_POP (REG)
|
|
-
|
|
-#ifdef SHARED
|
|
-# define PARMS 8 /* Preserve EBX. */
|
|
-# define ENTRANCE PUSH (%ebx);
|
|
-# define RETURN_END POP (%ebx); ret
|
|
-# define RETURN RETURN_END; CFI_PUSH (%ebx)
|
|
-# define JMPTBL(I, B) I - B
|
|
-
|
|
-/* Load an entry in a jump table into EBX and branch to it. TABLE is a
|
|
- jump table with relative offsets. INDEX is a register contains the
|
|
- index into the jump table. SCALE is the scale of INDEX. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE, INDEX, SCALE) \
|
|
- /* We first load PC into EBX. */ \
|
|
- call __i686.get_pc_thunk.bx; \
|
|
- /* Get the address of the jump table. */ \
|
|
- addl $(TABLE - .), %ebx; \
|
|
- /* Get the entry and convert the relative offset to the \
|
|
- absolute address. */ \
|
|
- addl (%ebx,INDEX,SCALE), %ebx; \
|
|
- /* We loaded the jump table. Go. */ \
|
|
- jmp *%ebx
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_VALUE(TABLE) \
|
|
- addl $(TABLE - .), %ebx
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_TAIL(TABLE, INDEX, SCALE) \
|
|
- addl (%ebx,INDEX,SCALE), %ebx; \
|
|
- /* We loaded the jump table. Go. */ \
|
|
- jmp *%ebx
|
|
-
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- ALIGN (4)
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-#else
|
|
-# define PARMS 4
|
|
-# define ENTRANCE
|
|
-# define RETURN_END ret
|
|
-# define RETURN RETURN_END
|
|
-# define JMPTBL(I, B) I
|
|
-
|
|
-/* Branch to an entry in a jump table. TABLE is a jump table with
|
|
- absolute offsets. INDEX is a register contains the index into the
|
|
- jump table. SCALE is the scale of INDEX. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE, INDEX, SCALE) \
|
|
- jmp *TABLE(,INDEX,SCALE)
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_VALUE(TABLE)
|
|
-
|
|
-# define BRANCH_TO_JMPTBL_ENTRY_TAIL(TABLE, INDEX, SCALE) \
|
|
- jmp *TABLE(,INDEX,SCALE)
|
|
-#endif
|
|
-
|
|
- .section .text.ssse3,"ax",@progbits
|
|
-#if defined SHARED && !defined NOT_IN_libc && !defined USE_AS_BCOPY
|
|
-ENTRY (MEMCPY_CHK)
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END (MEMCPY_CHK)
|
|
-#endif
|
|
-ENTRY (MEMCPY)
|
|
- ENTRANCE
|
|
- movl LEN(%esp), %ecx
|
|
- movl SRC(%esp), %eax
|
|
- movl DEST(%esp), %edx
|
|
-
|
|
-#ifdef USE_AS_MEMMOVE
|
|
- cmp %eax, %edx
|
|
- jb L(copy_forward)
|
|
- je L(fwd_write_0bytes)
|
|
- cmp $32, %ecx
|
|
- jge L(memmove_bwd)
|
|
- jmp L(bk_write_less32bytes_2)
|
|
-L(memmove_bwd):
|
|
- add %ecx, %eax
|
|
- cmp %eax, %edx
|
|
- movl SRC(%esp), %eax
|
|
- jb L(copy_backward)
|
|
-
|
|
-L(copy_forward):
|
|
-#endif
|
|
- cmp $48, %ecx
|
|
- jge L(48bytesormore)
|
|
-
|
|
-L(fwd_write_less32bytes):
|
|
-#ifndef USE_AS_MEMMOVE
|
|
- cmp %dl, %al
|
|
- jl L(bk_write)
|
|
-#endif
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-#ifndef USE_AS_MEMMOVE
|
|
-L(bk_write):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48_bytes_bwd), %ecx, 4)
|
|
-#endif
|
|
-
|
|
- ALIGN (4)
|
|
-/* ECX > 32 and EDX is 4 byte aligned. */
|
|
-L(48bytesormore):
|
|
- movdqu (%eax), %xmm0
|
|
- PUSH (%edi)
|
|
- movl %edx, %edi
|
|
- and $-16, %edx
|
|
- PUSH (%esi)
|
|
- add $16, %edx
|
|
- movl %edi, %esi
|
|
- sub %edx, %edi
|
|
- add %edi, %ecx
|
|
- sub %edi, %eax
|
|
-
|
|
-#ifdef SHARED_CACHE_SIZE_HALF
|
|
- cmp $SHARED_CACHE_SIZE_HALF, %ecx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmp __x86_shared_cache_size_half@GOTOFF(%ebx), %ecx
|
|
-# else
|
|
- cmp __x86_shared_cache_size_half, %ecx
|
|
-# endif
|
|
-#endif
|
|
-
|
|
- mov %eax, %edi
|
|
- jge L(large_page)
|
|
- and $0xf, %edi
|
|
- jz L(shl_0)
|
|
-
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(shl_table), %edi, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_0):
|
|
- movdqu %xmm0, (%esi)
|
|
- xor %edi, %edi
|
|
- POP (%esi)
|
|
- cmp $127, %ecx
|
|
- ja L(shl_0_gobble)
|
|
- lea -32(%ecx), %ecx
|
|
-L(shl_0_loop):
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
- jl L(shl_0_end)
|
|
-
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
- jl L(shl_0_end)
|
|
-
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
- jl L(shl_0_end)
|
|
-
|
|
- movdqa (%eax, %edi), %xmm0
|
|
- movdqa 16(%eax, %edi), %xmm1
|
|
- sub $32, %ecx
|
|
- movdqa %xmm0, (%edx, %edi)
|
|
- movdqa %xmm1, 16(%edx, %edi)
|
|
- lea 32(%edi), %edi
|
|
-L(shl_0_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- add %edi, %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-L(shl_0_gobble):
|
|
-
|
|
-#ifdef DATA_CACHE_SIZE_HALF
|
|
- cmp $DATA_CACHE_SIZE_HALF, %ecx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmp __x86_data_cache_size_half@GOTOFF(%ebx), %ecx
|
|
-# else
|
|
- cmp __x86_data_cache_size_half, %ecx
|
|
-# endif
|
|
-#endif
|
|
-
|
|
- POP (%edi)
|
|
- lea -128(%ecx), %ecx
|
|
- jge L(shl_0_gobble_mem_loop)
|
|
-L(shl_0_gobble_cache_loop):
|
|
- movdqa (%eax), %xmm0
|
|
- movdqa 0x10(%eax), %xmm1
|
|
- movdqa 0x20(%eax), %xmm2
|
|
- movdqa 0x30(%eax), %xmm3
|
|
- movdqa 0x40(%eax), %xmm4
|
|
- movdqa 0x50(%eax), %xmm5
|
|
- movdqa 0x60(%eax), %xmm6
|
|
- movdqa 0x70(%eax), %xmm7
|
|
- lea 0x80(%eax), %eax
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- movdqa %xmm2, 0x20(%edx)
|
|
- movdqa %xmm3, 0x30(%edx)
|
|
- movdqa %xmm4, 0x40(%edx)
|
|
- movdqa %xmm5, 0x50(%edx)
|
|
- movdqa %xmm6, 0x60(%edx)
|
|
- movdqa %xmm7, 0x70(%edx)
|
|
- lea 0x80(%edx), %edx
|
|
-
|
|
- jge L(shl_0_gobble_cache_loop)
|
|
-L(shl_0_gobble_cache_loop_tail):
|
|
- cmp $-0x40, %ecx
|
|
- lea 0x80(%ecx), %ecx
|
|
- jl L(shl_0_cache_less_64bytes)
|
|
-
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x40, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
-
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
-
|
|
- movdqa 0x20(%eax), %xmm0
|
|
- movdqa 0x30(%eax), %xmm1
|
|
- add $0x40, %eax
|
|
-
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm1, 0x30(%edx)
|
|
- add $0x40, %edx
|
|
-L(shl_0_cache_less_64bytes):
|
|
- cmp $0x20, %ecx
|
|
- jl L(shl_0_cache_less_32bytes)
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x20, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
- add $0x20, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- add $0x20, %edx
|
|
-L(shl_0_cache_less_32bytes):
|
|
- cmp $0x10, %ecx
|
|
- jl L(shl_0_cache_less_16bytes)
|
|
- sub $0x10, %ecx
|
|
- movdqa (%eax), %xmm0
|
|
- add $0x10, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- add $0x10, %edx
|
|
-L(shl_0_cache_less_16bytes):
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_0_gobble_mem_loop):
|
|
- prefetcht0 0x1c0(%eax)
|
|
- prefetcht0 0x280(%eax)
|
|
- prefetcht0 0x1c0(%edx)
|
|
-
|
|
- movdqa (%eax), %xmm0
|
|
- movdqa 0x10(%eax), %xmm1
|
|
- movdqa 0x20(%eax), %xmm2
|
|
- movdqa 0x30(%eax), %xmm3
|
|
- movdqa 0x40(%eax), %xmm4
|
|
- movdqa 0x50(%eax), %xmm5
|
|
- movdqa 0x60(%eax), %xmm6
|
|
- movdqa 0x70(%eax), %xmm7
|
|
- lea 0x80(%eax), %eax
|
|
- sub $0x80, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- movdqa %xmm2, 0x20(%edx)
|
|
- movdqa %xmm3, 0x30(%edx)
|
|
- movdqa %xmm4, 0x40(%edx)
|
|
- movdqa %xmm5, 0x50(%edx)
|
|
- movdqa %xmm6, 0x60(%edx)
|
|
- movdqa %xmm7, 0x70(%edx)
|
|
- lea 0x80(%edx), %edx
|
|
-
|
|
- jge L(shl_0_gobble_mem_loop)
|
|
- cmp $-0x40, %ecx
|
|
- lea 0x80(%ecx), %ecx
|
|
- jl L(shl_0_mem_less_64bytes)
|
|
-
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x40, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
-
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
-
|
|
- movdqa 0x20(%eax), %xmm0
|
|
- movdqa 0x30(%eax), %xmm1
|
|
- add $0x40, %eax
|
|
-
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm1, 0x30(%edx)
|
|
- add $0x40, %edx
|
|
-L(shl_0_mem_less_64bytes):
|
|
- cmp $0x20, %ecx
|
|
- jl L(shl_0_mem_less_32bytes)
|
|
- movdqa (%eax), %xmm0
|
|
- sub $0x20, %ecx
|
|
- movdqa 0x10(%eax), %xmm1
|
|
- add $0x20, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- add $0x20, %edx
|
|
-L(shl_0_mem_less_32bytes):
|
|
- cmp $0x10, %ecx
|
|
- jl L(shl_0_mem_less_16bytes)
|
|
- sub $0x10, %ecx
|
|
- movdqa (%eax), %xmm0
|
|
- add $0x10, %eax
|
|
- movdqa %xmm0, (%edx)
|
|
- add $0x10, %edx
|
|
-L(shl_0_mem_less_16bytes):
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_1):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -1(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_1_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $1, %xmm2, %xmm3
|
|
- palignr $1, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_1_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $1, %xmm2, %xmm3
|
|
- palignr $1, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_1_loop)
|
|
-
|
|
-L(shl_1_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 1(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_2):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -2(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_2_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $2, %xmm2, %xmm3
|
|
- palignr $2, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_2_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $2, %xmm2, %xmm3
|
|
- palignr $2, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_2_loop)
|
|
-
|
|
-L(shl_2_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 2(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_3):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -3(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_3_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $3, %xmm2, %xmm3
|
|
- palignr $3, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_3_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $3, %xmm2, %xmm3
|
|
- palignr $3, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_3_loop)
|
|
-
|
|
-L(shl_3_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 3(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_4):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -4(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_4_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $4, %xmm2, %xmm3
|
|
- palignr $4, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_4_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $4, %xmm2, %xmm3
|
|
- palignr $4, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_4_loop)
|
|
-
|
|
-L(shl_4_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 4(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_5):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -5(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_5_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $5, %xmm2, %xmm3
|
|
- palignr $5, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_5_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $5, %xmm2, %xmm3
|
|
- palignr $5, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_5_loop)
|
|
-
|
|
-L(shl_5_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 5(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_6):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -6(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_6_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $6, %xmm2, %xmm3
|
|
- palignr $6, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_6_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $6, %xmm2, %xmm3
|
|
- palignr $6, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_6_loop)
|
|
-
|
|
-L(shl_6_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 6(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_7):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -7(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_7_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $7, %xmm2, %xmm3
|
|
- palignr $7, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_7_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $7, %xmm2, %xmm3
|
|
- palignr $7, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_7_loop)
|
|
-
|
|
-L(shl_7_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 7(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_8):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -8(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_8_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $8, %xmm2, %xmm3
|
|
- palignr $8, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_8_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $8, %xmm2, %xmm3
|
|
- palignr $8, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_8_loop)
|
|
-
|
|
-L(shl_8_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 8(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_9):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -9(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_9_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $9, %xmm2, %xmm3
|
|
- palignr $9, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_9_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $9, %xmm2, %xmm3
|
|
- palignr $9, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_9_loop)
|
|
-
|
|
-L(shl_9_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 9(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_10):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -10(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_10_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $10, %xmm2, %xmm3
|
|
- palignr $10, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_10_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $10, %xmm2, %xmm3
|
|
- palignr $10, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_10_loop)
|
|
-
|
|
-L(shl_10_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 10(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_11):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -11(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_11_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $11, %xmm2, %xmm3
|
|
- palignr $11, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_11_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $11, %xmm2, %xmm3
|
|
- palignr $11, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_11_loop)
|
|
-
|
|
-L(shl_11_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 11(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_12):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -12(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_12_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $12, %xmm2, %xmm3
|
|
- palignr $12, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_12_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $12, %xmm2, %xmm3
|
|
- palignr $12, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_12_loop)
|
|
-
|
|
-L(shl_12_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 12(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_13):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -13(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_13_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $13, %xmm2, %xmm3
|
|
- palignr $13, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_13_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $13, %xmm2, %xmm3
|
|
- palignr $13, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_13_loop)
|
|
-
|
|
-L(shl_13_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 13(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_14):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -14(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_14_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $14, %xmm2, %xmm3
|
|
- palignr $14, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_14_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $14, %xmm2, %xmm3
|
|
- palignr $14, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_14_loop)
|
|
-
|
|
-L(shl_14_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 14(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(shl_15):
|
|
- BRANCH_TO_JMPTBL_ENTRY_VALUE(L(table_48bytes_fwd))
|
|
- lea -15(%eax), %eax
|
|
- movaps (%eax), %xmm1
|
|
- xor %edi, %edi
|
|
- lea -32(%ecx), %ecx
|
|
- movdqu %xmm0, (%esi)
|
|
- POP (%esi)
|
|
-L(shl_15_loop):
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm4
|
|
- palignr $15, %xmm2, %xmm3
|
|
- palignr $15, %xmm1, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jl L(shl_15_end)
|
|
-
|
|
- movdqa 16(%eax, %edi), %xmm2
|
|
- sub $32, %ecx
|
|
- movdqa 32(%eax, %edi), %xmm3
|
|
- movdqa %xmm3, %xmm1
|
|
- palignr $15, %xmm2, %xmm3
|
|
- palignr $15, %xmm4, %xmm2
|
|
- lea 32(%edi), %edi
|
|
- movdqa %xmm2, -32(%edx, %edi)
|
|
- movdqa %xmm3, -16(%edx, %edi)
|
|
-
|
|
- jae L(shl_15_loop)
|
|
-
|
|
-L(shl_15_end):
|
|
- lea 32(%ecx), %ecx
|
|
- add %ecx, %edi
|
|
- add %edi, %edx
|
|
- lea 15(%edi, %eax), %eax
|
|
- POP (%edi)
|
|
- BRANCH_TO_JMPTBL_ENTRY_TAIL(L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_44bytes):
|
|
- movl -44(%eax), %ecx
|
|
- movl %ecx, -44(%edx)
|
|
-L(fwd_write_40bytes):
|
|
- movl -40(%eax), %ecx
|
|
- movl %ecx, -40(%edx)
|
|
-L(fwd_write_36bytes):
|
|
- movl -36(%eax), %ecx
|
|
- movl %ecx, -36(%edx)
|
|
-L(fwd_write_32bytes):
|
|
- movl -32(%eax), %ecx
|
|
- movl %ecx, -32(%edx)
|
|
-L(fwd_write_28bytes):
|
|
- movl -28(%eax), %ecx
|
|
- movl %ecx, -28(%edx)
|
|
-L(fwd_write_24bytes):
|
|
- movl -24(%eax), %ecx
|
|
- movl %ecx, -24(%edx)
|
|
-L(fwd_write_20bytes):
|
|
- movl -20(%eax), %ecx
|
|
- movl %ecx, -20(%edx)
|
|
-L(fwd_write_16bytes):
|
|
- movl -16(%eax), %ecx
|
|
- movl %ecx, -16(%edx)
|
|
-L(fwd_write_12bytes):
|
|
- movl -12(%eax), %ecx
|
|
- movl %ecx, -12(%edx)
|
|
-L(fwd_write_8bytes):
|
|
- movl -8(%eax), %ecx
|
|
- movl %ecx, -8(%edx)
|
|
-L(fwd_write_4bytes):
|
|
- movl -4(%eax), %ecx
|
|
- movl %ecx, -4(%edx)
|
|
-L(fwd_write_0bytes):
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_5bytes):
|
|
- movl -5(%eax), %ecx
|
|
- movl -4(%eax), %eax
|
|
- movl %ecx, -5(%edx)
|
|
- movl %eax, -4(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_45bytes):
|
|
- movl -45(%eax), %ecx
|
|
- movl %ecx, -45(%edx)
|
|
-L(fwd_write_41bytes):
|
|
- movl -41(%eax), %ecx
|
|
- movl %ecx, -41(%edx)
|
|
-L(fwd_write_37bytes):
|
|
- movl -37(%eax), %ecx
|
|
- movl %ecx, -37(%edx)
|
|
-L(fwd_write_33bytes):
|
|
- movl -33(%eax), %ecx
|
|
- movl %ecx, -33(%edx)
|
|
-L(fwd_write_29bytes):
|
|
- movl -29(%eax), %ecx
|
|
- movl %ecx, -29(%edx)
|
|
-L(fwd_write_25bytes):
|
|
- movl -25(%eax), %ecx
|
|
- movl %ecx, -25(%edx)
|
|
-L(fwd_write_21bytes):
|
|
- movl -21(%eax), %ecx
|
|
- movl %ecx, -21(%edx)
|
|
-L(fwd_write_17bytes):
|
|
- movl -17(%eax), %ecx
|
|
- movl %ecx, -17(%edx)
|
|
-L(fwd_write_13bytes):
|
|
- movl -13(%eax), %ecx
|
|
- movl %ecx, -13(%edx)
|
|
-L(fwd_write_9bytes):
|
|
- movl -9(%eax), %ecx
|
|
- movl %ecx, -9(%edx)
|
|
- movl -5(%eax), %ecx
|
|
- movl %ecx, -5(%edx)
|
|
-L(fwd_write_1bytes):
|
|
- movzbl -1(%eax), %ecx
|
|
- movb %cl, -1(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_46bytes):
|
|
- movl -46(%eax), %ecx
|
|
- movl %ecx, -46(%edx)
|
|
-L(fwd_write_42bytes):
|
|
- movl -42(%eax), %ecx
|
|
- movl %ecx, -42(%edx)
|
|
-L(fwd_write_38bytes):
|
|
- movl -38(%eax), %ecx
|
|
- movl %ecx, -38(%edx)
|
|
-L(fwd_write_34bytes):
|
|
- movl -34(%eax), %ecx
|
|
- movl %ecx, -34(%edx)
|
|
-L(fwd_write_30bytes):
|
|
- movl -30(%eax), %ecx
|
|
- movl %ecx, -30(%edx)
|
|
-L(fwd_write_26bytes):
|
|
- movl -26(%eax), %ecx
|
|
- movl %ecx, -26(%edx)
|
|
-L(fwd_write_22bytes):
|
|
- movl -22(%eax), %ecx
|
|
- movl %ecx, -22(%edx)
|
|
-L(fwd_write_18bytes):
|
|
- movl -18(%eax), %ecx
|
|
- movl %ecx, -18(%edx)
|
|
-L(fwd_write_14bytes):
|
|
- movl -14(%eax), %ecx
|
|
- movl %ecx, -14(%edx)
|
|
-L(fwd_write_10bytes):
|
|
- movl -10(%eax), %ecx
|
|
- movl %ecx, -10(%edx)
|
|
-L(fwd_write_6bytes):
|
|
- movl -6(%eax), %ecx
|
|
- movl %ecx, -6(%edx)
|
|
-L(fwd_write_2bytes):
|
|
- movzwl -2(%eax), %ecx
|
|
- movw %cx, -2(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(fwd_write_47bytes):
|
|
- movl -47(%eax), %ecx
|
|
- movl %ecx, -47(%edx)
|
|
-L(fwd_write_43bytes):
|
|
- movl -43(%eax), %ecx
|
|
- movl %ecx, -43(%edx)
|
|
-L(fwd_write_39bytes):
|
|
- movl -39(%eax), %ecx
|
|
- movl %ecx, -39(%edx)
|
|
-L(fwd_write_35bytes):
|
|
- movl -35(%eax), %ecx
|
|
- movl %ecx, -35(%edx)
|
|
-L(fwd_write_31bytes):
|
|
- movl -31(%eax), %ecx
|
|
- movl %ecx, -31(%edx)
|
|
-L(fwd_write_27bytes):
|
|
- movl -27(%eax), %ecx
|
|
- movl %ecx, -27(%edx)
|
|
-L(fwd_write_23bytes):
|
|
- movl -23(%eax), %ecx
|
|
- movl %ecx, -23(%edx)
|
|
-L(fwd_write_19bytes):
|
|
- movl -19(%eax), %ecx
|
|
- movl %ecx, -19(%edx)
|
|
-L(fwd_write_15bytes):
|
|
- movl -15(%eax), %ecx
|
|
- movl %ecx, -15(%edx)
|
|
-L(fwd_write_11bytes):
|
|
- movl -11(%eax), %ecx
|
|
- movl %ecx, -11(%edx)
|
|
-L(fwd_write_7bytes):
|
|
- movl -7(%eax), %ecx
|
|
- movl %ecx, -7(%edx)
|
|
-L(fwd_write_3bytes):
|
|
- movzwl -3(%eax), %ecx
|
|
- movzbl -1(%eax), %eax
|
|
- movw %cx, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl %edx, %eax
|
|
-# else
|
|
- movl DEST(%esp), %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(large_page):
|
|
- movdqu (%eax), %xmm1
|
|
- lea 16(%eax), %eax
|
|
- movdqu %xmm0, (%esi)
|
|
- movntdq %xmm1, (%edx)
|
|
- lea 16(%edx), %edx
|
|
- POP (%esi)
|
|
- lea -0x90(%ecx), %ecx
|
|
- POP (%edi)
|
|
-L(large_page_loop):
|
|
- movdqu (%eax), %xmm0
|
|
- movdqu 0x10(%eax), %xmm1
|
|
- movdqu 0x20(%eax), %xmm2
|
|
- movdqu 0x30(%eax), %xmm3
|
|
- movdqu 0x40(%eax), %xmm4
|
|
- movdqu 0x50(%eax), %xmm5
|
|
- movdqu 0x60(%eax), %xmm6
|
|
- movdqu 0x70(%eax), %xmm7
|
|
- lea 0x80(%eax), %eax
|
|
-
|
|
- sub $0x80, %ecx
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm1, 0x10(%edx)
|
|
- movntdq %xmm2, 0x20(%edx)
|
|
- movntdq %xmm3, 0x30(%edx)
|
|
- movntdq %xmm4, 0x40(%edx)
|
|
- movntdq %xmm5, 0x50(%edx)
|
|
- movntdq %xmm6, 0x60(%edx)
|
|
- movntdq %xmm7, 0x70(%edx)
|
|
- lea 0x80(%edx), %edx
|
|
- jae L(large_page_loop)
|
|
- cmp $-0x40, %ecx
|
|
- lea 0x80(%ecx), %ecx
|
|
- jl L(large_page_less_64bytes)
|
|
-
|
|
- movdqu (%eax), %xmm0
|
|
- movdqu 0x10(%eax), %xmm1
|
|
- movdqu 0x20(%eax), %xmm2
|
|
- movdqu 0x30(%eax), %xmm3
|
|
- lea 0x40(%eax), %eax
|
|
-
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm1, 0x10(%edx)
|
|
- movntdq %xmm2, 0x20(%edx)
|
|
- movntdq %xmm3, 0x30(%edx)
|
|
- lea 0x40(%edx), %edx
|
|
- sub $0x40, %ecx
|
|
-L(large_page_less_64bytes):
|
|
- cmp $32, %ecx
|
|
- jl L(large_page_less_32bytes)
|
|
- movdqu (%eax), %xmm0
|
|
- movdqu 0x10(%eax), %xmm1
|
|
- lea 0x20(%eax), %eax
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm1, 0x10(%edx)
|
|
- lea 0x20(%edx), %edx
|
|
- sub $0x20, %ecx
|
|
-L(large_page_less_32bytes):
|
|
- add %ecx, %edx
|
|
- add %ecx, %eax
|
|
- sfence
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48bytes_fwd), %ecx, 4)
|
|
-
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_44bytes):
|
|
- movl 40(%eax), %ecx
|
|
- movl %ecx, 40(%edx)
|
|
-L(bk_write_40bytes):
|
|
- movl 36(%eax), %ecx
|
|
- movl %ecx, 36(%edx)
|
|
-L(bk_write_36bytes):
|
|
- movl 32(%eax), %ecx
|
|
- movl %ecx, 32(%edx)
|
|
-L(bk_write_32bytes):
|
|
- movl 28(%eax), %ecx
|
|
- movl %ecx, 28(%edx)
|
|
-L(bk_write_28bytes):
|
|
- movl 24(%eax), %ecx
|
|
- movl %ecx, 24(%edx)
|
|
-L(bk_write_24bytes):
|
|
- movl 20(%eax), %ecx
|
|
- movl %ecx, 20(%edx)
|
|
-L(bk_write_20bytes):
|
|
- movl 16(%eax), %ecx
|
|
- movl %ecx, 16(%edx)
|
|
-L(bk_write_16bytes):
|
|
- movl 12(%eax), %ecx
|
|
- movl %ecx, 12(%edx)
|
|
-L(bk_write_12bytes):
|
|
- movl 8(%eax), %ecx
|
|
- movl %ecx, 8(%edx)
|
|
-L(bk_write_8bytes):
|
|
- movl 4(%eax), %ecx
|
|
- movl %ecx, 4(%edx)
|
|
-L(bk_write_4bytes):
|
|
- movl (%eax), %ecx
|
|
- movl %ecx, (%edx)
|
|
-L(bk_write_0bytes):
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_45bytes):
|
|
- movl 41(%eax), %ecx
|
|
- movl %ecx, 41(%edx)
|
|
-L(bk_write_41bytes):
|
|
- movl 37(%eax), %ecx
|
|
- movl %ecx, 37(%edx)
|
|
-L(bk_write_37bytes):
|
|
- movl 33(%eax), %ecx
|
|
- movl %ecx, 33(%edx)
|
|
-L(bk_write_33bytes):
|
|
- movl 29(%eax), %ecx
|
|
- movl %ecx, 29(%edx)
|
|
-L(bk_write_29bytes):
|
|
- movl 25(%eax), %ecx
|
|
- movl %ecx, 25(%edx)
|
|
-L(bk_write_25bytes):
|
|
- movl 21(%eax), %ecx
|
|
- movl %ecx, 21(%edx)
|
|
-L(bk_write_21bytes):
|
|
- movl 17(%eax), %ecx
|
|
- movl %ecx, 17(%edx)
|
|
-L(bk_write_17bytes):
|
|
- movl 13(%eax), %ecx
|
|
- movl %ecx, 13(%edx)
|
|
-L(bk_write_13bytes):
|
|
- movl 9(%eax), %ecx
|
|
- movl %ecx, 9(%edx)
|
|
-L(bk_write_9bytes):
|
|
- movl 5(%eax), %ecx
|
|
- movl %ecx, 5(%edx)
|
|
-L(bk_write_5bytes):
|
|
- movl 1(%eax), %ecx
|
|
- movl %ecx, 1(%edx)
|
|
-L(bk_write_1bytes):
|
|
- movzbl (%eax), %ecx
|
|
- movb %cl, (%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_46bytes):
|
|
- movl 42(%eax), %ecx
|
|
- movl %ecx, 42(%edx)
|
|
-L(bk_write_42bytes):
|
|
- movl 38(%eax), %ecx
|
|
- movl %ecx, 38(%edx)
|
|
-L(bk_write_38bytes):
|
|
- movl 34(%eax), %ecx
|
|
- movl %ecx, 34(%edx)
|
|
-L(bk_write_34bytes):
|
|
- movl 30(%eax), %ecx
|
|
- movl %ecx, 30(%edx)
|
|
-L(bk_write_30bytes):
|
|
- movl 26(%eax), %ecx
|
|
- movl %ecx, 26(%edx)
|
|
-L(bk_write_26bytes):
|
|
- movl 22(%eax), %ecx
|
|
- movl %ecx, 22(%edx)
|
|
-L(bk_write_22bytes):
|
|
- movl 18(%eax), %ecx
|
|
- movl %ecx, 18(%edx)
|
|
-L(bk_write_18bytes):
|
|
- movl 14(%eax), %ecx
|
|
- movl %ecx, 14(%edx)
|
|
-L(bk_write_14bytes):
|
|
- movl 10(%eax), %ecx
|
|
- movl %ecx, 10(%edx)
|
|
-L(bk_write_10bytes):
|
|
- movl 6(%eax), %ecx
|
|
- movl %ecx, 6(%edx)
|
|
-L(bk_write_6bytes):
|
|
- movl 2(%eax), %ecx
|
|
- movl %ecx, 2(%edx)
|
|
-L(bk_write_2bytes):
|
|
- movzwl (%eax), %ecx
|
|
- movw %cx, (%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_47bytes):
|
|
- movl 43(%eax), %ecx
|
|
- movl %ecx, 43(%edx)
|
|
-L(bk_write_43bytes):
|
|
- movl 39(%eax), %ecx
|
|
- movl %ecx, 39(%edx)
|
|
-L(bk_write_39bytes):
|
|
- movl 35(%eax), %ecx
|
|
- movl %ecx, 35(%edx)
|
|
-L(bk_write_35bytes):
|
|
- movl 31(%eax), %ecx
|
|
- movl %ecx, 31(%edx)
|
|
-L(bk_write_31bytes):
|
|
- movl 27(%eax), %ecx
|
|
- movl %ecx, 27(%edx)
|
|
-L(bk_write_27bytes):
|
|
- movl 23(%eax), %ecx
|
|
- movl %ecx, 23(%edx)
|
|
-L(bk_write_23bytes):
|
|
- movl 19(%eax), %ecx
|
|
- movl %ecx, 19(%edx)
|
|
-L(bk_write_19bytes):
|
|
- movl 15(%eax), %ecx
|
|
- movl %ecx, 15(%edx)
|
|
-L(bk_write_15bytes):
|
|
- movl 11(%eax), %ecx
|
|
- movl %ecx, 11(%edx)
|
|
-L(bk_write_11bytes):
|
|
- movl 7(%eax), %ecx
|
|
- movl %ecx, 7(%edx)
|
|
-L(bk_write_7bytes):
|
|
- movl 3(%eax), %ecx
|
|
- movl %ecx, 3(%edx)
|
|
-L(bk_write_3bytes):
|
|
- movzwl 1(%eax), %ecx
|
|
- movw %cx, 1(%edx)
|
|
- movzbl (%eax), %eax
|
|
- movb %al, (%edx)
|
|
-#ifndef USE_AS_BCOPY
|
|
- movl DEST(%esp), %eax
|
|
-# ifdef USE_AS_MEMPCPY
|
|
- movl LEN(%esp), %ecx
|
|
- add %ecx, %eax
|
|
-# endif
|
|
-#endif
|
|
- RETURN_END
|
|
-
|
|
-
|
|
- .pushsection .rodata.ssse3,"a",@progbits
|
|
- ALIGN (2)
|
|
-L(table_48bytes_fwd):
|
|
- .int JMPTBL (L(fwd_write_0bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_1bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_2bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_3bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_4bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_5bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_6bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_7bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_8bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_9bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_10bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_11bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_12bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_13bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_14bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_15bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_16bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_17bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_18bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_19bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_20bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_21bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_22bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_23bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_24bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_25bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_26bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_27bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_28bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_29bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_30bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_31bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_32bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_33bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_34bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_35bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_36bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_37bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_38bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_39bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_40bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_41bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_42bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_43bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_44bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_45bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_46bytes), L(table_48bytes_fwd))
|
|
- .int JMPTBL (L(fwd_write_47bytes), L(table_48bytes_fwd))
|
|
-
|
|
- ALIGN (2)
|
|
-L(shl_table):
|
|
- .int JMPTBL (L(shl_0), L(shl_table))
|
|
- .int JMPTBL (L(shl_1), L(shl_table))
|
|
- .int JMPTBL (L(shl_2), L(shl_table))
|
|
- .int JMPTBL (L(shl_3), L(shl_table))
|
|
- .int JMPTBL (L(shl_4), L(shl_table))
|
|
- .int JMPTBL (L(shl_5), L(shl_table))
|
|
- .int JMPTBL (L(shl_6), L(shl_table))
|
|
- .int JMPTBL (L(shl_7), L(shl_table))
|
|
- .int JMPTBL (L(shl_8), L(shl_table))
|
|
- .int JMPTBL (L(shl_9), L(shl_table))
|
|
- .int JMPTBL (L(shl_10), L(shl_table))
|
|
- .int JMPTBL (L(shl_11), L(shl_table))
|
|
- .int JMPTBL (L(shl_12), L(shl_table))
|
|
- .int JMPTBL (L(shl_13), L(shl_table))
|
|
- .int JMPTBL (L(shl_14), L(shl_table))
|
|
- .int JMPTBL (L(shl_15), L(shl_table))
|
|
-
|
|
- ALIGN (2)
|
|
-L(table_48_bytes_bwd):
|
|
- .int JMPTBL (L(bk_write_0bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_1bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_2bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_3bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_4bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_5bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_6bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_7bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_8bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_9bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_10bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_11bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_12bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_13bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_14bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_15bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_16bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_17bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_18bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_19bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_20bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_21bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_22bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_23bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_24bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_25bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_26bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_27bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_28bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_29bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_30bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_31bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_32bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_33bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_34bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_35bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_36bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_37bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_38bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_39bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_40bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_41bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_42bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_43bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_44bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_45bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_46bytes), L(table_48_bytes_bwd))
|
|
- .int JMPTBL (L(bk_write_47bytes), L(table_48_bytes_bwd))
|
|
-
|
|
- .popsection
|
|
-
|
|
-#ifdef USE_AS_MEMMOVE
|
|
- ALIGN (4)
|
|
-L(copy_backward):
|
|
- PUSH (%esi)
|
|
- movl %eax, %esi
|
|
- lea (%ecx,%edx,1),%edx
|
|
- lea (%ecx,%esi,1),%esi
|
|
- testl $0x3, %edx
|
|
- jnz L(bk_align)
|
|
-
|
|
-L(bk_aligned_4):
|
|
- cmp $64, %ecx
|
|
- jge L(bk_write_more64bytes)
|
|
-
|
|
-L(bk_write_64bytesless):
|
|
- cmp $32, %ecx
|
|
- jl L(bk_write_less32bytes)
|
|
-
|
|
-L(bk_write_more32bytes):
|
|
- /* Copy 32 bytes at a time. */
|
|
- sub $32, %ecx
|
|
- movl -4(%esi), %eax
|
|
- movl %eax, -4(%edx)
|
|
- movl -8(%esi), %eax
|
|
- movl %eax, -8(%edx)
|
|
- movl -12(%esi), %eax
|
|
- movl %eax, -12(%edx)
|
|
- movl -16(%esi), %eax
|
|
- movl %eax, -16(%edx)
|
|
- movl -20(%esi), %eax
|
|
- movl %eax, -20(%edx)
|
|
- movl -24(%esi), %eax
|
|
- movl %eax, -24(%edx)
|
|
- movl -28(%esi), %eax
|
|
- movl %eax, -28(%edx)
|
|
- movl -32(%esi), %eax
|
|
- movl %eax, -32(%edx)
|
|
- sub $32, %edx
|
|
- sub $32, %esi
|
|
-
|
|
-L(bk_write_less32bytes):
|
|
- movl %esi, %eax
|
|
- sub %ecx, %edx
|
|
- sub %ecx, %eax
|
|
- POP (%esi)
|
|
-L(bk_write_less32bytes_2):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_48_bytes_bwd), %ecx, 4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_align):
|
|
- cmp $8, %ecx
|
|
- jle L(bk_write_less32bytes)
|
|
- testl $1, %edx
|
|
- /* We get here only if (EDX & 3 ) != 0 so if (EDX & 1) ==0,
|
|
- then (EDX & 2) must be != 0. */
|
|
- jz L(bk_got2)
|
|
- sub $1, %esi
|
|
- sub $1, %ecx
|
|
- sub $1, %edx
|
|
- movzbl (%esi), %eax
|
|
- movb %al, (%edx)
|
|
-
|
|
- testl $2, %edx
|
|
- jz L(bk_aligned_4)
|
|
-
|
|
-L(bk_got2):
|
|
- sub $2, %esi
|
|
- sub $2, %ecx
|
|
- sub $2, %edx
|
|
- movzwl (%esi), %eax
|
|
- movw %ax, (%edx)
|
|
- jmp L(bk_aligned_4)
|
|
-
|
|
- ALIGN (4)
|
|
-L(bk_write_more64bytes):
|
|
- /* Check alignment of last byte. */
|
|
- testl $15, %edx
|
|
- jz L(bk_ssse3_cpy_pre)
|
|
-
|
|
-/* EDX is aligned 4 bytes, but not 16 bytes. */
|
|
-L(bk_ssse3_align):
|
|
- sub $4, %esi
|
|
- sub $4, %ecx
|
|
- sub $4, %edx
|
|
- movl (%esi), %eax
|
|
- movl %eax, (%edx)
|
|
-
|
|
- testl $15, %edx
|
|
- jz L(bk_ssse3_cpy_pre)
|
|
-
|
|
- sub $4, %esi
|
|
- sub $4, %ecx
|
|
- sub $4, %edx
|
|
- movl (%esi), %eax
|
|
- movl %eax, (%edx)
|
|
-
|
|
- testl $15, %edx
|
|
- jz L(bk_ssse3_cpy_pre)
|
|
-
|
|
- sub $4, %esi
|
|
- sub $4, %ecx
|
|
- sub $4, %edx
|
|
- movl (%esi), %eax
|
|
- movl %eax, (%edx)
|
|
-
|
|
-L(bk_ssse3_cpy_pre):
|
|
- cmp $64, %ecx
|
|
- jl L(bk_write_more32bytes)
|
|
-
|
|
-L(bk_ssse3_cpy):
|
|
- sub $64, %esi
|
|
- sub $64, %ecx
|
|
- sub $64, %edx
|
|
- movdqu 0x30(%esi), %xmm3
|
|
- movdqa %xmm3, 0x30(%edx)
|
|
- movdqu 0x20(%esi), %xmm2
|
|
- movdqa %xmm2, 0x20(%edx)
|
|
- movdqu 0x10(%esi), %xmm1
|
|
- movdqa %xmm1, 0x10(%edx)
|
|
- movdqu (%esi), %xmm0
|
|
- movdqa %xmm0, (%edx)
|
|
- cmp $64, %ecx
|
|
- jge L(bk_ssse3_cpy)
|
|
- jmp L(bk_write_64bytesless)
|
|
-
|
|
-#endif
|
|
-
|
|
-END (MEMCPY)
|
|
-
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memcpy.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,90 +0,0 @@
|
|
-/* Multiple versions of memcpy
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib and for
|
|
- DSO. In static binaries we need memcpy before the initialization
|
|
- happened. */
|
|
-#if defined SHARED && !defined NOT_IN_libc
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(memcpy)
|
|
- .type memcpy, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memcpy_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memcpy_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memcpy_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(memcpy)
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __memcpy_ia32, @function; \
|
|
- .p2align 4; \
|
|
- __memcpy_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END
|
|
-# define END(name) \
|
|
- cfi_endproc; .size __memcpy_ia32, .-__memcpy_ia32
|
|
-
|
|
-# undef ENTRY_CHK
|
|
-# define ENTRY_CHK(name) \
|
|
- .type __memcpy_chk_ia32, @function; \
|
|
- .globl __memcpy_chk_ia32; \
|
|
- .p2align 4; \
|
|
- __memcpy_chk_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END_CHK
|
|
-# define END_CHK(name) \
|
|
- cfi_endproc; .size __memcpy_chk_ia32, .-__memcpy_chk_ia32
|
|
-
|
|
-# undef libc_hidden_builtin_def
|
|
-/* IFUNC doesn't work with the hidden functions in shared library since
|
|
- they will be called without setting up EBX needed for PLT which is
|
|
- used by IFUNC. */
|
|
-# define libc_hidden_builtin_def(name) \
|
|
- .globl __GI_memcpy; __GI_memcpy = __memcpy_ia32
|
|
-#endif
|
|
-
|
|
-#include "../memcpy.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memcpy_chk.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,64 +0,0 @@
|
|
-/* Multiple versions of __memcpy_chk
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib and for
|
|
- DSO. There are no multiarch memcpy functions for static binaries.
|
|
- */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(__memcpy_chk)
|
|
- .type __memcpy_chk, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memcpy_chk_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memcpy_chk_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memcpy_chk_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(__memcpy_chk)
|
|
-# else
|
|
-# include "../memcpy_chk.S"
|
|
-# endif
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memmove-ssse3-rep.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,4 +0,0 @@
|
|
-#define USE_AS_MEMMOVE
|
|
-#define MEMCPY __memmove_ssse3_rep
|
|
-#define MEMCPY_CHK __memmove_chk_ssse3_rep
|
|
-#include "memcpy-ssse3-rep.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memmove-ssse3.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,4 +0,0 @@
|
|
-#define USE_AS_MEMMOVE
|
|
-#define MEMCPY __memmove_ssse3
|
|
-#define MEMCPY_CHK __memmove_chk_ssse3
|
|
-#include "memcpy-ssse3.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memmove.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,117 +0,0 @@
|
|
-/* Multiple versions of memmove
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib. */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(memmove)
|
|
- .type memmove, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memmove_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memmove_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memmove_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(memmove)
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __memmove_ia32, @function; \
|
|
- .p2align 4; \
|
|
- __memmove_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# else
|
|
- .text
|
|
-ENTRY(memmove)
|
|
- .type memmove, @gnu_indirect_function
|
|
- cmpl $0, KIND_OFFSET+__cpu_features
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memmove_ia32, %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features
|
|
- jz 2f
|
|
- leal __memmove_ssse3, %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features
|
|
- jz 2f
|
|
- leal __memmove_ssse3_rep, %eax
|
|
-2: ret
|
|
-END(memmove)
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __memmove_ia32, @function; \
|
|
- .globl __memmove_ia32; \
|
|
- .p2align 4; \
|
|
- __memmove_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# endif
|
|
-
|
|
-# undef END
|
|
-# define END(name) \
|
|
- cfi_endproc; .size __memmove_ia32, .-__memmove_ia32
|
|
-
|
|
-# undef ENTRY_CHK
|
|
-# define ENTRY_CHK(name) \
|
|
- .type __memmove_chk_ia32, @function; \
|
|
- .globl __memmove_chk_ia32; \
|
|
- .p2align 4; \
|
|
- __memmove_chk_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END_CHK
|
|
-# define END_CHK(name) \
|
|
- cfi_endproc; .size __memmove_chk_ia32, .-__memmove_chk_ia32
|
|
-
|
|
-# ifdef SHARED
|
|
-# undef libc_hidden_builtin_def
|
|
-/* IFUNC doesn't work with the hidden functions in shared library since
|
|
- they will be called without setting up EBX needed for PLT which is
|
|
- used by IFUNC. */
|
|
-# define libc_hidden_builtin_def(name) \
|
|
- .globl __GI_memmove; __GI_memmove = __memmove_ia32
|
|
-# endif
|
|
-#endif
|
|
-
|
|
-#include "../memmove.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memmove_chk.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,112 +0,0 @@
|
|
-/* Multiple versions of __memmove_chk
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib. */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(__memmove_chk)
|
|
- .type __memmove_chk, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memmove_chk_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memmove_chk_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memmove_chk_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(__memmove_chk)
|
|
-# else
|
|
- .text
|
|
-ENTRY(__memmove_chk)
|
|
- .type __memmove_chk, @gnu_indirect_function
|
|
- cmpl $0, KIND_OFFSET+__cpu_features
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memmove_chk_ia32, %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features
|
|
- jz 2f
|
|
- leal __memmove_chk_ssse3, %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features
|
|
- jz 2f
|
|
- leal __memmove_chk_ssse3_rep, %eax
|
|
-2: ret
|
|
-END(__memmove_chk)
|
|
-
|
|
- .type __memmove_chk_ssse3, @function
|
|
- .p2align 4;
|
|
-__memmove_chk_ssse3:
|
|
- cfi_startproc
|
|
- CALL_MCOUNT
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb __chk_fail
|
|
- jmp __memmove_ssse3
|
|
- cfi_endproc
|
|
- .size __memmove_chk_ssse3, .-__memmove_chk_ssse3
|
|
-
|
|
- .type __memmove_chk_ssse3_rep, @function
|
|
- .p2align 4;
|
|
-__memmove_chk_ssse3_rep:
|
|
- cfi_startproc
|
|
- CALL_MCOUNT
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb __chk_fail
|
|
- jmp __memmove_ssse3_rep
|
|
- cfi_endproc
|
|
- .size __memmove_chk_ssse3_rep, .-__memmove_chk_ssse3_rep
|
|
-
|
|
- .type __memmove_chk_ia32, @function
|
|
- .p2align 4;
|
|
-__memmove_chk_ia32:
|
|
- cfi_startproc
|
|
- CALL_MCOUNT
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb __chk_fail
|
|
- jmp __memmove_ia32
|
|
- cfi_endproc
|
|
- .size __memmove_chk_ia32, .-__memmove_chk_ia32
|
|
-# endif
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/mempcpy-ssse3-rep.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,4 +0,0 @@
|
|
-#define USE_AS_MEMPCPY
|
|
-#define MEMCPY __mempcpy_ssse3_rep
|
|
-#define MEMCPY_CHK __mempcpy_chk_ssse3_rep
|
|
-#include "memcpy-ssse3-rep.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/mempcpy-ssse3.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,4 +0,0 @@
|
|
-#define USE_AS_MEMPCPY
|
|
-#define MEMCPY __mempcpy_ssse3
|
|
-#define MEMCPY_CHK __mempcpy_chk_ssse3
|
|
-#include "memcpy-ssse3.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/mempcpy.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,93 +0,0 @@
|
|
-/* Multiple versions of mempcpy
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib and for
|
|
- DSO. In static binaries we need mempcpy before the initialization
|
|
- happened. */
|
|
-#if defined SHARED && !defined NOT_IN_libc
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(__mempcpy)
|
|
- .type __mempcpy, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __mempcpy_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __mempcpy_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __mempcpy_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(__mempcpy)
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __mempcpy_ia32, @function; \
|
|
- .p2align 4; \
|
|
- __mempcpy_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END
|
|
-# define END(name) \
|
|
- cfi_endproc; .size __mempcpy_ia32, .-__mempcpy_ia32
|
|
-
|
|
-# undef ENTRY_CHK
|
|
-# define ENTRY_CHK(name) \
|
|
- .type __mempcpy_chk_ia32, @function; \
|
|
- .globl __mempcpy_chk_ia32; \
|
|
- .p2align 4; \
|
|
- __mempcpy_chk_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END_CHK
|
|
-# define END_CHK(name) \
|
|
- cfi_endproc; .size __mempcpy_chk_ia32, .-__mempcpy_chk_ia32
|
|
-
|
|
-# undef libc_hidden_def
|
|
-# undef libc_hidden_builtin_def
|
|
-/* IFUNC doesn't work with the hidden functions in shared library since
|
|
- they will be called without setting up EBX needed for PLT which is
|
|
- used by IFUNC. */
|
|
-# define libc_hidden_def(name) \
|
|
- .globl __GI_mempcpy; __GI_mempcpy = __mempcpy_ia32
|
|
-# define libc_hidden_builtin_def(name) \
|
|
- .globl __GI___mempcpy; __GI___mempcpy = __mempcpy_ia32
|
|
-#endif
|
|
-
|
|
-#include "../mempcpy.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/mempcpy_chk.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,64 +0,0 @@
|
|
-/* Multiple versions of __mempcpy_chk
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib and for
|
|
- DSO. There are no multiarch mempcpy functions for static binaries.
|
|
- */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(__mempcpy_chk)
|
|
- .type __mempcpy_chk, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __mempcpy_chk_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSSE3, CPUID_OFFSET+index_SSSE3+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __mempcpy_chk_ssse3@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __mempcpy_chk_ssse3_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(__mempcpy_chk)
|
|
-# else
|
|
-# include "../mempcpy_chk.S"
|
|
-# endif
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memset-sse2-rep.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,821 +0,0 @@
|
|
-/* memset with SSE2 and REP string.
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#ifndef NOT_IN_libc
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include "asm-syntax.h"
|
|
-
|
|
-#define CFI_PUSH(REG) \
|
|
- cfi_adjust_cfa_offset (4); \
|
|
- cfi_rel_offset (REG, 0)
|
|
-
|
|
-#define CFI_POP(REG) \
|
|
- cfi_adjust_cfa_offset (-4); \
|
|
- cfi_restore (REG)
|
|
-
|
|
-#define PUSH(REG) pushl REG; CFI_PUSH (REG)
|
|
-#define POP(REG) popl REG; CFI_POP (REG)
|
|
-
|
|
-#ifdef USE_AS_BZERO
|
|
-# define DEST PARMS
|
|
-# define LEN DEST+4
|
|
-# define SETRTNVAL
|
|
-#else
|
|
-# define DEST PARMS
|
|
-# define CHR DEST+4
|
|
-# define LEN CHR+4
|
|
-# define SETRTNVAL movl DEST(%esp), %eax
|
|
-#endif
|
|
-
|
|
-#ifdef SHARED
|
|
-# define ENTRANCE PUSH (%ebx);
|
|
-# define RETURN_END POP (%ebx); ret
|
|
-# define RETURN RETURN_END; CFI_PUSH (%ebx)
|
|
-# define PARMS 8 /* Preserve EBX. */
|
|
-# define JMPTBL(I, B) I - B
|
|
-
|
|
-/* Load an entry in a jump table into EBX and branch to it. TABLE is a
|
|
- jump table with relative offsets. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE) \
|
|
- /* We first load PC into EBX. */ \
|
|
- call __i686.get_pc_thunk.bx; \
|
|
- /* Get the address of the jump table. */ \
|
|
- add $(TABLE - .), %ebx; \
|
|
- /* Get the entry and convert the relative offset to the \
|
|
- absolute address. */ \
|
|
- add (%ebx,%ecx,4), %ebx; \
|
|
- add %ecx, %edx; \
|
|
- /* We loaded the jump table and adjuested EDX. Go. */ \
|
|
- jmp *%ebx
|
|
-
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- ALIGN (4)
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-#else
|
|
-# define ENTRANCE
|
|
-# define RETURN_END ret
|
|
-# define RETURN RETURN_END
|
|
-# define PARMS 4
|
|
-# define JMPTBL(I, B) I
|
|
-
|
|
-/* Branch to an entry in a jump table. TABLE is a jump table with
|
|
- absolute offsets. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE) \
|
|
- add %ecx, %edx; \
|
|
- jmp *TABLE(,%ecx,4)
|
|
-#endif
|
|
-
|
|
- .section .text.sse2,"ax",@progbits
|
|
-#if defined SHARED && !defined NOT_IN_libc && !defined USE_AS_BZERO
|
|
-ENTRY (__memset_chk_sse2_rep)
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END (__memset_chk_sse2_rep)
|
|
-#endif
|
|
-ENTRY (__memset_sse2_rep)
|
|
- ENTRANCE
|
|
-
|
|
- movl LEN(%esp), %ecx
|
|
-#ifdef USE_AS_BZERO
|
|
- xor %eax, %eax
|
|
-#else
|
|
- movzbl CHR(%esp), %eax
|
|
- movb %al, %ah
|
|
- /* Fill the whole EAX with pattern. */
|
|
- movl %eax, %edx
|
|
- shl $16, %eax
|
|
- or %edx, %eax
|
|
-#endif
|
|
- movl DEST(%esp), %edx
|
|
- cmp $32, %ecx
|
|
- jae L(32bytesormore)
|
|
-
|
|
-L(write_less32bytes):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_less_32bytes))
|
|
-
|
|
-
|
|
- .pushsection .rodata.sse2,"a",@progbits
|
|
- ALIGN (2)
|
|
-L(table_less_32bytes):
|
|
- .int JMPTBL (L(write_0bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_1bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_2bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_3bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_4bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_5bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_6bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_7bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_8bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_9bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_10bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_11bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_12bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_13bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_14bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_15bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_16bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_17bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_18bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_19bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_20bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_21bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_22bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_23bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_24bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_25bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_26bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_27bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_28bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_29bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_30bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_31bytes), L(table_less_32bytes))
|
|
- .popsection
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_28bytes):
|
|
- movl %eax, -28(%edx)
|
|
-L(write_24bytes):
|
|
- movl %eax, -24(%edx)
|
|
-L(write_20bytes):
|
|
- movl %eax, -20(%edx)
|
|
-L(write_16bytes):
|
|
- movl %eax, -16(%edx)
|
|
-L(write_12bytes):
|
|
- movl %eax, -12(%edx)
|
|
-L(write_8bytes):
|
|
- movl %eax, -8(%edx)
|
|
-L(write_4bytes):
|
|
- movl %eax, -4(%edx)
|
|
-L(write_0bytes):
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_29bytes):
|
|
- movl %eax, -29(%edx)
|
|
-L(write_25bytes):
|
|
- movl %eax, -25(%edx)
|
|
-L(write_21bytes):
|
|
- movl %eax, -21(%edx)
|
|
-L(write_17bytes):
|
|
- movl %eax, -17(%edx)
|
|
-L(write_13bytes):
|
|
- movl %eax, -13(%edx)
|
|
-L(write_9bytes):
|
|
- movl %eax, -9(%edx)
|
|
-L(write_5bytes):
|
|
- movl %eax, -5(%edx)
|
|
-L(write_1bytes):
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_30bytes):
|
|
- movl %eax, -30(%edx)
|
|
-L(write_26bytes):
|
|
- movl %eax, -26(%edx)
|
|
-L(write_22bytes):
|
|
- movl %eax, -22(%edx)
|
|
-L(write_18bytes):
|
|
- movl %eax, -18(%edx)
|
|
-L(write_14bytes):
|
|
- movl %eax, -14(%edx)
|
|
-L(write_10bytes):
|
|
- movl %eax, -10(%edx)
|
|
-L(write_6bytes):
|
|
- movl %eax, -6(%edx)
|
|
-L(write_2bytes):
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_31bytes):
|
|
- movl %eax, -31(%edx)
|
|
-L(write_27bytes):
|
|
- movl %eax, -27(%edx)
|
|
-L(write_23bytes):
|
|
- movl %eax, -23(%edx)
|
|
-L(write_19bytes):
|
|
- movl %eax, -19(%edx)
|
|
-L(write_15bytes):
|
|
- movl %eax, -15(%edx)
|
|
-L(write_11bytes):
|
|
- movl %eax, -11(%edx)
|
|
-L(write_7bytes):
|
|
- movl %eax, -7(%edx)
|
|
-L(write_3bytes):
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-/* ECX > 32 and EDX is 4 byte aligned. */
|
|
-L(32bytesormore):
|
|
- /* Fill xmm0 with the pattern. */
|
|
-#ifdef USE_AS_BZERO
|
|
- pxor %xmm0, %xmm0
|
|
-#else
|
|
- movd %eax, %xmm0
|
|
- punpcklbw %xmm0, %xmm0
|
|
- pshufd $0, %xmm0, %xmm0
|
|
-#endif
|
|
- testl $0xf, %edx
|
|
- jz L(aligned_16)
|
|
-/* ECX > 32 and EDX is not 16 byte aligned. */
|
|
-L(not_aligned_16):
|
|
- movdqu %xmm0, (%edx)
|
|
- movl %edx, %eax
|
|
- and $-16, %edx
|
|
- add $16, %edx
|
|
- sub %edx, %eax
|
|
- add %eax, %ecx
|
|
- movd %xmm0, %eax
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16):
|
|
- cmp $128, %ecx
|
|
- jge L(128bytesormore)
|
|
-
|
|
-L(aligned_16_less128bytes):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_16_128bytes))
|
|
-
|
|
- ALIGN (4)
|
|
-L(128bytesormore):
|
|
- PUSH (%edi)
|
|
-#ifdef DATA_CACHE_SIZE
|
|
- PUSH (%ebx)
|
|
- mov $DATA_CACHE_SIZE, %ebx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- mov __x86_data_cache_size@GOTOFF(%ebx), %ebx
|
|
-# else
|
|
- PUSH (%ebx)
|
|
- mov __x86_data_cache_size, %ebx
|
|
-# endif
|
|
-#endif
|
|
- mov %ebx, %edi
|
|
- shr $4, %ebx
|
|
- sub %ebx, %edi
|
|
-#if defined DATA_CACHE_SIZE || !defined SHARED
|
|
- POP (%ebx)
|
|
-#endif
|
|
-/*
|
|
- * When data size approximate the end of L1 cache,
|
|
- * fast string will prefetch and combine data efficiently.
|
|
- */
|
|
- cmp %edi, %ecx
|
|
- jae L(128bytesormore_nt)
|
|
- subl $128, %ecx
|
|
-L(128bytesormore_normal):
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm0, 0x10(%edx)
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm0, 0x30(%edx)
|
|
- movdqa %xmm0, 0x40(%edx)
|
|
- movdqa %xmm0, 0x50(%edx)
|
|
- movdqa %xmm0, 0x60(%edx)
|
|
- movdqa %xmm0, 0x70(%edx)
|
|
- lea 128(%edx), %edx
|
|
- jl L(128bytesless_normal)
|
|
-
|
|
-
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm0, 0x10(%edx)
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm0, 0x30(%edx)
|
|
- movdqa %xmm0, 0x40(%edx)
|
|
- movdqa %xmm0, 0x50(%edx)
|
|
- movdqa %xmm0, 0x60(%edx)
|
|
- movdqa %xmm0, 0x70(%edx)
|
|
- lea 128(%edx), %edx
|
|
- jge L(128bytesormore_normal)
|
|
-
|
|
-L(128bytesless_normal):
|
|
- POP (%edi)
|
|
- lea 128(%ecx), %ecx
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_16_128bytes))
|
|
-
|
|
- ALIGN (4)
|
|
-L(128bytesormore_nt):
|
|
- mov %edx, %edi
|
|
- mov %ecx, %edx
|
|
- shr $2, %ecx
|
|
- and $3, %edx
|
|
- rep stosl
|
|
- jz L(copy_page_by_rep_exit)
|
|
- cmp $2, %edx
|
|
- jb L(copy_page_by_rep_left_1)
|
|
- movw %ax, (%edi)
|
|
- add $2, %edi
|
|
- sub $2, %edx
|
|
- jz L(copy_page_by_rep_exit)
|
|
-L(copy_page_by_rep_left_1):
|
|
- movb %al, (%edi)
|
|
-L(copy_page_by_rep_exit):
|
|
- POP (%edi)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- .pushsection .rodata.sse2,"a",@progbits
|
|
- ALIGN (2)
|
|
-L(table_16_128bytes):
|
|
- .int JMPTBL (L(aligned_16_0bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_1bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_2bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_3bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_4bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_5bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_6bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_7bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_8bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_9bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_10bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_11bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_12bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_13bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_14bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_15bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_16bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_17bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_18bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_19bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_20bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_21bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_22bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_23bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_24bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_25bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_26bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_27bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_28bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_29bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_30bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_31bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_32bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_33bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_34bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_35bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_36bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_37bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_38bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_39bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_40bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_41bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_42bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_43bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_44bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_45bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_46bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_47bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_48bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_49bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_50bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_51bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_52bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_53bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_54bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_55bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_56bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_57bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_58bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_59bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_60bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_61bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_62bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_63bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_64bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_65bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_66bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_67bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_68bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_69bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_70bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_71bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_72bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_73bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_74bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_75bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_76bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_77bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_78bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_79bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_80bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_81bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_82bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_83bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_84bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_85bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_86bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_87bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_88bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_89bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_90bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_91bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_92bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_93bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_94bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_95bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_96bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_97bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_98bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_99bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_100bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_101bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_102bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_103bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_104bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_105bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_106bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_107bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_108bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_109bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_110bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_111bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_112bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_113bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_114bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_115bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_116bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_117bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_118bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_119bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_120bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_121bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_122bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_123bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_124bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_125bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_126bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_127bytes), L(table_16_128bytes))
|
|
- .popsection
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_112bytes):
|
|
- movdqa %xmm0, -112(%edx)
|
|
-L(aligned_16_96bytes):
|
|
- movdqa %xmm0, -96(%edx)
|
|
-L(aligned_16_80bytes):
|
|
- movdqa %xmm0, -80(%edx)
|
|
-L(aligned_16_64bytes):
|
|
- movdqa %xmm0, -64(%edx)
|
|
-L(aligned_16_48bytes):
|
|
- movdqa %xmm0, -48(%edx)
|
|
-L(aligned_16_32bytes):
|
|
- movdqa %xmm0, -32(%edx)
|
|
-L(aligned_16_16bytes):
|
|
- movdqa %xmm0, -16(%edx)
|
|
-L(aligned_16_0bytes):
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_113bytes):
|
|
- movdqa %xmm0, -113(%edx)
|
|
-L(aligned_16_97bytes):
|
|
- movdqa %xmm0, -97(%edx)
|
|
-L(aligned_16_81bytes):
|
|
- movdqa %xmm0, -81(%edx)
|
|
-L(aligned_16_65bytes):
|
|
- movdqa %xmm0, -65(%edx)
|
|
-L(aligned_16_49bytes):
|
|
- movdqa %xmm0, -49(%edx)
|
|
-L(aligned_16_33bytes):
|
|
- movdqa %xmm0, -33(%edx)
|
|
-L(aligned_16_17bytes):
|
|
- movdqa %xmm0, -17(%edx)
|
|
-L(aligned_16_1bytes):
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_114bytes):
|
|
- movdqa %xmm0, -114(%edx)
|
|
-L(aligned_16_98bytes):
|
|
- movdqa %xmm0, -98(%edx)
|
|
-L(aligned_16_82bytes):
|
|
- movdqa %xmm0, -82(%edx)
|
|
-L(aligned_16_66bytes):
|
|
- movdqa %xmm0, -66(%edx)
|
|
-L(aligned_16_50bytes):
|
|
- movdqa %xmm0, -50(%edx)
|
|
-L(aligned_16_34bytes):
|
|
- movdqa %xmm0, -34(%edx)
|
|
-L(aligned_16_18bytes):
|
|
- movdqa %xmm0, -18(%edx)
|
|
-L(aligned_16_2bytes):
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_115bytes):
|
|
- movdqa %xmm0, -115(%edx)
|
|
-L(aligned_16_99bytes):
|
|
- movdqa %xmm0, -99(%edx)
|
|
-L(aligned_16_83bytes):
|
|
- movdqa %xmm0, -83(%edx)
|
|
-L(aligned_16_67bytes):
|
|
- movdqa %xmm0, -67(%edx)
|
|
-L(aligned_16_51bytes):
|
|
- movdqa %xmm0, -51(%edx)
|
|
-L(aligned_16_35bytes):
|
|
- movdqa %xmm0, -35(%edx)
|
|
-L(aligned_16_19bytes):
|
|
- movdqa %xmm0, -19(%edx)
|
|
-L(aligned_16_3bytes):
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_116bytes):
|
|
- movdqa %xmm0, -116(%edx)
|
|
-L(aligned_16_100bytes):
|
|
- movdqa %xmm0, -100(%edx)
|
|
-L(aligned_16_84bytes):
|
|
- movdqa %xmm0, -84(%edx)
|
|
-L(aligned_16_68bytes):
|
|
- movdqa %xmm0, -68(%edx)
|
|
-L(aligned_16_52bytes):
|
|
- movdqa %xmm0, -52(%edx)
|
|
-L(aligned_16_36bytes):
|
|
- movdqa %xmm0, -36(%edx)
|
|
-L(aligned_16_20bytes):
|
|
- movdqa %xmm0, -20(%edx)
|
|
-L(aligned_16_4bytes):
|
|
- movl %eax, -4(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_117bytes):
|
|
- movdqa %xmm0, -117(%edx)
|
|
-L(aligned_16_101bytes):
|
|
- movdqa %xmm0, -101(%edx)
|
|
-L(aligned_16_85bytes):
|
|
- movdqa %xmm0, -85(%edx)
|
|
-L(aligned_16_69bytes):
|
|
- movdqa %xmm0, -69(%edx)
|
|
-L(aligned_16_53bytes):
|
|
- movdqa %xmm0, -53(%edx)
|
|
-L(aligned_16_37bytes):
|
|
- movdqa %xmm0, -37(%edx)
|
|
-L(aligned_16_21bytes):
|
|
- movdqa %xmm0, -21(%edx)
|
|
-L(aligned_16_5bytes):
|
|
- movl %eax, -5(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_118bytes):
|
|
- movdqa %xmm0, -118(%edx)
|
|
-L(aligned_16_102bytes):
|
|
- movdqa %xmm0, -102(%edx)
|
|
-L(aligned_16_86bytes):
|
|
- movdqa %xmm0, -86(%edx)
|
|
-L(aligned_16_70bytes):
|
|
- movdqa %xmm0, -70(%edx)
|
|
-L(aligned_16_54bytes):
|
|
- movdqa %xmm0, -54(%edx)
|
|
-L(aligned_16_38bytes):
|
|
- movdqa %xmm0, -38(%edx)
|
|
-L(aligned_16_22bytes):
|
|
- movdqa %xmm0, -22(%edx)
|
|
-L(aligned_16_6bytes):
|
|
- movl %eax, -6(%edx)
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_119bytes):
|
|
- movdqa %xmm0, -119(%edx)
|
|
-L(aligned_16_103bytes):
|
|
- movdqa %xmm0, -103(%edx)
|
|
-L(aligned_16_87bytes):
|
|
- movdqa %xmm0, -87(%edx)
|
|
-L(aligned_16_71bytes):
|
|
- movdqa %xmm0, -71(%edx)
|
|
-L(aligned_16_55bytes):
|
|
- movdqa %xmm0, -55(%edx)
|
|
-L(aligned_16_39bytes):
|
|
- movdqa %xmm0, -39(%edx)
|
|
-L(aligned_16_23bytes):
|
|
- movdqa %xmm0, -23(%edx)
|
|
-L(aligned_16_7bytes):
|
|
- movl %eax, -7(%edx)
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_120bytes):
|
|
- movdqa %xmm0, -120(%edx)
|
|
-L(aligned_16_104bytes):
|
|
- movdqa %xmm0, -104(%edx)
|
|
-L(aligned_16_88bytes):
|
|
- movdqa %xmm0, -88(%edx)
|
|
-L(aligned_16_72bytes):
|
|
- movdqa %xmm0, -72(%edx)
|
|
-L(aligned_16_56bytes):
|
|
- movdqa %xmm0, -56(%edx)
|
|
-L(aligned_16_40bytes):
|
|
- movdqa %xmm0, -40(%edx)
|
|
-L(aligned_16_24bytes):
|
|
- movdqa %xmm0, -24(%edx)
|
|
-L(aligned_16_8bytes):
|
|
- movq %xmm0, -8(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_121bytes):
|
|
- movdqa %xmm0, -121(%edx)
|
|
-L(aligned_16_105bytes):
|
|
- movdqa %xmm0, -105(%edx)
|
|
-L(aligned_16_89bytes):
|
|
- movdqa %xmm0, -89(%edx)
|
|
-L(aligned_16_73bytes):
|
|
- movdqa %xmm0, -73(%edx)
|
|
-L(aligned_16_57bytes):
|
|
- movdqa %xmm0, -57(%edx)
|
|
-L(aligned_16_41bytes):
|
|
- movdqa %xmm0, -41(%edx)
|
|
-L(aligned_16_25bytes):
|
|
- movdqa %xmm0, -25(%edx)
|
|
-L(aligned_16_9bytes):
|
|
- movq %xmm0, -9(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_122bytes):
|
|
- movdqa %xmm0, -122(%edx)
|
|
-L(aligned_16_106bytes):
|
|
- movdqa %xmm0, -106(%edx)
|
|
-L(aligned_16_90bytes):
|
|
- movdqa %xmm0, -90(%edx)
|
|
-L(aligned_16_74bytes):
|
|
- movdqa %xmm0, -74(%edx)
|
|
-L(aligned_16_58bytes):
|
|
- movdqa %xmm0, -58(%edx)
|
|
-L(aligned_16_42bytes):
|
|
- movdqa %xmm0, -42(%edx)
|
|
-L(aligned_16_26bytes):
|
|
- movdqa %xmm0, -26(%edx)
|
|
-L(aligned_16_10bytes):
|
|
- movq %xmm0, -10(%edx)
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_123bytes):
|
|
- movdqa %xmm0, -123(%edx)
|
|
-L(aligned_16_107bytes):
|
|
- movdqa %xmm0, -107(%edx)
|
|
-L(aligned_16_91bytes):
|
|
- movdqa %xmm0, -91(%edx)
|
|
-L(aligned_16_75bytes):
|
|
- movdqa %xmm0, -75(%edx)
|
|
-L(aligned_16_59bytes):
|
|
- movdqa %xmm0, -59(%edx)
|
|
-L(aligned_16_43bytes):
|
|
- movdqa %xmm0, -43(%edx)
|
|
-L(aligned_16_27bytes):
|
|
- movdqa %xmm0, -27(%edx)
|
|
-L(aligned_16_11bytes):
|
|
- movq %xmm0, -11(%edx)
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_124bytes):
|
|
- movdqa %xmm0, -124(%edx)
|
|
-L(aligned_16_108bytes):
|
|
- movdqa %xmm0, -108(%edx)
|
|
-L(aligned_16_92bytes):
|
|
- movdqa %xmm0, -92(%edx)
|
|
-L(aligned_16_76bytes):
|
|
- movdqa %xmm0, -76(%edx)
|
|
-L(aligned_16_60bytes):
|
|
- movdqa %xmm0, -60(%edx)
|
|
-L(aligned_16_44bytes):
|
|
- movdqa %xmm0, -44(%edx)
|
|
-L(aligned_16_28bytes):
|
|
- movdqa %xmm0, -28(%edx)
|
|
-L(aligned_16_12bytes):
|
|
- movq %xmm0, -12(%edx)
|
|
- movl %eax, -4(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_125bytes):
|
|
- movdqa %xmm0, -125(%edx)
|
|
-L(aligned_16_109bytes):
|
|
- movdqa %xmm0, -109(%edx)
|
|
-L(aligned_16_93bytes):
|
|
- movdqa %xmm0, -93(%edx)
|
|
-L(aligned_16_77bytes):
|
|
- movdqa %xmm0, -77(%edx)
|
|
-L(aligned_16_61bytes):
|
|
- movdqa %xmm0, -61(%edx)
|
|
-L(aligned_16_45bytes):
|
|
- movdqa %xmm0, -45(%edx)
|
|
-L(aligned_16_29bytes):
|
|
- movdqa %xmm0, -29(%edx)
|
|
-L(aligned_16_13bytes):
|
|
- movq %xmm0, -13(%edx)
|
|
- movl %eax, -5(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_126bytes):
|
|
- movdqa %xmm0, -126(%edx)
|
|
-L(aligned_16_110bytes):
|
|
- movdqa %xmm0, -110(%edx)
|
|
-L(aligned_16_94bytes):
|
|
- movdqa %xmm0, -94(%edx)
|
|
-L(aligned_16_78bytes):
|
|
- movdqa %xmm0, -78(%edx)
|
|
-L(aligned_16_62bytes):
|
|
- movdqa %xmm0, -62(%edx)
|
|
-L(aligned_16_46bytes):
|
|
- movdqa %xmm0, -46(%edx)
|
|
-L(aligned_16_30bytes):
|
|
- movdqa %xmm0, -30(%edx)
|
|
-L(aligned_16_14bytes):
|
|
- movq %xmm0, -14(%edx)
|
|
- movl %eax, -6(%edx)
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_127bytes):
|
|
- movdqa %xmm0, -127(%edx)
|
|
-L(aligned_16_111bytes):
|
|
- movdqa %xmm0, -111(%edx)
|
|
-L(aligned_16_95bytes):
|
|
- movdqa %xmm0, -95(%edx)
|
|
-L(aligned_16_79bytes):
|
|
- movdqa %xmm0, -79(%edx)
|
|
-L(aligned_16_63bytes):
|
|
- movdqa %xmm0, -63(%edx)
|
|
-L(aligned_16_47bytes):
|
|
- movdqa %xmm0, -47(%edx)
|
|
-L(aligned_16_31bytes):
|
|
- movdqa %xmm0, -31(%edx)
|
|
-L(aligned_16_15bytes):
|
|
- movq %xmm0, -15(%edx)
|
|
- movl %eax, -7(%edx)
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN_END
|
|
-
|
|
-END (__memset_sse2_rep)
|
|
-
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memset-sse2.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,867 +0,0 @@
|
|
-/* memset with SSE2
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#ifndef NOT_IN_libc
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include "asm-syntax.h"
|
|
-
|
|
-#define CFI_PUSH(REG) \
|
|
- cfi_adjust_cfa_offset (4); \
|
|
- cfi_rel_offset (REG, 0)
|
|
-
|
|
-#define CFI_POP(REG) \
|
|
- cfi_adjust_cfa_offset (-4); \
|
|
- cfi_restore (REG)
|
|
-
|
|
-#define PUSH(REG) pushl REG; CFI_PUSH (REG)
|
|
-#define POP(REG) popl REG; CFI_POP (REG)
|
|
-
|
|
-#ifdef USE_AS_BZERO
|
|
-# define DEST PARMS
|
|
-# define LEN DEST+4
|
|
-# define SETRTNVAL
|
|
-#else
|
|
-# define DEST PARMS
|
|
-# define CHR DEST+4
|
|
-# define LEN CHR+4
|
|
-# define SETRTNVAL movl DEST(%esp), %eax
|
|
-#endif
|
|
-
|
|
-#ifdef SHARED
|
|
-# define ENTRANCE PUSH (%ebx);
|
|
-# define RETURN_END POP (%ebx); ret
|
|
-# define RETURN RETURN_END; CFI_PUSH (%ebx)
|
|
-# define PARMS 8 /* Preserve EBX. */
|
|
-# define JMPTBL(I, B) I - B
|
|
-
|
|
-/* Load an entry in a jump table into EBX and branch to it. TABLE is a
|
|
- jump table with relative offsets. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE) \
|
|
- /* We first load PC into EBX. */ \
|
|
- call __i686.get_pc_thunk.bx; \
|
|
- /* Get the address of the jump table. */ \
|
|
- add $(TABLE - .), %ebx; \
|
|
- /* Get the entry and convert the relative offset to the \
|
|
- absolute address. */ \
|
|
- add (%ebx,%ecx,4), %ebx; \
|
|
- add %ecx, %edx; \
|
|
- /* We loaded the jump table and adjuested EDX. Go. */ \
|
|
- jmp *%ebx
|
|
-
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- ALIGN (4)
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-#else
|
|
-# define ENTRANCE
|
|
-# define RETURN_END ret
|
|
-# define RETURN RETURN_END
|
|
-# define PARMS 4
|
|
-# define JMPTBL(I, B) I
|
|
-
|
|
-/* Branch to an entry in a jump table. TABLE is a jump table with
|
|
- absolute offsets. */
|
|
-# define BRANCH_TO_JMPTBL_ENTRY(TABLE) \
|
|
- add %ecx, %edx; \
|
|
- jmp *TABLE(,%ecx,4)
|
|
-#endif
|
|
-
|
|
- .section .text.sse2,"ax",@progbits
|
|
-#if defined SHARED && !defined NOT_IN_libc && !defined USE_AS_BZERO
|
|
-ENTRY (__memset_chk_sse2)
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb HIDDEN_JUMPTARGET (__chk_fail)
|
|
-END (__memset_chk_sse2)
|
|
-#endif
|
|
-ENTRY (__memset_sse2)
|
|
- ENTRANCE
|
|
-
|
|
- movl LEN(%esp), %ecx
|
|
-#ifdef USE_AS_BZERO
|
|
- xor %eax, %eax
|
|
-#else
|
|
- movzbl CHR(%esp), %eax
|
|
- movb %al, %ah
|
|
- /* Fill the whole EAX with pattern. */
|
|
- movl %eax, %edx
|
|
- shl $16, %eax
|
|
- or %edx, %eax
|
|
-#endif
|
|
- movl DEST(%esp), %edx
|
|
- cmp $32, %ecx
|
|
- jae L(32bytesormore)
|
|
-
|
|
-L(write_less32bytes):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_less_32bytes))
|
|
-
|
|
-
|
|
- .pushsection .rodata.sse2,"a",@progbits
|
|
- ALIGN (2)
|
|
-L(table_less_32bytes):
|
|
- .int JMPTBL (L(write_0bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_1bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_2bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_3bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_4bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_5bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_6bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_7bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_8bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_9bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_10bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_11bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_12bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_13bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_14bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_15bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_16bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_17bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_18bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_19bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_20bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_21bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_22bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_23bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_24bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_25bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_26bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_27bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_28bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_29bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_30bytes), L(table_less_32bytes))
|
|
- .int JMPTBL (L(write_31bytes), L(table_less_32bytes))
|
|
- .popsection
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_28bytes):
|
|
- movl %eax, -28(%edx)
|
|
-L(write_24bytes):
|
|
- movl %eax, -24(%edx)
|
|
-L(write_20bytes):
|
|
- movl %eax, -20(%edx)
|
|
-L(write_16bytes):
|
|
- movl %eax, -16(%edx)
|
|
-L(write_12bytes):
|
|
- movl %eax, -12(%edx)
|
|
-L(write_8bytes):
|
|
- movl %eax, -8(%edx)
|
|
-L(write_4bytes):
|
|
- movl %eax, -4(%edx)
|
|
-L(write_0bytes):
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_29bytes):
|
|
- movl %eax, -29(%edx)
|
|
-L(write_25bytes):
|
|
- movl %eax, -25(%edx)
|
|
-L(write_21bytes):
|
|
- movl %eax, -21(%edx)
|
|
-L(write_17bytes):
|
|
- movl %eax, -17(%edx)
|
|
-L(write_13bytes):
|
|
- movl %eax, -13(%edx)
|
|
-L(write_9bytes):
|
|
- movl %eax, -9(%edx)
|
|
-L(write_5bytes):
|
|
- movl %eax, -5(%edx)
|
|
-L(write_1bytes):
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_30bytes):
|
|
- movl %eax, -30(%edx)
|
|
-L(write_26bytes):
|
|
- movl %eax, -26(%edx)
|
|
-L(write_22bytes):
|
|
- movl %eax, -22(%edx)
|
|
-L(write_18bytes):
|
|
- movl %eax, -18(%edx)
|
|
-L(write_14bytes):
|
|
- movl %eax, -14(%edx)
|
|
-L(write_10bytes):
|
|
- movl %eax, -10(%edx)
|
|
-L(write_6bytes):
|
|
- movl %eax, -6(%edx)
|
|
-L(write_2bytes):
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(write_31bytes):
|
|
- movl %eax, -31(%edx)
|
|
-L(write_27bytes):
|
|
- movl %eax, -27(%edx)
|
|
-L(write_23bytes):
|
|
- movl %eax, -23(%edx)
|
|
-L(write_19bytes):
|
|
- movl %eax, -19(%edx)
|
|
-L(write_15bytes):
|
|
- movl %eax, -15(%edx)
|
|
-L(write_11bytes):
|
|
- movl %eax, -11(%edx)
|
|
-L(write_7bytes):
|
|
- movl %eax, -7(%edx)
|
|
-L(write_3bytes):
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-/* ECX > 32 and EDX is 4 byte aligned. */
|
|
-L(32bytesormore):
|
|
- /* Fill xmm0 with the pattern. */
|
|
-#ifdef USE_AS_BZERO
|
|
- pxor %xmm0, %xmm0
|
|
-#else
|
|
- movd %eax, %xmm0
|
|
- punpcklbw %xmm0, %xmm0
|
|
- pshufd $0, %xmm0, %xmm0
|
|
-#endif
|
|
- testl $0xf, %edx
|
|
- jz L(aligned_16)
|
|
-/* ECX > 32 and EDX is not 16 byte aligned. */
|
|
-L(not_aligned_16):
|
|
- movdqu %xmm0, (%edx)
|
|
- movl %edx, %eax
|
|
- and $-16, %edx
|
|
- add $16, %edx
|
|
- sub %edx, %eax
|
|
- add %eax, %ecx
|
|
- movd %xmm0, %eax
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16):
|
|
- cmp $128, %ecx
|
|
- jge L(128bytesormore)
|
|
-
|
|
-L(aligned_16_less128bytes):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_16_128bytes))
|
|
-
|
|
- ALIGN (4)
|
|
-L(128bytesormore):
|
|
-#ifdef SHARED_CACHE_SIZE
|
|
- PUSH (%ebx)
|
|
- mov $SHARED_CACHE_SIZE, %ebx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- mov __x86_shared_cache_size@GOTOFF(%ebx), %ebx
|
|
-# else
|
|
- PUSH (%ebx)
|
|
- mov __x86_shared_cache_size, %ebx
|
|
-# endif
|
|
-#endif
|
|
- cmp %ebx, %ecx
|
|
- jae L(128bytesormore_nt_start)
|
|
-
|
|
-
|
|
-#ifdef DATA_CACHE_SIZE
|
|
- POP (%ebx)
|
|
- cmp $DATA_CACHE_SIZE, %ecx
|
|
-#else
|
|
-# ifdef SHARED
|
|
- call __i686.get_pc_thunk.bx
|
|
- add $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmp __x86_data_cache_size@GOTOFF(%ebx), %ecx
|
|
-# else
|
|
- POP (%ebx)
|
|
- cmp __x86_data_cache_size, %ecx
|
|
-# endif
|
|
-#endif
|
|
-
|
|
- jae L(128bytes_L2_normal)
|
|
- subl $128, %ecx
|
|
-L(128bytesormore_normal):
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm0, 0x10(%edx)
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm0, 0x30(%edx)
|
|
- movdqa %xmm0, 0x40(%edx)
|
|
- movdqa %xmm0, 0x50(%edx)
|
|
- movdqa %xmm0, 0x60(%edx)
|
|
- movdqa %xmm0, 0x70(%edx)
|
|
- lea 128(%edx), %edx
|
|
- jl L(128bytesless_normal)
|
|
-
|
|
-
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm0, 0x10(%edx)
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm0, 0x30(%edx)
|
|
- movdqa %xmm0, 0x40(%edx)
|
|
- movdqa %xmm0, 0x50(%edx)
|
|
- movdqa %xmm0, 0x60(%edx)
|
|
- movdqa %xmm0, 0x70(%edx)
|
|
- lea 128(%edx), %edx
|
|
- jge L(128bytesormore_normal)
|
|
-
|
|
-L(128bytesless_normal):
|
|
- lea 128(%ecx), %ecx
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_16_128bytes))
|
|
-
|
|
- ALIGN (4)
|
|
-L(128bytes_L2_normal):
|
|
- prefetcht0 0x380(%edx)
|
|
- prefetcht0 0x3c0(%edx)
|
|
- sub $128, %ecx
|
|
- movdqa %xmm0, (%edx)
|
|
- movaps %xmm0, 0x10(%edx)
|
|
- movaps %xmm0, 0x20(%edx)
|
|
- movaps %xmm0, 0x30(%edx)
|
|
- movaps %xmm0, 0x40(%edx)
|
|
- movaps %xmm0, 0x50(%edx)
|
|
- movaps %xmm0, 0x60(%edx)
|
|
- movaps %xmm0, 0x70(%edx)
|
|
- add $128, %edx
|
|
- cmp $128, %ecx
|
|
- jge L(128bytes_L2_normal)
|
|
-
|
|
-L(128bytesless_L2_normal):
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_16_128bytes))
|
|
-
|
|
-L(128bytesormore_nt_start):
|
|
- sub %ebx, %ecx
|
|
- ALIGN (4)
|
|
-L(128bytesormore_shared_cache_loop):
|
|
- prefetcht0 0x3c0(%edx)
|
|
- prefetcht0 0x380(%edx)
|
|
- sub $0x80, %ebx
|
|
- movdqa %xmm0, (%edx)
|
|
- movdqa %xmm0, 0x10(%edx)
|
|
- movdqa %xmm0, 0x20(%edx)
|
|
- movdqa %xmm0, 0x30(%edx)
|
|
- movdqa %xmm0, 0x40(%edx)
|
|
- movdqa %xmm0, 0x50(%edx)
|
|
- movdqa %xmm0, 0x60(%edx)
|
|
- movdqa %xmm0, 0x70(%edx)
|
|
- add $0x80, %edx
|
|
- cmp $0x80, %ebx
|
|
- jge L(128bytesormore_shared_cache_loop)
|
|
- cmp $0x80, %ecx
|
|
- jb L(shared_cache_loop_end)
|
|
- ALIGN (4)
|
|
-L(128bytesormore_nt):
|
|
- sub $0x80, %ecx
|
|
- movntdq %xmm0, (%edx)
|
|
- movntdq %xmm0, 0x10(%edx)
|
|
- movntdq %xmm0, 0x20(%edx)
|
|
- movntdq %xmm0, 0x30(%edx)
|
|
- movntdq %xmm0, 0x40(%edx)
|
|
- movntdq %xmm0, 0x50(%edx)
|
|
- movntdq %xmm0, 0x60(%edx)
|
|
- movntdq %xmm0, 0x70(%edx)
|
|
- add $0x80, %edx
|
|
- cmp $0x80, %ecx
|
|
- jge L(128bytesormore_nt)
|
|
- sfence
|
|
-L(shared_cache_loop_end):
|
|
-#if defined DATA_CACHE_SIZE || !defined SHARED
|
|
- POP (%ebx)
|
|
-#endif
|
|
- BRANCH_TO_JMPTBL_ENTRY (L(table_16_128bytes))
|
|
-
|
|
-
|
|
- .pushsection .rodata.sse2,"a",@progbits
|
|
- ALIGN (2)
|
|
-L(table_16_128bytes):
|
|
- .int JMPTBL (L(aligned_16_0bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_1bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_2bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_3bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_4bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_5bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_6bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_7bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_8bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_9bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_10bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_11bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_12bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_13bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_14bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_15bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_16bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_17bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_18bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_19bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_20bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_21bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_22bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_23bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_24bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_25bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_26bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_27bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_28bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_29bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_30bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_31bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_32bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_33bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_34bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_35bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_36bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_37bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_38bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_39bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_40bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_41bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_42bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_43bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_44bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_45bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_46bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_47bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_48bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_49bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_50bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_51bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_52bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_53bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_54bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_55bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_56bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_57bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_58bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_59bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_60bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_61bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_62bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_63bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_64bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_65bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_66bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_67bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_68bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_69bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_70bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_71bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_72bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_73bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_74bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_75bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_76bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_77bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_78bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_79bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_80bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_81bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_82bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_83bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_84bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_85bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_86bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_87bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_88bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_89bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_90bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_91bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_92bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_93bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_94bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_95bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_96bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_97bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_98bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_99bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_100bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_101bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_102bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_103bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_104bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_105bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_106bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_107bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_108bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_109bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_110bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_111bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_112bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_113bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_114bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_115bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_116bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_117bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_118bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_119bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_120bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_121bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_122bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_123bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_124bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_125bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_126bytes), L(table_16_128bytes))
|
|
- .int JMPTBL (L(aligned_16_127bytes), L(table_16_128bytes))
|
|
- .popsection
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_112bytes):
|
|
- movdqa %xmm0, -112(%edx)
|
|
-L(aligned_16_96bytes):
|
|
- movdqa %xmm0, -96(%edx)
|
|
-L(aligned_16_80bytes):
|
|
- movdqa %xmm0, -80(%edx)
|
|
-L(aligned_16_64bytes):
|
|
- movdqa %xmm0, -64(%edx)
|
|
-L(aligned_16_48bytes):
|
|
- movdqa %xmm0, -48(%edx)
|
|
-L(aligned_16_32bytes):
|
|
- movdqa %xmm0, -32(%edx)
|
|
-L(aligned_16_16bytes):
|
|
- movdqa %xmm0, -16(%edx)
|
|
-L(aligned_16_0bytes):
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_113bytes):
|
|
- movdqa %xmm0, -113(%edx)
|
|
-L(aligned_16_97bytes):
|
|
- movdqa %xmm0, -97(%edx)
|
|
-L(aligned_16_81bytes):
|
|
- movdqa %xmm0, -81(%edx)
|
|
-L(aligned_16_65bytes):
|
|
- movdqa %xmm0, -65(%edx)
|
|
-L(aligned_16_49bytes):
|
|
- movdqa %xmm0, -49(%edx)
|
|
-L(aligned_16_33bytes):
|
|
- movdqa %xmm0, -33(%edx)
|
|
-L(aligned_16_17bytes):
|
|
- movdqa %xmm0, -17(%edx)
|
|
-L(aligned_16_1bytes):
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_114bytes):
|
|
- movdqa %xmm0, -114(%edx)
|
|
-L(aligned_16_98bytes):
|
|
- movdqa %xmm0, -98(%edx)
|
|
-L(aligned_16_82bytes):
|
|
- movdqa %xmm0, -82(%edx)
|
|
-L(aligned_16_66bytes):
|
|
- movdqa %xmm0, -66(%edx)
|
|
-L(aligned_16_50bytes):
|
|
- movdqa %xmm0, -50(%edx)
|
|
-L(aligned_16_34bytes):
|
|
- movdqa %xmm0, -34(%edx)
|
|
-L(aligned_16_18bytes):
|
|
- movdqa %xmm0, -18(%edx)
|
|
-L(aligned_16_2bytes):
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_115bytes):
|
|
- movdqa %xmm0, -115(%edx)
|
|
-L(aligned_16_99bytes):
|
|
- movdqa %xmm0, -99(%edx)
|
|
-L(aligned_16_83bytes):
|
|
- movdqa %xmm0, -83(%edx)
|
|
-L(aligned_16_67bytes):
|
|
- movdqa %xmm0, -67(%edx)
|
|
-L(aligned_16_51bytes):
|
|
- movdqa %xmm0, -51(%edx)
|
|
-L(aligned_16_35bytes):
|
|
- movdqa %xmm0, -35(%edx)
|
|
-L(aligned_16_19bytes):
|
|
- movdqa %xmm0, -19(%edx)
|
|
-L(aligned_16_3bytes):
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_116bytes):
|
|
- movdqa %xmm0, -116(%edx)
|
|
-L(aligned_16_100bytes):
|
|
- movdqa %xmm0, -100(%edx)
|
|
-L(aligned_16_84bytes):
|
|
- movdqa %xmm0, -84(%edx)
|
|
-L(aligned_16_68bytes):
|
|
- movdqa %xmm0, -68(%edx)
|
|
-L(aligned_16_52bytes):
|
|
- movdqa %xmm0, -52(%edx)
|
|
-L(aligned_16_36bytes):
|
|
- movdqa %xmm0, -36(%edx)
|
|
-L(aligned_16_20bytes):
|
|
- movdqa %xmm0, -20(%edx)
|
|
-L(aligned_16_4bytes):
|
|
- movl %eax, -4(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_117bytes):
|
|
- movdqa %xmm0, -117(%edx)
|
|
-L(aligned_16_101bytes):
|
|
- movdqa %xmm0, -101(%edx)
|
|
-L(aligned_16_85bytes):
|
|
- movdqa %xmm0, -85(%edx)
|
|
-L(aligned_16_69bytes):
|
|
- movdqa %xmm0, -69(%edx)
|
|
-L(aligned_16_53bytes):
|
|
- movdqa %xmm0, -53(%edx)
|
|
-L(aligned_16_37bytes):
|
|
- movdqa %xmm0, -37(%edx)
|
|
-L(aligned_16_21bytes):
|
|
- movdqa %xmm0, -21(%edx)
|
|
-L(aligned_16_5bytes):
|
|
- movl %eax, -5(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_118bytes):
|
|
- movdqa %xmm0, -118(%edx)
|
|
-L(aligned_16_102bytes):
|
|
- movdqa %xmm0, -102(%edx)
|
|
-L(aligned_16_86bytes):
|
|
- movdqa %xmm0, -86(%edx)
|
|
-L(aligned_16_70bytes):
|
|
- movdqa %xmm0, -70(%edx)
|
|
-L(aligned_16_54bytes):
|
|
- movdqa %xmm0, -54(%edx)
|
|
-L(aligned_16_38bytes):
|
|
- movdqa %xmm0, -38(%edx)
|
|
-L(aligned_16_22bytes):
|
|
- movdqa %xmm0, -22(%edx)
|
|
-L(aligned_16_6bytes):
|
|
- movl %eax, -6(%edx)
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_119bytes):
|
|
- movdqa %xmm0, -119(%edx)
|
|
-L(aligned_16_103bytes):
|
|
- movdqa %xmm0, -103(%edx)
|
|
-L(aligned_16_87bytes):
|
|
- movdqa %xmm0, -87(%edx)
|
|
-L(aligned_16_71bytes):
|
|
- movdqa %xmm0, -71(%edx)
|
|
-L(aligned_16_55bytes):
|
|
- movdqa %xmm0, -55(%edx)
|
|
-L(aligned_16_39bytes):
|
|
- movdqa %xmm0, -39(%edx)
|
|
-L(aligned_16_23bytes):
|
|
- movdqa %xmm0, -23(%edx)
|
|
-L(aligned_16_7bytes):
|
|
- movl %eax, -7(%edx)
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_120bytes):
|
|
- movdqa %xmm0, -120(%edx)
|
|
-L(aligned_16_104bytes):
|
|
- movdqa %xmm0, -104(%edx)
|
|
-L(aligned_16_88bytes):
|
|
- movdqa %xmm0, -88(%edx)
|
|
-L(aligned_16_72bytes):
|
|
- movdqa %xmm0, -72(%edx)
|
|
-L(aligned_16_56bytes):
|
|
- movdqa %xmm0, -56(%edx)
|
|
-L(aligned_16_40bytes):
|
|
- movdqa %xmm0, -40(%edx)
|
|
-L(aligned_16_24bytes):
|
|
- movdqa %xmm0, -24(%edx)
|
|
-L(aligned_16_8bytes):
|
|
- movq %xmm0, -8(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_121bytes):
|
|
- movdqa %xmm0, -121(%edx)
|
|
-L(aligned_16_105bytes):
|
|
- movdqa %xmm0, -105(%edx)
|
|
-L(aligned_16_89bytes):
|
|
- movdqa %xmm0, -89(%edx)
|
|
-L(aligned_16_73bytes):
|
|
- movdqa %xmm0, -73(%edx)
|
|
-L(aligned_16_57bytes):
|
|
- movdqa %xmm0, -57(%edx)
|
|
-L(aligned_16_41bytes):
|
|
- movdqa %xmm0, -41(%edx)
|
|
-L(aligned_16_25bytes):
|
|
- movdqa %xmm0, -25(%edx)
|
|
-L(aligned_16_9bytes):
|
|
- movq %xmm0, -9(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_122bytes):
|
|
- movdqa %xmm0, -122(%edx)
|
|
-L(aligned_16_106bytes):
|
|
- movdqa %xmm0, -106(%edx)
|
|
-L(aligned_16_90bytes):
|
|
- movdqa %xmm0, -90(%edx)
|
|
-L(aligned_16_74bytes):
|
|
- movdqa %xmm0, -74(%edx)
|
|
-L(aligned_16_58bytes):
|
|
- movdqa %xmm0, -58(%edx)
|
|
-L(aligned_16_42bytes):
|
|
- movdqa %xmm0, -42(%edx)
|
|
-L(aligned_16_26bytes):
|
|
- movdqa %xmm0, -26(%edx)
|
|
-L(aligned_16_10bytes):
|
|
- movq %xmm0, -10(%edx)
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_123bytes):
|
|
- movdqa %xmm0, -123(%edx)
|
|
-L(aligned_16_107bytes):
|
|
- movdqa %xmm0, -107(%edx)
|
|
-L(aligned_16_91bytes):
|
|
- movdqa %xmm0, -91(%edx)
|
|
-L(aligned_16_75bytes):
|
|
- movdqa %xmm0, -75(%edx)
|
|
-L(aligned_16_59bytes):
|
|
- movdqa %xmm0, -59(%edx)
|
|
-L(aligned_16_43bytes):
|
|
- movdqa %xmm0, -43(%edx)
|
|
-L(aligned_16_27bytes):
|
|
- movdqa %xmm0, -27(%edx)
|
|
-L(aligned_16_11bytes):
|
|
- movq %xmm0, -11(%edx)
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_124bytes):
|
|
- movdqa %xmm0, -124(%edx)
|
|
-L(aligned_16_108bytes):
|
|
- movdqa %xmm0, -108(%edx)
|
|
-L(aligned_16_92bytes):
|
|
- movdqa %xmm0, -92(%edx)
|
|
-L(aligned_16_76bytes):
|
|
- movdqa %xmm0, -76(%edx)
|
|
-L(aligned_16_60bytes):
|
|
- movdqa %xmm0, -60(%edx)
|
|
-L(aligned_16_44bytes):
|
|
- movdqa %xmm0, -44(%edx)
|
|
-L(aligned_16_28bytes):
|
|
- movdqa %xmm0, -28(%edx)
|
|
-L(aligned_16_12bytes):
|
|
- movq %xmm0, -12(%edx)
|
|
- movl %eax, -4(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_125bytes):
|
|
- movdqa %xmm0, -125(%edx)
|
|
-L(aligned_16_109bytes):
|
|
- movdqa %xmm0, -109(%edx)
|
|
-L(aligned_16_93bytes):
|
|
- movdqa %xmm0, -93(%edx)
|
|
-L(aligned_16_77bytes):
|
|
- movdqa %xmm0, -77(%edx)
|
|
-L(aligned_16_61bytes):
|
|
- movdqa %xmm0, -61(%edx)
|
|
-L(aligned_16_45bytes):
|
|
- movdqa %xmm0, -45(%edx)
|
|
-L(aligned_16_29bytes):
|
|
- movdqa %xmm0, -29(%edx)
|
|
-L(aligned_16_13bytes):
|
|
- movq %xmm0, -13(%edx)
|
|
- movl %eax, -5(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_126bytes):
|
|
- movdqa %xmm0, -126(%edx)
|
|
-L(aligned_16_110bytes):
|
|
- movdqa %xmm0, -110(%edx)
|
|
-L(aligned_16_94bytes):
|
|
- movdqa %xmm0, -94(%edx)
|
|
-L(aligned_16_78bytes):
|
|
- movdqa %xmm0, -78(%edx)
|
|
-L(aligned_16_62bytes):
|
|
- movdqa %xmm0, -62(%edx)
|
|
-L(aligned_16_46bytes):
|
|
- movdqa %xmm0, -46(%edx)
|
|
-L(aligned_16_30bytes):
|
|
- movdqa %xmm0, -30(%edx)
|
|
-L(aligned_16_14bytes):
|
|
- movq %xmm0, -14(%edx)
|
|
- movl %eax, -6(%edx)
|
|
- movw %ax, -2(%edx)
|
|
- SETRTNVAL
|
|
- RETURN
|
|
-
|
|
- ALIGN (4)
|
|
-L(aligned_16_127bytes):
|
|
- movdqa %xmm0, -127(%edx)
|
|
-L(aligned_16_111bytes):
|
|
- movdqa %xmm0, -111(%edx)
|
|
-L(aligned_16_95bytes):
|
|
- movdqa %xmm0, -95(%edx)
|
|
-L(aligned_16_79bytes):
|
|
- movdqa %xmm0, -79(%edx)
|
|
-L(aligned_16_63bytes):
|
|
- movdqa %xmm0, -63(%edx)
|
|
-L(aligned_16_47bytes):
|
|
- movdqa %xmm0, -47(%edx)
|
|
-L(aligned_16_31bytes):
|
|
- movdqa %xmm0, -31(%edx)
|
|
-L(aligned_16_15bytes):
|
|
- movq %xmm0, -15(%edx)
|
|
- movl %eax, -7(%edx)
|
|
- movw %ax, -3(%edx)
|
|
- movb %al, -1(%edx)
|
|
- SETRTNVAL
|
|
- RETURN_END
|
|
-
|
|
-END (__memset_sse2)
|
|
-
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memset.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,112 +0,0 @@
|
|
-/* Multiple versions of memset
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib. */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(memset)
|
|
- .type memset, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memset_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSE2, CPUID_OFFSET+index_SSE2+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memset_sse2@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memset_sse2_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(memset)
|
|
-# else
|
|
- .text
|
|
-ENTRY(memset)
|
|
- .type memset, @gnu_indirect_function
|
|
- cmpl $0, KIND_OFFSET+__cpu_features
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memset_ia32, %eax
|
|
- testl $bit_SSE2, CPUID_OFFSET+index_SSE2+__cpu_features
|
|
- jz 2f
|
|
- leal __memset_sse2, %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features
|
|
- jz 2f
|
|
- leal __memset_sse2_rep, %eax
|
|
-2: ret
|
|
-END(memset)
|
|
-# endif
|
|
-
|
|
-# undef ENTRY
|
|
-# define ENTRY(name) \
|
|
- .type __memset_ia32, @function; \
|
|
- .globl __memset_ia32; \
|
|
- .p2align 4; \
|
|
- __memset_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END
|
|
-# define END(name) \
|
|
- cfi_endproc; .size __memset_ia32, .-__memset_ia32
|
|
-
|
|
-# undef ENTRY_CHK
|
|
-# define ENTRY_CHK(name) \
|
|
- .type __memset_chk_ia32, @function; \
|
|
- .globl __memset_chk_ia32; \
|
|
- .p2align 4; \
|
|
- __memset_chk_ia32: cfi_startproc; \
|
|
- CALL_MCOUNT
|
|
-# undef END_CHK
|
|
-# define END_CHK(name) \
|
|
- cfi_endproc; .size __memset_chk_ia32, .-__memset_chk_ia32
|
|
-
|
|
-# ifdef SHARED
|
|
-# undef libc_hidden_builtin_def
|
|
-/* IFUNC doesn't work with the hidden functions in shared library since
|
|
- they will be called without setting up EBX needed for PLT which is
|
|
- used by IFUNC. */
|
|
-# define libc_hidden_builtin_def(name) \
|
|
- .globl __GI_memset; __GI_memset = __memset_ia32
|
|
-# endif
|
|
-
|
|
-# undef strong_alias
|
|
-# define strong_alias(original, alias)
|
|
-#endif
|
|
-
|
|
-#include "../memset.S"
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/i686/multiarch/memset_chk.S
|
|
+++ glibc-2.11.90-11//dev/null
|
|
@@ -1,116 +0,0 @@
|
|
-/* Multiple versions of __memset_chk
|
|
- Copyright (C) 2010 Free Software Foundation, Inc.
|
|
- Contributed by Intel Corporation.
|
|
- This file is part of the GNU C Library.
|
|
-
|
|
- The GNU C Library is free software; you can redistribute it and/or
|
|
- modify it under the terms of the GNU Lesser General Public
|
|
- License as published by the Free Software Foundation; either
|
|
- version 2.1 of the License, or (at your option) any later version.
|
|
-
|
|
- The GNU C Library is distributed in the hope that it will be useful,
|
|
- but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
- Lesser General Public License for more details.
|
|
-
|
|
- You should have received a copy of the GNU Lesser General Public
|
|
- License along with the GNU C Library; if not, write to the Free
|
|
- Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
- 02111-1307 USA. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#include <init-arch.h>
|
|
-
|
|
-/* Define multiple versions only for the definition in lib. */
|
|
-#ifndef NOT_IN_libc
|
|
-# ifdef SHARED
|
|
- .section .gnu.linkonce.t.__i686.get_pc_thunk.bx,"ax",@progbits
|
|
- .globl __i686.get_pc_thunk.bx
|
|
- .hidden __i686.get_pc_thunk.bx
|
|
- .p2align 4
|
|
- .type __i686.get_pc_thunk.bx,@function
|
|
-__i686.get_pc_thunk.bx:
|
|
- movl (%esp), %ebx
|
|
- ret
|
|
-
|
|
- .text
|
|
-ENTRY(__memset_chk)
|
|
- .type __memset_chk, @gnu_indirect_function
|
|
- pushl %ebx
|
|
- cfi_adjust_cfa_offset (4)
|
|
- cfi_rel_offset (ebx, 0)
|
|
- call __i686.get_pc_thunk.bx
|
|
- addl $_GLOBAL_OFFSET_TABLE_, %ebx
|
|
- cmpl $0, KIND_OFFSET+__cpu_features@GOTOFF(%ebx)
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memset_chk_ia32@GOTOFF(%ebx), %eax
|
|
- testl $bit_SSE2, CPUID_OFFSET+index_SSE2+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memset_chk_sse2@GOTOFF(%ebx), %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features@GOTOFF(%ebx)
|
|
- jz 2f
|
|
- leal __memset_chk_sse2_rep@GOTOFF(%ebx), %eax
|
|
-2: popl %ebx
|
|
- cfi_adjust_cfa_offset (-4)
|
|
- cfi_restore (ebx)
|
|
- ret
|
|
-END(__memset_chk)
|
|
-
|
|
-strong_alias (__memset_chk, __memset_zero_constant_len_parameter)
|
|
- .section .gnu.warning.__memset_zero_constant_len_parameter
|
|
- .string "memset used with constant zero length parameter; this could be due to transposed parameters"
|
|
-# else
|
|
- .text
|
|
-ENTRY(__memset_chk)
|
|
- .type __memset_chk, @gnu_indirect_function
|
|
- cmpl $0, KIND_OFFSET+__cpu_features
|
|
- jne 1f
|
|
- call __init_cpu_features
|
|
-1: leal __memset_chk_ia32, %eax
|
|
- testl $bit_SSE2, CPUID_OFFSET+index_SSE2+__cpu_features
|
|
- jz 2f
|
|
- leal __memset_chk_sse2, %eax
|
|
- testl $bit_Fast_Rep_String, FEATURE_OFFSET+index_Fast_Rep_String+__cpu_features
|
|
- jz 2f
|
|
- leal __memset_chk_sse2_rep, %eax
|
|
-2: ret
|
|
-END(__memset_chk)
|
|
-
|
|
- .type __memset_chk_sse2, @function
|
|
- .p2align 4;
|
|
-__memset_chk_sse2:
|
|
- cfi_startproc
|
|
- CALL_MCOUNT
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb __chk_fail
|
|
- jmp __memset_sse2
|
|
- cfi_endproc
|
|
- .size __memset_chk_sse2, .-__memset_chk_sse2
|
|
-
|
|
- .type __memset_chk_sse2_rep, @function
|
|
- .p2align 4;
|
|
-__memset_chk_sse2_rep:
|
|
- cfi_startproc
|
|
- CALL_MCOUNT
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb __chk_fail
|
|
- jmp __memset_sse2_rep
|
|
- cfi_endproc
|
|
- .size __memset_chk_sse2_rep, .-__memset_chk_sse2_rep
|
|
-
|
|
- .type __memset_chk_ia32, @function
|
|
- .p2align 4;
|
|
-__memset_chk_ia32:
|
|
- cfi_startproc
|
|
- CALL_MCOUNT
|
|
- movl 12(%esp), %eax
|
|
- cmpl %eax, 16(%esp)
|
|
- jb __chk_fail
|
|
- jmp __memset_ia32
|
|
- cfi_endproc
|
|
- .size __memset_chk_ia32, .-__memset_chk_ia32
|
|
-# endif
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/i386/sysdep.h
|
|
+++ glibc-2.11.90-11/sysdeps/i386/sysdep.h
|
|
@@ -67,9 +67,6 @@
|
|
ASM_SIZE_DIRECTIVE(name) \
|
|
STABS_FUN_END(name)
|
|
|
|
-#define ENTRY_CHK(name) ENTRY (name)
|
|
-#define END_CHK(name) END (name)
|
|
-
|
|
#ifdef HAVE_CPP_ASM_DEBUGINFO
|
|
/* Disable that goop, because we just pass -g through to the assembler
|
|
and it generates proper line number information directly. */
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/ia64/Makefile
|
|
+++ glibc-2.11.90-11/sysdeps/ia64/Makefile
|
|
@@ -12,8 +12,8 @@ elide-routines.os += hp-timing
|
|
|
|
ifeq (yes,$(build-shared))
|
|
# Compatibility
|
|
-sysdep_routines += ia64libgcc
|
|
-shared-only-routines += ia64libgcc
|
|
+sysdep_routines += libgcc-compat
|
|
+shared-only-routines += libgcc-compat
|
|
endif
|
|
endif
|
|
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/ia64/ia64libgcc.S
|
|
+++ glibc-2.11.90-11/sysdeps/ia64/ia64libgcc.S
|
|
@@ -1,350 +0,0 @@
|
|
-/* From the Intel IA-64 Optimization Guide, choose the minimum latency
|
|
- alternative. */
|
|
-
|
|
-#include <sysdep.h>
|
|
-#undef ret
|
|
-
|
|
-#include <shlib-compat.h>
|
|
-
|
|
-#if SHLIB_COMPAT(libc, GLIBC_2_2, GLIBC_2_2_6)
|
|
-
|
|
-/* __divtf3
|
|
- Compute a 80-bit IEEE double-extended quotient.
|
|
- farg0 holds the dividend. farg1 holds the divisor. */
|
|
-
|
|
-ENTRY(___divtf3)
|
|
- cmp.eq p7, p0 = r0, r0
|
|
- frcpa.s0 f10, p6 = farg0, farg1
|
|
- ;;
|
|
-(p6) cmp.ne p7, p0 = r0, r0
|
|
- .pred.rel.mutex p6, p7
|
|
-(p6) fnma.s1 f11 = farg1, f10, f1
|
|
-(p6) fma.s1 f12 = farg0, f10, f0
|
|
- ;;
|
|
-(p6) fma.s1 f13 = f11, f11, f0
|
|
-(p6) fma.s1 f14 = f11, f11, f11
|
|
- ;;
|
|
-(p6) fma.s1 f11 = f13, f13, f11
|
|
-(p6) fma.s1 f13 = f14, f10, f10
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f13, f11, f10
|
|
-(p6) fnma.s1 f11 = farg1, f12, farg0
|
|
- ;;
|
|
-(p6) fma.s1 f11 = f11, f10, f12
|
|
-(p6) fnma.s1 f12 = farg1, f10, f1
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f12, f10, f10
|
|
-(p6) fnma.s1 f12 = farg1, f11, farg0
|
|
- ;;
|
|
-(p6) fma.s0 fret0 = f12, f10, f11
|
|
-(p7) mov fret0 = f10
|
|
- br.ret.sptk rp
|
|
-END(___divtf3)
|
|
- .symver ___divtf3, __divtf3@GLIBC_2.2
|
|
-
|
|
-/* __divdf3
|
|
- Compute a 64-bit IEEE double quotient.
|
|
- farg0 holds the dividend. farg1 holds the divisor. */
|
|
-
|
|
-ENTRY(___divdf3)
|
|
- cmp.eq p7, p0 = r0, r0
|
|
- frcpa.s0 f10, p6 = farg0, farg1
|
|
- ;;
|
|
-(p6) cmp.ne p7, p0 = r0, r0
|
|
- .pred.rel.mutex p6, p7
|
|
-(p6) fmpy.s1 f11 = farg0, f10
|
|
-(p6) fnma.s1 f12 = farg1, f10, f1
|
|
- ;;
|
|
-(p6) fma.s1 f11 = f12, f11, f11
|
|
-(p6) fmpy.s1 f13 = f12, f12
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f12, f10, f10
|
|
-(p6) fma.s1 f11 = f13, f11, f11
|
|
- ;;
|
|
-(p6) fmpy.s1 f12 = f13, f13
|
|
-(p6) fma.s1 f10 = f13, f10, f10
|
|
- ;;
|
|
-(p6) fma.d.s1 f11 = f12, f11, f11
|
|
-(p6) fma.s1 f10 = f12, f10, f10
|
|
- ;;
|
|
-(p6) fnma.d.s1 f8 = farg1, f11, farg0
|
|
- ;;
|
|
-(p6) fma.d fret0 = f8, f10, f11
|
|
-(p7) mov fret0 = f10
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___divdf3)
|
|
- .symver ___divdf3, __divdf3@GLIBC_2.2
|
|
-
|
|
-/* __divsf3
|
|
- Compute a 32-bit IEEE float quotient.
|
|
- farg0 holds the dividend. farg1 holds the divisor. */
|
|
-
|
|
-ENTRY(___divsf3)
|
|
- cmp.eq p7, p0 = r0, r0
|
|
- frcpa.s0 f10, p6 = farg0, farg1
|
|
- ;;
|
|
-(p6) cmp.ne p7, p0 = r0, r0
|
|
- .pred.rel.mutex p6, p7
|
|
-(p6) fmpy.s1 f8 = farg0, f10
|
|
-(p6) fnma.s1 f9 = farg1, f10, f1
|
|
- ;;
|
|
-(p6) fma.s1 f8 = f9, f8, f8
|
|
-(p6) fmpy.s1 f9 = f9, f9
|
|
- ;;
|
|
-(p6) fma.s1 f8 = f9, f8, f8
|
|
-(p6) fmpy.s1 f9 = f9, f9
|
|
- ;;
|
|
-(p6) fma.d.s1 f10 = f9, f8, f8
|
|
- ;;
|
|
-(p6) fnorm.s.s0 fret0 = f10
|
|
-(p7) mov fret0 = f10
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___divsf3)
|
|
- .symver ___divsf3, __divsf3@GLIBC_2.2
|
|
-
|
|
-/* __divdi3
|
|
- Compute a 64-bit integer quotient.
|
|
- in0 holds the dividend. in1 holds the divisor. */
|
|
-
|
|
-ENTRY(___divdi3)
|
|
- .regstk 2,0,0,0
|
|
- /* Transfer inputs to FP registers. */
|
|
- setf.sig f8 = in0
|
|
- setf.sig f9 = in1
|
|
- ;;
|
|
- /* Convert the inputs to FP, so that they won't be treated as
|
|
- unsigned. */
|
|
- fcvt.xf f8 = f8
|
|
- fcvt.xf f9 = f9
|
|
- ;;
|
|
- /* Compute the reciprocal approximation. */
|
|
- frcpa.s1 f10, p6 = f8, f9
|
|
- ;;
|
|
- /* 3 Newton-Raphson iterations. */
|
|
-(p6) fnma.s1 f11 = f9, f10, f1
|
|
-(p6) fmpy.s1 f12 = f8, f10
|
|
- ;;
|
|
-(p6) fmpy.s1 f13 = f11, f11
|
|
-(p6) fma.s1 f12 = f11, f12, f12
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f11, f10, f10
|
|
-(p6) fma.s1 f11 = f13, f12, f12
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f13, f10, f10
|
|
-(p6) fnma.s1 f12 = f9, f11, f8
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f12, f10, f11
|
|
- ;;
|
|
- /* Round quotient to an integer. */
|
|
- fcvt.fx.trunc.s1 f10 = f10
|
|
- ;;
|
|
- /* Transfer result to GP registers. */
|
|
- getf.sig ret0 = f10
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___divdi3)
|
|
- .symver ___divdi3, __divdi3@GLIBC_2.2
|
|
-
|
|
-/* __moddi3
|
|
- Compute a 64-bit integer modulus.
|
|
- in0 holds the dividend (a). in1 holds the divisor (b). */
|
|
-
|
|
-ENTRY(___moddi3)
|
|
- .regstk 2,0,0,0
|
|
- /* Transfer inputs to FP registers. */
|
|
- setf.sig f14 = in0
|
|
- setf.sig f9 = in1
|
|
- ;;
|
|
- /* Convert the inputs to FP, so that they won't be treated as
|
|
- unsigned. */
|
|
- fcvt.xf f8 = f14
|
|
- fcvt.xf f9 = f9
|
|
- ;;
|
|
- /* Compute the reciprocal approximation. */
|
|
- frcpa.s1 f10, p6 = f8, f9
|
|
- ;;
|
|
- /* 3 Newton-Raphson iterations. */
|
|
-(p6) fmpy.s1 f12 = f8, f10
|
|
-(p6) fnma.s1 f11 = f9, f10, f1
|
|
- ;;
|
|
-(p6) fma.s1 f12 = f11, f12, f12
|
|
-(p6) fmpy.s1 f13 = f11, f11
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f11, f10, f10
|
|
-(p6) fma.s1 f11 = f13, f12, f12
|
|
- ;;
|
|
- sub in1 = r0, in1
|
|
-(p6) fma.s1 f10 = f13, f10, f10
|
|
-(p6) fnma.s1 f12 = f9, f11, f8
|
|
- ;;
|
|
- setf.sig f9 = in1
|
|
-(p6) fma.s1 f10 = f12, f10, f11
|
|
- ;;
|
|
- fcvt.fx.trunc.s1 f10 = f10
|
|
- ;;
|
|
- /* r = q * (-b) + a */
|
|
- xma.l f10 = f10, f9, f14
|
|
- ;;
|
|
- /* Transfer result to GP registers. */
|
|
- getf.sig ret0 = f10
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___moddi3)
|
|
- .symver ___moddi3, __moddi3@GLIBC_2.2
|
|
-
|
|
-/* __udivdi3
|
|
- Compute a 64-bit unsigned integer quotient.
|
|
- in0 holds the dividend. in1 holds the divisor. */
|
|
-
|
|
-ENTRY(___udivdi3)
|
|
- .regstk 2,0,0,0
|
|
- /* Transfer inputs to FP registers. */
|
|
- setf.sig f8 = in0
|
|
- setf.sig f9 = in1
|
|
- ;;
|
|
- /* Convert the inputs to FP, to avoid FP software-assist faults. */
|
|
- fcvt.xuf.s1 f8 = f8
|
|
- fcvt.xuf.s1 f9 = f9
|
|
- ;;
|
|
- /* Compute the reciprocal approximation. */
|
|
- frcpa.s1 f10, p6 = f8, f9
|
|
- ;;
|
|
- /* 3 Newton-Raphson iterations. */
|
|
-(p6) fnma.s1 f11 = f9, f10, f1
|
|
-(p6) fmpy.s1 f12 = f8, f10
|
|
- ;;
|
|
-(p6) fmpy.s1 f13 = f11, f11
|
|
-(p6) fma.s1 f12 = f11, f12, f12
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f11, f10, f10
|
|
-(p6) fma.s1 f11 = f13, f12, f12
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f13, f10, f10
|
|
-(p6) fnma.s1 f12 = f9, f11, f8
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f12, f10, f11
|
|
- ;;
|
|
- /* Round quotient to an unsigned integer. */
|
|
- fcvt.fxu.trunc.s1 f10 = f10
|
|
- ;;
|
|
- /* Transfer result to GP registers. */
|
|
- getf.sig ret0 = f10
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___udivdi3)
|
|
- .symver ___udivdi3, __udivdi3@GLIBC_2.2
|
|
-
|
|
-/* __umoddi3
|
|
- Compute a 64-bit unsigned integer modulus.
|
|
- in0 holds the dividend (a). in1 holds the divisor (b). */
|
|
-
|
|
-ENTRY(___umoddi3)
|
|
- .regstk 2,0,0,0
|
|
- /* Transfer inputs to FP registers. */
|
|
- setf.sig f14 = in0
|
|
- setf.sig f9 = in1
|
|
- ;;
|
|
- /* Convert the inputs to FP, to avoid FP software assist faults. */
|
|
- fcvt.xuf.s1 f8 = f14
|
|
- fcvt.xuf.s1 f9 = f9
|
|
- ;;
|
|
- /* Compute the reciprocal approximation. */
|
|
- frcpa.s1 f10, p6 = f8, f9
|
|
- ;;
|
|
- /* 3 Newton-Raphson iterations. */
|
|
-(p6) fmpy.s1 f12 = f8, f10
|
|
-(p6) fnma.s1 f11 = f9, f10, f1
|
|
- ;;
|
|
-(p6) fma.s1 f12 = f11, f12, f12
|
|
-(p6) fmpy.s1 f13 = f11, f11
|
|
- ;;
|
|
-(p6) fma.s1 f10 = f11, f10, f10
|
|
-(p6) fma.s1 f11 = f13, f12, f12
|
|
- ;;
|
|
- sub in1 = r0, in1
|
|
-(p6) fma.s1 f10 = f13, f10, f10
|
|
-(p6) fnma.s1 f12 = f9, f11, f8
|
|
- ;;
|
|
- setf.sig f9 = in1
|
|
-(p6) fma.s1 f10 = f12, f10, f11
|
|
- ;;
|
|
- /* Round quotient to an unsigned integer. */
|
|
- fcvt.fxu.trunc.s1 f10 = f10
|
|
- ;;
|
|
- /* r = q * (-b) + a */
|
|
- xma.l f10 = f10, f9, f14
|
|
- ;;
|
|
- /* Transfer result to GP registers. */
|
|
- getf.sig ret0 = f10
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___umoddi3)
|
|
- .symver ___umoddi3, __umoddi3@GLIBC_2.2
|
|
-
|
|
-/* __multi3
|
|
- Compute a 128-bit multiply of 128-bit multiplicands.
|
|
- in0/in1 holds one multiplicand (a), in2/in3 holds the other one (b). */
|
|
-
|
|
-ENTRY(___multi3)
|
|
- .regstk 4,0,0,0
|
|
- setf.sig f6 = in1
|
|
- movl r19 = 0xffffffff
|
|
- setf.sig f7 = in2
|
|
- ;;
|
|
- and r14 = r19, in0
|
|
- ;;
|
|
- setf.sig f10 = r14
|
|
- and r14 = r19, in2
|
|
- xmpy.l f9 = f6, f7
|
|
- ;;
|
|
- setf.sig f6 = r14
|
|
- shr.u r14 = in0, 32
|
|
- ;;
|
|
- setf.sig f7 = r14
|
|
- shr.u r14 = in2, 32
|
|
- ;;
|
|
- setf.sig f8 = r14
|
|
- xmpy.l f11 = f10, f6
|
|
- xmpy.l f6 = f7, f6
|
|
- ;;
|
|
- getf.sig r16 = f11
|
|
- xmpy.l f7 = f7, f8
|
|
- ;;
|
|
- shr.u r14 = r16, 32
|
|
- and r16 = r19, r16
|
|
- getf.sig r17 = f6
|
|
- setf.sig f6 = in0
|
|
- ;;
|
|
- setf.sig f11 = r14
|
|
- getf.sig r21 = f7
|
|
- setf.sig f7 = in3
|
|
- ;;
|
|
- xma.l f11 = f10, f8, f11
|
|
- xma.l f6 = f6, f7, f9
|
|
- ;;
|
|
- getf.sig r18 = f11
|
|
- ;;
|
|
- add r18 = r18, r17
|
|
- ;;
|
|
- and r15 = r19, r18
|
|
- cmp.ltu p7, p6 = r18, r17
|
|
- ;;
|
|
- getf.sig r22 = f6
|
|
-(p7) adds r14 = 1, r19
|
|
- ;;
|
|
-(p7) add r21 = r21, r14
|
|
- shr.u r14 = r18, 32
|
|
- shl r15 = r15, 32
|
|
- ;;
|
|
- add r20 = r21, r14
|
|
- ;;
|
|
- add ret0 = r15, r16
|
|
- add ret1 = r22, r20
|
|
- br.ret.sptk rp
|
|
- ;;
|
|
-END(___multi3)
|
|
- .symver ___multi3, __multi3@GLIBC_2.2
|
|
-
|
|
-#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/ia64/libgcc-compat.c
|
|
+++ glibc-2.11.90-11/sysdeps/ia64/libgcc-compat.c
|
|
@@ -0,0 +1,84 @@
|
|
+/* pre-.hidden libgcc compatibility
|
|
+ Copyright (C) 2002 Free Software Foundation, Inc.
|
|
+ This file is part of the GNU C Library.
|
|
+
|
|
+ The GNU C Library is free software; you can redistribute it and/or
|
|
+ modify it under the terms of the GNU Lesser General Public
|
|
+ License as published by the Free Software Foundation; either
|
|
+ version 2.1 of the License, or (at your option) any later version.
|
|
+
|
|
+ The GNU C Library is distributed in the hope that it will be useful,
|
|
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
+ Lesser General Public License for more details.
|
|
+
|
|
+ You should have received a copy of the GNU Lesser General Public
|
|
+ License along with the GNU C Library; if not, write to the Free
|
|
+ Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
+ 02111-1307 USA. */
|
|
+
|
|
+
|
|
+#include <stdint.h>
|
|
+#include <shlib-compat.h>
|
|
+
|
|
+#if SHLIB_COMPAT(libc, GLIBC_2_2, GLIBC_2_2_6)
|
|
+
|
|
+typedef int int128_t __attribute__((__mode__(TI)));
|
|
+
|
|
+extern long double __divtf3 (long double, long double) attribute_hidden;
|
|
+long double INTUSE (__divtf3) (long double x, long double y)
|
|
+{
|
|
+ return __divtf3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__divtf3), __divtf3, GLIBC_2.2);
|
|
+
|
|
+extern double __divdf3 (double, double) attribute_hidden;
|
|
+double INTUSE (__divdf3) (double x, double y)
|
|
+{
|
|
+ return __divdf3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__divdf3), __divdf3, GLIBC_2.2);
|
|
+
|
|
+extern float __divsf3 (float, float) attribute_hidden;
|
|
+float INTUSE (__divsf3) (float x, float y)
|
|
+{
|
|
+ return __divsf3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__divsf3), __divsf3, GLIBC_2.2);
|
|
+
|
|
+extern int64_t __divdi3 (int64_t, int64_t) attribute_hidden;
|
|
+int64_t INTUSE (__divdi3) (int64_t x, int64_t y)
|
|
+{
|
|
+ return __divdi3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__divdi3), __divdi3, GLIBC_2.2);
|
|
+
|
|
+extern int64_t __moddi3 (int64_t, int64_t) attribute_hidden;
|
|
+int64_t INTUSE (__moddi3) (int64_t x, int64_t y)
|
|
+{
|
|
+ return __moddi3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__moddi3), __moddi3, GLIBC_2.2);
|
|
+
|
|
+extern uint64_t __udivdi3 (uint64_t, uint64_t) attribute_hidden;
|
|
+uint64_t INTUSE (__udivdi3) (uint64_t x, uint64_t y)
|
|
+{
|
|
+ return __udivdi3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__udivdi3), __udivdi3, GLIBC_2.2);
|
|
+
|
|
+extern uint64_t __umoddi3 (uint64_t, uint64_t) attribute_hidden;
|
|
+uint64_t INTUSE (__umoddi3) (uint64_t x, uint64_t y)
|
|
+{
|
|
+ return __umoddi3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__umoddi3), __umoddi3, GLIBC_2.2);
|
|
+
|
|
+extern int128_t __multi3 (int128_t, int128_t) attribute_hidden;
|
|
+int128_t INTUSE (__multi3) (int128_t x, int128_t y)
|
|
+{
|
|
+ return __multi3 (x, y);
|
|
+}
|
|
+symbol_version (INTUSE (__multi3), __multi3, GLIBC_2.2);
|
|
+
|
|
+#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/powerpc/powerpc64/Makefile
|
|
+++ glibc-2.11.90-11/sysdeps/powerpc/powerpc64/Makefile
|
|
@@ -30,6 +30,7 @@ ifneq ($(elf),no)
|
|
# we use -fpic instead which is much better.
|
|
CFLAGS-initfini.s += -fpic -O1
|
|
endif
|
|
+CFLAGS-libc-start.c += -fno-asynchronous-unwind-tables
|
|
endif
|
|
|
|
ifeq ($(subdir),elf)
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/nice.c
|
|
+++ glibc-2.11.90-11/sysdeps/unix/nice.c
|
|
@@ -42,7 +42,12 @@ nice (int incr)
|
|
__set_errno (save);
|
|
}
|
|
|
|
- result = setpriority (PRIO_PROCESS, 0, prio + incr);
|
|
+ prio += incr;
|
|
+ if (prio < PRIO_MIN)
|
|
+ prio = PRIO_MIN;
|
|
+ else if (prio >= PRIO_MAX)
|
|
+ prio = PRIO_MAX - 1;
|
|
+ result = setpriority (PRIO_PROCESS, 0, prio);
|
|
if (result == -1)
|
|
{
|
|
if (errno == EACCES)
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/check_pf.c
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/check_pf.c
|
|
@@ -27,13 +27,10 @@
|
|
#include <unistd.h>
|
|
#include <sys/socket.h>
|
|
|
|
-#include <asm/types.h>
|
|
-#include <linux/netlink.h>
|
|
-#include <linux/rtnetlink.h>
|
|
-
|
|
#include <not-cancel.h>
|
|
#include <kernel-features.h>
|
|
|
|
+#include "netlinkaccess.h"
|
|
|
|
#ifndef IFA_F_HOMEADDRESS
|
|
# define IFA_F_HOMEADDRESS 0
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/dl-osinfo.h
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/dl-osinfo.h
|
|
@@ -17,10 +17,13 @@
|
|
Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
02111-1307 USA. */
|
|
|
|
+#include <errno.h>
|
|
#include <kernel-features.h>
|
|
#include <dl-sysdep.h>
|
|
#include <fcntl.h>
|
|
#include <stdint.h>
|
|
+#include <hp-timing.h>
|
|
+#include <endian.h>
|
|
|
|
#ifndef MIN
|
|
# define MIN(a,b) (((a)<(b))?(a):(b))
|
|
@@ -80,6 +83,32 @@ _dl_setup_stack_chk_guard (void *dl_random)
|
|
unsigned char *p = (unsigned char *) &ret;
|
|
p[sizeof (ret) - 1] = 255;
|
|
p[sizeof (ret) - 2] = '\n';
|
|
+#ifdef HP_TIMING_NOW
|
|
+ hp_timing_t hpt;
|
|
+ HP_TIMING_NOW (hpt);
|
|
+ hpt = (hpt & 0xffff) << 8;
|
|
+ ret ^= hpt;
|
|
+#endif
|
|
+ uintptr_t stk;
|
|
+ /* Avoid GCC being too smart. */
|
|
+ asm ("" : "=r" (stk) : "r" (p));
|
|
+ stk &= 0x7ffff0;
|
|
+#if __BYTE_ORDER == __LITTLE_ENDIAN
|
|
+ stk <<= (__WORDSIZE - 23);
|
|
+#elif __WORDSIZE == 64
|
|
+ stk <<= 31;
|
|
+#endif
|
|
+ ret ^= stk;
|
|
+ /* Avoid GCC being too smart. */
|
|
+ p = (unsigned char *) &errno;
|
|
+ asm ("" : "=r" (stk) : "r" (p));
|
|
+ stk &= 0x7fff00;
|
|
+#if __BYTE_ORDER == __LITTLE_ENDIAN
|
|
+ stk <<= (__WORDSIZE - 29);
|
|
+#else
|
|
+ stk >>= 8;
|
|
+#endif
|
|
+ ret ^= stk;
|
|
}
|
|
else
|
|
#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/futimesat.c
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/futimesat.c
|
|
@@ -37,14 +37,14 @@ futimesat (fd, file, tvp)
|
|
{
|
|
int result;
|
|
|
|
+ if (file == NULL)
|
|
+ return __futimes (fd, tvp);
|
|
+
|
|
#ifdef __NR_futimesat
|
|
# ifndef __ASSUME_ATFCTS
|
|
if (__have_atfcts >= 0)
|
|
# endif
|
|
{
|
|
- if (file == NULL)
|
|
- return __futimes (fd, tvp);
|
|
-
|
|
result = INLINE_SYSCALL (futimesat, 3, fd, file, tvp);
|
|
# ifndef __ASSUME_ATFCTS
|
|
if (result == -1 && errno == ENOSYS)
|
|
@@ -58,22 +58,7 @@ futimesat (fd, file, tvp)
|
|
#ifndef __ASSUME_ATFCTS
|
|
char *buf = NULL;
|
|
|
|
- if (file == NULL)
|
|
- {
|
|
- static const char procfd[] = "/proc/self/fd/%d";
|
|
- /* Buffer for the path name we are going to use. It consists of
|
|
- - the string /proc/self/fd/
|
|
- - the file descriptor number.
|
|
- The final NUL is included in the sizeof. A bit of overhead
|
|
- due to the format elements compensates for possible negative
|
|
- numbers. */
|
|
- size_t buflen = sizeof (procfd) + sizeof (int) * 3;
|
|
- buf = alloca (buflen);
|
|
-
|
|
- __snprintf (buf, buflen, procfd, fd);
|
|
- file = buf;
|
|
- }
|
|
- else if (fd != AT_FDCWD && file[0] != '/')
|
|
+ if (fd != AT_FDCWD && file[0] != '/')
|
|
{
|
|
size_t filelen = strlen (file);
|
|
if (__builtin_expect (filelen == 0, 0))
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/i386/dl-cache.h
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/i386/dl-cache.h
|
|
@@ -0,0 +1,59 @@
|
|
+/* Support for reading /etc/ld.so.cache files written by Linux ldconfig.
|
|
+ Copyright (C) 2004 Free Software Foundation, Inc.
|
|
+ This file is part of the GNU C Library.
|
|
+
|
|
+ The GNU C Library is free software; you can redistribute it and/or
|
|
+ modify it under the terms of the GNU Lesser General Public
|
|
+ License as published by the Free Software Foundation; either
|
|
+ version 2.1 of the License, or (at your option) any later version.
|
|
+
|
|
+ The GNU C Library is distributed in the hope that it will be useful,
|
|
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
+ Lesser General Public License for more details.
|
|
+
|
|
+ You should have received a copy of the GNU Lesser General Public
|
|
+ License along with the GNU C Library; if not, write to the Free
|
|
+ Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
+ 02111-1307 USA. */
|
|
+
|
|
+static inline int
|
|
+is_ia64 (void)
|
|
+{
|
|
+ unsigned int fl1, fl2;
|
|
+
|
|
+ /* See if we can use cpuid. */
|
|
+ __asm__ ("pushfl; pushfl; popl %0; movl %0,%1; xorl %2,%0;"
|
|
+ "pushl %0; popfl; pushfl; popl %0; popfl"
|
|
+ : "=&r" (fl1), "=&r" (fl2)
|
|
+ : "i" (0x00200000));
|
|
+ if (((fl1 ^ fl2) & 0x00200000) == 0)
|
|
+ return 0;
|
|
+
|
|
+ /* Host supports cpuid. See if cpuid gives capabilities, try
|
|
+ CPUID(0). Preserve %ebx and %ecx; cpuid insn clobbers these, we
|
|
+ don't need their CPUID values here, and %ebx may be the PIC
|
|
+ register. */
|
|
+ __asm__ ("pushl %%ecx; pushl %%ebx; cpuid; popl %%ebx; popl %%ecx"
|
|
+ : "=a" (fl1) : "0" (0) : "edx", "cc");
|
|
+ if (fl1 == 0)
|
|
+ return 0;
|
|
+
|
|
+ /* Invoke CPUID(1), return %edx; caller can examine bits to
|
|
+ determine what's supported. */
|
|
+ __asm__ ("pushl %%ecx; pushl %%ebx; cpuid; popl %%ebx; popl %%ecx"
|
|
+ : "=d" (fl2), "=a" (fl1) : "1" (1) : "cc");
|
|
+ return (fl2 & (1 << 30)) != 0;
|
|
+}
|
|
+
|
|
+#define arch_startup(argc, argv) \
|
|
+ do { \
|
|
+ /* On IA-64, try to execute 64-bit ldconfig if possible. \
|
|
+ This is because the badly designed /emul/ia32-linux hack \
|
|
+ will cause 32-bit ldconfig to do all sorts of weird things. */ \
|
|
+ if (is_ia64 ()) \
|
|
+ execv ("/emul/ia32-linux/../../sbin/ldconfig", \
|
|
+ (char *const *) argv); \
|
|
+ } while (0)
|
|
+
|
|
+#include_next <dl-cache.h>
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/ia64/dl-cache.h
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/ia64/dl-cache.h
|
|
@@ -22,4 +22,31 @@
|
|
#define _dl_cache_check_flags(flags) \
|
|
((flags) == _DL_CACHE_DEFAULT_ID)
|
|
|
|
+#define EMUL_HACK "/emul/ia32-linux"
|
|
+
|
|
+#define arch_startup(argc, argv) unlink (EMUL_HACK LD_SO_CACHE)
|
|
+
|
|
+#define add_arch_dirs(config_file) \
|
|
+ do { \
|
|
+ int save_verbose = opt_verbose; \
|
|
+ opt_verbose = 0; \
|
|
+ \
|
|
+ parse_conf (config_file, EMUL_HACK, true); \
|
|
+ \
|
|
+ /* Always add the standard search paths. */ \
|
|
+ add_system_dir (EMUL_HACK SLIBDIR); \
|
|
+ if (strcmp (SLIBDIR, LIBDIR)) \
|
|
+ add_system_dir (EMUL_HACK LIBDIR); \
|
|
+ \
|
|
+ char emul_config_file[strlen (config_file) \
|
|
+ + sizeof EMUL_HACK]; \
|
|
+ strcpy (mempcpy (emul_config_file, EMUL_HACK, \
|
|
+ strlen (EMUL_HACK)), config_file); \
|
|
+ \
|
|
+ if (! access (emul_config_file, R_OK)) \
|
|
+ parse_conf (emul_config_file, EMUL_HACK, true); \
|
|
+ \
|
|
+ opt_verbose = save_verbose; \
|
|
+ } while (0)
|
|
+
|
|
#include_next <dl-cache.h>
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/ia64/dl-procinfo.c
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/ia64/dl-procinfo.c
|
|
@@ -0,0 +1,5 @@
|
|
+#ifdef IS_IN_ldconfig
|
|
+#include <sysdeps/i386/dl-procinfo.c>
|
|
+#else
|
|
+#include <sysdeps/generic/dl-procinfo.c>
|
|
+#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/ia64/dl-procinfo.h
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/ia64/dl-procinfo.h
|
|
@@ -0,0 +1,5 @@
|
|
+#ifdef IS_IN_ldconfig
|
|
+#include <sysdeps/unix/sysv/linux/i386/dl-procinfo.h>
|
|
+#else
|
|
+#include <sysdeps/generic/dl-procinfo.h>
|
|
+#endif
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/ia64/ldd-rewrite.sed
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/ia64/ldd-rewrite.sed
|
|
@@ -1 +1 @@
|
|
-s_^\(RTLDLIST=\)\([^ ]*\)-ia64\(\.so\.[0-9.]*\)[ ]*$_\1"\2-ia64\3 \2\3"_
|
|
+s_^\(RTLDLIST=\)\([^ ]*\)-ia64\(\.so\.[0-9.]*\)[ ]*$_\1"\2-ia64\3 /emul/ia32-linux\2\3"_
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/netlinkaccess.h
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/netlinkaccess.h
|
|
@@ -25,6 +25,24 @@
|
|
|
|
#include <kernel-features.h>
|
|
|
|
+#ifndef IFA_MAX
|
|
+/* 2.6.19 kernel headers helpfully removed some macros and
|
|
+ moved lots of stuff into new headers, some of which aren't
|
|
+ included by linux/rtnetlink.h. */
|
|
+#include <linux/if_addr.h>
|
|
+#endif
|
|
+
|
|
+#ifndef IFA_RTA
|
|
+# define IFA_RTA(r) \
|
|
+ ((struct rtattr*) ((char*)(r) + NLMSG_ALIGN (sizeof (struct ifaddrmsg))))
|
|
+# define IFA_PAYLOAD(n) NLMSG_PAYLOAD (n, sizeof (struct ifaddrmsg))
|
|
+#endif
|
|
+
|
|
+#ifndef IFLA_RTA
|
|
+# define IFLA_RTA(r) \
|
|
+ ((struct rtattr*) ((char*)(r) + NLMSG_ALIGN (sizeof (struct ifinfomsg))))
|
|
+# define IFLA_PAYLOAD(n) NLMSG_PAYLOAD (n, sizeof (struct ifinfomsg))
|
|
+#endif
|
|
|
|
struct netlink_res
|
|
{
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/paths.h
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/paths.h
|
|
@@ -62,7 +62,7 @@
|
|
#define _PATH_TTY "/dev/tty"
|
|
#define _PATH_UNIX "/boot/vmlinux"
|
|
#define _PATH_UTMP "/var/run/utmp"
|
|
-#define _PATH_VI "/usr/bin/vi"
|
|
+#define _PATH_VI "/bin/vi"
|
|
#define _PATH_WTMP "/var/log/wtmp"
|
|
|
|
/* Provide trailing slash, since mostly used for building pathnames. */
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/unix/sysv/linux/tcsetattr.c
|
|
+++ glibc-2.11.90-11/sysdeps/unix/sysv/linux/tcsetattr.c
|
|
@@ -49,6 +49,7 @@ tcsetattr (fd, optional_actions, termios_p)
|
|
{
|
|
struct __kernel_termios k_termios;
|
|
unsigned long int cmd;
|
|
+ int retval;
|
|
|
|
switch (optional_actions)
|
|
{
|
|
@@ -80,6 +81,35 @@ tcsetattr (fd, optional_actions, termios_p)
|
|
memcpy (&k_termios.c_cc[0], &termios_p->c_cc[0],
|
|
__KERNEL_NCCS * sizeof (cc_t));
|
|
|
|
- return INLINE_SYSCALL (ioctl, 3, fd, cmd, &k_termios);
|
|
+ retval = INLINE_SYSCALL (ioctl, 3, fd, cmd, &k_termios);
|
|
+
|
|
+ if (retval == 0 && cmd == TCSETS)
|
|
+ {
|
|
+ /* The Linux kernel has a bug which silently ignore the invalid
|
|
+ c_cflag on pty. We have to check it here. */
|
|
+ int save = errno;
|
|
+ retval = INLINE_SYSCALL (ioctl, 3, fd, TCGETS, &k_termios);
|
|
+ if (retval)
|
|
+ {
|
|
+ /* We cannot verify if the setting is ok. We don't return
|
|
+ an error (?). */
|
|
+ __set_errno (save);
|
|
+ retval = 0;
|
|
+ }
|
|
+ else if ((termios_p->c_cflag & (PARENB | CREAD))
|
|
+ != (k_termios.c_cflag & (PARENB | CREAD))
|
|
+ || ((termios_p->c_cflag & CSIZE)
|
|
+ && ((termios_p->c_cflag & CSIZE)
|
|
+ != (k_termios.c_cflag & CSIZE))))
|
|
+ {
|
|
+ /* It looks like the Linux kernel silently changed the
|
|
+ PARENB/CREAD/CSIZE bits in c_cflag. Report it as an
|
|
+ error. */
|
|
+ __set_errno (EINVAL);
|
|
+ retval = -1;
|
|
+ }
|
|
+ }
|
|
+
|
|
+ return retval;
|
|
}
|
|
libc_hidden_def (tcsetattr)
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/x86_64/cacheinfo.c
|
|
+++ glibc-2.11.90-11/sysdeps/x86_64/cacheinfo.c
|
|
@@ -74,7 +74,6 @@ static const struct intel_02_cache_info
|
|
{ 0x0a, 2, 32, M(_SC_LEVEL1_DCACHE_SIZE), 8192 },
|
|
{ 0x0c, 4, 32, M(_SC_LEVEL1_DCACHE_SIZE), 16384 },
|
|
{ 0x0d, 4, 64, M(_SC_LEVEL1_DCACHE_SIZE), 16384 },
|
|
- { 0x0e, 6, 64, M(_SC_LEVEL1_DCACHE_SIZE), 24576 },
|
|
{ 0x21, 8, 64, M(_SC_LEVEL2_CACHE_SIZE), 262144 },
|
|
{ 0x22, 4, 64, M(_SC_LEVEL3_CACHE_SIZE), 524288 },
|
|
{ 0x23, 8, 64, M(_SC_LEVEL3_CACHE_SIZE), 1048576 },
|
|
@@ -114,7 +113,6 @@ static const struct intel_02_cache_info
|
|
{ 0x7c, 8, 64, M(_SC_LEVEL2_CACHE_SIZE), 1048576 },
|
|
{ 0x7d, 8, 64, M(_SC_LEVEL2_CACHE_SIZE), 2097152 },
|
|
{ 0x7f, 2, 64, M(_SC_LEVEL2_CACHE_SIZE), 524288 },
|
|
- { 0x80, 8, 64, M(_SC_LEVEL2_CACHE_SIZE), 524288 },
|
|
{ 0x82, 8, 32, M(_SC_LEVEL2_CACHE_SIZE), 262144 },
|
|
{ 0x83, 8, 32, M(_SC_LEVEL2_CACHE_SIZE), 524288 },
|
|
{ 0x84, 8, 32, M(_SC_LEVEL2_CACHE_SIZE), 1048576 },
|
|
@@ -454,10 +452,9 @@ __cache_sysconf (int name)
|
|
}
|
|
|
|
|
|
-/* Data cache size for use in memory and string routines, typically
|
|
+/* Half the data cache size for use in memory and string routines, typically
|
|
L1 size. */
|
|
long int __x86_64_data_cache_size_half attribute_hidden = 32 * 1024 / 2;
|
|
-long int __x86_64_data_cache_size attribute_hidden = 32 * 1024;
|
|
/* Shared cache size for use in memory and string routines, typically
|
|
L2 or L3 size. */
|
|
long int __x86_64_shared_cache_size_half attribute_hidden = 1024 * 1024 / 2;
|
|
@@ -660,10 +657,7 @@ init_cacheinfo (void)
|
|
}
|
|
|
|
if (data > 0)
|
|
- {
|
|
- __x86_64_data_cache_size_half = data / 2;
|
|
- __x86_64_data_cache_size = data;
|
|
- }
|
|
+ __x86_64_data_cache_size_half = data / 2;
|
|
|
|
if (shared > 0)
|
|
{
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/x86_64/multiarch/ifunc-defines.sym
|
|
+++ glibc-2.11.90-11/sysdeps/x86_64/multiarch/ifunc-defines.sym
|
|
@@ -13,8 +13,5 @@ CPUID_ECX_OFFSET offsetof (struct cpuid_registers, ecx)
|
|
CPUID_EDX_OFFSET offsetof (struct cpuid_registers, edx)
|
|
FAMILY_OFFSET offsetof (struct cpu_features, family)
|
|
MODEL_OFFSET offsetof (struct cpu_features, model)
|
|
-FEATURE_OFFSET offsetof (struct cpu_features, feature)
|
|
-FEATURE_SIZE sizeof (unsigned int)
|
|
|
|
COMMON_CPUID_INDEX_1
|
|
-FEATURE_INDEX_1
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/x86_64/multiarch/init-arch.c
|
|
+++ glibc-2.11.90-11/sysdeps/x86_64/multiarch/init-arch.c
|
|
@@ -64,23 +64,7 @@ __init_cpu_features (void)
|
|
__cpu_features.model += extended_model;
|
|
}
|
|
else if (__cpu_features.family == 0x06)
|
|
- {
|
|
- __cpu_features.model += extended_model;
|
|
- switch (__cpu_features.model)
|
|
- {
|
|
- case 0x1a:
|
|
- case 0x1e:
|
|
- case 0x1f:
|
|
- case 0x25:
|
|
- case 0x2e:
|
|
- case 0x2f:
|
|
- /* Rep string instructions are fast on Intel Core i3, i5
|
|
- and i7. */
|
|
- __cpu_features.feature[index_Fast_Rep_String]
|
|
- |= bit_Fast_Rep_String;
|
|
- break;
|
|
- }
|
|
- }
|
|
+ __cpu_features.model += extended_model;
|
|
}
|
|
/* This spells out "AuthenticAMD". */
|
|
else if (ebx == 0x68747541 && ecx == 0x444d4163 && edx == 0x69746e65)
|
|
--- glibc-2.11-175-gb34e12e/sysdeps/x86_64/multiarch/init-arch.h
|
|
+++ glibc-2.11.90-11/sysdeps/x86_64/multiarch/init-arch.h
|
|
@@ -16,8 +16,6 @@
|
|
Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
|
|
02111-1307 USA. */
|
|
|
|
-#define bit_Fast_Rep_String (1 << 0)
|
|
-
|
|
#ifdef __ASSEMBLER__
|
|
|
|
#include <ifunc-defines.h>
|
|
@@ -30,8 +28,6 @@
|
|
#define index_SSSE3 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_ECX_OFFSET
|
|
#define index_SSE4_2 COMMON_CPUID_INDEX_1*CPUID_SIZE+CPUID_ECX_OFFSET
|
|
|
|
-#define index_Fast_Rep_String FEATURE_INDEX_1*FEATURE_SIZE
|
|
-
|
|
#else /* __ASSEMBLER__ */
|
|
|
|
#include <sys/param.h>
|
|
@@ -43,13 +39,6 @@ enum
|
|
COMMON_CPUID_INDEX_MAX
|
|
};
|
|
|
|
-enum
|
|
- {
|
|
- FEATURE_INDEX_1 = 0,
|
|
- /* Keep the following line at the end. */
|
|
- FEATURE_INDEX_MAX
|
|
- };
|
|
-
|
|
extern struct cpu_features
|
|
{
|
|
enum
|
|
@@ -69,7 +58,6 @@ extern struct cpu_features
|
|
} cpuid[COMMON_CPUID_INDEX_MAX];
|
|
unsigned int family;
|
|
unsigned int model;
|
|
- unsigned int feature[FEATURE_INDEX_MAX];
|
|
} __cpu_features attribute_hidden;
|
|
|
|
|
|
@@ -98,6 +86,4 @@ extern const struct cpu_features *__get_cpu_features (void)
|
|
#define HAS_SSE4_2 HAS_CPU_FEATURE (COMMON_CPUID_INDEX_1, ecx, 20)
|
|
#define HAS_FMA HAS_CPU_FEATURE (COMMON_CPUID_INDEX_1, ecx, 12)
|
|
|
|
-#define index_Fast_Rep_String FEATURE_INDEX_1
|
|
-
|
|
#endif /* __ASSEMBLER__ */
|
|
--- glibc-2.11-175-gb34e12e/timezone/zic.c
|
|
+++ glibc-2.11.90-11/timezone/zic.c
|
|
@@ -1921,7 +1921,7 @@ const int zonecount;
|
|
if (stdrp != NULL && stdrp->r_hiyear == 2037)
|
|
return;
|
|
}
|
|
- if (stdrp == NULL && zp->z_nrules != 0)
|
|
+ if (stdrp == NULL && (zp->z_nrules != 0 || zp->z_stdoff != 0))
|
|
return;
|
|
abbrvar = (stdrp == NULL) ? "" : stdrp->r_abbrvar;
|
|
doabbr(result, zp->z_format, abbrvar, FALSE, TRUE);
|