glibc/SOURCES/power6emul.c

/* Emulate power6 mf[tf]gpr and fri[zpmn] instructions.
   Copyright (C) 2006 Red Hat, Inc.
   Contributed by Jakub Jelinek <jakub@redhat.com>, 2006.

   This library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.

   It is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Lesser General Public License for more details.

   You should have received a copy of the GNU Lesser General Public
   License along with the GNU C Library; if not, write to the Free
   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
   02111-1307 USA.  */

#include <signal.h>
#include <stdio.h>

extern double frip (double), friz (double), frin (double), frim (double);
asm (".globl frip, friz, frin, frim\n.hidden frip, friz, frin, frim\n\t"
#ifdef __powerpc64__
	".section \".toc\",\"aw\"\n"
"8:"	".tc FD_43300000_0[TC],0x4330000000000000\n"
"9:"	".tc FD_3fe00000_0[TC],0x3fe0000000000000\n\t"
	".previous\n\t"
#else
	".rodata\n\t"
	".align 2\n"
"8:"	".long 0x59800000\n"
"9:"	".long 0x3f000000\n\t"
	".previous\n\t"
#endif
	"# frip == ceil\n"
"frip:"	"mffs    11\n\t"
#ifdef __powerpc64__
	"lfd     13,8b@toc(2)\n\t"
#else
	"mflr    11\n\t"
	"bcl     20,31,1f\n"
"1:"	"mflr    9\n\t"
	"addis   9,9,8b-1b@ha\n\t"
	"lfs     13,8b-1b@l(9)\n\t"
	"mtlr    11\n\t"
#endif
	"fabs    0,1\n\t"
	"fsub    12,13,13\n\t"
	"fcmpu   7,0,13\n\t"
	"fcmpu   6,1,12\n\t"
	"bnllr-  7\n\t"
	"mtfsfi  7,2\n\t"
	"ble-    6,2f\n\t"
	"fadd    1,1,13\n\t"
	"fsub    1,1,13\n\t"
	"fabs    1,1\n\t"
	"mtfsf   0x01,11\n\t"
	"blr\n"
"2:"	"bge-    6,3f\n\t"
	"fsub    1,1,13\n\t"
	"fadd    1,1,13\n\t"
	"fnabs   1,1\n"
"3:"	"mtfsf   0x01,11\n\t"
	"blr\n\t"
	"# friz == trunc\n"
"friz:"	"mffs    11\n\t"
#ifdef __powerpc64__
	"lfd     13,8b@toc(2)\n\t"
#else
	"mflr    11\n\t"
	"bcl     20,31,1f\n"
"1:"	"mflr    9\n\t"
	"addis   9,9,8b-1b@ha\n\t"
	"lfs     13,8b-1b@l(9)\n\t"
	"mtlr    11\n\t"
#endif
	"fabs    0,1\n\t"
	"fsub    12,13,13\n\t"
	"fcmpu   7,0,13\n\t"
	"fcmpu   6,1,12\n\t"
	"bnllr-  7\n\t"
	"mtfsfi  7,1\n\t"
	"ble-    6,2f\n\t"
	"fadd    1,1,13\n\t"
	"fsub    1,1,13\n\t"
	"fabs    1,1\n\t"
	"mtfsf   0x01,11\n\t"
	"blr\n"
"2:"	"bge-    6,3f\n\t"
	"fsub    1,1,13\n\t"
	"fadd    1,1,13\n\t"
	"fnabs   1,1\n"
"3:"	"mtfsf   0x01,11\n\t"
	"blr\n\t"
	"# frin == round\n"
"frin:"	"mffs    11\n\t"
#ifdef __powerpc64__
	"lfd     13,8b@toc(2)\n\t"
#else
	"mflr    11\n\t"
	"bcl     20,31,1f\n"
"1:"	"mflr    9\n\t"
	"addis   9,9,8b-1b@ha\n\t"
	"addi    9,9,8b-1b@l\n\t"
	"mtlr    11\n\t"
	"lfs     13,0(9)\n\t"
#endif
	"fabs    0,1\n\t"
	"fsub    12,13,13\n\t"
	"fcmpu   7,0,13\n\t"
	"fcmpu   6,1,12\n\t"
	"bnllr-  7\n\t"
	"mtfsfi  7,1\n\t"
#ifdef __powerpc64__
	"lfd     10,9b@toc(2)\n\t"
#else
	"lfs     10,9b-8b(9)\n\t"
#endif
	"ble-    6,2f\n\t"
	"fadd    1,1,10\n\t"
	"fadd    1,1,13\n\t"
	"fsub    1,1,13\n\t"
	"fabs    1,1\n\t"
	"mtfsf   0x01,11\n\t"
	"blr\n"
"2:"	"fsub    9,1,10\n\t"
	"bge-    6,3f\n\t"
	"fsub    1,9,13\n\t"
	"fadd    1,1,13\n\t"
	"fnabs   1,1\n"
"3:"	"mtfsf   0x01,11\n\t"
	"blr\n\t"
	"# frim == floor\n"
"frim:"	"mffs    11\n\t"
#ifdef __powerpc64__
	"lfd     13,8b@toc(2)\n\t"
#else
	"mflr    11\n\t"
	"bcl     20,31,1f\n"
"1:"	"mflr    9\n\t"
	"addis   9,9,8b-1b@ha\n\t"
	"lfs     13,8b-1b@l(9)\n\t"
	"mtlr    11\n\t"
#endif
	"fabs    0,1\n\t"
	"fsub    12,13,13\n\t"
	"fcmpu   7,0,13\n\t"
	"fcmpu   6,1,12\n\t"
	"bnllr-  7\n\t"
	"mtfsfi  7,3\n\t"
	"ble-    6,2f\n\t"
	"fadd    1,1,13\n\t"
	"fsub    1,1,13\n\t"
	"fabs    1,1\n\t"
	"mtfsf   0x01,11\n\t"
	"blr\n"
"2:"	"bge-    6,3f\n\t"
	"fsub    1,1,13\n\t"
	"fadd    1,1,13\n\t"
	"fnabs   1,1\n"
"3:"	"mtfsf   0x01,11\n\t"
	"blr\n");

#ifdef __powerpc64__
#define m1 0x5555555555555555L
#define m2 0x3333333333333333L
#define m3 0x0f0f0f0f0f0f0f0fL
#else
#define m1 0x55555555
#define m2 0x33333333
#define m3 0x0f0f0f0f
#endif

static inline unsigned long
popcntb (unsigned long n)
{
  n -= (n >> 1) & m1;
  n = (n & m2) + ((n >> 2) & m2);
  n = (n + (n >> 4)) & m3;
  return n;
}

static void
catch_sigill (int signal, struct sigcontext *ctx)
{
  unsigned int insn = *(unsigned int *) (ctx->regs->nip);
#ifdef __powerpc64__
  if ((insn & 0xfc1f07ff) == 0x7c0005be) /* mftgpr */
    {
      unsigned long *regs = (unsigned long *) ctx->regs;
      unsigned fpr = (insn >> 11) & 0x1f;
      unsigned gpr = (insn >> 21) & 0x1f;
      regs[gpr] = regs[fpr + 0x30];
      ctx->regs->nip += 4;
      return;
    }
  if ((insn & 0xfc1f07ff) == 0x7c0004be) /*mffgpr */
    {
      unsigned long *regs = (unsigned long *) ctx->regs;
      unsigned fpr = (insn >> 21) & 0x1f;
      unsigned gpr = (insn >> 11) & 0x1f;
      regs[fpr + 0x30] = regs[gpr];
      ctx->regs->nip += 4;
      return;
    }
#endif
  if ((insn & 0xfc1f073f) == 0xfc000310) /* fri[pznm] */
    {
#ifdef __powerpc64__
      double *regs = (double *) (((char *) ctx->regs) + 0x30 * 8);
      unsigned int *fpscr = (unsigned int *) (((char *) ctx->regs) + 0x50 * 8 + 4);
#else
      double *regs = (double *) (((char *) ctx->regs) + 0x30 * 4);
      unsigned int *fpscr = (unsigned int *) (((char *) ctx->regs) + 0x30 * 4 + 0x20 * 8 + 4);
#endif
      unsigned dest = (insn >> 21) & 0x1f;
      unsigned src = (insn >> 11) & 0x1f;
      switch (insn & 0xc0)
	{
	case 0:
	  regs[dest] = frin (regs[src]);
	  break;
	case 0x40:
	  regs[dest] = friz (regs[src]);
	  break;
	case 0x80:
	  regs[dest] = frip (regs[src]);
	  break;
	case 0xc0:
	  regs[dest] = frim (regs[src]);
	  break;
	}
      /* Update raised exceptions.  */
      union { unsigned int i[2]; double d; } u;
      asm volatile ("mffs %0" : "=f" (u.d));
      u.i[1] &= 0xfffe0000; /* Is this correct?  */
      *fpscr |= u.i[1];
      ctx->regs->nip += 4;
      return;
    }
  if ((insn & 0xfc00ffff) == 0x7c0000f4) /* popcntb */
    {
      unsigned long *regs = (unsigned long *) ctx->regs;
      unsigned dest = (insn >> 16) & 0x1f;
      unsigned src = (insn >> 21) & 0x1f;
      unsigned long res = 0;
      int i;

      regs[dest] = popcntb (regs[src]);
      ctx->regs->nip += 4;
      return;
    }

  struct sigaction sa;
  sa.sa_handler = SIG_DFL;
  sigemptyset (&sa.sa_mask);
  sa.sa_flags = 0;
  sigaction (signal, &sa, NULL);
  raise (signal);
}

static void
__attribute__ ((constructor))
install_handler (void)
{
  struct sigaction sa;
  sa.sa_handler = (void *) catch_sigill;
  sigemptyset (&sa.sa_mask);
  sa.sa_flags = SA_RESTART;
  sigaction (SIGILL, &sa, NULL);
}
import glibc-2.28-158.el8 2021-04-23 04:11:25 +00:00			`/* Emulate power6 mf[tf]gpr and fri[zpmn] instructions.`
			`Copyright (C) 2006 Red Hat, Inc.`
			`Contributed by Jakub Jelinek <jakub@redhat.com>, 2006.`

			`This library is free software; you can redistribute it and/or`
			`modify it under the terms of the GNU Lesser General Public`
			`License as published by the Free Software Foundation; either`
			`version 2.1 of the License, or (at your option) any later version.`

			`It is distributed in the hope that it will be useful,`
			`but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`Lesser General Public License for more details.`

			`You should have received a copy of the GNU Lesser General Public`
			`License along with the GNU C Library; if not, write to the Free`
			`Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA`
			`02111-1307 USA. */`

			`#include <signal.h>`
			`#include <stdio.h>`

			`extern double frip (double), friz (double), frin (double), frim (double);`
			`asm (".globl frip, friz, frin, frim\n.hidden frip, friz, frin, frim\n\t"`
			`#ifdef __powerpc64__`
			`".section \".toc\",\"aw\"\n"`
			`"8:" ".tc FD_43300000_0[TC],0x4330000000000000\n"`
			`"9:" ".tc FD_3fe00000_0[TC],0x3fe0000000000000\n\t"`
			`".previous\n\t"`
			`#else`
			`".rodata\n\t"`
			`".align 2\n"`
			`"8:" ".long 0x59800000\n"`
			`"9:" ".long 0x3f000000\n\t"`
			`".previous\n\t"`
			`#endif`
			`"# frip == ceil\n"`
			`"frip:" "mffs 11\n\t"`
			`#ifdef __powerpc64__`
			`"lfd 13,8b@toc(2)\n\t"`
			`#else`
			`"mflr 11\n\t"`
			`"bcl 20,31,1f\n"`
			`"1:" "mflr 9\n\t"`
			`"addis 9,9,8b-1b@ha\n\t"`
			`"lfs 13,8b-1b@l(9)\n\t"`
			`"mtlr 11\n\t"`
			`#endif`
			`"fabs 0,1\n\t"`
			`"fsub 12,13,13\n\t"`
			`"fcmpu 7,0,13\n\t"`
			`"fcmpu 6,1,12\n\t"`
			`"bnllr- 7\n\t"`
			`"mtfsfi 7,2\n\t"`
			`"ble- 6,2f\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fabs 1,1\n\t"`
			`"mtfsf 0x01,11\n\t"`
			`"blr\n"`
			`"2:" "bge- 6,3f\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fnabs 1,1\n"`
			`"3:" "mtfsf 0x01,11\n\t"`
			`"blr\n\t"`
			`"# friz == trunc\n"`
			`"friz:" "mffs 11\n\t"`
			`#ifdef __powerpc64__`
			`"lfd 13,8b@toc(2)\n\t"`
			`#else`
			`"mflr 11\n\t"`
			`"bcl 20,31,1f\n"`
			`"1:" "mflr 9\n\t"`
			`"addis 9,9,8b-1b@ha\n\t"`
			`"lfs 13,8b-1b@l(9)\n\t"`
			`"mtlr 11\n\t"`
			`#endif`
			`"fabs 0,1\n\t"`
			`"fsub 12,13,13\n\t"`
			`"fcmpu 7,0,13\n\t"`
			`"fcmpu 6,1,12\n\t"`
			`"bnllr- 7\n\t"`
			`"mtfsfi 7,1\n\t"`
			`"ble- 6,2f\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fabs 1,1\n\t"`
			`"mtfsf 0x01,11\n\t"`
			`"blr\n"`
			`"2:" "bge- 6,3f\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fnabs 1,1\n"`
			`"3:" "mtfsf 0x01,11\n\t"`
			`"blr\n\t"`
			`"# frin == round\n"`
			`"frin:" "mffs 11\n\t"`
			`#ifdef __powerpc64__`
			`"lfd 13,8b@toc(2)\n\t"`
			`#else`
			`"mflr 11\n\t"`
			`"bcl 20,31,1f\n"`
			`"1:" "mflr 9\n\t"`
			`"addis 9,9,8b-1b@ha\n\t"`
			`"addi 9,9,8b-1b@l\n\t"`
			`"mtlr 11\n\t"`
			`"lfs 13,0(9)\n\t"`
			`#endif`
			`"fabs 0,1\n\t"`
			`"fsub 12,13,13\n\t"`
			`"fcmpu 7,0,13\n\t"`
			`"fcmpu 6,1,12\n\t"`
			`"bnllr- 7\n\t"`
			`"mtfsfi 7,1\n\t"`
			`#ifdef __powerpc64__`
			`"lfd 10,9b@toc(2)\n\t"`
			`#else`
			`"lfs 10,9b-8b(9)\n\t"`
			`#endif`
			`"ble- 6,2f\n\t"`
			`"fadd 1,1,10\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fabs 1,1\n\t"`
			`"mtfsf 0x01,11\n\t"`
			`"blr\n"`
			`"2:" "fsub 9,1,10\n\t"`
			`"bge- 6,3f\n\t"`
			`"fsub 1,9,13\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fnabs 1,1\n"`
			`"3:" "mtfsf 0x01,11\n\t"`
			`"blr\n\t"`
			`"# frim == floor\n"`
			`"frim:" "mffs 11\n\t"`
			`#ifdef __powerpc64__`
			`"lfd 13,8b@toc(2)\n\t"`
			`#else`
			`"mflr 11\n\t"`
			`"bcl 20,31,1f\n"`
			`"1:" "mflr 9\n\t"`
			`"addis 9,9,8b-1b@ha\n\t"`
			`"lfs 13,8b-1b@l(9)\n\t"`
			`"mtlr 11\n\t"`
			`#endif`
			`"fabs 0,1\n\t"`
			`"fsub 12,13,13\n\t"`
			`"fcmpu 7,0,13\n\t"`
			`"fcmpu 6,1,12\n\t"`
			`"bnllr- 7\n\t"`
			`"mtfsfi 7,3\n\t"`
			`"ble- 6,2f\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fabs 1,1\n\t"`
			`"mtfsf 0x01,11\n\t"`
			`"blr\n"`
			`"2:" "bge- 6,3f\n\t"`
			`"fsub 1,1,13\n\t"`
			`"fadd 1,1,13\n\t"`
			`"fnabs 1,1\n"`
			`"3:" "mtfsf 0x01,11\n\t"`
			`"blr\n");`

			`#ifdef __powerpc64__`
			`#define m1 0x5555555555555555L`
			`#define m2 0x3333333333333333L`
			`#define m3 0x0f0f0f0f0f0f0f0fL`
			`#else`
			`#define m1 0x55555555`
			`#define m2 0x33333333`
			`#define m3 0x0f0f0f0f`
			`#endif`

			`static inline unsigned long`
			`popcntb (unsigned long n)`
			`{`
			`n -= (n >> 1) & m1;`
			`n = (n & m2) + ((n >> 2) & m2);`
			`n = (n + (n >> 4)) & m3;`
			`return n;`
			`}`

			`static void`
			`catch_sigill (int signal, struct sigcontext *ctx)`
			`{`
			`unsigned int insn = (unsigned int ) (ctx->regs->nip);`
			`#ifdef __powerpc64__`
			`if ((insn & 0xfc1f07ff) == 0x7c0005be) /* mftgpr */`
			`{`
			`unsigned long regs = (unsigned long ) ctx->regs;`
			`unsigned fpr = (insn >> 11) & 0x1f;`
			`unsigned gpr = (insn >> 21) & 0x1f;`
			`regs[gpr] = regs[fpr + 0x30];`
			`ctx->regs->nip += 4;`
			`return;`
			`}`
			`if ((insn & 0xfc1f07ff) == 0x7c0004be) /mffgpr /`
			`{`
			`unsigned long regs = (unsigned long ) ctx->regs;`
			`unsigned fpr = (insn >> 21) & 0x1f;`
			`unsigned gpr = (insn >> 11) & 0x1f;`
			`regs[fpr + 0x30] = regs[gpr];`
			`ctx->regs->nip += 4;`
			`return;`
			`}`
			`#endif`
			`if ((insn & 0xfc1f073f) == 0xfc000310) /* fri[pznm] */`
			`{`
			`#ifdef __powerpc64__`
			`double regs = (double ) (((char ) ctx->regs) + 0x30 8);`
			`unsigned int fpscr = (unsigned int ) (((char ) ctx->regs) + 0x50 8 + 4);`
			`#else`
			`double regs = (double ) (((char ) ctx->regs) + 0x30 4);`
			`unsigned int fpscr = (unsigned int ) (((char ) ctx->regs) + 0x30 4 + 0x20 * 8 + 4);`
			`#endif`
			`unsigned dest = (insn >> 21) & 0x1f;`
			`unsigned src = (insn >> 11) & 0x1f;`
			`switch (insn & 0xc0)`
			`{`
			`case 0:`
			`regs[dest] = frin (regs[src]);`
			`break;`
			`case 0x40:`
			`regs[dest] = friz (regs[src]);`
			`break;`
			`case 0x80:`
			`regs[dest] = frip (regs[src]);`
			`break;`
			`case 0xc0:`
			`regs[dest] = frim (regs[src]);`
			`break;`
			`}`
			`/* Update raised exceptions. */`
			`union { unsigned int i[2]; double d; } u;`
			`asm volatile ("mffs %0" : "=f" (u.d));`
			`u.i[1] &= 0xfffe0000; /* Is this correct? */`
			`*fpscr \|= u.i[1];`
			`ctx->regs->nip += 4;`
			`return;`
			`}`
			`if ((insn & 0xfc00ffff) == 0x7c0000f4) /* popcntb */`
			`{`
			`unsigned long regs = (unsigned long ) ctx->regs;`
			`unsigned dest = (insn >> 16) & 0x1f;`
			`unsigned src = (insn >> 21) & 0x1f;`
			`unsigned long res = 0;`
			`int i;`

			`regs[dest] = popcntb (regs[src]);`
			`ctx->regs->nip += 4;`
			`return;`
			`}`

			`struct sigaction sa;`
			`sa.sa_handler = SIG_DFL;`
			`sigemptyset (&sa.sa_mask);`
			`sa.sa_flags = 0;`
			`sigaction (signal, &sa, NULL);`
			`raise (signal);`
			`}`

			`static void`
			`__attribute__ ((constructor))`
			`install_handler (void)`
			`{`
			`struct sigaction sa;`
			`sa.sa_handler = (void *) catch_sigill;`
			`sigemptyset (&sa.sa_mask);`
			`sa.sa_flags = SA_RESTART;`
			`sigaction (SIGILL, &sa, NULL);`
			`}`