SPARCv9 assembler pack: refine CPU detection on Linux, fix for "unaligned
[openssl.git] / crypto / sparcv9cap.c
index 7012f78604b294fd8dcc202b86058d312282e5d8..1d820f4c0ab41356ac0fec4c77f4a9769adb3dba 100644 (file)
@@ -1,6 +1,8 @@
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
+#include <setjmp.h>
+#include <signal.h>
 #include <sys/time.h>
 #include <openssl/bn.h>
 
@@ -9,6 +11,7 @@
 #define SPARCV9_VIS1           (1<<2)
 #define SPARCV9_VIS2           (1<<3)  /* reserved */
 #define SPARCV9_FMADD          (1<<4)  /* reserved for SPARC64 V */
+
 static int OPENSSL_sparcv9cap_P=SPARCV9_TICK_PRIVILEGED;
 
 int bn_mul_mont(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp, const BN_ULONG *np,const BN_ULONG *n0, int num)
@@ -16,17 +19,19 @@ int bn_mul_mont(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp, const BN_U
        int bn_mul_mont_fpu(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp, const BN_ULONG *np,const BN_ULONG *n0, int num);
        int bn_mul_mont_int(BN_ULONG *rp, const BN_ULONG *ap, const BN_ULONG *bp, const BN_ULONG *np,const BN_ULONG *n0, int num);
 
-       if (OPENSSL_sparcv9cap_P&(SPARCV9_PREFER_FPU|SPARCV9_VIS1) ==
+       if ((OPENSSL_sparcv9cap_P&(SPARCV9_PREFER_FPU|SPARCV9_VIS1)) ==
                (SPARCV9_PREFER_FPU|SPARCV9_VIS1))
                return bn_mul_mont_fpu(rp,ap,bp,np,n0,num);
        else
                return bn_mul_mont_int(rp,ap,bp,np,n0,num);
        }
 
+unsigned long  _sparcv9_rdtick(void);
+unsigned long  _sparcv9_rdwrasi(unsigned long);
+void           _sparcv9_vis1_probe(void);
+
 unsigned long OPENSSL_rdtsc(void)
        {
-       unsigned long OPENSSL_rdtick(void);
-
        if (OPENSSL_sparcv9cap_P&SPARCV9_TICK_PRIVILEGED)
 #if defined(__sun) && defined(__SVR4)
                return gethrtime();
@@ -34,13 +39,14 @@ unsigned long OPENSSL_rdtsc(void)
                return 0;
 #endif
        else
-               return OPENSSL_rdtick();
+               return _sparcv9_rdtick();
        }
 
 #if defined(__sun) && defined(__SVR4)
 
 #include <dlfcn.h>
 #include <libdevinfo.h>
+#include <sys/systeminfo.h>
 
 typedef di_node_t (*di_init_t)(const char *,uint_t);
 typedef void      (*di_fini_t)(di_node_t);
@@ -55,21 +61,22 @@ static int walk_nodename(di_node_t node, di_node_name_t di_node_name)
 
        /* This is expected to catch all UltraSPARC flavors prior T1 */
        if (!strcmp (name,"SUNW,UltraSPARC") ||
-           !strncmp(name,"SUNW,UltraSPARC-I",17))
+           !strncmp(name,"SUNW,UltraSPARC-I",17))  /* covers II,III,IV */
                {
                OPENSSL_sparcv9cap_P |= SPARCV9_PREFER_FPU|SPARCV9_VIS1;
 
-               /* %tick is privileged only on UltraSPARC-I/II */
+               /* %tick is privileged only on UltraSPARC-I/II, but not IIe */
                if (name[14]!='\0' && name[17]!='\0' && name[18]!='\0')
                        OPENSSL_sparcv9cap_P &= ~SPARCV9_TICK_PRIVILEGED;
 
                return DI_WALK_TERMINATE;
                }
-       /* This is expected to catch remaining UltraSPARC T1 */
+       /* This is expected to catch remaining UltraSPARCs, such as T1 */
        else if (!strncmp(name,"SUNW,UltraSPARC",15))
                {
-               OPENSSL_sparcv9cap_P |= SPARCV9_VIS1;
                OPENSSL_sparcv9cap_P &= ~SPARCV9_TICK_PRIVILEGED;
+
+               return DI_WALK_TERMINATE;
                }
 
        return DI_WALK_CONTINUE;
@@ -78,15 +85,38 @@ static int walk_nodename(di_node_t node, di_node_name_t di_node_name)
 void OPENSSL_cpuid_setup(void)
        {
        void *h;
-       char *e;
+       char *e,si[256];
+       static int trigger=0;
+
+       if (trigger) return;
+       trigger=1;
 
-       if (e=getenv("OPENSSL_sparcv9cap"))
+       if ((e=getenv("OPENSSL_sparcv9cap")))
                {
                OPENSSL_sparcv9cap_P=strtoul(e,NULL,0);
                return;
                }
 
-       if (h = dlopen("libdevinfo.so.1",RTLD_LAZY)) do
+       if (sysinfo(SI_MACHINE,si,sizeof(si))>0)
+               {
+               if (strcmp(si,"sun4v"))
+                       /* FPU is preferred for all CPUs, but US-T1/2 */
+                       OPENSSL_sparcv9cap_P |= SPARCV9_PREFER_FPU;
+               }
+
+       if (sysinfo(SI_ISALIST,si,sizeof(si))>0)
+               {
+               if (strstr(si,"+vis"))
+                       OPENSSL_sparcv9cap_P |= SPARCV9_VIS1;
+               if (strstr(si,"+vis2"))
+                       {
+                       OPENSSL_sparcv9cap_P |= SPARCV9_VIS2;
+                       OPENSSL_sparcv9cap_P &= ~SPARCV9_TICK_PRIVILEGED;
+                       return;
+                       }
+               }
+
+       if ((h = dlopen("libdevinfo.so.1",RTLD_LAZY))) do
                {
                di_init_t       di_init;
                di_fini_t       di_fini;
@@ -110,24 +140,76 @@ void OPENSSL_cpuid_setup(void)
        if (h) dlclose(h);
        }
 
-#elif defined(__linux)
+#else
+
+static sigjmp_buf common_jmp;
+static void common_handler(int sig) { siglongjmp(common_jmp,sig); }
 
 void OPENSSL_cpuid_setup(void)
        {
        char *e;
+       struct sigaction        common_act,ill_oact,bus_oact;
+       sigset_t                all_masked,oset;
+       unsigned long           oasi;
+       int                     sig;
  
-       if (e=getenv("OPENSSL_sparcv9cap"))
+       if ((e=getenv("OPENSSL_sparcv9cap")))
                {
-               OPENSSL_sparcv9cap_P=strtoul(env,NULL,0);
+               OPENSSL_sparcv9cap_P=strtoul(e,NULL,0);
                return;
                }
 
-       /* Linux apparently supports UltraSPARC-I/II/III only */
+       /* For now we assume that the rest supports UltraSPARC-I* only */
        OPENSSL_sparcv9cap_P |= SPARCV9_PREFER_FPU|SPARCV9_VIS1;
-       }
 
-#else
+       sigfillset(&all_masked);
+       sigdelset(&all_masked,SIGILL);
+       sigdelset(&all_masked,SIGTRAP);
+#ifdef SIGEMT
+       sigdelset(&all_masked,SIGEMT);
+#endif
+       sigdelset(&all_masked,SIGFPE);
+       sigdelset(&all_masked,SIGBUS);
+       sigdelset(&all_masked,SIGSEGV);
+       sigprocmask(SIG_SETMASK,&all_masked,&oset);
+
+       memset(&common_act,0,sizeof(common_act));
+       common_act.sa_handler = common_handler;
+       common_act.sa_mask    = all_masked;
+
+       sigaction(SIGILL,&common_act,&ill_oact);
+       sigaction(SIGBUS,&common_act,&bus_oact);/* T1 fails 16-bit ldda */
+       oasi = _sparcv9_rdwrasi(0xD2);          /* ASI_FL16_P */
+       if ((sig=sigsetjmp(common_jmp,0)) == 0)
+               {
+               _sparcv9_vis1_probe();
+               OPENSSL_sparcv9cap_P |= SPARCV9_VIS1;
+               }
+       else if (sig == SIGBUS)                 /* T1 fails 16-bit ldda */
+               {
+               OPENSSL_sparcv9cap_P &= ~SPARCV9_PREFER_FPU;
+               }
+       else
+               {
+               OPENSSL_sparcv9cap_P &= ~SPARCV9_VIS1;
+               }
+       _sparcv9_rdwrasi(oasi);
+       sigaction(SIGBUS,&bus_oact,NULL);
+       sigaction(SIGILL,&ill_oact,NULL);
 
-void OPENSSL_cpuid_setup(void) {}
+       sigaction(SIGILL,&common_act,&ill_oact);
+       if (sigsetjmp(common_jmp,0) == 0)
+               {
+               _sparcv9_rdtick();
+               OPENSSL_sparcv9cap_P &= ~SPARCV9_TICK_PRIVILEGED;
+               }
+       else
+               {
+               OPENSSL_sparcv9cap_P |= SPARCV9_TICK_PRIVILEGED;
+               }
+       sigaction(SIGILL,&ill_oact,NULL);
+
+       sigprocmask(SIG_SETMASK,&oset,NULL);
+       }
 
 #endif