diff --git a/src/arch/helperavx.h b/src/arch/helperavx.h
index 4e4f9960..4d2b9788 100644
--- a/src/arch/helperavx.h
+++ b/src/arch/helperavx.h
@@ -345,9 +345,11 @@ static INLINE vfloat vmin_vf_vf_vf(vfloat x, vfloat y) { return _mm256_min_ps(x,
 #if CONFIG == 1
 static INLINE vfloat vmla_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vadd_vf_vf_vf(vmul_vf_vf_vf(x, y), z); }
 static INLINE vfloat vmlanp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vsub_vf_vf_vf(z, vmul_vf_vf_vf(x, y)); }
+static INLINE vfloat vmlapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vsub_vf_vf_vf(vmul_vf_vf_vf(x, y), z); }
 #else
 static INLINE vfloat vmla_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm256_macc_ps(x, y, z); }
 static INLINE vfloat vmlanp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm256_nmacc_ps(x, y, z); }
+static INLINE vfloat vmlapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm256_msub_ps(x, y, z); }
 static INLINE vfloat vfma_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm256_macc_ps(x, y, z); }
 static INLINE vfloat vfmapp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm256_macc_ps(x, y, z); }
 static INLINE vfloat vfmapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm256_msub_ps(x, y, z); }
diff --git a/src/arch/helperavx512f.h b/src/arch/helperavx512f.h
index 3577b1df..7778d6b6 100644
--- a/src/arch/helperavx512f.h
+++ b/src/arch/helperavx512f.h
@@ -369,6 +369,7 @@ static INLINE vfloat vmlanp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _
 #else
 static INLINE vfloat vmla_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vadd_vf_vf_vf(vmul_vf_vf_vf(x, y), z); }
 static INLINE vfloat vmlanp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vsub_vf_vf_vf(z, vmul_vf_vf_vf(x, y)); }
+static INLINE vfloat vmlapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vsub_vf_vf_vf(vmul_vf_vf_vf(x, y), z); }
 #endif
 
 static INLINE vfloat vfma_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return _mm512_fmadd_ps(x, y, z); }
diff --git a/src/arch/helperpurec_scalar.h b/src/arch/helperpurec_scalar.h
index 948fdaf7..4612396d 100644
--- a/src/arch/helperpurec_scalar.h
+++ b/src/arch/helperpurec_scalar.h
@@ -303,6 +303,7 @@ static INLINE vfloat vmin_vf_vf_vf(vfloat x, vfloat y) { return x < y ? x : y; }
 #ifndef ENABLE_FMA_SP
 static INLINE vfloat vmla_vf_vf_vf_vf  (vfloat x, vfloat y, vfloat z) { return x * y + z; }
 static INLINE vfloat vmlanp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return - x * y + z; }
+static INLINE vfloat vmlapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return x * y - z; }
 #else
 static INLINE vfloat vmla_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return FMAF(x, y, z); }
 static INLINE vfloat vmlapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return FMAF(x, y, -z); }
diff --git a/src/arch/helpersse2.h b/src/arch/helpersse2.h
index 95a27c76..2fd78511 100644
--- a/src/arch/helpersse2.h
+++ b/src/arch/helpersse2.h
@@ -308,6 +308,7 @@ static INLINE vfloat vsqrt_vf_vf(vfloat x) { return _mm_sqrt_ps(x); }
 static INLINE vfloat vabs_vf_vf(vfloat f) { return vreinterpret_vf_vm(vandnot_vm_vm_vm(vreinterpret_vm_vf(vcast_vf_f(-0.0f)), vreinterpret_vm_vf(f))); }
 static INLINE vfloat vneg_vf_vf(vfloat d) { return vreinterpret_vf_vm(vxor_vm_vm_vm(vreinterpret_vm_vf(vcast_vf_f(-0.0f)), vreinterpret_vm_vf(d))); }
 static INLINE vfloat vmla_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vadd_vf_vf_vf(vmul_vf_vf_vf(x, y), z); }
+static INLINE vfloat vmlapn_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vsub_vf_vf_vf(vmul_vf_vf_vf(x, y), z); }
 static INLINE vfloat vmlanp_vf_vf_vf_vf(vfloat x, vfloat y, vfloat z) { return vsub_vf_vf_vf(z, vmul_vf_vf_vf(x, y)); }
 static INLINE vfloat vmax_vf_vf_vf(vfloat x, vfloat y) { return _mm_max_ps(x, y); }
 static INLINE vfloat vmin_vf_vf_vf(vfloat x, vfloat y) { return _mm_min_ps(x, y); }
diff --git a/src/libm-tester/iut.c b/src/libm-tester/iut.c
index cbb9c3d1..1f9f94c2 100644
--- a/src/libm-tester/iut.c
+++ b/src/libm-tester/iut.c
@@ -569,6 +569,16 @@ int main(int argc, char **argv) {
       sscanf(buf, "cospif_u05 %x", &u);
       u = f2u(xcospif_u05(u2f(u)));
       printf("%x\n", u);
+    } else if (startsWith(buf, "fastsinf_u100000 ")) {
+      uint32_t u;
+      sscanf(buf, "fastsinf_u100000 %x", &u);
+      u = f2u(xfastsinf_u100000(u2f(u)));
+      printf("%x\n", u);
+    } else if (startsWith(buf, "fastcosf_u100000 ")) {
+      uint32_t u;
+      sscanf(buf, "fastcosf_u100000 %x", &u);
+      u = f2u(xfastcosf_u100000(u2f(u)));
+      printf("%x\n", u);
     } else if (startsWith(buf, "tanf_u1 ")) {
       uint32_t u;
       sscanf(buf, "tanf_u1 %x", &u);
diff --git a/src/libm-tester/iutsimd.c b/src/libm-tester/iutsimd.c
index 41a7cc90..a1f73e1a 100644
--- a/src/libm-tester/iutsimd.c
+++ b/src/libm-tester/iutsimd.c
@@ -570,6 +570,11 @@ int do_test(int argc, char **argv) {
     func_f_f("atanf_u1", xatanf_u1);
     func_f_f("logf_u1", xlogf_u1);
 
+    func_f_f("fastsinf_u100000", xfastsinf_u100000);
+    func_f_f("fastcosf_u100000", xfastcosf_u100000);
+    func_f_f("fastsinf_u35", xfastsinf_u35);
+    func_f_f("fastcosf_u35", xfastcosf_u35);
+
     func_f_f("exp2f", xexp2f);
     func_f_f("exp10f", xexp10f);
     func_f_f("expm1f", xexpm1f);
diff --git a/src/libm-tester/tester.c b/src/libm-tester/tester.c
index dcc2b170..821fd955 100644
--- a/src/libm-tester/tester.c
+++ b/src/libm-tester/tester.c
@@ -289,6 +289,11 @@ float child_cbrtf_u1(float x) { child_f_f("cbrtf_u1", x); }
 float child_atan2f_u1(float y, float x) { child_f_f_f("atan2f_u1", y, x); }
 Sleef_float2 child_sincosf_u1(float x) { child_f2_f("sincosf_u1", x); }
 
+float child_fastsinf_u100000(float x) { child_f_f("fastsinf_u100000", x); }
+float child_fastcosf_u100000(float x) { child_f_f("fastcosf_u100000", x); }
+float child_fastsinf_u35(float x) { child_f_f("fastsinf_u35", x); }
+float child_fastcosf_u35(float x) { child_f_f("fastcosf_u35", x); }
+
 float child_powf(float x, float y) { child_f_f_f("powf", x, y); }
 float child_sqrtf(float x) { child_f_f("sqrtf", x); }
 float child_sqrtf_u05(float x) { child_f_f("sqrtf_u05", x); }
@@ -4122,6 +4127,19 @@ void do_test() {
       break;								\
     }									\
   } while(0)
+
+#define checkAccuracy2_f(mpfrFunc, childFunc, argx, bound, abound) do {	\
+    mpfr_set_d(frx, (float)flushToZero(argx), GMP_RNDN);		\
+    mpfrFunc(frc, frx, GMP_RNDN);					\
+    double t = childFunc((float)flushToZero(argx));			\
+    double ae = fabs(mpfr_get_d(frc, GMP_RNDN) - t);			\
+    if (countULPsp(t, frc) > bound && ae > abound) {			\
+      fprintf(stderr, "\narg = %.20g, test = %.20g, correct = %.20g, ULP = %lf, abserror = %g\n", \
+	      (float)flushToZero(argx), (double)childFunc((float)flushToZero(argx)), mpfr_get_d(frc, GMP_RNDN), countULPsp(childFunc((float)flushToZero(argx)), frc), ae); \
+      success = 0;							\
+      break;								\
+    }									\
+  } while(0)
   
   //
 
@@ -4469,6 +4487,16 @@ void do_test() {
 
     mpfr_set_default_prec(53);
   
+    //
+  
+    fprintf(stderr, "fastsinf_u100000 : ");
+    for(d = -9;d < 9 && success;d += 0.001) checkAccuracy2_f(mpfr_sin, child_fastsinf_u100000, d, 100000, 1e-6);
+    showResult(success);
+
+    fprintf(stderr, "fastcosf_u100000 : ");
+    for(d = -9;d < 9 && success;d += 0.001) checkAccuracy2_f(mpfr_cos, child_fastcosf_u100000, d, 100000, 1e-6);
+    showResult(success);
+
     //
 
     fprintf(stderr, "tanf : ");
diff --git a/src/libm/funcproto.h b/src/libm/funcproto.h
index 3639ba62..de9f5645 100644
--- a/src/libm/funcproto.h
+++ b/src/libm/funcproto.h
@@ -20,6 +20,7 @@ typedef struct {
   2 : "_u05"
   3 : "_u35"
   4 : "_u15"
+  5 : "_u100000"
 
   funcType:
   0 : vdouble func(vdouble);
@@ -34,6 +35,7 @@ typedef struct {
 
   flags:
   1 : No GNUABI
+  2 : No double func
  */
 
 funcSpec funcList[] = {
@@ -66,6 +68,11 @@ funcSpec funcList[] = {
   { "cosh", 35, 3, 0, 0 },
   { "tanh", 35, 3, 0, 0 },
 
+  { "fastsin", 100000, 5, 0, 2 },
+  { "fastcos", 100000, 5, 0, 2 },
+  { "fastsin", 35, 3, 0, 2 },
+  { "fastcos", 35, 3, 0, 2 },
+
   { "asinh", 10, 0, 0, 0 },
   { "acosh", 10, 0, 0, 0 },
   { "atanh", 10, 0, 0, 0 },
diff --git a/src/libm/mkalias.c b/src/libm/mkalias.c
index 97c12b23..4b40aa30 100644
--- a/src/libm/mkalias.c
+++ b/src/libm/mkalias.c
@@ -36,7 +36,7 @@ int main(int argc, char **argv) {
   };
   static char *typeSpecS[] = { "", "f" };
   static char *typeSpec[] = { "d", "f" };
-  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15" };
+  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15", "_u100000" };
   static char *vparameterStr[7] = { "v", "vv", "", "vv", "v", "vvv", "" };
 
   static char returnType[9][1000];
@@ -84,6 +84,7 @@ int main(int argc, char **argv) {
 
   if (argc == 6) {
     for(int i=0;funcList[i].name != NULL;i++) {
+      if ((funcList[i].flags & 2) != 0) continue;
       if (funcList[i].ulp >= 0) {
 	printf("EXPORT CONST %s Sleef_%s%s%d_u%02d(%s) __attribute__((alias(\"Sleef_%s%s%d_u%02d%s\"))) %s;\n",
 	       returnType[funcList[i].funcType],
diff --git a/src/libm/mkdisp.c b/src/libm/mkdisp.c
index 131d0770..54cc65ca 100644
--- a/src/libm/mkdisp.c
+++ b/src/libm/mkdisp.c
@@ -30,13 +30,15 @@ int main(int argc, char **argv) {
 
     switch(funcList[i].funcType) {
     case 0:
-      printf("DISPATCH_vf_vf(%s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
-	     vdoublename,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_vf_vf(%s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
+	       vdoublename,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
+	printf(")\n");
+      }
 
       printf("DISPATCH_vf_vf(%s, Sleef_%sf%d%s, pnt_%sf%d%s, disp_%sf%d%s",
 	     vfloatname,
@@ -48,13 +50,15 @@ int main(int argc, char **argv) {
 
       break;
     case 1:
-      printf("DISPATCH_vf_vf_vf(%s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
-	     vdoublename,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_vf_vf_vf(%s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
+	       vdoublename,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
+	printf(")\n");
+      }
 
       printf("DISPATCH_vf_vf_vf(%s, Sleef_%sf%d%s, pnt_%sf%d%s, disp_%sf%d%s",
 	     vfloatname,
@@ -67,13 +71,15 @@ int main(int argc, char **argv) {
       break;
     case 2:
     case 6:
-      printf("DISPATCH_vf2_vf(%s, Sleef_%s_2, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
-	     vdoublename, vdoublename,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_vf2_vf(%s, Sleef_%s_2, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
+	       vdoublename, vdoublename,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
+	printf(")\n");
+      }
 
       printf("DISPATCH_vf2_vf(%s, Sleef_%s_2, Sleef_%sf%d%s, pnt_%sf%d%s, disp_%sf%d%s",
 	     vfloatname, vfloatname, 
@@ -85,31 +91,37 @@ int main(int argc, char **argv) {
 
       break;
     case 3:
-      printf("DISPATCH_vf_vf_vi(%s, %s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
-	     vdoublename, vintname,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_vf_vf_vi(%s, %s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
+	       vdoublename, vintname,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
+	printf(")\n");
+      }
       break;
     case 4:
-      printf("DISPATCH_vi_vf(%s, %s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
-	     vdoublename, vintname,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_vi_vf(%s, %s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
+	       vdoublename, vintname,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
+	printf(")\n");
+      }
       break;
     case 5:
-      printf("DISPATCH_vf_vf_vf_vf(%s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
-	     vdoublename,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0,
-	     funcList[i].name, wdp, ulpSuffix0);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_vf_vf_vf_vf(%s, Sleef_%sd%d%s, pnt_%sd%d%s, disp_%sd%d%s",
+	       vdoublename,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0,
+	       funcList[i].name, wdp, ulpSuffix0);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d%s%s", funcList[i].name, wdp, ulpSuffix1, argv[isastart + j]);
+	printf(")\n");
+      }
 
       printf("DISPATCH_vf_vf_vf_vf(%s, Sleef_%sf%d%s, pnt_%sf%d%s, disp_%sf%d%s",
 	     vfloatname,
@@ -128,12 +140,14 @@ int main(int argc, char **argv) {
       for(int j=0;j<nisa;j++) printf(", Sleef_%sf%d_%s", funcList[i].name, wsp, argv[isastart + j]);
       printf(")\n");
 
-      printf("DISPATCH_i_i(Sleef_%sd%d, pnt_%sd%d, disp_%sd%d",
-	     funcList[i].name, wdp,
-	     funcList[i].name, wdp,
-	     funcList[i].name, wdp);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d_%s", funcList[i].name, wdp, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_i_i(Sleef_%sd%d, pnt_%sd%d, disp_%sd%d",
+	       funcList[i].name, wdp,
+	       funcList[i].name, wdp,
+	       funcList[i].name, wdp);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d_%s", funcList[i].name, wdp, argv[isastart + j]);
+	printf(")\n");
+      }
       break;
     case 8:
       printf("DISPATCH_p_i(Sleef_%sf%d, pnt_%sf%d, disp_%sf%d",
@@ -143,12 +157,14 @@ int main(int argc, char **argv) {
       for(int j=0;j<nisa;j++) printf(", Sleef_%sf%d_%s", funcList[i].name, wsp, argv[isastart + j]);
       printf(")\n");
 
-      printf("DISPATCH_p_i(Sleef_%sd%d, pnt_%sd%d, disp_%sd%d",
-	     funcList[i].name, wdp,
-	     funcList[i].name, wdp,
-	     funcList[i].name, wdp);
-      for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d_%s", funcList[i].name, wdp, argv[isastart + j]);
-      printf(")\n");
+      if ((funcList[i].flags & 2) == 0) {
+	printf("DISPATCH_p_i(Sleef_%sd%d, pnt_%sd%d, disp_%sd%d",
+	       funcList[i].name, wdp,
+	       funcList[i].name, wdp,
+	       funcList[i].name, wdp);
+	for(int j=0;j<nisa;j++) printf(", Sleef_%sd%d_%s", funcList[i].name, wdp, argv[isastart + j]);
+	printf(")\n");
+      }
       break;
     }
   }
diff --git a/src/libm/mkmasked_gnuabi.c b/src/libm/mkmasked_gnuabi.c
index 44dde0ff..8b451cbe 100644
--- a/src/libm/mkmasked_gnuabi.c
+++ b/src/libm/mkmasked_gnuabi.c
@@ -44,7 +44,7 @@ int main(int argc, char **argv) {
   static char *vintname[] = { "vint", "vint2" };
   static int sizeoffp[] = { 8, 4 };
   
-  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15" };
+  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15", "_u100000" };
   static char vparameterStr[7][LEN] = { "v", "vv", "vl8l8", "vv", "v", "vvv", "vl8" };
   static char *typeSpecS[] = { "", "f" };
   static char *typeSpec[] = { "d", "f" };
@@ -57,6 +57,7 @@ int main(int argc, char **argv) {
   
   for(int i=0;funcList[i].name != NULL;i++) {
     if ((funcList[i].flags & 1) != 0) continue;
+    if (fptype == 0 && (funcList[i].flags & 2) != 0) continue;
     if (funcList[i].ulp < 20) {
       snprintf(funcname[0], LEN, "_ZGV%sN%s%s_%s%s",
 	       mangledisa, cvw, vparameterStr[funcList[i].funcType], funcList[i].name, typeSpecS[fptype]);
diff --git a/src/libm/mkrename.c b/src/libm/mkrename.c
index 08fdf012..11acd7cc 100644
--- a/src/libm/mkrename.c
+++ b/src/libm/mkrename.c
@@ -32,7 +32,7 @@ int main(int argc, char **argv) {
     exit(-1);
   }
 
-  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15" };
+  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15", "_u100000" };
   
   if (argc == 4 || argc == 5) {
     char *atrPrefix = strcmp(argv[1], "-") == 0 ? "" : argv[1];
diff --git a/src/libm/mkrename_gnuabi.c b/src/libm/mkrename_gnuabi.c
index a68c274b..3f55c375 100644
--- a/src/libm/mkrename_gnuabi.c
+++ b/src/libm/mkrename_gnuabi.c
@@ -25,12 +25,13 @@ int main(int argc, char **argv) {
   if (strcmp(isaname, "sve") == 0)
     wdp = wsp = "x";
 
-  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15" };
+  static char *ulpSuffixStr[] = { "", "_u1", "_u05", "_u35", "_u15", "_u100000" };
   static char *vparameterStrDP[] = { "v", "vv", "vl8l8", "vv", "v", "vvv", "vl8" };
   static char *vparameterStrSP[] = { "v", "vv", "vl4l4", "vv", "v", "vvv", "vl4" };
   
   for(int i=0;funcList[i].name != NULL;i++) {
     if ((funcList[i].flags & 1) != 0) continue;
+    if ((funcList[i].flags & 2) != 0) continue;
     if (funcList[i].ulp < 0) {
       printf("#define x%s _ZGV%sN%s%s_%s\n", funcList[i].name,
 	     mangledisa, wdp, vparameterStrDP[funcList[i].funcType], funcList[i].name);
diff --git a/src/libm/rename.h b/src/libm/rename.h
index 258275e4..0031ab5d 100644
--- a/src/libm/rename.h
+++ b/src/libm/rename.h
@@ -104,6 +104,9 @@
 #define xlogf_u1 Sleef_logf_u10
 #define xcbrtf_u1 Sleef_cbrtf_u10
 
+#define xfastsinf_u100000 Sleef_fastsinf_u100000
+#define xfastcosf_u100000 Sleef_fastcosf_u100000
+
 #define xexpf Sleef_expf_u10
 #define xpowf Sleef_powf_u10
 #define xsinhf Sleef_sinhf_u10
diff --git a/src/libm/sleeflibm_header.h.org b/src/libm/sleeflibm_header.h.org
index 25af696b..65bc396e 100644
--- a/src/libm/sleeflibm_header.h.org
+++ b/src/libm/sleeflibm_header.h.org
@@ -195,6 +195,8 @@ IMPORT CONST float Sleef_cbrtf_u35(float);
 IMPORT CONST float Sleef_sinf_u10(float);
 IMPORT CONST float Sleef_cosf_u10(float);
 IMPORT CONST Sleef_float2 Sleef_sincosf_u10(float);
+IMPORT CONST float Sleef_fastsinf_u100000(float);
+IMPORT CONST float Sleef_fastcosf_u100000(float);
 IMPORT CONST float Sleef_tanf_u10(float);
 IMPORT CONST float Sleef_asinf_u10(float);
 IMPORT CONST float Sleef_acosf_u10(float);
diff --git a/src/libm/sleefsimdsp.c b/src/libm/sleefsimdsp.c
index f4cb68d3..1f063015 100644
--- a/src/libm/sleefsimdsp.c
+++ b/src/libm/sleefsimdsp.c
@@ -894,6 +894,57 @@ EXPORT CONST VECTOR_CC vfloat xcosf_u1(vfloat d) {
 #endif // #if !defined(DETERMINISTIC)
 }
 
+EXPORT CONST VECTOR_CC vfloat xfastsinf_u100000(vfloat d) {
+  vint2 q;
+  vfloat u, s, t = d;
+
+  d = vmul_vf_vf_vf(d, vcast_vf_f((float)M_1_PI));
+  u = vrint_vf_vf(d);
+  q = vrint_vi2_vf(d);
+  d = vsub_vf_vf_vf(d, u);
+
+  s = vmul_vf_vf_vf(d, d);
+
+  u = vcast_vf_f(+0.2324385881e+1);
+  u = vmla_vf_vf_vf_vf(u, s, vcast_vf_f(-0.5145016193e+1f));
+  u = vmla_vf_vf_vf_vf(u, s, vcast_vf_f(+0.3141218185e+1f));
+
+  d = vreinterpret_vf_vm(vxor_vm_vm_vm(vand_vm_vo32_vm(veq_vo_vi2_vi2(vand_vi2_vi2_vi2(q, vcast_vi2_i(1)), vcast_vi2_i(1)), vreinterpret_vm_vf(vcast_vf_f(-0.0f))), vreinterpret_vm_vf(d)));
+
+  u = vmul_vf_vf_vf(u, d);
+
+  return u;
+}
+
+EXPORT CONST VECTOR_CC vfloat xfastsinf_u35(vfloat d) {
+  return vcast_vf_f(0);
+}
+
+EXPORT CONST VECTOR_CC vfloat xfastcosf_u100000(vfloat d) {
+  vint2 q;
+  vfloat u, s, t = d, dq;
+
+  dq = vrint_vf_vf(vmla_vf_vf_vf_vf(d, vcast_vf_f((float)M_1_PI), vcast_vf_f(-0.5f)));
+  d = vmlapn_vf_vf_vf_vf(d, vcast_vf_f((float)M_1_PI), vadd_vf_vf_vf(dq, vcast_vf_f(0.5f)));
+  q = vrint_vi2_vf(vmla_vf_vf_vf_vf(vcast_vf_f(2.0f), dq, vcast_vf_f(1.0f)));
+
+  s = vmul_vf_vf_vf(d, d);
+
+  u = vcast_vf_f(+0.2324385881e+1);
+  u = vmla_vf_vf_vf_vf(u, s, vcast_vf_f(-0.5145016193e+1f));
+  u = vmla_vf_vf_vf_vf(u, s, vcast_vf_f(+0.3141218185e+1f));
+
+  d = vreinterpret_vf_vm(vxor_vm_vm_vm(vand_vm_vo32_vm(veq_vo_vi2_vi2(vand_vi2_vi2_vi2(q, vcast_vi2_i(2)), vcast_vi2_i(0)), vreinterpret_vm_vf(vcast_vf_f(-0.0f))), vreinterpret_vm_vf(d)));
+
+  u = vmul_vf_vf_vf(u, d);
+
+  return u;
+}
+
+EXPORT CONST VECTOR_CC vfloat xfastcosf_u35(vfloat d) {
+  return vcast_vf_f(0);
+}
+
 #ifdef ENABLE_GNUABI
 #define TYPE2_FUNCATR static INLINE CONST 
 #define TYPE6_FUNCATR static INLINE CONST 
diff --git a/src/libm/sleefsp.c b/src/libm/sleefsp.c
index e150c5e0..0894df5b 100644
--- a/src/libm/sleefsp.c
+++ b/src/libm/sleefsp.c
@@ -620,6 +620,98 @@ EXPORT CONST float xcosf_u1(float d) {
   return u;
 }
 
+EXPORT CONST float xfastsinf_u100000(float d) {
+  int q;
+  float u, s, t = d;
+
+  d *= (float)M_1_PI;
+  q = (int)rintfk(d);
+  d -= q;
+
+  s = d * d;
+
+  if ((q & 1) != 0) d = -d;
+
+  u = +0.2324385881e+1;
+  u = mlaf(u, s, -0.5145016193e+1f);
+  u = mlaf(u, s, +0.3141218185e+1f);
+
+  u *= d;
+
+  return u;
+}
+
+EXPORT CONST float xfastsinf_u35(float d) {
+  int q;
+  float u, s, t = d;
+
+  d *= (float)M_1_PI;
+  q = (int)rintfk(d);
+  d -= q;
+
+  s = d * d;
+
+  if ((q & 1) != 0) d = -d;
+
+  u = +0.7737486064e-1;
+  u = mlaf(u, s, -0.5981476903e+0f);
+  u = mlaf(u, s, +0.2550054789e+1f);
+  u = mlaf(u, s, -0.5167709351e+1f);
+  u = mlaf(u, s, +0.3141592741e+1f);
+
+  u *= d;
+
+  if (UNLIKELY(fabsfk(t) > 9.0f)) u = xsinf(t);
+
+  return u;
+}
+
+EXPORT CONST float xfastcosf_u100000(float d) {
+  int q;
+  float u, s, t = d, dq;
+
+  dq = rintfk(mlaf(d, (float)M_1_PI, - 0.5f));
+  d = mlaf(d, (float)M_1_PI, -dq - 0.5f);
+  q = (int)mlaf(2, dq, 1);
+
+  s = d * d;
+
+  if ((q & 2) == 0) d = -d;
+
+  u = +0.2324385881e+1;
+  u = mlaf(u, s, -0.5145016193e+1f);
+  u = mlaf(u, s, +0.3141218185e+1f);
+
+  u *= d;
+
+  return u;
+}
+
+EXPORT CONST float xfastcosf_u35(float d) {
+  int q;
+  float u, s, t = d, dq;
+
+  dq = rintfk(mlaf(d, (float)M_1_PI, - 0.5f));
+  d = mlaf(d, (float)M_1_PI, -dq - 0.5f);
+  q = (int)mlaf(2, dq, 1);
+
+  s = d * d;
+
+  if ((q & 2) == 0) d = -d;
+
+  u = +0.7737486064e-1;
+  u = mlaf(u, s, -0.5981476903e+0f);
+  u = mlaf(u, s, +0.2550054789e+1f);
+  u = mlaf(u, s, -0.5167709351e+1f);
+  u = mlaf(u, s, +0.3141592741e+1f);
+
+  u *= d;
+
+  if (UNLIKELY(fabsfk(t) > 9.0f)) u = xcosf(t);
+
+  return u;
+}
+
 EXPORT CONST Sleef_float2 xsincosf(float d) {
   int q;
   float u, s, t;