shithub: mc

Download patch

ref: 31356a321f79afc2dd2cc5a6b7c9c72f77cf3394
parent: c79e884fc2aedd7695d73b1f0e5fe8059cb451d3
author: S. Gilles <[email protected]>
date: Thu Mar 22 06:27:26 EDT 2018

Do not use packed SIMD instructions for only one argument

--- a/lib/math/fpmath-trunc-impl+posixy-x64-sse4.s
+++ b/lib/math/fpmath-trunc-impl+posixy-x64-sse4.s
@@ -2,7 +2,7 @@
 .globl math$_trunc32
 math$trunc32:
 math$_trunc32:
-	roundps $0x03, %xmm0, %xmm0
+	roundss $0x03, %xmm0, %xmm0
 	ret
 
 .globl math$floor32
@@ -9,7 +9,7 @@
 .globl math$_floor32
 math$floor32:
 math$_floor32:
-	roundps $0x01, %xmm0, %xmm0
+	roundss $0x01, %xmm0, %xmm0
 	ret
 
 .globl math$ceil32
@@ -16,7 +16,7 @@
 .globl math$_ceil32
 math$ceil32:
 math$_ceil32:
-	roundps $0x02, %xmm0, %xmm0
+	roundss $0x02, %xmm0, %xmm0
 	ret
 
 .globl math$trunc64
@@ -23,7 +23,7 @@
 .globl math$_trunc64
 math$trunc64:
 math$_trunc64:
-	roundpd $0x03, %xmm0, %xmm0
+	roundsd $0x03, %xmm0, %xmm0
 	ret
 
 .globl math$floor64
@@ -30,7 +30,7 @@
 .globl math$_floor64
 math$floor64:
 math$_floor64:
-	roundpd $0x01, %xmm0, %xmm0
+	roundsd $0x01, %xmm0, %xmm0
 	ret
 
 .globl math$ceil64
@@ -37,5 +37,5 @@
 .globl math$_ceil64
 math$ceil64:
 math$_ceil64:
-	roundpd $0x02, %xmm0, %xmm0
+	roundsd $0x02, %xmm0, %xmm0
 	ret