shithub: dav1d

Download patch

ref: 4a2ea99d3dc6b6bbb43e4680392584dcf4c8882f
parent: 79e4a5f7c126b7b655f3bb0c4bd4a537705e37b3
author: Martin Storsjö <[email protected]>
date: Thu Jun 20 08:17:51 EDT 2019

arm64: Consistently name macro arguments tX for temporaries in transposes

--- a/src/arm/64/util.S
+++ b/src/arm/64/util.S
@@ -59,9 +59,9 @@
 #endif
 .endm
 
-.macro transpose_8x8b r0, r1, r2, r3, r4, r5, r6, r7, r8, r9
-        trn1            \r8\().8b,  \r0\().8b,  \r1\().8b
-        trn2            \r9\().8b,  \r0\().8b,  \r1\().8b
+.macro transpose_8x8b r0, r1, r2, r3, r4, r5, r6, r7, t8, t9
+        trn1            \t8\().8b,  \r0\().8b,  \r1\().8b
+        trn2            \t9\().8b,  \r0\().8b,  \r1\().8b
         trn1            \r1\().8b,  \r2\().8b,  \r3\().8b
         trn2            \r3\().8b,  \r2\().8b,  \r3\().8b
         trn1            \r0\().8b,  \r4\().8b,  \r5\().8b
@@ -73,24 +73,24 @@
         trn2            \r2\().4h,  \r0\().4h,  \r2\().4h
         trn1            \r6\().4h,  \r5\().4h,  \r7\().4h
         trn2            \r7\().4h,  \r5\().4h,  \r7\().4h
-        trn1            \r5\().4h,  \r9\().4h,  \r3\().4h
-        trn2            \r9\().4h,  \r9\().4h,  \r3\().4h
-        trn1            \r3\().4h,  \r8\().4h,  \r1\().4h
-        trn2            \r8\().4h,  \r8\().4h,  \r1\().4h
+        trn1            \r5\().4h,  \t9\().4h,  \r3\().4h
+        trn2            \t9\().4h,  \t9\().4h,  \r3\().4h
+        trn1            \r3\().4h,  \t8\().4h,  \r1\().4h
+        trn2            \t8\().4h,  \t8\().4h,  \r1\().4h
 
         trn1            \r0\().2s,  \r3\().2s,  \r4\().2s
         trn2            \r4\().2s,  \r3\().2s,  \r4\().2s
         trn1            \r1\().2s,  \r5\().2s,  \r6\().2s
         trn2            \r5\().2s,  \r5\().2s,  \r6\().2s
-        trn2            \r6\().2s,  \r8\().2s,  \r2\().2s
-        trn1            \r2\().2s,  \r8\().2s,  \r2\().2s
-        trn1            \r3\().2s,  \r9\().2s,  \r7\().2s
-        trn2            \r7\().2s,  \r9\().2s,  \r7\().2s
+        trn2            \r6\().2s,  \t8\().2s,  \r2\().2s
+        trn1            \r2\().2s,  \t8\().2s,  \r2\().2s
+        trn1            \r3\().2s,  \t9\().2s,  \r7\().2s
+        trn2            \r7\().2s,  \t9\().2s,  \r7\().2s
 .endm
 
-.macro transpose_8x16b r0, r1, r2, r3, r4, r5, r6, r7, r8, r9
-        trn1            \r8\().16b, \r0\().16b, \r1\().16b
-        trn2            \r9\().16b, \r0\().16b, \r1\().16b
+.macro transpose_8x16b r0, r1, r2, r3, r4, r5, r6, r7, t8, t9
+        trn1            \t8\().16b, \r0\().16b, \r1\().16b
+        trn2            \t9\().16b, \r0\().16b, \r1\().16b
         trn1            \r1\().16b, \r2\().16b, \r3\().16b
         trn2            \r3\().16b, \r2\().16b, \r3\().16b
         trn1            \r0\().16b, \r4\().16b, \r5\().16b
@@ -102,19 +102,19 @@
         trn2            \r2\().8h,  \r0\().8h,  \r2\().8h
         trn1            \r6\().8h,  \r5\().8h,  \r7\().8h
         trn2            \r7\().8h,  \r5\().8h,  \r7\().8h
-        trn1            \r5\().8h,  \r9\().8h,  \r3\().8h
-        trn2            \r9\().8h,  \r9\().8h,  \r3\().8h
-        trn1            \r3\().8h,  \r8\().8h,  \r1\().8h
-        trn2            \r8\().8h,  \r8\().8h,  \r1\().8h
+        trn1            \r5\().8h,  \t9\().8h,  \r3\().8h
+        trn2            \t9\().8h,  \t9\().8h,  \r3\().8h
+        trn1            \r3\().8h,  \t8\().8h,  \r1\().8h
+        trn2            \t8\().8h,  \t8\().8h,  \r1\().8h
 
         trn1            \r0\().4s,  \r3\().4s,  \r4\().4s
         trn2            \r4\().4s,  \r3\().4s,  \r4\().4s
         trn1            \r1\().4s,  \r5\().4s,  \r6\().4s
         trn2            \r5\().4s,  \r5\().4s,  \r6\().4s
-        trn2            \r6\().4s,  \r8\().4s,  \r2\().4s
-        trn1            \r2\().4s,  \r8\().4s,  \r2\().4s
-        trn1            \r3\().4s,  \r9\().4s,  \r7\().4s
-        trn2            \r7\().4s,  \r9\().4s,  \r7\().4s
+        trn2            \r6\().4s,  \t8\().4s,  \r2\().4s
+        trn1            \r2\().4s,  \t8\().4s,  \r2\().4s
+        trn1            \r3\().4s,  \t9\().4s,  \r7\().4s
+        trn2            \r7\().4s,  \t9\().4s,  \r7\().4s
 .endm
 
 .macro  transpose_4x16b r0, r1, r2, r3, t4, t5, t6, t7