Than Ngo 13262e
From: Michel Normand <normand@linux.vnet.ibm.com>
Than Ngo 13262e
Subject: atlas.3.10.2 ppc64le do not use files with lvx
Than Ngo 13262e
Date: Tue, 12 Aug 2014 16:07:06 +0200
Than Ngo 13262e
Than Ngo 13262e
ppc64le do not use files with lvx
Than Ngo 13262e
This is a temporary patch as long as the related files
Than Ngo 13262e
are not ported yet to ppc64 little-endian.
Than Ngo 13262e
Than Ngo 13262e
Warning: patch to be applied only for ppc64le architecture
Than Ngo 13262e
and will also need atlas-new_archdef_for_ppc64le.patch
Than Ngo 13262e
Than Ngo 13262e
Signed-off-by: Michel Normand <normand@linux.vnet.ibm.com>
Than Ngo 13262e
---
Than Ngo 13262e
 tune/blas/gemm/CASES/ccases.flg |    6 +-----
Than Ngo 13262e
 tune/blas/gemm/CASES/dcases.flg |    8 +-------
Than Ngo 13262e
 tune/blas/gemm/CASES/dcases.vnb |    4 ----
Than Ngo 13262e
 tune/blas/gemm/CASES/scases.flg |    9 +--------
Than Ngo 13262e
 tune/blas/gemm/CASES/scases.vnb |    3 ---
Than Ngo 13262e
 tune/blas/gemm/CASES/zcases.flg |    8 +-------
Than Ngo 13262e
 6 files changed, 4 insertions(+), 34 deletions(-)
Than Ngo 13262e
Than Ngo 13262e
Index: ATLAS/tune/blas/gemm/CASES/ccases.flg
Than Ngo 13262e
===================================================================
Than Ngo 13262e
--- ATLAS.orig/tune/blas/gemm/CASES/ccases.flg
Than Ngo 13262e
+++ ATLAS/tune/blas/gemm/CASES/ccases.flg
Than Ngo 13262e
@@ -1,5 +1,5 @@
Than Ngo 13262e
 <ID> <flag> <mb> <nb> <kb> <muladd> <lat> <mu> <nu> <ku> <rout> "<Contributer>"
Than Ngo 13262e
-24
Than Ngo 13262e
+22
Than Ngo 13262e
 304 192 4 3 8 0 4 4 3 8 ATL_mm4x3x8p.c     "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -mcpu=ultrasparc -mtune=ultrasparc -fomit-frame-pointer -O
Than Ngo 13262e
@@ -48,13 +48,9 @@ gcc
Than Ngo 13262e
 328 480 8 8 2 1 1 8 8 2 ATL_mm8x8x2.c  "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -fomit-frame-pointer -O2 -fno-tree-loop-optimize
Than Ngo 13262e
-329 192 4 4 4 1 16 4 4 4 ATL_cmm4x4x128_av.c "R. Clint Whaley" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--x assembler-with-cpp
Than Ngo 13262e
 331 192 4 4 1 1 1 4 4 1 ATL_smm4x4xURx_mips.c  "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mips4
Than Ngo 13262e
-332 192 8 2 4 1 0 8 2 4 ATL_smm8x2x4_av.c  "IBM"
Than Ngo 13262e
 333 448 4 4 2 1 1 4 4 2 ATL_smm4x4x2pf_arm.c "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mfpu=vfpv3
Than Ngo 13262e
Index: ATLAS/tune/blas/gemm/CASES/scases.flg
Than Ngo 13262e
===================================================================
Than Ngo 13262e
--- ATLAS.orig/tune/blas/gemm/CASES/scases.flg
Than Ngo 13262e
+++ ATLAS/tune/blas/gemm/CASES/scases.flg
Than Ngo 13262e
@@ -1,5 +1,5 @@
Than Ngo 13262e
 <ID> <flag> <mb> <nb> <kb> <muladd> <lat> <mu> <nu> <ku> <rout> "<Contributer>"
Than Ngo 13262e
-25
Than Ngo 13262e
+22
Than Ngo 13262e
 304 192 4 3 8 0 4 4 3 8 ATL_mm4x3x8p.c     "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -mcpu=ultrasparc -mtune=ultrasparc -fomit-frame-pointer -O
Than Ngo 13262e
@@ -48,16 +48,9 @@ gcc
Than Ngo 13262e
 328 480 8 8 2 1 1 8 8 2 ATL_mm8x8x2.c  "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -fomit-frame-pointer -O2 -fno-tree-loop-optimize
Than Ngo 13262e
-329 192 4 4 4 1 16 4 4 4 ATL_smm4x4x128_av.c "R. Clint Whaley" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--x assembler-with-cpp
Than Ngo 13262e
-330 200 92 92 92 1 16 92 92 92 ATL_smm4x4x128_av.c "R. Clint Whaley" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--x assembler-with-cpp
Than Ngo 13262e
 331 192 4 4 1 1 1 4 4 1 ATL_smm4x4xURx_mips.c  "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mips4
Than Ngo 13262e
-332 192 8 2 4 1 0 8 2 4 ATL_smm8x2x4_av.c  "IBM"
Than Ngo 13262e
 333 448 4 4 2 1 1 4 4 2 ATL_smm4x4x2pf_arm.c "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mfpu=vfpv3
Than Ngo 13262e
Index: ATLAS/tune/blas/gemm/CASES/scases.vnb
Than Ngo 13262e
===================================================================
Than Ngo 13262e
--- ATLAS.orig/tune/blas/gemm/CASES/scases.vnb
Than Ngo 13262e
+++ ATLAS/tune/blas/gemm/CASES/scases.vnb
Than Ngo 13262e
@@ -31,9 +31,6 @@
Than Ngo 13262e
 # Defaults: TA='t', TB='n', SSE=0, X87=0, LDBOT=1, RTKU=0, AOUTER=0,
Than Ngo 13262e
 #           KBMAX=KU, KBMIN=KU, BETAN1=0, RTMN=1
Than Ngo 13262e
 #
Than Ngo 13262e
-ID=1  ROUT='ATL_smm4x4x128_av.c' AUTH='R. Clint Whaley' MU=4 NU=4 KU=4 \
Than Ngo 13262e
-      LDKB=1 LDBOT=1 KBMIN=4 KBMAX=128 ASM=GAS_PPC \
Than Ngo 13262e
-      COMP='gcc' FLAGS='-x assembler-with-cpp'
Than Ngo 13262e
 ID=2  ROUT='ATL_smm4x4x16_av.c' AUTH='R. Clint Whaley' MU=4 NU=4 KU=16 \
Than Ngo 13262e
       LDKB=1 LDBOT=0 KBMIN=16 KBMAX=2048 ASM=GAS_SPARC \
Than Ngo 13262e
       COMP='gcc' FLAGS='-x assembler-with-cpp'
Than Ngo 13262e
Index: ATLAS/tune/blas/gemm/CASES/dcases.flg
Than Ngo 13262e
===================================================================
Than Ngo 13262e
--- ATLAS.orig/tune/blas/gemm/CASES/dcases.flg
Than Ngo 13262e
+++ ATLAS/tune/blas/gemm/CASES/dcases.flg
Than Ngo 13262e
@@ -1,5 +1,5 @@
Than Ngo 13262e
 <ID> <flag> <mb> <nb> <kb> <muladd> <lat> <mu> <nu> <ku> <rout> "<Contributer>"
Than Ngo 13262e
-32
Than Ngo 13262e
+30
Than Ngo 13262e
 306 192 4 3 8 0 4 4 3 8 ATL_mm4x3x8p.c     "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -mcpu=ultrasparc -mtune=ultrasparc -fomit-frame-pointer -O -fno-schedule-insns -fno-schedule-insns2
Than Ngo 13262e
@@ -79,12 +79,6 @@ gcc
Than Ngo 13262e
 336 192 4 4 1 1 1 4 4 1 ATL_dmm4x4xURx_mips.c  "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mips4
Than Ngo 13262e
-337 192 4 4 1 1 16 4 4 1 ATL_dmm4x4x80_ppc.c "Whaley & Castaldo" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--x assembler-with-cpp
Than Ngo 13262e
-338 192 8 4 2 1 0 8 4 2  ATL_dmm8x4x2_vsx.c  "IBM" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--O3 -mvsx
Than Ngo 13262e
 339 448 4 4 2 1 1 4 4 2 ATL_dmm4x4x2pf_arm.c "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mfpu=vfpv3
Than Ngo 13262e
Index: ATLAS/tune/blas/gemm/CASES/dcases.vnb
Than Ngo 13262e
===================================================================
Than Ngo 13262e
--- ATLAS.orig/tune/blas/gemm/CASES/dcases.vnb
Than Ngo 13262e
+++ ATLAS/tune/blas/gemm/CASES/dcases.vnb
Than Ngo 13262e
@@ -53,10 +53,6 @@ ID=6  ROUT='ATL_dmm4x1x90_x87.c' AUTH='R
Than Ngo 13262e
 ID=7  ROUT='ATL_dmm8x1x120_sse2.c' AUTH='R. Clint Whaley' \
Than Ngo 13262e
       MU=8 NU=1 KU=1 KBMAX=512 ASM=GAS_x8664 BETAN1=1 \
Than Ngo 13262e
       COMP='gcc' FLAGS='-m64 -x assembler-with-cpp'
Than Ngo 13262e
-ID=70 ROUT='ATL_dmm4x4x80_ppc.c' AUTH='R. Clint Whaley' TA='T', TB='N' \
Than Ngo 13262e
-      MU=4 NU=4 KU=1 KBMIN=1 KBMAX=80 ASM=GAS_PPC BETAN1=0 LDBOT=0 \
Than Ngo 13262e
-      LDAB=0 LDISKB=1 RTN=1 RTM=1 RTK=0 \
Than Ngo 13262e
-      COMP='gcc' FLAGS='-x assembler-with-cpp'
Than Ngo 13262e
 ID=80 ROUT='ATL_dmm4x4x16r8_US.c' AUTH='R. Clint Whaley' TA='T', TB='N' \
Than Ngo 13262e
       MU=4 NU=4 KU=24 KBMIN=24 KBMAX=512 ASM=GAS_SPARC BETAN1=0 \
Than Ngo 13262e
       LDAB=0 RTK=1 RTN=1 RTM=1 LDBOT=0 LDISKB=1 LDAB=1 \
Than Ngo 13262e
Index: ATLAS/tune/blas/gemm/CASES/zcases.flg
Than Ngo 13262e
===================================================================
Than Ngo 13262e
--- ATLAS.orig/tune/blas/gemm/CASES/zcases.flg
Than Ngo 13262e
+++ ATLAS/tune/blas/gemm/CASES/zcases.flg
Than Ngo 13262e
@@ -1,5 +1,5 @@
Than Ngo 13262e
 <ID> <flag> <mb> <nb> <kb> <muladd> <lat> <mu> <nu> <ku> <rout> "<Contributer>"
Than Ngo 13262e
-31
Than Ngo 13262e
+29
Than Ngo 13262e
 306 192 4 3 8 0 4 4 3 8 ATL_mm4x3x8p.c     "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -mcpu=ultrasparc -mtune=ultrasparc -fomit-frame-pointer -O -fno-schedule-insns -fno-schedule-insns2
Than Ngo 13262e
@@ -76,12 +76,6 @@ gcc
Than Ngo 13262e
 336 192 4 4 1 1 1 4 4 1 ATL_dmm4x4xURx_mips.c  "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mips4
Than Ngo 13262e
-337 192 4 4 1 1 16 4 4 1 ATL_dmm4x4x80_ppc.c "Whaley & Castaldo" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--x assembler-with-cpp
Than Ngo 13262e
-338 192 8 4 2 1 0 8 4 2  ATL_dmm8x4x2_vsx.c  "IBM" \
Than Ngo 13262e
-gcc
Than Ngo 13262e
--O3 -mvsx
Than Ngo 13262e
 339 448 4 4 2 1 1 4 4 2 ATL_dmm4x4x2pf_arm.c "R. Clint Whaley" \
Than Ngo 13262e
 gcc
Than Ngo 13262e
 -x assembler-with-cpp -mfpu=vfpv3