[Math-atlas-commits] CVS: AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc cMVNK.sum, 1.7, 1.8 cM
Brought to you by:
rwhaley,
tonyc040457
From: R. C. W. <rw...@us...> - 2010-10-30 01:20:51
|
Update of /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc In directory sfp-cvsdas-4.v30.ch3.sourceforge.com:/tmp/cvs-serv9219 Modified Files: cMVNK.sum cMVTK.sum cR1K.sum cR2K.sum dMVNK.sum dMVTK.sum dR1K.sum dR2K.sum sMVNK.sum sMVTK.sum sR1K.sum sR2K.sum zMVNK.sum zMVTK.sum zR1K.sum zR2K.sum Log Message: Index: cMVNK.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/cMVNK.sum,v retrieving revision 1.7 retrieving revision 1.8 diff -C2 -d -r1.7 -r1.8 *** cMVNK.sum 29 Oct 2010 23:33:52 -0000 1.7 --- cMVNK.sum 30 Oct 2010 01:20:39 -0000 1.8 *************** *** 1,48 **** ID=900002 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900002' \ ! rankR=0 CacheElts=10240 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.598008e+03,-3.138177e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht1 -DPFIY=prefetcht2 -DPFADIST=1024 -DPFXDIST=128 -DPFYDIST=128' \ COMP='gcc' ID=900007 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900007' \ ! rankR=2 CacheElts=10240 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=6 \ NU=6 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.152557e+03,-2.299547e+03,0.000000e+00,-1.396562e+04,-1.418841e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=2 ROUT='ATL_cgemvN_8x4_sse3.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__2' \ ! rankR=1 CacheElts=10240 SSE=3 alignA=8 alignY=0 alignX=16 minM=0 minN=0 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.317547e+03,-2.472250e+03,0.000000e+00,-1.385181e+04,-1.441761e+04 \ ! CFLAGS='-x assembler-with-cpp' COMP='gcc' ID=900006 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900006' \ ! rankR=0 CacheElts=10240 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=6 \ NU=6 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-4.623044e+03,-4.681861e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFADIST=128 -DPFXDIST=384 -DPFYDIST=0' \ COMP='gcc' ! ID=2 ROUT='ATL_cgemvN_8x4_sse3.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__2' \ ! rankR=1 CacheElts=3440 SSE=3 alignA=8 alignY=0 alignX=16 minM=0 minN=0 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.317547e+03,-2.472250e+03,0.000000e+00,0.000000e+00,-1.427433e+04 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0' COMP='gcc' ID=900004 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900004' \ ! rankR=0 CacheElts=3440 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-5.022432e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetchnta -DPFADIST=256 -DPFXDIST=896' \ COMP='gcc' ID=900002 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900002' \ ! rankR=0 CacheElts=3440 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.626235e+03,-3.019014e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=256 -DPFXDIST=0 -DPFYDIST=192' \ COMP='gcc' --- 1,43 ---- ID=900002 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900002' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-7.476866e+03,-9.433726e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFADIST=512 -DPFXDIST=1088 -DPFYDIST=256' \ COMP='gcc' ID=900007 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900007' \ ! rankR=1 CacheElts=16384 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=6 \ NU=6 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-8.228465e+03,-8.387789e+03,0.000000e+00,-1.836017e+04,-1.871202e+04 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht0 -DPFIY=prefetchnta -DPFADIST=0 -DPFYDIST=192' \ ! COMP='gcc' ID=900006 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900006' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=6 \ NU=6 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-1.654752e+04,-1.701679e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIY=prefetchnta -DPFADIST=0 -DPFXDIST=256 -DPFYDIST=128' \ COMP='gcc' ! ID=900007 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900007' \ ! rankR=1 CacheElts=3522 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=6 \ ! NU=6 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-8.228465e+03,-8.387789e+03,0.000000e+00,-1.607123e+04,-1.871202e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ID=900004 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900004' \ ! rankR=0 CacheElts=3522 SSE=3 alignA=0 alignY=16 alignX=16 minM=32 minN=6 \ ! NU=6 MU=32 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-1.794583e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFIX=prefetcht1 -DPFADIST=0' \ COMP='gcc' ID=900002 ROUT='cmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_cmvnk__900002' \ ! rankR=0 CacheElts=3522 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-7.766099e+03,-8.807003e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=320 -DPFXDIST=192 -DPFYDIST=128' \ COMP='gcc' Index: cMVTK.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/cMVTK.sum,v retrieving revision 1.7 retrieving revision 1.8 diff -C2 -d -r1.7 -r1.8 *** cMVTK.sum 29 Oct 2010 23:33:52 -0000 1.7 --- cMVTK.sum 30 Oct 2010 01:20:39 -0000 1.8 *************** *** 1,70 **** ID=900002 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900002' \ ! rankR=0 CacheElts=14336 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.652535e+03,-3.179747e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFADIST=1472 -DPFXDIST=128' \ COMP='gcc' ID=900005 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900005' \ ! rankR=3 CacheElts=14336 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.211972e+03,-2.464977e+03,0.000000e+00,-1.712460e+04,-1.784040e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=448 -DPFYDIST=128' \ COMP='gcc' - ID=2 ROUT='ATL_cgemvT_8x4_sse3.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__2' \ - rankR=2 CacheElts=14336 SSE=3 alignA=8 alignY=16 alignX=0 minM=9 minN=4 \ - NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ - ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ - MFLOP=-2.309995e+03,-2.576584e+03,0.000000e+00,-1.561544e+04,-1.774476e+04 \ - CFLAGS='-x assembler-with-cpp' COMP='gcc' - ID=900003 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900003' \ - rankR=1 CacheElts=14336 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=1 \ - NU=1 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ - ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ - MFLOP=-2.727078e+03,-3.142616e+03,0.000000e+00,-1.148059e+04,-1.169355e+04 \ - ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ID=900004 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900004' \ ! rankR=0 CacheElts=14336 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-5.148432e+03,-5.237358e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht2 -DPFIY=prefetchnta -DPFADIST=0 -DPFYDIST=0' \ ! COMP='gcc' ! ID=2 ROUT='ATL_cgemvT_8x4_sse3.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__2' \ ! rankR=3 CacheElts=3440 SSE=3 alignA=8 alignY=16 alignX=0 minM=9 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.309995e+03,-2.576584e+03,0.000000e+00,0.000000e+00,-1.774476e+04 \ ! CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900005 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900005' \ ! rankR=2 CacheElts=3440 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.211972e+03,-2.464977e+03,0.000000e+00,0.000000e+00,-1.726190e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=256' \ COMP='gcc' - ID=900003 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900003' \ - rankR=1 CacheElts=3440 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=1 \ - NU=1 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ - ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ - MFLOP=-2.727078e+03,-3.142616e+03,0.000000e+00,0.000000e+00,-1.169355e+04 \ - ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ID=900004 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900004' \ ! rankR=0 CacheElts=3440 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-5.297495e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht1 -DPFIX=prefetcht0 -DPFIY=prefetchnta -DPFADIST=0 -DPFXDIST=192 -DPFYDIST=128' \ COMP='gcc' ID=900002 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900002' \ ! rankR=0 CacheElts=3440 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.654228e+03,-3.041274e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=256 -DPFXDIST=128 -DPFYDIST=0' \ COMP='gcc' --- 1,38 ---- ID=900002 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900002' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-7.796398e+03,-9.941270e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIY=prefetcht1 -DPFADIST=576 -DPFXDIST=0 -DPFYDIST=128' \ COMP='gcc' ID=900005 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900005' \ ! rankR=1 CacheElts=16384 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=4 NU=4 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ ! AXPYBASED=0 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-8.007692e+03,-8.507624e+03,0.000000e+00,-1.841561e+04,-1.787195e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht1 -DPFIY=prefetchnta -DPFADIST=0 -DPFXDIST=128 -DPFYDIST=640' \ COMP='gcc' ID=900004 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900004' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=4 \ ! NU=4 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-1.682707e+04,-1.687659e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIX=prefetcht2 -DPFIY=prefetcht1 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=192' \ COMP='gcc' ID=900004 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900004' \ ! rankR=0 CacheElts=4096 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=4 \ ! NU=4 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-1.753242e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht1 -DPFADIST=0 -DPFXDIST=704 -DPFYDIST=256' \ COMP='gcc' ID=900002 ROUT='cmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_cmvtk__900002' \ ! rankR=0 CacheElts=4096 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-8.095427e+03,-9.372292e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=384 -DPFXDIST=0 -DPFYDIST=128' \ COMP='gcc' Index: cR1K.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/cR1K.sum,v retrieving revision 1.9 retrieving revision 1.10 diff -C2 -d -r1.9 -r1.10 *** cR1K.sum 29 Oct 2010 23:33:52 -0000 1.9 --- cR1K.sum 30 Oct 2010 01:20:39 -0000 1.10 *************** *** 1,48 **** ! ID=2 ROUT='ATL_cgerk_2x1p.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__2' \ ! rankR=0 CacheElts=16384 SSE=0 alignA=0 alignY=0 alignX=0 minM=0 minN=0 \ ! NU=1 MU=2 LDAMUL=0 PFTUNABLE=0 ALIGNX2A=0 ADDCFLAGS=0 FNU=0 INCYISONE=0 \ ! X87=0 \ ! MFLOP=-2.168394e+03,-2.199754e+03 ! ID=3 ROUT='ATL_cgerk_8x4_sse3.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__3' \ ! rankR=2 CacheElts=16384 SSE=3 alignA=8 alignY=8 alignX=0 minM=9 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=1 ADDCFLAGS=0 FNU=1 INCYISONE=0 \ X87=0 \ ! MFLOP=-1.885814e+03,-2.016748e+03,0.000000e+00,-1.301613e+04,-1.339619e+04 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht0 -DPFIY=prefetcht0 -DPFADIST=0 -DPFXDIST=192' \ COMP='gcc' ! ID=900003 ROUT='cr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900003' \ ! rankR=1 CacheElts=16384 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=2 NU=2 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 \ ! INCYISONE=1 X87=0 \ ! MFLOP=-1.941797e+03,-2.245314e+03,0.000000e+00,-9.989941e+03,-1.191511e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900001 ROUT='cr1_C.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900001' \ ! rankR=0 CacheElts=16384 SSE=0 alignA=0 alignY=0 alignX=0 minM=4 minN=1 \ ! NU=1 MU=4 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-1.956773e+03,-2.152571e+03,0.000000e+00,-3.821897e+03,-3.485880e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetchnta -DPFIX=prefetcht2 -DPFIY=prefetcht2 -DPFADIST=0 -DPFXDIST=128' ! ID=900006 ROUT='cr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900006' \ ! rankR=2 CacheElts=3276 SSE=3 alignA=16 alignY=16 alignX=16 minM=48 minN=4 \ ! NU=4 MU=48 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-1.847503e+03,-2.059639e+03,0.000000e+00,0.000000e+00,-1.223120e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=3 ROUT='ATL_cgerk_8x4_sse3.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__3' \ ! rankR=1 CacheElts=3276 SSE=3 alignA=8 alignY=8 alignX=0 minM=9 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=1 ADDCFLAGS=0 FNU=1 INCYISONE=0 \ X87=0 \ ! MFLOP=-1.885814e+03,-2.016748e+03,0.000000e+00,0.000000e+00,-1.355002e+04 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=256 -DPFYDIST=192' \ COMP='gcc' ! ID=900004 ROUT='cr1_C.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900004' \ ! rankR=0 CacheElts=3276 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=1 \ ! NU=1 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-3.850238e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetcht2 -DPFIX=prefetcht1 -DPFADIST=0 -DPFXDIST=0' ! ID=1 ROUT='ATL_cgerk_axpy.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__1' \ ! rankR=0 CacheElts=3276 SSE=0 alignA=0 alignY=0 alignX=0 minM=0 minN=0 \ ! NU=1 MU=16 LDAMUL=0 PFTUNABLE=0 ALIGNX2A=0 ADDCFLAGS=0 FNU=0 INCYISONE=0 \ X87=0 \ ! MFLOP=-1.982382e+03 --- 1,30 ---- ! ID=900002 ROUT='cr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900002' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=40 minN=2 \ ! NU=2 MU=40 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-7.111933e+03,-7.139371e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht0 -DPFIY=prefetchnta -DPFADIST=512 -DPFXDIST=192' \ COMP='gcc' ! ID=900005 ROUT='cr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900005' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=3 \ ! NU=3 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-1.239298e+04,-1.233288e+04 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht0 -DPFIY=prefetchnta -DPFADIST=256 -DPFXDIST=128 -DPFYDIST=0' \ COMP='gcc' ! ID=900005 ROUT='cr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900005' \ ! rankR=0 CacheElts=4014 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=3 \ ! NU=3 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-1.230014e+04 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFADIST=384 -DPFXDIST=448' \ ! COMP='gcc' ! ID=900002 ROUT='cr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cgerk__900002' \ ! rankR=0 CacheElts=4014 SSE=3 alignA=0 alignY=16 alignX=16 minM=40 minN=2 \ ! NU=2 MU=40 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-6.079332e+03,-7.102213e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=384 -DPFXDIST=320 -DPFYDIST=1152' \ ! COMP='gcc' Index: cR2K.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/cR2K.sum,v retrieving revision 1.6 retrieving revision 1.7 diff -C2 -d -r1.6 -r1.7 *** cR2K.sum 29 Oct 2010 23:33:52 -0000 1.6 --- cR2K.sum 30 Oct 2010 01:20:39 -0000 1.7 *************** *** 1,45 **** ! ID=900007 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900007' \ ! rankR=1 CacheElts=28672 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=2 NU=2 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 \ ! INCYISONE=1 X87=0 \ ! MFLOP=0.000000e+00,-4.498280e+03,0.000000e+00,-3.492476e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht2 -DPFIX=prefetcht0 -DPFIY=prefetchnta -DPFADIST=576 -DPFXDIST=256 -DPFYDIST=128' \ COMP='gcc' ! ID=1 ROUT='ATL_cger2k_1x1_1.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__1' \ ! rankR=0 CacheElts=28672 SSE=0 alignA=0 alignY=0 alignX=0 minM=0 minN=0 \ ! NU=1 MU=1 LDAMUL=0 PFTUNABLE=0 ALIGNX2A=0 ADDCFLAGS=0 FNU=0 INCYISONE=0 \ X87=0 \ ! MFLOP=-3.071484e+03,-3.456404e+03 ! ID=900007 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900007' \ ! rankR=1 CacheElts=28672 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=2 NU=2 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 \ ! INCYISONE=1 X87=0 \ ! MFLOP=-3.743625e+03,-4.482379e+03,0.000000e+00,-1.203084e+04,-1.260319e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=0' \ COMP='gcc' ! ID=900001 ROUT='cr2_C.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900001' \ ! rankR=0 CacheElts=28672 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=1 \ ! NU=1 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-2.930797e+03,-3.198091e+03,0.000000e+00,-3.970006e+03,-3.774158e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetchnta -DPFIX=prefetcht1 -DPFIY=prefetcht2 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=128' ! ID=900007 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900007' \ ! rankR=1 CacheElts=3768 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-3.743625e+03,-4.482379e+03,0.000000e+00,-3.492476e+03,-1.224626e+04 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFADIST=128 -DPFYDIST=128' \ COMP='gcc' ! ID=900001 ROUT='cr2_C.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900001' \ ! rankR=0 CacheElts=3768 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=1 \ ! NU=1 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-2.930797e+03,-3.198091e+03,0.000000e+00,0.000000e+00,-4.014994e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=256' ! ID=900001 ROUT='cr2_C.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900001' \ ! rankR=0 CacheElts=3768 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=1 \ ! NU=1 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-3.250529e+03,-3.250333e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=512' --- 1,45 ---- ! ID=900005 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900005' \ ! rankR=1 CacheElts=30720 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=0.000000e+00,-1.359440e+04,0.000000e+00,0.000000e+00,-1.504063e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht1 -DPFIY=prefetcht1 -DPFADIST=512 -DPFYDIST=192' \ COMP='gcc' ! ID=900002 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900002' \ ! rankR=0 CacheElts=30720 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-1.035700e+04,-1.288474e+04 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=320 -DPFXDIST=256 -DPFYDIST=384' \ COMP='gcc' ! ID=900005 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900005' \ ! rankR=1 CacheElts=30720 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-1.113886e+04,-1.338699e+04,0.000000e+00,-1.593345e+04,-1.419003e+04 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIX=prefetchnta -DPFADIST=192 -DPFXDIST=256' \ ! COMP='gcc' ! ID=900006 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900006' \ ! rankR=0 CacheElts=30720 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=1 \ ! NU=1 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-1.451876e+04,-1.408775e+04 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIX=prefetcht2 -DPFADIST=0 -DPFXDIST=128 -DPFYDIST=0' \ COMP='gcc' ! ID=900004 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900004' \ ! rankR=0 CacheElts=2375 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-1.510179e+04 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht1 -DPFIX=prefetchnta -DPFADIST=128 -DPFXDIST=128 -DPFYDIST=448' \ ! COMP='gcc' ! ID=900002 ROUT='cr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_cger2k__900002' \ ! rankR=0 CacheElts=2375 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-1.051983e+04,-1.198884e+04 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=256 -DPFXDIST=0' COMP='gcc' Index: dMVNK.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/dMVNK.sum,v retrieving revision 1.5 retrieving revision 1.6 diff -C2 -d -r1.5 -r1.6 *** dMVNK.sum 29 Oct 2010 23:33:52 -0000 1.5 --- dMVNK.sum 30 Oct 2010 01:20:39 -0000 1.6 *************** *** 1,50 **** ID=900002 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900002' \ ! rankR=0 CacheElts=18432 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-6.941766e+02,-7.783074e+02 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIY=prefetcht0 -DPFADIST=128 -DPFXDIST=128 -DPFYDIST=256' \ ! COMP='gcc' ! ID=900009 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900009' \ ! rankR=1 CacheElts=18432 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=10 \ ! NU=10 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ ! AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-6.045484e+02,-6.494537e+02,0.000000e+00,-4.941867e+03,-4.281697e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFIX=prefetchnta -DPFADIST=0' \ COMP='gcc' ! ID=900008 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900008' \ ! rankR=0 CacheElts=18432 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=10 \ ! NU=10 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-3.503359e+03,-3.718705e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIY=prefetcht2 -DPFADIST=0 -DPFXDIST=192' \ ! COMP='gcc' ! ID=900006 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900006' \ ! rankR=2 CacheElts=4014 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 minN=8 \ ! NU=8 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ ! AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-6.037738e+02,-6.537777e+02,0.000000e+00,0.000000e+00,-4.814453e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=0' \ COMP='gcc' ! ID=900003 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900003' \ ! rankR=1 CacheElts=4014 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-6.988671e+02,-7.615770e+02,0.000000e+00,0.000000e+00,-4.394462e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900005 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900005' \ ! rankR=0 CacheElts=4014 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=8 \ ! NU=8 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-4.034810e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFADIST=0 -DPFXDIST=448 -DPFYDIST=0' \ COMP='gcc' ID=900002 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900002' \ ! rankR=0 CacheElts=4014 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-7.024868e+02,-7.719047e+02 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=128 -DPFXDIST=512 -DPFYDIST=1024' \ ! COMP='gcc' --- 1,37 ---- ID=900002 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900002' \ ! rankR=0 CacheElts=26624 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=2 \ ! NU=2 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.025492e+03,-2.465174e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFADIST=576 -DPFXDIST=128 -DPFYDIST=192' \ COMP='gcc' ! ID=900005 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900005' \ ! rankR=1 CacheElts=26624 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=8 \ ! NU=8 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.027557e+03,-2.048439e+03,0.000000e+00,-6.465084e+03,-7.033689e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht1 -DPFIX=prefetcht0 -DPFIY=prefetchnta -DPFADIST=0 -DPFXDIST=448 -DPFYDIST=256' \ COMP='gcc' ! ID=900004 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900004' \ ! rankR=0 CacheElts=26624 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=8 \ ! NU=8 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-6.203419e+03,-6.886336e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht0 -DPFADIST=0 -DPFXDIST=192 -DPFYDIST=0' \ ! COMP='gcc' ! ID=900004 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900004' \ ! rankR=0 CacheElts=3768 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=8 \ ! NU=8 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-7.978343e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIY=prefetcht1 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=128' \ COMP='gcc' ID=900002 ROUT='dmvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_dmvnk__900002' \ ! rankR=0 CacheElts=3768 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=2 \ ! NU=2 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.065846e+03,-2.310732e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFXDIST=128 -DPFYDIST=0' COMP='gcc' Index: dMVTK.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/dMVTK.sum,v retrieving revision 1.8 retrieving revision 1.9 diff -C2 -d -r1.8 -r1.9 *** dMVTK.sum 29 Oct 2010 23:33:52 -0000 1.8 --- dMVTK.sum 30 Oct 2010 01:20:39 -0000 1.9 *************** *** 1,58 **** ID=900002 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900002' \ ! rankR=0 CacheElts=16384 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-6.845809e+02,-8.176735e+02 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIY=prefetcht1 -DPFADIST=1664 -DPFXDIST=256 -DPFYDIST=0' \ ! COMP='gcc' ! ID=900009 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900009' \ ! rankR=3 CacheElts=16384 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=10 \ ! NU=10 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ ! AXPYBASED=0 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-5.979128e+02,-6.425698e+02,0.000000e+00,-5.067152e+03,-4.527881e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=128 -DPFYDIST=256' \ COMP='gcc' ID=2 ROUT='ATL_dgemvT_2x8_sse3.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__2' \ ! rankR=2 CacheElts=16384 SSE=0 alignA=0 alignY=16 alignX=0 minM=0 minN=8 \ ! NU=8 MU=2 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=0 X87=0 \ ! MFLOP=-6.596378e+02,-6.646367e+02,0.000000e+00,-4.947005e+03,-6.984322e+03 ! ID=900006 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900006' \ ! rankR=1 CacheElts=16384 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-5.923111e+02,-6.518792e+02,0.000000e+00,-3.787492e+03,-6.320513e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900007 ROUT='dmvt_C.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900007' \ ! rankR=0 CacheElts=16384 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=8 \ ! NU=8 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-3.292669e+03,-4.088346e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetcht2 -DPFIX=prefetcht1 -DPFYDIST=128' ! ID=2 ROUT='ATL_dgemvT_2x8_sse3.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__2' \ ! rankR=2 CacheElts=3850 SSE=0 alignA=0 alignY=16 alignX=0 minM=0 minN=8 \ NU=8 MU=2 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=0 X87=0 \ ! MFLOP=-6.596378e+02,-6.646367e+02,0.000000e+00,0.000000e+00,-6.984322e+03 ! ID=900006 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900006' \ ! rankR=1 CacheElts=3850 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-5.923111e+02,-6.518792e+02,0.000000e+00,0.000000e+00,-6.681424e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=256 -DPFYDIST=128' \ COMP='gcc' ! ID=900007 ROUT='dmvt_C.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900007' \ ! rankR=0 CacheElts=3850 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=8 \ ! NU=8 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-3.296523e+03,-4.114734e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetchnta -DPFIX=prefetcht2 -DPFIY=prefetcht0 -DPFADIST=0 -DPFYDIST=0' ID=900002 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900002' \ ! rankR=0 CacheElts=3850 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=1 \ ! NU=1 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-7.056153e+02,-7.888170e+02 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=128 -DPFXDIST=1792 -DPFYDIST=256' \ ! COMP='gcc' --- 1,34 ---- ID=900002 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900002' \ ! rankR=0 CacheElts=32768 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=2 \ ! NU=2 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.063952e+03,-2.533194e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIY=prefetcht0 -DPFADIST=768 -DPFXDIST=0 -DPFYDIST=256' \ COMP='gcc' ID=2 ROUT='ATL_dgemvT_2x8_sse3.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__2' \ ! rankR=1 CacheElts=32768 SSE=0 alignA=0 alignY=16 alignX=0 minM=0 minN=8 \ NU=8 MU=2 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=0 X87=0 \ ! MFLOP=-1.932877e+03,-1.953017e+03,0.000000e+00,-6.343135e+03,-7.145821e+03 ! ID=900008 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900008' \ ! rankR=0 CacheElts=32768 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=6 \ ! NU=6 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-5.951610e+03,-6.134438e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIX=prefetchnta -DPFIY=prefetcht0 -DPFADIST=0 -DPFXDIST=1280 -DPFYDIST=256' \ COMP='gcc' ! ID=900005 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900005' \ ! rankR=0 CacheElts=3686 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=8 \ ! NU=8 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-8.043420e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht0 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=448' \ ! COMP='gcc' ID=900002 ROUT='dmvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_dmvtk__900002' \ ! rankR=0 CacheElts=3686 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=2 \ ! NU=2 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-2.120502e+03,-2.376783e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFXDIST=256 -DPFYDIST=192' COMP='gcc' Index: dR1K.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/dR1K.sum,v retrieving revision 1.8 retrieving revision 1.9 diff -C2 -d -r1.8 -r1.9 *** dR1K.sum 29 Oct 2010 23:33:52 -0000 1.8 --- dR1K.sum 30 Oct 2010 01:20:39 -0000 1.9 *************** *** 1,62 **** ID=900002 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900002' \ ! rankR=0 CacheElts=32768 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-5.713103e+02,-5.713103e+02 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht1 -DPFIX=prefetcht1 -DPFADIST=512 -DPFXDIST=0 -DPFYDIST=128' \ ! COMP='gcc' ! ID=6 ROUT='ATL_dgerk_4x8_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__6' \ ! rankR=3 CacheElts=32768 SSE=3 alignA=0 alignY=0 alignX=0 minM=0 minN=0 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 FNU=0 INCYISONE=0 \ ! X87=0 \ ! MFLOP=-4.814511e+02,-5.358372e+02,0.000000e+00,-3.463635e+03,-4.406780e+03 ! ID=900009 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900009' \ ! rankR=2 CacheElts=32768 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-4.740158e+02,-5.530732e+02,0.000000e+00,-3.420273e+03,-4.590250e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=128' \ COMP='gcc' ! ID=900003 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900003' \ ! rankR=1 CacheElts=32768 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-5.087824e+02,-5.716577e+02,0.000000e+00,-3.216009e+03,-4.317224e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900007 ROUT='dr1_C.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900007' \ ! rankR=0 CacheElts=32768 SSE=0 alignA=0 alignY=0 alignX=0 minM=1 minN=8 \ ! NU=8 MU=1 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-2.600666e+03,-3.064204e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetcht2 -DPFIX=prefetcht2 -DPFIY=prefetcht0 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=384' ! ID=900009 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900009' \ ! rankR=3 CacheElts=3604 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-4.740158e+02,-5.530732e+02,0.000000e+00,-1.600000e+03,-4.654021e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=128 -DPFYDIST=256' \ COMP='gcc' ! ID=6 ROUT='ATL_dgerk_4x8_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__6' \ ! rankR=2 CacheElts=3604 SSE=3 alignA=0 alignY=0 alignX=0 minM=0 minN=0 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 FNU=0 INCYISONE=0 \ ! X87=0 \ ! MFLOP=-4.814511e+02,-5.358372e+02,0.000000e+00,0.000000e+00,-4.406780e+03 ! ID=900003 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900003' \ ! rankR=1 CacheElts=3604 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=2 \ ! NU=2 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-5.087824e+02,-5.716577e+02,0.000000e+00,0.000000e+00,-4.317224e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900007 ROUT='dr1_C.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900007' \ ! rankR=0 CacheElts=3604 SSE=0 alignA=0 alignY=0 alignX=0 minM=1 minN=8 \ ! NU=8 MU=1 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-2.592030e+03,-3.072310e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetchnta -DPFXDIST=0' ! ID=900001 ROUT='dr1_C.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900001' \ ! rankR=0 CacheElts=3604 SSE=0 alignA=0 alignY=0 alignX=0 minM=32 minN=2 \ ! NU=2 MU=32 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-5.040471e+02,-5.564499e+02 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFADIST=0 -DPFXDIST=0 -DPFYDIST=128' --- 1,28 ---- ID=900002 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900002' \ ! rankR=0 CacheElts=26624 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-1.841971e+03,-1.841971e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIX=prefetcht0 -DPFIY=prefetcht0 -DPFADIST=576 -DPFXDIST=512 -DPFYDIST=128' \ COMP='gcc' ! ID=900007 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900007' \ ! rankR=0 CacheElts=26624 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=6 \ ! NU=6 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-4.451065e+03,-4.328288e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht0 -DPFADIST=0 -DPFXDIST=192 -DPFYDIST=256' \ COMP='gcc' ! ID=900005 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900005' \ ! rankR=0 CacheElts=3522 SSE=3 alignA=0 alignY=16 alignX=16 minM=8 minN=4 \ ! NU=4 MU=8 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-4.911114e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIX=prefetcht1 -DPFADIST=256' COMP='gcc' ! ID=900002 ROUT='dr1_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dgerk__900002' \ ! rankR=0 CacheElts=3522 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-1.609676e+03,-1.827604e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=256' COMP='gcc' Index: dR2K.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/dR2K.sum,v retrieving revision 1.6 retrieving revision 1.7 diff -C2 -d -r1.6 -r1.7 *** dR2K.sum 29 Oct 2010 23:33:52 -0000 1.6 --- dR2K.sum 30 Oct 2010 01:20:39 -0000 1.7 *************** *** 1,15 **** ID=900002 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900002' \ ! rankR=0 CacheElts=32768 SSE=3 alignA=0 alignY=16 alignX=16 minM=56 minN=2 \ ! NU=2 MU=56 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-9.276838e+02,-1.131530e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFXDIST=320 -DPFYDIST=0' COMP='gcc' ID=900008 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900008' \ ! rankR=2 CacheElts=32768 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=5 NU=5 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 \ ! INCYISONE=1 X87=0 \ ! MFLOP=-8.951151e+02,-1.044676e+03,0.000000e+00,-6.217282e+03,-5.023061e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht2 -DPFIY=prefetcht2 -DPFADIST=0 -DPFYDIST=128' \ COMP='gcc' ID=4 ROUT='ATL_dger2k_2x2_sse3.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__4' \ --- 1,15 ---- ID=900002 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900002' \ ! rankR=0 CacheElts=32768 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-2.984606e+03,-3.588692e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=448 -DPFYDIST=192' COMP='gcc' ID=900008 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900008' \ ! rankR=2 CacheElts=32768 SSE=3 alignA=16 alignY=16 alignX=16 minM=8 minN=5 \ ! NU=5 MU=8 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-3.019768e+03,-3.310418e+03,0.000000e+00,-6.095681e+03,-5.716172e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=256 -DPFYDIST=256' \ COMP='gcc' ID=4 ROUT='ATL_dger2k_2x2_sse3.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__4' \ *************** *** 17,52 **** NU=2 MU=2 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=0 \ X87=0 \ ! MFLOP=-9.779651e+02,-1.099505e+03,0.000000e+00,-5.435554e+03,-2.801769e+03 \ CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -DATL_ALIGNED -DATL_USEREAL' \ COMP='gcc' ! ID=900004 ROUT='dr2_C.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900004' \ ! rankR=0 CacheElts=32768 SSE=0 alignA=0 alignY=0 alignX=0 minM=4 minN=1 \ ! NU=1 MU=4 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-2.928973e+03,-2.885300e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIX=prefetcht1 -DPFIY=prefetchnta -DPFYDIST=128' ! ID=900008 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900008' \ ! rankR=2 CacheElts=3850 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 minN=5 \ ! NU=5 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ ! X87=0 \ ! MFLOP=-8.951151e+02,-1.044676e+03,0.000000e+00,-2.740894e+03,-5.023061e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=3 ROUT='ATL_dger2k_2x2_sse3.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__3' \ ! rankR=1 CacheElts=3850 SSE=2 alignA=16 alignY=16 alignX=16 minM=0 minN=2 \ ! NU=2 MU=2 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=0 \ X87=0 \ ! MFLOP=-9.750347e+02,-1.114012e+03,0.000000e+00,0.000000e+00,-4.863884e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -DATL_ALIGNED' \ COMP='gcc' ! ID=900004 ROUT='dr2_C.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900004' \ ! rankR=0 CacheElts=3850 SSE=0 alignA=0 alignY=0 alignX=0 minM=4 minN=1 \ ! NU=1 MU=4 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-3.062050e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetcht1 -DPFIX=prefetcht1 -DPFIY=prefetcht0 -DPFADIST=0 -DPFYDIST=128' ! ID=900001 ROUT='dr2_C.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900001' \ ! rankR=0 CacheElts=3850 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=1 \ ! NU=1 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-9.806080e+02,-1.043580e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFYDIST=1600' --- 17,43 ---- NU=2 MU=2 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=0 \ X87=0 \ ! MFLOP=-2.782555e+03,-3.177497e+03,0.000000e+00,-5.562726e+03,-2.810595e+03 \ CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -DATL_ALIGNED -DATL_USEREAL' \ COMP='gcc' ! ID=900004 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900004' \ ! rankR=0 CacheElts=32768 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=4 \ ! NU=4 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-4.423501e+03,-6.618111e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht1 -DPFIY=prefetchnta -DPFADIST=128 -DPFXDIST=384 -DPFYDIST=128' \ COMP='gcc' ! ID=900004 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900004' \ ! rankR=0 CacheElts=2375 SSE=3 alignA=0 alignY=16 alignX=16 minM=24 minN=4 \ ! NU=4 MU=24 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-6.842289e+03 \ ! ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht2 -DPFIX=prefetcht0 -DPFIY=prefetcht1 -DPFADIST=0 -DPFXDIST=192 -DPFYDIST=256' \ ! COMP='gcc' ! ID=900002 ROUT='dr2_sse.c' AUTH='R. Clint Whaley' KNAME='ATL_dger2k__900002' \ ! rankR=0 CacheElts=2375 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=2 \ ! NU=2 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 FNU=1 INCYISONE=1 \ X87=0 \ ! MFLOP=-3.034269e+03,-3.313463e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFYDIST=0' COMP='gcc' Index: sMVNK.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/sMVNK.sum,v retrieving revision 1.5 retrieving revision 1.6 diff -C2 -d -r1.5 -r1.6 *** sMVNK.sum 29 Oct 2010 23:33:52 -0000 1.5 --- sMVNK.sum 30 Oct 2010 01:20:39 -0000 1.6 *************** *** 1,64 **** ! ID=900001 ROUT='smvn_C.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900001' \ ! rankR=0 CacheElts=36864 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=4 \ ! NU=4 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-1.421887e+03,-1.608062e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetcht0 -DPFIY=prefetcht1 -DPFADIST=0 -DPFYDIST=0' ! ID=900006 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900006' \ ! rankR=3 CacheElts=36864 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=4 NU=4 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-1.382933e+03,-1.596011e+03,0.000000e+00,-8.212706e+03,-9.444444e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=0 -DPFXDIST=192 -DPFYDIST=384' \ COMP='gcc' ! ID=2 ROUT='ATL_sgemvN_8x4_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__2' \ ! rankR=2 CacheElts=36864 SSE=1 alignA=0 alignY=16 alignX=0 minM=0 minN=0 \ ! NU=4 MU=8 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=0 X87=0 \ ! MFLOP=-1.462021e+03,-1.612652e+03,0.000000e+00,-7.434983e+03,-8.803571e+03 ! ID=900003 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900003' \ ! rankR=1 CacheElts=36864 SSE=3 alignA=16 alignY=16 alignX=16 minM=80 \ ! minN=2 NU=2 MU=80 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-1.374508e+03,-1.573829e+03,0.000000e+00,-7.018069e+03,-7.424699e+03 \ ! ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ! ID=900005 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900005' \ ! rankR=0 CacheElts=36864 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=4 \ ! NU=4 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ! ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-4.055397e+03,-4.279514e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetchnta -DPFIX=prefetcht0 -DPFIY=prefetcht1 -DPFADIST=128 -DPFXDIST=128' \ COMP='gcc' - ID=900006 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900006' \ - rankR=3 CacheElts=8192 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 minN=4 \ - NU=4 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ - AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ - MFLOP=-1.382933e+03,-1.596011e+03,0.000000e+00,0.000000e+00,-9.722587e+03 \ - ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp -DPFADIST=0' COMP='gcc' - ID=2 ROUT='ATL_sgemvN_8x4_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__2' \ - rankR=2 CacheElts=8192 SSE=1 alignA=0 alignY=16 alignX=0 minM=0 minN=0 \ - NU=4 MU=8 LDAMUL=16 PFTUNABLE=0 ALIGNX2A=1 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ - ALLALIGNXY=0 LDYTOP=0 FNU=0 X87=0 \ - MFLOP=-1.462021e+03,-1.612652e+03,0.000000e+00,0.000000e+00,-8.803571e+03 - ID=900003 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900003' \ - rankR=1 CacheElts=8192 SSE=3 alignA=16 alignY=16 alignX=16 minM=80 minN=2 \ - NU=2 MU=80 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ - AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ - MFLOP=-1.374508e+03,-1.573829e+03,0.000000e+00,0.000000e+00,-7.424699e+03 \ - ASM=GAS_x8664 CFLAGS='-x assembler-with-cpp' COMP='gcc' ID=900005 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900005' \ ! rankR=0 CacheElts=8192 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=4 \ ! NU=4 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-4.232002e+03 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht1 -DPFIY=prefetcht0 -DPFADIST=0 -DPFXDIST=128 -DPFYDIST=832' \ COMP='gcc' ! ID=900001 ROUT='smvn_C.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900001' \ ! rankR=0 CacheElts=8192 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=4 \ ! NU=4 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-1.431032e+03,-1.596147e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFADIST=0 -DPFYDIST=0' --- 1,37 ---- ! ID=900002 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900002' \ ! rankR=0 CacheElts=57344 SSE=3 alignA=0 alignY=16 alignX=16 minM=32 minN=4 \ ! NU=4 MU=32 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-4.046816e+03,-4.695770e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIY=prefetcht2 -DPFADIST=384 -DPFXDIST=0 -DPFYDIST=256' \ ! COMP='gcc' ! ID=900008 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900008' \ ! rankR=1 CacheElts=57344 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=12 NU=12 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-3.252172e+03,-3.809663e+03,0.000000e+00,-1.326065e+04,-1.434403e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht0 -DPFIX=prefetcht2 -DPFIY=prefetchnta -DPFADIST=0 -DPFXDIST=320 -DPFYDIST=192' \ COMP='gcc' ! ID=900007 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900007' \ ! rankR=0 CacheElts=57344 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=12 \ ! NU=12 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 \ AXPYBASED=1 ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,-1.177907e+04,-1.225333e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht2 -DPFIX=prefetcht2 -DPFIY=prefetcht0 -DPFADIST=0 -DPFXDIST=192 -DPFYDIST=0' \ COMP='gcc' ID=900005 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900005' \ ! rankR=0 CacheElts=4096 SSE=3 alignA=0 alignY=16 alignX=16 minM=16 minN=8 \ ! NU=8 MU=16 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=0.000000e+00,0.000000e+00,0.000000e+00,0.000000e+00,-1.540818e+04 \ ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFIA=prefetcht1 -DPFADIST=0 -DPFXDIST=128 -DPFYDIST=384' \ COMP='gcc' ! ID=900002 ROUT='smvn_sse.c' AUTH='R. Clint Whaley' TA='N' KNAME='ATL_smvnk__900002' \ ! rankR=0 CacheElts=4096 SSE=3 alignA=0 alignY=16 alignX=16 minM=32 minN=4 \ ! NU=4 MU=32 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=1 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-4.223665e+03,-4.483205e+03 ASM=GAS_x8664 \ ! CFLAGS='-x assembler-with-cpp -DPFADIST=192 -DPFYDIST=256' COMP='gcc' Index: sMVTK.sum =================================================================== RCS file: /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/Core264SSE3/kern/gcc/sMVTK.sum,v retrieving revision 1.5 retrieving revision 1.6 diff -C2 -d -r1.5 -r1.6 *** sMVTK.sum 29 Oct 2010 23:33:52 -0000 1.5 --- sMVTK.sum 30 Oct 2010 01:20:39 -0000 1.6 *************** *** 1,66 **** ! ID=900001 ROUT='smvt_C.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_smvtk__900001' \ ! rankR=0 CacheElts=49152 SSE=0 alignA=0 alignY=0 alignX=0 minM=2 minN=4 \ ! NU=4 MU=2 LDAMUL=0 PFTUNABLE=1 ALIGNX2A=0 ADDCFLAGS=0 GEMMBASED=0 AXPYBASED=0 \ ALLALIGNXY=0 LDYTOP=0 FNU=1 X87=0 \ ! MFLOP=-1.391000e+03,-1.573593e+03 \ ! CFLAGS='-fomit-frame-pointer -mfpmath=sse -msse3 -O2 -m64 -DPFIA=prefetcht2 -DPFIX=prefetchnta -DPFIY=prefetcht2 -DPFADIST=128 -DPFXDIST=320 -DPFYDIST=128' ! ID=900009 ROUT='smvt_sse.c' AUTH='R. Clint Whaley' TA='T' KNAME='ATL_smvtk__900009' \ ! rankR=3 CacheElts=49152 SSE=3 alignA=16 alignY=16 alignX=16 minM=16 \ ! minN=4 NU=4 MU=16 LDAMUL=16 PFTUNABLE=1 ALIGNX2A=0 ADDCF... [truncated message content] |