[Math-atlas-commits] CVS: AtlasBase/Clint/misc/ARCHDEF/HPPA20/gcc/gemm cCleanK,NONE,1.1 cCleanM,NONE
Brought to you by:
rwhaley,
tonyc040457
Update of /cvsroot/math-atlas/AtlasBase/Clint/misc/ARCHDEF/HPPA20/gcc/gemm In directory sc8-pr-cvs1.sourceforge.net:/tmp/cvs-serv16539/Clint/misc/ARCHDEF/HPPA20/gcc/gemm Added Files: cCleanK cCleanM cCleanN cMMRES cNB cNCNB cXover.h cbestNN_0x0x0 cbestNN_0x0x80 cbestNN_80x80x80 cbestNT_0x0x0 cbestNT_0x0x80 cbestNT_80x80x80 cbestTN_0x0x0 cbestTN_0x0x80 cbestTN_80x80x80 cbestTT_0x0x0 cbestTT_0x0x80 cbestTT_80x80x80 cgMMRES cuCleanK cuCleanKF cuCleanM cuCleanMF cuCleanN cuCleanNF cuMMRES dCleanK dCleanM dCleanN dMMRES dNB dNCNB dXover.h dbestNN_0x0x0 dbestNN_0x0x80 dbestNN_80x80x80 dbestNT_0x0x0 dbestNT_0x0x80 dbestNT_80x80x80 dbestTN_0x0x0 dbestTN_0x0x80 dbestTN_80x80x80 dbestTT_0x0x0 dbestTT_0x0x80 dbestTT_80x80x80 dgMMRES dnreg duCleanK duCleanKF duCleanM duCleanMF duCleanN duCleanNF duMMRES sCleanK sCleanM sCleanN sMMRES sNB sNCNB sXover.h sbestNN_0x0x0 sbestNN_0x0x80 sbestNN_80x80x80 sbestNT_0x0x0 sbestNT_0x0x80 sbestNT_80x80x80 sbestTN_0x0x0 sbestTN_0x0x80 sbestTN_80x80x80 sbestTT_0x0x0 sbestTT_0x0x80 sbestTT_80x80x80 sgMMRES snreg suCleanK suCleanKF suCleanM suCleanMF suCleanN suCleanNF suMMRES zCleanK zCleanM zCleanN zMMRES zNB zNCNB zXover.h zbestNN_0x0x0 zbestNN_0x0x80 zbestNN_80x80x80 zbestNT_0x0x0 zbestNT_0x0x80 zbestNT_80x80x80 zbestTN_0x0x0 zbestTN_0x0x80 zbestTN_80x80x80 zbestTT_0x0x0 zbestTT_0x0x80 zbestTT_80x80x80 zgMMRES zuCleanK zuCleanKF zuCleanM zuCleanMF zuCleanN zuCleanNF zuMMRES Log Message: hppa20 fixes --- NEW FILE: cCleanK --- KB MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH GEN-MFLOP SPC-MFLOP 80 1 1 80 6 6 80 0 6 3 -738.21 -640.84 79 1 1 80 6 6 79 0 6 3 -724.05 -640.84 78 1 1 80 6 6 78 0 6 3 -691.97 -640.84 77 1 1 80 6 6 77 0 6 3 -698.79 -640.84 76 1 1 80 6 6 76 0 6 3 -714.44 -640.84 75 1 1 80 6 6 75 0 6 3 -691.15 -640.84 74 1 1 80 6 6 74 0 6 3 -716.41 -640.84 73 1 1 80 6 6 73 0 6 3 -687.11 -640.84 72 1 1 80 6 6 72 0 6 3 -732.35 -640.84 71 1 1 80 6 6 71 0 6 3 -719.08 -640.84 70 1 1 80 6 6 70 0 6 3 -681.39 -640.84 69 1 1 80 6 6 69 0 6 3 -671.53 -640.84 68 1 1 80 6 6 68 0 6 3 -731.62 -640.84 67 1 1 80 6 6 67 0 6 3 -739.57 -640.84 66 1 1 80 6 6 66 0 6 3 -708.08 -640.84 65 1 1 80 6 6 65 0 6 3 -726.60 -640.84 64 1 1 80 6 6 64 0 6 3 -714.88 -640.84 63 1 1 80 6 6 63 0 6 3 -709.62 -640.84 62 1 1 80 6 6 62 0 6 3 -692.47 -640.84 61 1 1 80 6 6 61 0 6 3 -702.93 -640.84 60 1 1 80 6 6 60 0 6 3 -680.15 -640.84 59 1 1 80 6 6 59 0 6 3 -681.62 -640.84 58 1 1 80 6 6 58 0 6 3 -655.49 -640.84 57 1 1 80 6 6 57 0 6 3 -678.28 -640.84 56 1 1 80 6 6 56 0 6 3 -676.17 -640.84 55 1 1 80 6 6 55 0 6 3 -666.95 -640.84 54 1 1 80 6 6 54 0 6 3 -670.30 -640.84 53 1 1 80 6 6 53 0 6 3 -670.03 -640.84 52 1 1 80 6 6 52 0 6 3 -676.13 -640.84 51 1 1 80 6 6 51 0 6 3 -667.33 -640.84 50 1 1 80 6 6 50 0 6 3 -673.49 -640.84 49 1 1 80 6 6 49 0 6 3 -677.17 -640.84 48 1 1 80 6 6 48 0 6 3 -681.07 -640.84 47 1 1 80 6 6 47 0 6 3 -673.73 -640.84 46 1 1 80 6 6 46 0 6 3 -676.53 -640.84 45 1 1 80 6 6 45 0 6 3 -675.98 -640.84 44 1 1 80 6 6 44 0 6 3 -676.97 -640.84 43 1 1 80 6 6 43 0 6 3 -675.50 -640.84 42 1 1 80 6 6 42 0 6 3 -680.07 -640.84 41 1 1 80 6 6 41 0 6 3 -676.12 -640.84 40 1 1 80 6 6 40 0 6 3 -676.24 -640.84 39 1 1 80 6 6 39 0 6 3 -671.89 -640.84 38 1 1 80 6 6 38 0 6 3 -676.26 -640.84 37 1 1 80 6 6 37 0 6 3 -678.86 -640.84 36 1 1 80 6 6 36 0 6 3 -667.88 -640.84 35 1 1 80 6 6 35 0 6 3 -669.50 -640.84 34 1 1 80 6 6 34 0 6 3 -676.45 -640.84 33 1 1 80 6 6 33 0 6 3 -670.84 -640.84 32 1 1 80 6 6 32 0 6 3 -666.77 -640.84 31 1 1 80 6 6 31 0 6 3 -669.49 -640.84 30 1 1 80 6 6 30 0 6 3 -669.58 -640.84 29 1 1 80 6 6 29 0 6 3 -674.84 -640.84 28 1 1 80 6 6 28 0 6 3 -673.73 -640.84 27 1 1 80 6 6 27 0 6 3 -672.62 -640.84 26 1 1 80 6 6 26 0 6 3 -663.57 -640.84 25 1 1 80 6 6 25 0 6 3 -665.71 -640.84 24 1 1 80 6 6 24 0 6 3 -653.19 -640.84 23 1 1 80 6 6 23 0 6 3 -655.48 -640.84 22 1 1 80 6 6 22 0 6 3 -660.73 -640.84 21 1 1 80 6 6 21 0 6 3 -670.22 -640.84 20 1 1 80 6 6 20 0 6 3 -659.27 -640.84 19 1 1 80 6 6 19 0 6 3 -656.99 -640.84 18 1 1 80 6 6 18 0 6 3 -652.89 -640.84 17 1 1 80 6 6 17 0 6 3 -668.03 -640.84 16 1 1 80 6 6 16 0 6 3 -651.68 -640.84 15 1 1 80 6 6 15 0 6 3 -654.86 -640.84 14 1 1 80 6 6 14 0 6 3 -655.87 -640.84 13 1 1 80 6 6 13 0 6 3 -649.45 -640.84 0 1 1 80 6 6 1 0 6 3 -602.48 -640.84 --- NEW FILE: cCleanM --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -700.70 --- NEW FILE: cCleanN --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -701.67 --- NEW FILE: cMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -816.77 ICASE NB MFLOP ROUT AUTHOR 324 80 -2163.30 "ATL_smm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: cNB --- 1 80 --- NEW FILE: cNCNB --- 80 --- NEW FILE: cXover.h --- #ifndef CXOVER_H #define CXOVER_H #define ATL_3NB 240 #define NN_MNK_M 18000 #define NN_MNK_N 18000 #define NN_MNK_MN 64000 #define NN_MNK_K 297680 #define NN_MNK_GE 1000 #define NT_MNK_M 8000 #define NT_MNK_N 297680 #define NT_MNK_MN 64000 #define NT_MNK_K 564480 #define NT_MNK_GE 3375 #define TN_MNK_M 8000 #define TN_MNK_N 8000 #define TN_MNK_MN 64000 #define TN_MNK_K 564480 #define TN_MNK_GE 1000 #define TT_MNK_M 18000 #define TT_MNK_N 8000 #define TT_MNK_MN 64000 #define TT_MNK_K 8000 #define TT_MNK_GE 3375 #endif --- NEW FILE: cbestNN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 8 0 6 3 -692.80 --- NEW FILE: cbestNN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 6 80 0 6 3 -709.14 --- NEW FILE: cbestNN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -698.20 --- NEW FILE: cbestNT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 4 80 6 6 1 0 6 3 -649.68 --- NEW FILE: cbestNT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 6 4 0 6 3 -749.67 --- NEW FILE: cbestNT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 4 0 6 3 -747.70 --- NEW FILE: cbestTN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 1 0 6 3 -609.45 --- NEW FILE: cbestTN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 6 80 0 6 3 -766.44 --- NEW FILE: cbestTN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 6 80 0 6 3 -766.44 --- NEW FILE: cbestTT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 6 8 0 6 3 -747.34 --- NEW FILE: cbestTT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 4 0 6 3 -748.41 --- NEW FILE: cbestTT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 4 0 6 3 -748.41 --- NEW FILE: cgMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -820.62 --- NEW FILE: cuCleanK --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 3 1 80 70 40 16 -415.52 ATL_mm4x4x2_1_prefCU.c 16 324 1 80 64 32 16 -2076.53 ATL_smm4x4x16_hppa.c --- NEW FILE: cuCleanKF --- MULT ICASE FIXED NB 1 16 324 1 80 --- NEW FILE: cuCleanM --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 311 0 80 70 40 16 -370.48 ATL_mm6x8x8_1p.c 4 324 0 80 68 40 16 -2111.18 ATL_smm4x4x16_hppa.c --- NEW FILE: cuCleanMF --- MULT ICASE FIXED NB 1 4 324 0 80 --- NEW FILE: cuCleanN --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 3 6 0 80 69 39 18 -321.61 ATL_mm4x3x8p.c 4 324 0 80 68 40 16 -2111.54 ATL_smm4x4x16_hppa.c --- NEW FILE: cuCleanNF --- MULT ICASE FIXED NB 1 4 324 0 80 --- NEW FILE: cuMMRES --- CASE NB MFLOP ROUTINE 324 80 -2163.30 "ATL_smm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: dCleanK --- KB MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH GEN-MFLOP SPC-MFLOP 80 1 2 80 6 3 80 1 4 1 -1766.63 -1587.81 79 1 2 80 6 3 79 1 4 1 -1693.09 -1576.79 78 1 2 80 6 3 78 1 4 1 -1521.93 -1381.18 77 1 2 80 6 3 77 1 4 1 -1617.22 -1502.09 76 1 2 80 6 3 76 1 4 1 -1647.24 -1460.79 75 1 2 80 6 3 75 1 4 1 -1585.78 -1499.71 74 1 2 80 6 3 74 1 4 1 -1580.67 -1372.92 73 1 2 80 6 3 73 1 4 1 -1651.64 -1538.54 72 1 2 80 6 3 72 1 4 1 -1763.81 -1561.75 71 1 2 80 6 3 71 1 4 1 -1689.51 -1572.11 70 1 2 80 6 3 70 1 4 1 -1519.60 -1382.92 69 1 2 80 6 3 69 1 4 1 -1608.31 -1499.38 68 1 2 80 6 3 68 1 4 1 -1645.67 -1465.04 67 1 2 80 6 3 67 1 4 1 -1586.82 -1492.01 66 1 2 80 6 3 66 1 4 1 -1581.19 -1367.87 65 1 2 80 6 3 65 1 4 1 -1652.37 -1531.62 64 1 2 80 6 3 64 1 4 1 -1759.66 -1542.31 63 1 2 80 6 3 63 1 4 1 -1688.47 -1558.71 62 1 2 80 6 3 62 1 4 1 -1520.56 -1369.77 61 1 2 80 6 3 61 1 4 1 -1614.73 -1487.09 60 1 2 80 6 3 60 1 4 1 -1640.78 -1454.99 59 1 2 80 6 3 59 1 4 1 -1586.62 -1484.77 58 1 2 80 6 3 58 1 4 1 -1580.47 -1368.54 57 1 2 80 6 3 57 1 4 1 -1647.34 -1528.00 56 1 2 80 6 3 56 1 4 1 -1754.41 -1542.15 55 1 2 80 6 3 55 1 4 1 -1684.84 -1553.24 54 1 2 80 6 3 54 1 4 1 -1517.65 -1371.08 53 1 2 80 6 3 53 1 4 1 -1612.01 -1482.66 52 1 2 80 6 3 52 1 4 1 -1637.90 -1452.10 51 1 2 80 6 3 51 1 4 1 -1587.27 -1458.27 50 1 2 80 6 3 50 1 4 1 -1559.84 -1348.77 49 1 2 80 6 3 49 1 4 1 -1646.65 -1485.98 48 1 2 80 6 3 48 1 4 1 -1745.59 -1517.42 47 1 2 80 6 3 47 1 4 1 -1678.01 -1533.78 46 1 2 80 6 3 46 1 4 1 -1516.98 -1349.23 45 1 2 80 6 3 45 1 4 1 -1607.29 -1472.41 44 1 2 80 6 3 44 1 4 1 -1630.73 -1438.44 43 1 2 80 6 3 43 1 4 1 -1582.02 -1465.46 42 1 2 80 6 3 42 1 4 1 -1564.56 -1353.06 41 1 2 80 6 3 41 1 4 1 -1639.11 -1488.35 40 1 2 80 6 3 40 1 4 1 -1736.06 -1504.42 39 1 2 80 6 3 39 1 4 1 -1667.37 -1516.02 38 1 2 80 6 3 38 1 4 1 -1514.63 -1352.02 37 1 2 80 6 3 37 1 4 1 -1605.03 -1448.04 36 1 2 80 6 3 36 1 4 1 -1622.51 -1422.28 35 1 2 80 6 3 35 1 4 1 -1576.27 -1444.97 34 1 2 80 6 3 34 1 4 1 -1556.29 -1327.45 33 1 2 80 6 3 33 1 4 1 -1632.44 -1452.53 32 1 2 80 6 3 32 1 4 1 -1717.75 -1471.66 31 1 2 80 6 3 31 1 4 1 -1655.83 -1475.18 30 1 2 80 6 3 30 1 4 1 -1508.23 -1325.22 29 1 2 80 6 3 29 1 4 1 -1595.00 -1447.85 28 1 2 80 6 3 28 1 4 1 -1611.38 -1427.27 27 1 2 80 6 3 27 1 4 1 -1572.67 -1458.82 26 1 2 80 6 3 26 1 4 1 -1539.41 -1334.25 25 1 2 80 6 3 25 1 4 1 -1615.81 -1443.99 24 1 2 80 6 3 24 1 4 1 -1694.94 -1471.40 23 1 2 80 6 3 23 1 4 1 -1632.76 -1458.88 22 1 2 80 6 3 22 1 4 1 -1496.02 -1316.91 21 1 2 80 6 3 21 1 4 1 -1581.60 -1417.27 20 1 2 80 6 3 20 1 4 1 -1587.78 -1364.42 19 1 2 80 6 3 19 1 4 1 -1563.93 -1405.56 18 1 2 80 6 3 18 1 4 1 -1511.77 -1286.38 17 1 2 80 6 3 17 1 4 1 -1591.99 -1391.92 16 1 2 80 6 3 16 1 4 1 -1645.67 -1385.75 15 1 2 80 6 3 15 1 4 1 -1595.28 -1379.66 14 1 2 80 6 3 14 1 4 1 -1487.33 -1281.13 13 1 2 80 6 3 13 1 4 1 -1555.52 -1343.43 12 1 2 80 6 3 12 1 4 1 -1537.29 -1286.04 11 1 2 80 6 3 11 1 4 1 -1538.77 -1309.73 10 1 2 80 6 3 10 1 4 1 -1455.52 -1194.47 9 1 2 80 6 3 9 1 4 1 -1488.17 -1267.21 8 1 2 80 6 3 8 1 4 1 -1511.26 -1191.37 7 1 2 80 6 3 7 1 4 1 -1417.28 -1162.08 6 1 2 80 6 3 6 1 4 1 -1316.38 -1042.65 5 1 2 80 6 3 5 1 4 1 -1292.40 -1019.83 4 1 2 80 6 3 4 1 4 1 -1231.77 -1016.82 3 1 2 80 6 3 3 1 4 1 -1104.98 -1016.82 0 1 2 80 6 3 1 1 4 1 -888.95 -1016.82 --- NEW FILE: dCleanM --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 80 1 4 1 -1775.67 --- NEW FILE: dCleanN --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 80 1 4 1 -1793.01 --- NEW FILE: dMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 80 1 4 1 -1806.50 ICASE NB MFLOP ROUT AUTHOR 325 80 -1821.25 "ATL_dmm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: dNB --- 1 80 --- NEW FILE: dNCNB --- 80 --- NEW FILE: dXover.h --- #ifndef DXOVER_H #define DXOVER_H #define ATL_3NB 240 #define NN_MNK_M 18202320 #define NN_MNK_N 18202320 #define NN_MNK_MN 3052800 #define NN_MNK_K 564480 #define NN_MNK_GE 108531333 #define NT_MNK_M 7938000 #define NT_MNK_N 8000 #define NT_MNK_MN 3052800 #define NT_MNK_K 564480 #define NT_MNK_GE 1000 #define TN_MNK_M 25267520 #define TN_MNK_N 19365120 #define TN_MNK_MN 2147483647 #define TN_MNK_K 8000 #define TN_MNK_GE 592704 #define TT_MNK_M 2099520 #define TT_MNK_N 8000 #define TT_MNK_MN 3052800 #define TT_MNK_K 564480 #define TT_MNK_GE 592704 #endif --- NEW FILE: dbestNN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 12 1 4 1 -1440.53 --- NEW FILE: dbestNN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 4 1 4 1 -1458.02 --- NEW FILE: dbestNN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 80 1 4 1 -1430.63 --- NEW FILE: dbestNT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 3 8 1 4 1 -1307.21 --- NEW FILE: dbestNT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 4 80 6 3 80 1 4 1 -1357.23 --- NEW FILE: dbestNT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 8 80 6 3 80 1 4 1 -1400.46 --- NEW FILE: dbestTN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 16 1 4 1 -1585.40 --- NEW FILE: dbestTN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 4 80 6 3 80 1 4 1 -1760.65 --- NEW FILE: dbestTN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 5 80 6 3 80 1 4 1 -1802.33 --- NEW FILE: dbestTT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 12 1 4 1 -1454.63 --- NEW FILE: dbestTT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 80 1 4 1 -1435.23 --- NEW FILE: dbestTT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 3 80 1 4 1 -1451.25 --- NEW FILE: dgMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 80 1 4 1 -1806.50 --- NEW FILE: dnreg --- 33 --- NEW FILE: duCleanK --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 3 1 80 70 40 16 -1147.34 ATL_mm4x4x2_1_prefCU.c 16 325 1 80 64 32 16 -1732.24 ATL_dmm4x4x16_hppa.c --- NEW FILE: duCleanKF --- MULT ICASE FIXED NB 0 --- NEW FILE: duCleanM --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 314 0 80 70 40 16 -598.39 ATL_mm6x8x8_1p.c 4 325 0 80 68 40 16 -1589.00 ATL_dmm4x4x16_hppa.c --- NEW FILE: duCleanMF --- MULT ICASE FIXED NB 1 4 325 0 80 --- NEW FILE: duCleanN --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 3 6 0 80 69 39 18 -982.72 ATL_mm4x3x8p.c 4 325 0 80 68 40 16 -1589.18 ATL_dmm4x4x16_hppa.c --- NEW FILE: duCleanNF --- MULT ICASE FIXED NB 0 --- NEW FILE: duMMRES --- CASE NB MFLOP ROUTINE 325 80 -1821.25 "ATL_dmm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: sCleanK --- KB MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH GEN-MFLOP SPC-MFLOP 80 1 1 80 6 6 80 0 6 3 -1050.78 -589.25 79 1 1 80 6 6 79 0 6 3 -1002.57 -586.35 78 1 1 80 6 6 78 0 6 3 -896.97 -576.92 77 1 1 80 6 6 77 0 6 3 -967.06 -579.98 76 1 1 80 6 6 76 0 6 3 -870.60 -581.37 75 1 1 80 6 6 75 0 6 3 -892.20 -578.77 74 1 1 80 6 6 74 0 6 3 -860.87 -577.05 73 1 1 80 6 6 73 0 6 3 -885.36 -579.74 72 1 1 80 6 6 72 0 6 3 -909.62 -585.82 71 1 1 80 6 6 71 0 6 3 -991.18 -578.85 70 1 1 80 6 6 70 0 6 3 -897.43 -575.13 69 1 1 80 6 6 69 0 6 3 -883.59 -588.28 68 1 1 80 6 6 68 0 6 3 -1014.35 -580.03 67 1 1 80 6 6 67 0 6 3 -1026.57 -580.89 66 1 1 80 6 6 66 0 6 3 -990.69 -577.18 65 1 1 80 6 6 65 0 6 3 -993.61 -577.98 64 1 1 80 6 6 64 0 6 3 -1037.96 -590.25 63 1 1 80 6 6 63 0 6 3 -1006.98 -583.02 62 1 1 80 6 6 62 0 6 3 -1021.73 -578.58 61 1 1 80 6 6 61 0 6 3 -884.27 -580.23 60 1 1 80 6 6 60 0 6 3 -1008.15 -577.80 59 1 1 80 6 6 59 0 6 3 -984.01 -589.66 58 1 1 80 6 6 58 0 6 3 -864.41 -577.56 57 1 1 80 6 6 57 0 6 3 -992.65 -581.21 56 1 1 80 6 6 56 0 6 3 -1001.96 -586.41 55 1 1 80 6 6 55 0 6 3 -993.16 -577.12 54 1 1 80 6 6 54 0 6 3 -996.14 -577.97 53 1 1 80 6 6 53 0 6 3 -1001.06 -582.94 52 1 1 80 6 6 52 0 6 3 -1001.44 -580.77 51 1 1 80 6 6 51 0 6 3 -995.00 -582.08 50 1 1 80 6 6 50 0 6 3 -993.23 -576.87 49 1 1 80 6 6 49 0 6 3 -991.92 -590.41 48 1 1 80 6 6 48 0 6 3 -1027.26 -587.37 47 1 1 80 6 6 47 0 6 3 -1000.89 -582.23 46 1 1 80 6 6 46 0 6 3 -989.15 -579.03 45 1 1 80 6 6 45 0 6 3 -992.22 -576.41 44 1 1 80 6 6 44 0 6 3 -997.99 -582.14 43 1 1 80 6 6 43 0 6 3 -998.07 -581.00 42 1 1 80 6 6 42 0 6 3 -988.62 -576.30 41 1 1 80 6 6 41 0 6 3 -990.16 -578.96 40 1 1 80 6 6 40 0 6 3 -1010.52 -580.13 39 1 1 80 6 6 39 0 6 3 -990.61 -589.93 38 1 1 80 6 6 38 0 6 3 -986.36 -574.77 37 1 1 80 6 6 37 0 6 3 -996.94 -582.06 36 1 1 80 6 6 36 0 6 3 -993.50 -580.36 35 1 1 80 6 6 35 0 6 3 -987.37 -575.24 34 1 1 80 6 6 34 0 6 3 -986.07 -576.49 33 1 1 80 6 6 33 0 6 3 -982.24 -579.97 32 1 1 80 6 6 32 0 6 3 -1010.07 -584.06 31 1 1 80 6 6 31 0 6 3 -989.32 -578.59 30 1 1 80 6 6 30 0 6 3 -983.63 -571.12 29 1 1 80 6 6 29 0 6 3 -989.19 -593.40 28 1 1 80 6 6 28 0 6 3 -995.26 -575.56 27 1 1 80 6 6 27 0 6 3 -988.24 -579.58 26 1 1 80 6 6 26 0 6 3 -979.39 -575.51 25 1 1 80 6 6 25 0 6 3 -979.17 -573.44 24 1 1 80 6 6 24 0 6 3 -989.40 -581.88 23 1 1 80 6 6 23 0 6 3 -976.71 -580.49 22 1 1 80 6 6 22 0 6 3 -975.12 -577.55 21 1 1 80 6 6 21 0 6 3 -975.00 -578.12 20 1 1 80 6 6 20 0 6 3 -978.68 -568.51 19 1 1 80 6 6 19 0 6 3 -974.24 -602.84 18 1 1 80 6 6 18 0 6 3 -976.06 -571.83 17 1 1 80 6 6 17 0 6 3 -969.09 -577.78 16 1 1 80 6 6 16 0 6 3 -968.17 -576.49 15 1 1 80 6 6 15 0 6 3 -958.08 -564.19 14 1 1 80 6 6 14 0 6 3 -956.01 -567.26 13 1 1 80 6 6 13 0 6 3 -935.54 -570.76 12 1 1 80 6 6 12 0 6 3 -926.13 -563.96 11 1 1 80 6 6 11 0 6 3 -916.29 -563.84 10 1 1 80 6 6 10 0 6 3 -909.87 -563.84 9 1 1 80 6 6 9 0 6 3 -891.14 -563.84 8 1 1 80 6 6 8 0 6 3 -868.52 -563.84 7 1 1 80 6 6 7 0 6 3 -846.58 -563.84 6 1 1 80 6 6 6 0 6 3 -830.30 -563.84 5 1 1 80 6 6 5 0 6 3 -733.68 -563.84 4 1 1 80 6 6 4 0 6 3 -709.29 -563.84 3 1 1 80 6 6 3 0 6 3 -672.81 -563.84 2 1 1 80 6 6 2 0 6 3 -586.62 -563.84 0 1 1 80 6 6 1 0 6 3 -408.05 -563.84 --- NEW FILE: sCleanM --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -798.57 --- NEW FILE: sCleanN --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -815.05 --- NEW FILE: sMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -1051.05 ICASE NB MFLOP ROUT AUTHOR 324 80 -2089.44 "ATL_smm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: sNB --- 1 80 --- NEW FILE: sNCNB --- 80 --- NEW FILE: sXover.h --- #ifndef SXOVER_H #define SXOVER_H #define ATL_3NB 240 #define NN_MNK_M 8000 #define NN_MNK_N 297680 #define NN_MNK_MN 64000 #define NN_MNK_K 224720 #define NN_MNK_GE 226981 #define NT_MNK_M 8000 #define NT_MNK_N 8000 #define NT_MNK_MN 64000 #define NT_MNK_K 8000 #define NT_MNK_GE 1000 #define TN_MNK_M 564480 #define TN_MNK_N 564480 #define TN_MNK_MN 537600 #define TN_MNK_K 564480 #define TN_MNK_GE 592704 #define TT_MNK_M 564480 #define TT_MNK_N 8000 #define TT_MNK_MN 64000 #define TT_MNK_K 297680 #define TT_MNK_GE 592704 #endif --- NEW FILE: sbestNN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 6 8 0 6 3 -610.17 --- NEW FILE: sbestNN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 6 80 0 6 3 -759.15 --- NEW FILE: sbestNN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 5 80 6 6 80 0 6 3 -759.34 --- NEW FILE: sbestNT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 6 8 0 6 3 -700.39 --- NEW FILE: sbestNT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 5 80 6 6 80 0 6 3 -642.97 --- NEW FILE: sbestNT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 1 0 6 3 -667.30 --- NEW FILE: sbestTN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 8 0 6 3 -654.15 --- NEW FILE: sbestTN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 4 80 6 6 80 0 6 3 -944.80 --- NEW FILE: sbestTN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 8 80 6 6 80 0 6 3 -945.09 --- NEW FILE: sbestTT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 6 12 0 6 3 -701.02 --- NEW FILE: sbestTT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -796.94 --- NEW FILE: sbestTT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 6 80 0 6 3 -797.15 --- NEW FILE: sgMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 1 80 6 6 80 0 6 3 -1051.05 --- NEW FILE: snreg --- 64 --- NEW FILE: suCleanK --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 3 1 80 70 40 16 -384.79 ATL_mm4x4x2_1_prefCU.c 16 324 1 80 64 32 16 -1983.68 ATL_smm4x4x16_hppa.c --- NEW FILE: suCleanKF --- MULT ICASE FIXED NB 1 16 324 1 80 --- NEW FILE: suCleanM --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 311 0 80 70 40 16 -376.95 ATL_mm6x8x8_1p.c 4 324 0 80 68 40 16 -1941.16 ATL_smm4x4x16_hppa.c --- NEW FILE: suCleanMF --- MULT ICASE FIXED NB 1 4 324 0 80 --- NEW FILE: suCleanN --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 3 6 0 80 69 39 18 -311.37 ATL_mm4x3x8p.c 4 324 0 80 68 40 16 -1936.54 ATL_smm4x4x16_hppa.c --- NEW FILE: suCleanNF --- MULT ICASE FIXED NB 1 4 324 0 80 --- NEW FILE: suMMRES --- CASE NB MFLOP ROUTINE 324 80 -2089.44 "ATL_smm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: zCleanK --- KB MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH GEN-MFLOP SPC-MFLOP 80 1 6 80 6 3 20 1 4 5 -1742.95 -1624.17 79 1 6 80 6 3 20 1 4 5 -1831.48 -1624.17 0 1 6 80 6 3 8 1 4 5 -1623.51 -1624.17 --- NEW FILE: zCleanM --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 20 1 4 5 -1762.64 --- NEW FILE: zCleanN --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 20 1 4 5 -1767.63 --- NEW FILE: zMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 20 1 4 5 -1754.73 ICASE NB MFLOP ROUT AUTHOR 325 80 -1933.00 "ATL_dmm4x4x16_hppa.c" "R. Clint Whaley" --- NEW FILE: zNB --- 1 80 --- NEW FILE: zNCNB --- 80 --- NEW FILE: zXover.h --- #ifndef ZXOVER_H #define ZXOVER_H #define ATL_3NB 240 #define NN_MNK_M 8000 #define NN_MNK_N 8000 #define NN_MNK_MN 64000 #define NN_MNK_K 564480 #define NN_MNK_GE 1000 #define NT_MNK_M 8000 #define NT_MNK_N 8000 #define NT_MNK_MN 64000 #define NT_MNK_K 72000 #define NT_MNK_GE 1000 #define TN_MNK_M 1190720 #define TN_MNK_N 3200000 #define TN_MNK_MN 2147483647 #define TN_MNK_K 1352000 #define TN_MNK_GE 1481544 #define TT_MNK_M 8000 #define TT_MNK_N 8000 #define TT_MNK_MN 64000 #define TT_MNK_K 176720 #define TT_MNK_GE 1000 #endif --- NEW FILE: zbestNN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 3 8 1 4 5 -1516.83 --- NEW FILE: zbestNN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 20 1 4 5 -1601.66 --- NEW FILE: zbestNN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 3 20 1 4 5 -1500.79 --- NEW FILE: zbestNT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 8 1 4 5 -1361.97 --- NEW FILE: zbestNT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 20 1 4 5 -1439.20 --- NEW FILE: zbestNT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 5 80 6 3 20 1 4 5 -1380.64 --- NEW FILE: zbestTN_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 8 1 4 5 -1643.94 --- NEW FILE: zbestTN_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 3 20 1 4 5 -1749.80 --- NEW FILE: zbestTN_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 20 1 4 5 -1797.14 --- NEW FILE: zbestTT_0x0x0 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 3 80 6 3 8 1 4 5 -1513.15 --- NEW FILE: zbestTT_0x0x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 4 1 4 5 -1505.85 --- NEW FILE: zbestTT_80x80x80 --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 6 80 6 3 20 1 4 5 -1449.23 --- NEW FILE: zgMMRES --- MULADD LAT NB MU NU KU FFTCH IFTCH NFTCH MFLOP 1 2 80 6 3 20 1 4 1 -875.76 --- NEW FILE: zuCleanK --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 3 1 80 70 40 16 -1197.13 ATL_mm4x4x2_1_prefCU.c 16 325 1 80 64 32 16 -1827.33 ATL_dmm4x4x16_hppa.c --- NEW FILE: zuCleanKF --- MULT ICASE FIXED NB 1 16 325 1 80 --- NEW FILE: zuCleanM --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 1 314 0 80 70 40 16 -604.89 ATL_mm6x8x8_1p.c 4 325 0 80 68 40 16 -1815.09 ATL_dmm4x4x16_hppa.c --- NEW FILE: zuCleanMF --- MULT ICASE FIXED NB 1 4 325 0 80 --- NEW FILE: zuCleanN --- MULT ICASE FIXED NB NB0 NB1 NB2 MFLOP ROUT 2 3 6 0 80 69 39 18 -1005.65 ATL_mm4x3x8p.c 4 325 0 80 68 40 16 -1810.81 ATL_dmm4x4x16_hppa.c --- NEW FILE: zuCleanNF --- MULT ICASE FIXED NB 1 4 325 0 80 --- NEW FILE: zuMMRES --- CASE NB MFLOP ROUTINE 325 80 -1933.00 "ATL_dmm4x4x16_hppa.c" "R. Clint Whaley" |