-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathbdw.csv
We can make this file beautiful and searchable if this error is corrected: It looks like row 2 should actually have 1 column, instead of 5 in line 1.
126 lines (126 loc) · 7.39 KB
/
bdw.csv
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
Intel(R) Xeon(R) CPU D-1571 @ 1.30GHz
"reg64","add","latency","1.005435e+00","9.945939e-01"
"reg64","add","throughput","2.673515e-01","3.740394e+00"
"reg64","lea","latency","1.005118e+00","9.949084e-01"
"reg64","lea","throughput","5.030286e-01","1.987958e+00"
"reg64","xor dst,dst","latency","2.673577e-01","3.740307e+00"
"reg64","xor dst,dst","throughput","2.673202e-01","3.740833e+00"
"reg64","xor","latency","2.668270e-01","3.747747e+00"
"reg64","xor","throughput","2.669234e-01","3.746393e+00"
"reg64","load","latency","5.018156e+00","1.992764e-01"
"reg64","load","throughput","6.271042e-01","1.594631e+00"
"reg64","crc32","latency","3.008892e+00","3.323482e-01"
"reg64","crc32","throughput","1.004368e+00","9.956510e-01"
"reg64","store [mem+0]->load[mem+0]","latency","1.229579e+01","8.132862e-02"
"reg64","store [mem+0]->load[mem+0]","throughput","1.263294e+00","7.915815e-01"
"reg64","store [mem+0]->load[mem+1]","latency","2.005469e+01","4.986365e-02"
"reg64","store [mem+0]->load[mem+1]","throughput","1.403139e+01","7.126875e-02"
"m128","pxor","latency","2.792659e-01","3.580816e+00"
"m128","pxor","throughput","2.789258e-01","3.585183e+00"
"m128","padd","latency","1.001859e+00","9.981446e-01"
"m128","padd","throughput","5.019989e-01","1.992036e+00"
"m128","pmuldq","latency","5.007596e+00","1.996966e-01"
"m128","pmuldq","throughput","1.002865e+00","9.971433e-01"
"m128","loadps","throughput","5.020837e-01","1.991700e+00"
"m128","loadps->movq","latency","7.012644e+00","1.425996e-01"
"m128","movq->movq","latency","2.005775e+00","4.985604e-01"
"m128","movq->movq","throughput","1.004190e+00","9.958275e-01"
"m128","xorps","latency","2.786104e-01","3.589241e+00"
"m128","xorps","throughput","2.790360e-01","3.583767e+00"
"m128","addps","latency","3.006787e+00","3.325809e-01"
"m128","addps","throughput","1.003402e+00","9.966099e-01"
"m128","mulps","latency","3.006605e+00","3.326011e-01"
"m128","mulps","throughput","5.009242e-01","1.996310e+00"
"m128","divps","latency","1.101913e+01","9.075130e-02"
"m128","divps","throughput","5.018023e+00","1.992817e-01"
"m128","divpd","latency","1.001664e+01","9.983390e-02"
"m128","divpd","throughput","8.021761e+00","1.246609e-01"
"m128","rsqrtps","latency","5.007502e+00","1.997004e-01"
"m128","rsqrtps","throughput","1.003823e+00","9.961916e-01"
"m128","rcpps","latency","5.008220e+00","1.996717e-01"
"m128","rcpps","throughput","1.003651e+00","9.963626e-01"
"m128","blendps","latency","1.003578e+00","9.964348e-01"
"m128","blendps","throughput","3.341694e-01","2.992494e+00"
"m128","blendvps","latency","2.006539e+00","4.983705e-01"
"m128","blendvps","throughput","2.005635e+00","4.985952e-01"
"m128","pshufb","latency","1.002921e+00","9.970875e-01"
"m128","pshufb","throughput","1.001989e+00","9.980154e-01"
"m128","shufps","latency","1.002982e+00","9.970270e-01"
"m128","shufps","throughput","1.002853e+00","9.971551e-01"
"m128","pmullw","latency","5.007810e+00","1.996881e-01"
"m128","pmullw","throughput","1.002626e+00","9.973805e-01"
"m128","phaddd","latency","3.007200e+00","3.325353e-01"
"m128","phaddd","throughput","2.005810e+00","4.985518e-01"
"m128","haddps","latency","3.007363e+00","3.325172e-01"
"m128","haddps","throughput","2.005387e+00","4.986569e-01"
"m128","pinsrd","latency","2.007249e+00","4.981942e-01"
"m128","pinsrd","throughput","2.005805e+00","4.985529e-01"
"m128","pinsrd->pexr","latency","4.008767e+00","2.494533e-01"
"m128","dpps","latency","1.202906e+01","8.313203e-02"
"m128","dpps","throughput","2.321211e+00","4.308097e-01"
"m128","cvtps2dq","latency","3.006614e+00","3.326000e-01"
"m128","cvtps2dq","throughput","1.002633e+00","9.973737e-01"
"reg64","popcnt","latency","3.006188e+00","3.326472e-01"
"reg64","popcnt","throughput","1.003134e+00","9.968755e-01"
"m128","aesenc","latency","7.010418e+00","1.426448e-01"
"m128","aesenc","throughput","1.002947e+00","9.970614e-01"
"m128","aesenclast","latency","7.011492e+00","1.426230e-01"
"m128","aesenclast","throughput","1.002983e+00","9.970260e-01"
"m128","aesdec","latency","7.009893e+00","1.426555e-01"
"m128","aesdec","throughput","1.003703e+00","9.963104e-01"
"m128","aesdeclast","latency","7.010402e+00","1.426452e-01"
"m128","aesdeclast","throughput","1.002656e+00","9.973512e-01"
"m256","movaps [mem]","latency","1.003582e+00","9.964310e-01"
"m256","movaps [mem]","throughput","5.022303e-01","1.991118e+00"
"m256","vmovdqu [mem+1]","latency","1.003402e+00","9.966090e-01"
"m256","vmovdqu [mem+1]","throughput","5.015736e-01","1.993725e+00"
"m256","vmovdqu [mem+63] (cross cache)","latency","1.004246e+00","9.957720e-01"
"m256","vmovdqu [mem+63] (cross cache)","throughput","1.004481e+00","9.955392e-01"
"m256","vmovdqu [mem+2MB-1] (cross page)","latency","3.105519e+01","3.220074e-02"
"m256","vmovdqu [mem+2MB-1] (cross page)","throughput","3.104532e+01","3.221098e-02"
"m256","xorps","latency","2.791684e-01","3.582067e+00"
"m256","xorps","throughput","2.790542e-01","3.583533e+00"
"m256","mulps","latency","3.007174e+00","3.325381e-01"
"m256","mulps","throughput","5.015511e-01","1.993815e+00"
"m256","addps","latency","3.007763e+00","3.324730e-01"
"m256","addps","throughput","1.003600e+00","9.964127e-01"
"m256","divps","latency","1.719467e+01","5.815756e-02"
"m256","divps","throughput","1.009360e+01","9.907269e-02"
"m256","divpd","latency","1.908511e+01","5.239688e-02"
"m256","divpd","throughput","1.616323e+01","6.186883e-02"
"m256","rsqrtps","latency","7.013317e+00","1.425859e-01"
"m256","rsqrtps","throughput","2.006882e+00","4.982853e-01"
"m256","rcpps","latency","7.013340e+00","1.425854e-01"
"m256","rcpps","throughput","2.004963e+00","4.987623e-01"
"m256","sqrtps","latency","1.808487e+01","5.529484e-02"
"m256","sqrtps","throughput","1.409339e+01","7.095526e-02"
"m256","vperm2f128","latency","3.006833e+00","3.325758e-01"
"m256","vperm2f128","throughput","1.002868e+00","9.971400e-01"
"m256","pxor","latency","2.788529e-01","3.586120e+00"
"m256","pxor","throughput","2.780111e-01","3.596979e+00"
"m256","paddd","latency","1.002739e+00","9.972681e-01"
"m256","paddd","throughput","5.009634e-01","1.996154e+00"
"m256","vpermps","latency","3.008312e+00","3.324123e-01"
"m256","vpermps","throughput","1.003438e+00","9.965739e-01"
"m256","vpermpd","latency","3.006010e+00","3.326669e-01"
"m256","vpermpd","throughput","1.002575e+00","9.974315e-01"
"m256","vpmovsxwd","latency","3.006030e+00","3.326647e-01"
"m256","vpmovsxwd","throughput","1.003455e+00","9.965573e-01"
"m256","vpgatherdd","latency","2.115726e+01","4.726510e-02"
"m256","vpgatherdd","throughput","6.039028e+00","1.655896e-01"
"m256","gather32(<ld+ins>x8 + perm)","latency","1.703472e+01","5.870364e-02"
"m256","gather32(<ld+ins>x8 + perm)","throughput","8.018219e+00","1.247160e-01"
"m256","vgatherdpd","latency","1.819990e+01","5.494535e-02"
"m256","vgatherdpd","throughput","5.037717e+00","1.985026e-01"
"m256","gather64(<ld+ins>x4 + perm)","latency","1.217406e+01","8.214183e-02"
"m256","gather64(<ld+ins>x4 + perm)","throughput","4.007869e+00","2.495092e-01"
"m256","vpshufb","latency","1.006102e+00","9.939352e-01"
"m256","vpshufb","throughput","1.003021e+00","9.969881e-01"
"m256","vfmaps","latency","5.008734e+00","1.996512e-01"
"m256","vfmaps","throughput","5.014875e-01","1.994068e+00"
"m256","vfmapd","latency","5.008636e+00","1.996551e-01"
"m256","vfmapd","throughput","5.010047e-01","1.995989e+00"
"m128","vfmaps","latency","5.008727e+00","1.996515e-01"
"m128","vfmaps","throughput","5.016058e-01","1.993597e+00"
"m128","vfmapd","latency","5.008312e+00","1.996681e-01"
"m128","vfmapd","throughput","5.009094e-01","1.996369e+00"