File tree 4 files changed +6
-1
lines changed
4 files changed +6
-1
lines changed Original file line number Diff line number Diff line change @@ -45,7 +45,7 @@ fma_dot:
45
45
vaddps %ymm0 ,%ymm8 ,%ymm0
46
46
47
47
/* TODO: horizontally sum ymm0 */
48
-
48
+ vzeroupper
49
49
retq
50
50
51
51
.data
Original file line number Diff line number Diff line change @@ -68,6 +68,7 @@ fma_gemm48:
68
68
dec %rcx
69
69
jnz loop_row
70
70
71
+ vzeroupper
71
72
pop %rbx
72
73
retq
73
74
Original file line number Diff line number Diff line change @@ -186,6 +186,7 @@ fma_gemm96:
186
186
dec %rcx
187
187
jnz loop_row
188
188
189
+ vzeroupper
189
190
pop %rbx
190
191
retq
191
192
Original file line number Diff line number Diff line change @@ -28,6 +28,7 @@ def gen_gemm48():
28
28
print (' dec %rcx' )
29
29
print (' jnz loop_row' )
30
30
31
+ print (' vzeroupper' )
31
32
print (' retq' )
32
33
33
34
print ('.data' )
@@ -69,6 +70,7 @@ def gen_gemm96():
69
70
print (' dec %rcx' )
70
71
print (' jnz loop_row' )
71
72
73
+ print (' vzeroupper' )
72
74
print (' retq' )
73
75
74
76
print ('.data' )
@@ -129,6 +131,7 @@ def gen_transform_cols(working_set):
129
131
130
132
if working_set != 'L1' :
131
133
print (' sfence' )
134
+ print (' vzeroupper' )
132
135
print (' pop %rbx' )
133
136
print (' retq' )
134
137
You can’t perform that action at this time.
0 commit comments