From d1c9b0393727e51fedc21d845db69f7c1dd84cd0 Mon Sep 17 00:00:00 2001 From: kaiburjack Date: Mon, 15 Aug 2022 20:07:20 +0200 Subject: [PATCH] Zero ymm2 with vpxor xmm2 using AVX's implicit zeroing of upper register parts https://stackoverflow.com/questions/44578967/what-is-the-most-efficient-way-to-clear-a-single-or-a-few-zmm-registers-on-knigh#answer-44841054 --- sse_amd64.s | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/sse_amd64.s b/sse_amd64.s index 8016696..f7223fd 100644 --- a/sse_amd64.s +++ b/sse_amd64.s @@ -48,7 +48,7 @@ TEXT ·onlySpaces32(SB),NOSPLIT, $0 VMOVDQU (DI), Y0 VMOVDQA Y0, Y1 VPCMPGTB ·spc<>(SB), Y0, Y0 - VPXOR Y2, Y2, Y2 + VPXOR X2, X2, X2 VPCMPGTB Y1, Y2, Y2 VPOR Y2, Y0, Y0 VPMOVMSKB Y0, AX