commit | b1ef5eee90d8748d5273fa3e6bb618dd4f925135 | [log] [tgz] |
---|---|---|
author | Eric Biggers <ebiggers@google.com> | Mon Mar 10 10:27:59 2025 -0700 |
committer | Boringssl LUCI CQ <boringssl-scoped@luci-project-accounts.iam.gserviceaccount.com> | Mon Mar 10 15:08:12 2025 -0700 |
tree | ee02f0a56674c59842bfc37299d25b73e19baeb0 | |
parent | c2f05fa29436cb346d36d166d99fe9aa859b60b0 [diff] |
Fix missing vzeroupper in poly_Rq_mul() poly_Rq_mul() uses ymm registers, so vzeroupper needs to be executed before returning in order to avoid slowing down subsequent SSE code. Change-Id: Id85e4ede05c612e0edf4c92a298531dd4c358bf4 Reviewed-on: https://boringssl-review.googlesource.com/c/boringssl/+/77229 Reviewed-by: David Benjamin <davidben@google.com> Commit-Queue: David Benjamin <davidben@google.com>
diff --git a/crypto/hrss/asm/poly_rq_mul.S b/crypto/hrss/asm/poly_rq_mul.S index 2b99d0e..abbc4e3 100644 --- a/crypto/hrss/asm/poly_rq_mul.S +++ b/crypto/hrss/asm/poly_rq_mul.S
@@ -8475,6 +8475,7 @@ vpaddw 2752(%r8), %ymm11, %ymm11 vpand mask_mod8192(%rip), %ymm11, %ymm11 vmovdqu %ymm11, 1320(%rdi) +vzeroupper pop %r12 .cfi_restore r12 pop %rbp