Skip to content

Instantly share code, notes, and snippets.

@tanakamura
Created February 1, 2017 23:29
Show Gist options
  • Select an option

  • Save tanakamura/984bc948056369b0c3f4330578e53bc9 to your computer and use it in GitHub Desktop.

Select an option

Save tanakamura/984bc948056369b0c3f4330578e53bc9 to your computer and use it in GitHub Desktop.
.data
.text
.globl run_4fmaps
// extern void run_4vnniw(
// unsigned short dst[16], // rdi
// unsigned short src0[64], // rsi
// unsigned short src1[4]); // rdx
run_4fmaps:
vmovups (%rdi), %zmm8
vmovups 64*0(%rsi), %zmm0
vmovups 64*1(%rsi), %zmm1
vmovups 64*2(%rsi), %zmm2
vmovups 64*3(%rsi), %zmm3
v4fmaddps (%rdx), %zmm8, %zmm0
vmovups %zmm8, (%rdi)
ret
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment