Skip to content

Commit

Permalink
implement qs8 x8c4 pack using avxvnni
Browse files Browse the repository at this point in the history
  • Loading branch information
kylo5aby committed Nov 22, 2024
1 parent 7798ad0 commit de0567c
Show file tree
Hide file tree
Showing 7 changed files with 1,076 additions and 0 deletions.
2 changes: 2 additions & 0 deletions cmake/gen/avxvnni_microkernels.cmake
Original file line number Diff line number Diff line change
Expand Up @@ -132,6 +132,8 @@ SET(NON_PROD_AVXVNNI_MICROKERNEL_SRCS
src/qd8-f32-qc8w-igemm/gen/qd8-f32-qc8w-igemm-7x8c8-minmax-avxvnni.c
src/qd8-f32-qc8w-igemm/gen/qd8-f32-qc8w-igemm-8x8c8-minmax-avxvnni-prfm.c
src/qd8-f32-qc8w-igemm/gen/qd8-f32-qc8w-igemm-8x8c8-minmax-avxvnni.c
src/qs8-packw/gen/qs8-packw-x8c4-gemm-goi-avxvnni-prfm.c
src/qs8-packw/gen/qs8-packw-x8c4-gemm-goi-avxvnni.c
src/qs8-packw/gen/qs8-packw-x16c8-gemm-goi-avxvnni-prfm.c
src/qs8-packw/gen/qs8-packw-x16c8-gemm-goi-avxvnni.c
src/qs8-qc8w-gemm/gen/qs8-qc8w-gemm-1x8c8-minmax-fp32-avxvnni.c
Expand Down
2 changes: 2 additions & 0 deletions gen/avxvnni_microkernels.bzl
Original file line number Diff line number Diff line change
Expand Up @@ -129,6 +129,8 @@ NON_PROD_AVXVNNI_MICROKERNEL_SRCS = [
"src/qd8-f32-qc8w-igemm/gen/qd8-f32-qc8w-igemm-7x8c8-minmax-avxvnni.c",
"src/qd8-f32-qc8w-igemm/gen/qd8-f32-qc8w-igemm-8x8c8-minmax-avxvnni-prfm.c",
"src/qd8-f32-qc8w-igemm/gen/qd8-f32-qc8w-igemm-8x8c8-minmax-avxvnni.c",
"src/qs8-packw/gen/qs8-packw-x8c4-gemm-goi-avxvnni-prfm.c",
"src/qs8-packw/gen/qs8-packw-x8c4-gemm-goi-avxvnni.c",
"src/qs8-packw/gen/qs8-packw-x16c8-gemm-goi-avxvnni-prfm.c",
"src/qs8-packw/gen/qs8-packw-x16c8-gemm-goi-avxvnni.c",
"src/qs8-qc8w-gemm/gen/qs8-qc8w-gemm-1x8c8-minmax-fp32-avxvnni.c",
Expand Down
2 changes: 2 additions & 0 deletions scripts/generate-x8-packw.sh
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,8 @@ tools/xngen src/x8-packw/kr-scalar.c.in -D NR=16 -D KR=8 -D TYPE=int8_t -D IZP=1

### AVXVNNI micro-kernels
### C8 packing
tools/xngen src/x8-packw/kr-c4-avxvnni.c.in -D NR=8 -D KR=4 -D DATATYPE=QS8 -D TYPE=int8_t -D IZP=0 -D AVX=2 -D PREFETCH=0 -o src/qs8-packw/gen/qs8-packw-x8c4-gemm-goi-avxvnni.c &
tools/xngen src/x8-packw/kr-c4-avxvnni.c.in -D NR=8 -D KR=4 -D DATATYPE=QS8 -D TYPE=int8_t -D IZP=0 -D AVX=2 -D PREFETCH=1 -o src/qs8-packw/gen/qs8-packw-x8c4-gemm-goi-avxvnni-prfm.c &
tools/xngen src/x8-packw/kr-avxvnni.c.in -D NR=8 -D KR=8 -D DATATYPE=QS8 -D TYPE=int8_t -D IZP=0 -D AVX=2 -D PREFETCH=0 -o src/qs8-packw/gen/qs8-packw-x8c8-gemm-goi-avxvnni.c &
tools/xngen src/x8-packw/kr-avxvnni.c.in -D NR=8 -D KR=8 -D DATATYPE=QS8 -D TYPE=int8_t -D IZP=0 -D AVX=2 -D PREFETCH=1 -o src/qs8-packw/gen/qs8-packw-x8c8-gemm-goi-avxvnni-prfm.c &
tools/xngen src/x8-packw/kr-avxvnni.c.in -D NR=8 -D KR=8 -D DATATYPE=QS8 -D TYPE=int8_t -D IZP=128 -D AVX=2 -D PREFETCH=0 -o src/qs8-qu8-packw/gen/qs8-qu8-packw-x8c8-gemm-goi-avxvnni.c &
Expand Down
Loading

0 comments on commit de0567c

Please sign in to comment.