@@ -28,12 +28,21 @@ ifneq ($(filter arm% aarch%,$(UNAME_M)),)
2828 src/quant/tq1_neon_sdot.c src/quant/tq1_neon.c src/quant/tq1_scalar.c \
2929 src/quant/q8_neon.c src/quant/q8_scalar.c \
3030 src/quant/q4_neon_sdot.c src/quant/q4_neon.c src/quant/q4_scalar.c \
31+ src/quant/q4_1_neon.c src/quant/q4_1_scalar.c \
32+ src/quant/bf16_neon.c src/quant/bf16_scalar.c \
3133 src/quant/q6k_neon.c src/quant/q6k_scalar.c \
3234 src/quant/q8k_neon.c src/quant/q8k_scalar.c \
3335 src/quant/q4k_neon.c src/quant/q4k_scalar.c \
3436 src/quant/q5k_neon.c src/quant/q5k_scalar.c \
3537 src/quant/q3k_neon.c src/quant/q3k_scalar.c \
36- src/quant/q2k_neon.c src/quant/q2k_scalar.c
38+ src/quant/q2k_neon.c src/quant/q2k_scalar.c \
39+ src/quant/iq4nl_neon.c src/quant/iq4nl_scalar.c \
40+ src/quant/iq4xs_neon.c src/quant/iq4xs_scalar.c \
41+ src/quant/iq3xxs_neon.c src/quant/iq3xxs_scalar.c \
42+ src/quant/iq3s_neon.c src/quant/iq3s_scalar.c \
43+ src/quant/iq2xxs_neon.c src/quant/iq2xxs_scalar.c \
44+ src/quant/iq2xs_neon.c src/quant/iq2xs_scalar.c \
45+ src/quant/iq2s_neon.c src/quant/iq2s_scalar.c
3746
3847 TRANSFORMER_BACKEND = src/transformer/rmsnorm_neon.c src/transformer/rmsnorm_scalar.c \
3948 src/transformer/gqa_neon.c src/transformer/gqa_scalar.c \
4554 src/quant/tq2_scalar.c src/quant/tq1_scalar.c \
4655 src/quant/q8_avx2.c src/quant/q8_scalar.c \
4756 src/quant/q4_avx2.c src/quant/q4_scalar.c \
57+ src/quant/q4_1_avx2.c src/quant/q4_1_scalar.c \
58+ src/quant/bf16_avx2.c src/quant/bf16_scalar.c \
4859 src/quant/q6k_avx2.c src/quant/q6k_scalar.c \
4960 src/quant/q8k_avx2.c src/quant/q8k_scalar.c \
5061 src/quant/q4k_avx2.c src/quant/q4k_scalar.c \
5162 src/quant/q5k_avx2.c src/quant/q5k_scalar.c \
5263 src/quant/q3k_avx2.c src/quant/q3k_scalar.c \
53- src/quant/q2k_avx2.c src/quant/q2k_scalar.c
64+ src/quant/q2k_avx2.c src/quant/q2k_scalar.c \
65+ src/quant/iq4nl_avx2.c src/quant/iq4nl_scalar.c \
66+ src/quant/iq4xs_avx2.c src/quant/iq4xs_scalar.c \
67+ src/quant/iq3xxs_avx2.c src/quant/iq3xxs_scalar.c \
68+ src/quant/iq3s_avx2.c src/quant/iq3s_scalar.c \
69+ src/quant/iq2xxs_avx2.c src/quant/iq2xxs_scalar.c \
70+ src/quant/iq2xs_avx2.c src/quant/iq2xs_scalar.c \
71+ src/quant/iq2s_avx2.c src/quant/iq2s_scalar.c
5472
5573 TRANSFORMER_BACKEND = src/transformer/rmsnorm_avx2.c src/transformer/rmsnorm_scalar.c \
5674 src/transformer/gqa_avx2.c src/transformer/gqa_scalar.c \
@@ -158,12 +176,21 @@ AVX2_QUANT_SRCS = $(QUANT_COMMON) \
158176 src/quant/tq2_scalar.c src/quant/tq1_scalar.c \
159177 src/quant/q8_avx2.c src/quant/q8_scalar.c \
160178 src/quant/q4_avx2.c src/quant/q4_scalar.c \
179+ src/quant/q4_1_avx2.c src/quant/q4_1_scalar.c \
180+ src/quant/bf16_avx2.c src/quant/bf16_scalar.c \
161181 src/quant/q6k_avx2.c src/quant/q6k_scalar.c \
162182 src/quant/q8k_avx2.c src/quant/q8k_scalar.c \
163183 src/quant/q4k_avx2.c src/quant/q4k_scalar.c \
164184 src/quant/q5k_avx2.c src/quant/q5k_scalar.c \
165185 src/quant/q3k_avx2.c src/quant/q3k_scalar.c \
166- src/quant/q2k_avx2.c src/quant/q2k_scalar.c
186+ src/quant/q2k_avx2.c src/quant/q2k_scalar.c \
187+ src/quant/iq4nl_avx2.c src/quant/iq4nl_scalar.c \
188+ src/quant/iq4xs_avx2.c src/quant/iq4xs_scalar.c \
189+ src/quant/iq3xxs_avx2.c src/quant/iq3xxs_scalar.c \
190+ src/quant/iq3s_avx2.c src/quant/iq3s_scalar.c \
191+ src/quant/iq2xxs_avx2.c src/quant/iq2xxs_scalar.c \
192+ src/quant/iq2xs_avx2.c src/quant/iq2xs_scalar.c \
193+ src/quant/iq2s_avx2.c src/quant/iq2s_scalar.c
167194
168195AVX2_TRANSFORMER_BACKEND = src/transformer/rmsnorm_avx2.c src/transformer/rmsnorm_scalar.c \
169196 src/transformer/gqa_avx2.c src/transformer/gqa_scalar.c \
0 commit comments