@@ -1927,27 +1927,6 @@ exec_config_t determine_thread_config(int prob_m, int prob_n, int prob_k,
19271927 __CALL_IF(NUM_BITS, 4 , N_BLOCKS, K_BLOCKS, false , false , 4 , NUM_THREADS) \
19281928 __CALL_IF(NUM_BITS, 4 , N_BLOCKS, K_BLOCKS, false , false , 8 , NUM_THREADS)
19291929
1930- #define AWQ_CALL_IF (NUM_BITS, N_BLOCKS, K_BLOCKS, NUM_THREADS) \
1931- __CALL_IF(NUM_BITS, 1 , N_BLOCKS, K_BLOCKS, false , true , -1 , NUM_THREADS) \
1932- __CALL_IF(NUM_BITS, 1 , N_BLOCKS, K_BLOCKS, false , true , 2 , NUM_THREADS) \
1933- __CALL_IF(NUM_BITS, 1 , N_BLOCKS, K_BLOCKS, false , true , 4 , NUM_THREADS) \
1934- __CALL_IF(NUM_BITS, 1 , N_BLOCKS, K_BLOCKS, false , true , 8 , NUM_THREADS) \
1935- \
1936- __CALL_IF(NUM_BITS, 2 , N_BLOCKS, K_BLOCKS, false , true , -1 , NUM_THREADS) \
1937- __CALL_IF(NUM_BITS, 2 , N_BLOCKS, K_BLOCKS, false , true , 2 , NUM_THREADS) \
1938- __CALL_IF(NUM_BITS, 2 , N_BLOCKS, K_BLOCKS, false , true , 4 , NUM_THREADS) \
1939- __CALL_IF(NUM_BITS, 2 , N_BLOCKS, K_BLOCKS, false , true , 8 , NUM_THREADS) \
1940- \
1941- __CALL_IF(NUM_BITS, 3 , N_BLOCKS, K_BLOCKS, false , true , -1 , NUM_THREADS) \
1942- __CALL_IF(NUM_BITS, 3 , N_BLOCKS, K_BLOCKS, false , true , 2 , NUM_THREADS) \
1943- __CALL_IF(NUM_BITS, 3 , N_BLOCKS, K_BLOCKS, false , true , 4 , NUM_THREADS) \
1944- __CALL_IF(NUM_BITS, 3 , N_BLOCKS, K_BLOCKS, false , true , 8 , NUM_THREADS) \
1945- \
1946- __CALL_IF(NUM_BITS, 4 , N_BLOCKS, K_BLOCKS, false , true , -1 , NUM_THREADS) \
1947- __CALL_IF(NUM_BITS, 4 , N_BLOCKS, K_BLOCKS, false , true , 2 , NUM_THREADS) \
1948- __CALL_IF(NUM_BITS, 4 , N_BLOCKS, K_BLOCKS, false , true , 4 , NUM_THREADS) \
1949- __CALL_IF(NUM_BITS, 4 , N_BLOCKS, K_BLOCKS, false , true , 8 , NUM_THREADS)
1950-
19511930template <typename scalar_t>
19521931void marlin_mm_f16i4(const void * A, const void * B, void * C, void * C_tmp,
19531932 void * s, void * zp, void * g_idx, void * perm, void * a_tmp,
@@ -2089,14 +2068,6 @@ void marlin_mm_f16i4(const void* A, const void* B, void* C, void* C_tmp,
20892068 GPTQ_CALL_IF (8 , 8 , 4 , 128 )
20902069 GPTQ_CALL_IF (8 , 4 , 8 , 128 )
20912070
2092- AWQ_CALL_IF (4 , 16 , 4 , 256 )
2093- AWQ_CALL_IF (4 , 8 , 8 , 256 )
2094- AWQ_CALL_IF (4 , 8 , 4 , 128 )
2095- AWQ_CALL_IF (4 , 4 , 8 , 128 )
2096- AWQ_CALL_IF (8 , 16 , 4 , 256 )
2097- AWQ_CALL_IF (8 , 8 , 8 , 256 )
2098- AWQ_CALL_IF (8 , 8 , 4 , 128 )
2099- AWQ_CALL_IF (8 , 4 , 8 , 128 )
21002071 else {
21012072 TORCH_CHECK (false , " Unsupported shapes: MNK = [" , prob_m, " , " , prob_n,
21022073 " , " , prob_k, " ]" , " , has_act_order = " , has_act_order,
0 commit comments