@@ -7656,7 +7656,7 @@ size_t ggml_quantize_chunk(
76567656 int64_t nrows ,
76577657 int64_t n_per_row ,
76587658 const float * imatrix ) {
7659- const int64_t n = ( int64_t ) nrows * n_per_row ;
7659+ const int64_t n = nrows * n_per_row ;
76607660
76617661 if (ggml_quantize_requires_imatrix (type )) {
76627662 GGML_ASSERT (imatrix != NULL );
@@ -7673,21 +7673,21 @@ size_t ggml_quantize_chunk(
76737673 size_t result = 0 ;
76747674
76757675 switch (type ) {
7676- case GGML_TYPE_Q1_0 : result = quantize_q1_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7677- case GGML_TYPE_Q4_0 : result = quantize_q4_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7678- case GGML_TYPE_Q4_1 : result = quantize_q4_1 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7679- case GGML_TYPE_Q5_0 : result = quantize_q5_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7680- case GGML_TYPE_Q5_1 : result = quantize_q5_1 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7681- case GGML_TYPE_Q8_0 : result = quantize_q8_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7682- case GGML_TYPE_MXFP4 : result = quantize_mxfp4 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7683- case GGML_TYPE_NVFP4 : result = quantize_nvfp4 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7684- case GGML_TYPE_Q2_K : result = quantize_q2_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7685- case GGML_TYPE_Q3_K : result = quantize_q3_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7686- case GGML_TYPE_Q4_K : result = quantize_q4_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7687- case GGML_TYPE_Q5_K : result = quantize_q5_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7688- case GGML_TYPE_Q6_K : result = quantize_q6_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7689- case GGML_TYPE_TQ1_0 : result = quantize_tq1_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7690- case GGML_TYPE_TQ2_0 : result = quantize_tq2_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7676+ case GGML_TYPE_Q1_0 : result = quantize_q1_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7677+ case GGML_TYPE_Q4_0 : result = quantize_q4_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7678+ case GGML_TYPE_Q4_1 : result = quantize_q4_1 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7679+ case GGML_TYPE_Q5_0 : result = quantize_q5_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7680+ case GGML_TYPE_Q5_1 : result = quantize_q5_1 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7681+ case GGML_TYPE_Q8_0 : result = quantize_q8_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7682+ case GGML_TYPE_MXFP4 : result = quantize_mxfp4 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7683+ case GGML_TYPE_NVFP4 : result = quantize_nvfp4 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7684+ case GGML_TYPE_Q2_K : result = quantize_q2_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7685+ case GGML_TYPE_Q3_K : result = quantize_q3_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7686+ case GGML_TYPE_Q4_K : result = quantize_q4_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7687+ case GGML_TYPE_Q5_K : result = quantize_q5_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7688+ case GGML_TYPE_Q6_K : result = quantize_q6_K (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7689+ case GGML_TYPE_TQ1_0 : result = quantize_tq1_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
7690+ case GGML_TYPE_TQ2_0 : result = quantize_tq2_0 (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
76917691 case GGML_TYPE_IQ2_XXS : result = quantize_iq2_xxs (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
76927692 case GGML_TYPE_IQ2_XS : result = quantize_iq2_xs (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
76937693 case GGML_TYPE_IQ3_XXS : result = quantize_iq3_xxs (src + start , (char * ) dst + start_row * row_size , nrows , n_per_row , imatrix ); break ;
@@ -7752,9 +7752,9 @@ struct ggml_threadpool_params ggml_threadpool_params_default(int n_threads) {
77527752}
77537753
77547754bool ggml_threadpool_params_match (const struct ggml_threadpool_params * p0 , const struct ggml_threadpool_params * p1 ) {
7755- if (p0 -> n_threads != p1 -> n_threads ) return false;
7756- if (p0 -> prio != p1 -> prio ) return false;
7757- if (p0 -> poll != p1 -> poll ) return false;
7758- if (p0 -> strict_cpu != p1 -> strict_cpu ) return false;
7755+ if (p0 -> n_threads != p1 -> n_threads ) return false;
7756+ if (p0 -> prio != p1 -> prio ) return false;
7757+ if (p0 -> poll != p1 -> poll ) return false;
7758+ if (p0 -> strict_cpu != p1 -> strict_cpu ) return false;
77597759 return memcmp (p0 -> cpumask , p1 -> cpumask , GGML_MAX_N_THREADS ) == 0 ;
77607760}
0 commit comments