@@ -397,6 +397,7 @@ static results_perplexity perplexity(llama_context * ctx, const gpt_params & par
397
397
}
398
398
);
399
399
const size_t num_prune = std::min (pass_results.size (), prune_target);
400
+ if (num_prune > 0 ) printf (" \n Pruning: " );
400
401
for (size_t temp = 0 , pruned = 0 ; temp < pass_results.size (); temp++) {
401
402
int32_t lidx = std::get<0 >(pass_results[temp]);
402
403
if (anti_mode) {
@@ -405,17 +406,17 @@ static results_perplexity perplexity(llama_context * ctx, const gpt_params & par
405
406
}
406
407
if (lidx == curr_best_layer && std::get<1 >(pass_results[temp]) == curr_best_type) continue ;
407
408
extremes[lidx] |= std::get<1 >(pass_results[temp]);
408
- printf (" \n Prune [%zu] : %d (%d) - %.2f\n " , pruned + 1 , lidx,
409
+ printf (" [%zu: %d (%d) - %.2f], " , pruned + 1 , lidx,
409
410
std::get<1 >(pass_results[temp]), std::get<2 >(pass_results[temp]));
410
411
if (++pruned >= num_prune) break ;
411
412
}
412
413
}
413
414
pass_results.clear ();
414
- printf (" \n\n ADD %c%3d - ppl vs ref %.4f" ,
415
+ printf (" \n\n ADD %c%3d - ppl vs ref %.4f - cur:[ " ,
415
416
int (label[curr_best_type]), curr_best_layer,
416
417
curr_best_ppl - ref_ppl);
417
418
if (!anti_mode) {
418
- if (curr_best_ppl > ref_ppl * 1.75 ) break ;
419
+ // if (curr_best_ppl > ref_ppl * 1.75) break;
419
420
skip_types[curr_best_layer] += curr_best_type;
420
421
skips.push_back (curr_best_type == 1 ? curr_best_layer : curr_best_layer + n_layers);
421
422
}
@@ -426,6 +427,10 @@ static results_perplexity perplexity(llama_context * ctx, const gpt_params & par
426
427
for (int32_t new_sl = 0 ; new_sl < n_layers; new_sl++) {
427
428
skip_types[new_sl] = (skip_types[new_sl] & 3 ) | (extremes[new_sl] << 2 );
428
429
}
430
+ for (int32_t i = 0 ; i < n_layers; i++) {
431
+ const int val = mask ^ (skip_types[i] & 3 );
432
+ printf (" %d%s" , val, i < n_layers - 1 ? " , " : " ]" );
433
+ }
429
434
for (int32_t new_sl = 0 ; new_sl < n_layers; new_sl++) {
430
435
int32_t curr_skipped = (skip_types[new_sl] >> 2 ) | (skip_types[new_sl] & 3 );
431
436
// printf("||%d, %d\n", new_sl, curr_skipped);
0 commit comments