narySt commited on
Commit
6b2577f
·
verified ·
1 Parent(s): c17eac7

Upload folder using huggingface_hub

Browse files
fixed_eval_results/hnet_fixed_length_results/eval_config.yaml ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ config_path: /workspace/byte-llms-code/hnet_project/configs/hnet_2stage_XL_code.json
3
+ checkpoint_path: /workspace/byte-llms-code/hnet_project/checkpoints/hnet_2stage_XL_code.pt
4
+ data:
5
+ path: /workspace/byte-llms-code/code_completion_exp/datasets/data_V4_full
6
+ max_context_len: 4096
7
+ max_target_len: 256
8
+ num_workers: 0
9
+ pin_memory: true
10
+ max_train_samples: null
11
+ max_val_samples: null
12
+ paths:
13
+ checkpoints_dir: /workspace/byte-llms-code/code_completion_exp/hnet-ckpts
14
+ initial_checkpoint: null
15
+ output_dir: /workspace/byte-llms-code/code_completion_exp/hnet-ckpts/eval_results
16
+ evaluation:
17
+ batch_size: 16
18
+ max_samples: null
19
+ compute_bpb: true
20
+ bleu_tokenize: none
21
+ use_amp: true
22
+ save_predictions: true
23
+ generation:
24
+ max_length: 512
25
+ temperature: 0.1
26
+ top_k: 0
27
+ top_p: 1.0
28
+ seed: 42
29
+ device: cuda
fixed_eval_results/hnet_fixed_length_results/metrics_03-22-final.txt ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Checkpoint: 03-22-final.pt
2
+ ================================================================================
3
+
4
+ exact_match: 0.37318365718844376
5
+ token_accuracy: 0.482588638384026
6
+ bleu: 20.854804726838726
7
+ bpb: 1.349107179428066
8
+ num_samples: 35098
9
+ gen_wall_time_s: 2863.6849117436213
10
+ gen_samples_per_s: 12.25623666069804
11
+ gen_time_per_sample_ms: 81.59111378835323
12
+ gen_chars_per_s: 360.7617569109473
13
+ gen_batch_mean_ms: 2610.469381717066
14
+ gen_batch_p50_ms: 1890.1621060213074
15
+ gen_batch_p95_ms: 9530.616011167876
16
+ gen_batch_max_ms: 22047.994011896662
17
+ gen_num_batches: 1097
fixed_eval_results/hnet_fixed_length_results/predictions_03-22-final.txt ADDED
The diff for this file is too large to render. See raw diff
 
fixed_eval_results/hnet_fixed_length_results/summary.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ EVALUATION SUMMARY
2
+ ==================================================================================================
3
+
4
+ Checkpoint Exact Match Token Acc BLEU BPB ms/sample samp/s
5
+ --------------------------------------------------------------------------------------------------
6
+ 03-22-final 37.32% 48.26% 20.85 1.35 81.6 12.26
fixed_eval_results/pythia_14b_fixed_results/eval_config.yaml ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ path: /workspace/byte-llms-code/code_completion_exp/datasets/data_V4_full
3
+ max_context_len: 4096
4
+ max_target_len: 256
5
+ num_workers: 4
6
+ pin_memory: true
7
+ model:
8
+ name: EleutherAI/pythia-1.4b
9
+ checkpoint_path: null
10
+ from_scratch: false
11
+ paths:
12
+ checkpoints_dir: /workspace/byte-llms-code/code_completion_exp/pythia_1_4b_rerun/pythia_1_4b_lr_2e-5
13
+ initial_checkpoint: null
14
+ output_dir: /workspace/byte-llms-code/code_completion_exp/pythia_1_4b_rerun/pythia_1_4b_lr_2e-5/eval_results
15
+ evaluation:
16
+ batch_size: 16
17
+ max_samples: null
18
+ compute_perplexity: true
19
+ bleu_tokenize: none
20
+ save_predictions: true
21
+ use_amp: true
22
+ generation:
23
+ max_new_tokens: 256
24
+ temperature: 0.1
25
+ top_k: 0
26
+ top_p: 1.0
27
+ do_sample: true
28
+ seed: 42
29
+ device: cuda
fixed_eval_results/pythia_14b_fixed_results/metrics_model_final.txt ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Checkpoint: model_final.pt
2
+ ================================================================================
3
+
4
+ exact_match: 0.34876631147073905
5
+ token_accuracy: 0.363837459168535
6
+ bleu: 19.70712343277282
7
+ perplexity: 319.0512224116374
8
+ num_samples: 35098
9
+ gen_wall_time_s: 893.0648033486214
10
+ gen_samples_per_s: 39.3006194717305
11
+ gen_time_per_sample_ms: 25.444891542213842
12
+ gen_chars_per_s: 1033.2542459853112
13
+ gen_batch_mean_ms: 797.1702183922795
14
+ gen_batch_p50_ms: 605.6874099886045
15
+ gen_batch_p95_ms: 1458.250489202328
16
+ gen_batch_max_ms: 20027.544419048354
17
+ gen_num_batches: 1097
fixed_eval_results/pythia_14b_fixed_results/predictions_model_final.txt ADDED
The diff for this file is too large to render. See raw diff
 
fixed_eval_results/pythia_14b_fixed_results/summary.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ EVALUATION SUMMARY
2
+ ==================================================================================================
3
+
4
+ Checkpoint Exact Match Token Acc BLEU PERPLEXITY ms/sample samp/s
5
+ --------------------------------------------------------------------------------------------------
6
+ model_final 34.88% 36.38% 19.71 319.05 25.4 39.30