Upload folder using huggingface_hub
Browse files- fixed_eval_results/hnet_fixed_length_results/eval_config.yaml +29 -0
- fixed_eval_results/hnet_fixed_length_results/metrics_03-22-final.txt +17 -0
- fixed_eval_results/hnet_fixed_length_results/predictions_03-22-final.txt +0 -0
- fixed_eval_results/hnet_fixed_length_results/summary.txt +6 -0
- fixed_eval_results/pythia_14b_fixed_results/eval_config.yaml +29 -0
- fixed_eval_results/pythia_14b_fixed_results/metrics_model_final.txt +17 -0
- fixed_eval_results/pythia_14b_fixed_results/predictions_model_final.txt +0 -0
- fixed_eval_results/pythia_14b_fixed_results/summary.txt +6 -0
fixed_eval_results/hnet_fixed_length_results/eval_config.yaml
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model:
|
| 2 |
+
config_path: /workspace/byte-llms-code/hnet_project/configs/hnet_2stage_XL_code.json
|
| 3 |
+
checkpoint_path: /workspace/byte-llms-code/hnet_project/checkpoints/hnet_2stage_XL_code.pt
|
| 4 |
+
data:
|
| 5 |
+
path: /workspace/byte-llms-code/code_completion_exp/datasets/data_V4_full
|
| 6 |
+
max_context_len: 4096
|
| 7 |
+
max_target_len: 256
|
| 8 |
+
num_workers: 0
|
| 9 |
+
pin_memory: true
|
| 10 |
+
max_train_samples: null
|
| 11 |
+
max_val_samples: null
|
| 12 |
+
paths:
|
| 13 |
+
checkpoints_dir: /workspace/byte-llms-code/code_completion_exp/hnet-ckpts
|
| 14 |
+
initial_checkpoint: null
|
| 15 |
+
output_dir: /workspace/byte-llms-code/code_completion_exp/hnet-ckpts/eval_results
|
| 16 |
+
evaluation:
|
| 17 |
+
batch_size: 16
|
| 18 |
+
max_samples: null
|
| 19 |
+
compute_bpb: true
|
| 20 |
+
bleu_tokenize: none
|
| 21 |
+
use_amp: true
|
| 22 |
+
save_predictions: true
|
| 23 |
+
generation:
|
| 24 |
+
max_length: 512
|
| 25 |
+
temperature: 0.1
|
| 26 |
+
top_k: 0
|
| 27 |
+
top_p: 1.0
|
| 28 |
+
seed: 42
|
| 29 |
+
device: cuda
|
fixed_eval_results/hnet_fixed_length_results/metrics_03-22-final.txt
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Checkpoint: 03-22-final.pt
|
| 2 |
+
================================================================================
|
| 3 |
+
|
| 4 |
+
exact_match: 0.37318365718844376
|
| 5 |
+
token_accuracy: 0.482588638384026
|
| 6 |
+
bleu: 20.854804726838726
|
| 7 |
+
bpb: 1.349107179428066
|
| 8 |
+
num_samples: 35098
|
| 9 |
+
gen_wall_time_s: 2863.6849117436213
|
| 10 |
+
gen_samples_per_s: 12.25623666069804
|
| 11 |
+
gen_time_per_sample_ms: 81.59111378835323
|
| 12 |
+
gen_chars_per_s: 360.7617569109473
|
| 13 |
+
gen_batch_mean_ms: 2610.469381717066
|
| 14 |
+
gen_batch_p50_ms: 1890.1621060213074
|
| 15 |
+
gen_batch_p95_ms: 9530.616011167876
|
| 16 |
+
gen_batch_max_ms: 22047.994011896662
|
| 17 |
+
gen_num_batches: 1097
|
fixed_eval_results/hnet_fixed_length_results/predictions_03-22-final.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
fixed_eval_results/hnet_fixed_length_results/summary.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
EVALUATION SUMMARY
|
| 2 |
+
==================================================================================================
|
| 3 |
+
|
| 4 |
+
Checkpoint Exact Match Token Acc BLEU BPB ms/sample samp/s
|
| 5 |
+
--------------------------------------------------------------------------------------------------
|
| 6 |
+
03-22-final 37.32% 48.26% 20.85 1.35 81.6 12.26
|
fixed_eval_results/pythia_14b_fixed_results/eval_config.yaml
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
data:
|
| 2 |
+
path: /workspace/byte-llms-code/code_completion_exp/datasets/data_V4_full
|
| 3 |
+
max_context_len: 4096
|
| 4 |
+
max_target_len: 256
|
| 5 |
+
num_workers: 4
|
| 6 |
+
pin_memory: true
|
| 7 |
+
model:
|
| 8 |
+
name: EleutherAI/pythia-1.4b
|
| 9 |
+
checkpoint_path: null
|
| 10 |
+
from_scratch: false
|
| 11 |
+
paths:
|
| 12 |
+
checkpoints_dir: /workspace/byte-llms-code/code_completion_exp/pythia_1_4b_rerun/pythia_1_4b_lr_2e-5
|
| 13 |
+
initial_checkpoint: null
|
| 14 |
+
output_dir: /workspace/byte-llms-code/code_completion_exp/pythia_1_4b_rerun/pythia_1_4b_lr_2e-5/eval_results
|
| 15 |
+
evaluation:
|
| 16 |
+
batch_size: 16
|
| 17 |
+
max_samples: null
|
| 18 |
+
compute_perplexity: true
|
| 19 |
+
bleu_tokenize: none
|
| 20 |
+
save_predictions: true
|
| 21 |
+
use_amp: true
|
| 22 |
+
generation:
|
| 23 |
+
max_new_tokens: 256
|
| 24 |
+
temperature: 0.1
|
| 25 |
+
top_k: 0
|
| 26 |
+
top_p: 1.0
|
| 27 |
+
do_sample: true
|
| 28 |
+
seed: 42
|
| 29 |
+
device: cuda
|
fixed_eval_results/pythia_14b_fixed_results/metrics_model_final.txt
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Checkpoint: model_final.pt
|
| 2 |
+
================================================================================
|
| 3 |
+
|
| 4 |
+
exact_match: 0.34876631147073905
|
| 5 |
+
token_accuracy: 0.363837459168535
|
| 6 |
+
bleu: 19.70712343277282
|
| 7 |
+
perplexity: 319.0512224116374
|
| 8 |
+
num_samples: 35098
|
| 9 |
+
gen_wall_time_s: 893.0648033486214
|
| 10 |
+
gen_samples_per_s: 39.3006194717305
|
| 11 |
+
gen_time_per_sample_ms: 25.444891542213842
|
| 12 |
+
gen_chars_per_s: 1033.2542459853112
|
| 13 |
+
gen_batch_mean_ms: 797.1702183922795
|
| 14 |
+
gen_batch_p50_ms: 605.6874099886045
|
| 15 |
+
gen_batch_p95_ms: 1458.250489202328
|
| 16 |
+
gen_batch_max_ms: 20027.544419048354
|
| 17 |
+
gen_num_batches: 1097
|
fixed_eval_results/pythia_14b_fixed_results/predictions_model_final.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
fixed_eval_results/pythia_14b_fixed_results/summary.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
EVALUATION SUMMARY
|
| 2 |
+
==================================================================================================
|
| 3 |
+
|
| 4 |
+
Checkpoint Exact Match Token Acc BLEU PERPLEXITY ms/sample samp/s
|
| 5 |
+
--------------------------------------------------------------------------------------------------
|
| 6 |
+
model_final 34.88% 36.38% 19.71 319.05 25.4 39.30
|