Upload folder using huggingface_hub

Files changed (8) hide show

fixed_eval_results/hnet_fixed_length_results/eval_config.yaml ADDED Viewed

+model:
+  config_path: /workspace/byte-llms-code/hnet_project/configs/hnet_2stage_XL_code.json
+  checkpoint_path: /workspace/byte-llms-code/hnet_project/checkpoints/hnet_2stage_XL_code.pt
+data:
+  path: /workspace/byte-llms-code/code_completion_exp/datasets/data_V4_full
+  max_context_len: 4096
+  max_target_len: 256
+  num_workers: 0
+  pin_memory: true
+  max_train_samples: null
+  max_val_samples: null
+paths:
+  checkpoints_dir: /workspace/byte-llms-code/code_completion_exp/hnet-ckpts
+  initial_checkpoint: null
+  output_dir: /workspace/byte-llms-code/code_completion_exp/hnet-ckpts/eval_results
+evaluation:
+  batch_size: 16
+  max_samples: null
+  compute_bpb: true
+  bleu_tokenize: none
+  use_amp: true
+  save_predictions: true
+generation:
+  max_length: 512
+  temperature: 0.1
+  top_k: 0
+  top_p: 1.0
+seed: 42
+device: cuda

fixed_eval_results/hnet_fixed_length_results/metrics_03-22-final.txt ADDED Viewed

+Checkpoint: 03-22-final.pt
+================================================================================
+exact_match: 0.37318365718844376
+token_accuracy: 0.482588638384026
+bleu: 20.854804726838726
+bpb: 1.349107179428066
+num_samples: 35098
+gen_wall_time_s: 2863.6849117436213
+gen_samples_per_s: 12.25623666069804
+gen_time_per_sample_ms: 81.59111378835323
+gen_chars_per_s: 360.7617569109473
+gen_batch_mean_ms: 2610.469381717066
+gen_batch_p50_ms: 1890.1621060213074
+gen_batch_p95_ms: 9530.616011167876
+gen_batch_max_ms: 22047.994011896662
+gen_num_batches: 1097

fixed_eval_results/hnet_fixed_length_results/predictions_03-22-final.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

fixed_eval_results/hnet_fixed_length_results/summary.txt ADDED Viewed

+EVALUATION SUMMARY
+==================================================================================================
+Checkpoint                      Exact Match    Token Acc     BLEU          BPB  ms/sample   samp/s
+--------------------------------------------------------------------------------------------------
+03-22-final                          37.32%       48.26%    20.85         1.35       81.6    12.26

fixed_eval_results/pythia_14b_fixed_results/eval_config.yaml ADDED Viewed

+data:
+  path: /workspace/byte-llms-code/code_completion_exp/datasets/data_V4_full
+  max_context_len: 4096
+  max_target_len: 256
+  num_workers: 4
+  pin_memory: true
+model:
+  name: EleutherAI/pythia-1.4b
+  checkpoint_path: null
+  from_scratch: false
+paths:
+  checkpoints_dir: /workspace/byte-llms-code/code_completion_exp/pythia_1_4b_rerun/pythia_1_4b_lr_2e-5
+  initial_checkpoint: null
+  output_dir: /workspace/byte-llms-code/code_completion_exp/pythia_1_4b_rerun/pythia_1_4b_lr_2e-5/eval_results
+evaluation:
+  batch_size: 16
+  max_samples: null
+  compute_perplexity: true
+  bleu_tokenize: none
+  save_predictions: true
+  use_amp: true
+generation:
+  max_new_tokens: 256
+  temperature: 0.1
+  top_k: 0
+  top_p: 1.0
+  do_sample: true
+seed: 42
+device: cuda

fixed_eval_results/pythia_14b_fixed_results/metrics_model_final.txt ADDED Viewed

+Checkpoint: model_final.pt
+================================================================================
+exact_match: 0.34876631147073905
+token_accuracy: 0.363837459168535
+bleu: 19.70712343277282
+perplexity: 319.0512224116374
+num_samples: 35098
+gen_wall_time_s: 893.0648033486214
+gen_samples_per_s: 39.3006194717305
+gen_time_per_sample_ms: 25.444891542213842
+gen_chars_per_s: 1033.2542459853112
+gen_batch_mean_ms: 797.1702183922795
+gen_batch_p50_ms: 605.6874099886045
+gen_batch_p95_ms: 1458.250489202328
+gen_batch_max_ms: 20027.544419048354
+gen_num_batches: 1097

fixed_eval_results/pythia_14b_fixed_results/predictions_model_final.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

fixed_eval_results/pythia_14b_fixed_results/summary.txt ADDED Viewed

+EVALUATION SUMMARY
+==================================================================================================
+Checkpoint                      Exact Match    Token Acc     BLEU   PERPLEXITY  ms/sample   samp/s
+--------------------------------------------------------------------------------------------------
+model_final                          34.88%       36.38%    19.71       319.05       25.4    39.30