| { |
| "config": { |
| "seed": 42, |
| "device": "cuda", |
| "dtype": "bfloat16", |
| "benchmark": { |
| "repeats": 3, |
| "batch_sizes": [ |
| 1, |
| 2, |
| 4, |
| 8, |
| 16 |
| ], |
| "max_new_tokens": [ |
| 64, |
| 128 |
| ], |
| "stop_on_eos": true, |
| "measure_memory": true, |
| "collect_traces": true, |
| "continue_on_error": true, |
| "warmup": { |
| "enabled": true |
| } |
| }, |
| "workloads": { |
| "synthetic": { |
| "enabled": false, |
| "prompt_byte_buckets": [ |
| 256, |
| 1024 |
| ], |
| "samples_per_bucket": 128 |
| }, |
| "code": { |
| "enabled": true, |
| "data_path": "code_completion_exp/datasets/data_V4_full", |
| "split": "validation", |
| "prompt_byte_buckets": [ |
| 256, |
| 1024 |
| ], |
| "samples_per_bucket": 128, |
| "max_samples_to_scan": 5000 |
| } |
| }, |
| "models": { |
| "enabled": [ |
| "hnet", |
| "hnet_serial", |
| "bolmo", |
| "pythia" |
| ], |
| "hnet": { |
| "config_path": "hnet_project/configs/hnet_2stage_XL_code.json", |
| "checkpoint_path": "hnet_project/checkpoints/hnet_2stage_XL_code.pt" |
| }, |
| "hnet_serial": { |
| "config_path": "hnet_project/configs/hnet_2stage_XL_code.json", |
| "checkpoint_path": "hnet_project/checkpoints/hnet_2stage_XL_code.pt" |
| }, |
| "bolmo": { |
| "model_name": "allenai/Bolmo-1B", |
| "cache_dir": "cache/bolmo", |
| "local_files_only": false |
| }, |
| "pythia": { |
| "model_name": "EleutherAI/pythia-1b", |
| "cache_dir": "cache/hf", |
| "local_files_only": false, |
| "max_context_len": 4096 |
| } |
| }, |
| "paths": { |
| "output_root": "generation_speed_exp/outputs" |
| } |
| }, |
| "repo_root": "/workspace/byte-llms-code", |
| "workloads": { |
| "code/256B": 128, |
| "code/1024B": 128 |
| }, |
| "environment": { |
| "timestamp": "2026-05-10T23:04:30", |
| "hostname": "e41665783a40", |
| "platform": "Linux-6.8.0-110-generic-x86_64-with-glibc2.39", |
| "python": "3.12.0 | packaged by Anaconda, Inc. | (main, Oct 2 2023, 17:29:18) [GCC 11.2.0]", |
| "git_commit": "21e26deacf90f77563e3834cfb46e6dc64f52d6e", |
| "git_branch": "feature/generation-bench", |
| "git_dirty": false, |
| "torch": "2.6.0+cu124", |
| "torch_cuda": "12.4", |
| "cuda_available": true, |
| "transformers": "4.57.6", |
| "cuda_devices": [ |
| { |
| "index": 0, |
| "name": "NVIDIA A100X", |
| "total_memory_mb": 81341.8125, |
| "major": 8, |
| "minor": 0 |
| }, |
| { |
| "index": 1, |
| "name": "NVIDIA A100X", |
| "total_memory_mb": 81341.8125, |
| "major": 8, |
| "minor": 0 |
| } |
| ], |
| "nvidia_smi": "NVIDIA A100X, 81920 MiB, 570.86.10\nNVIDIA A100X, 81920 MiB, 570.86.10" |
| } |
| } |