NextTerm-440M-Checkpoints / checkpoint_manifest.json
N8Programs's picture
Add files using upload-large-folder tool
451a228 verified
{
"repo": "N8Programs/NextTerm-440M-Checkpoints",
"format": "transformers save_pretrained subfolders",
"recommended_checkpoint": "checkpoints/final_latest",
"oeis_vocab_size": 16,
"stop_token_ids": [
11,
13,
14
],
"checkpoints": [
{
"name": "best_val",
"subfolder": "checkpoints/best_val",
"trained_tokens": 9500200875,
"dtype": "float32",
"rope_basis": "HF/Qwen split-half RoPE basis",
"source_rope_basis": "custom interleaved even/odd RoPE basis",
"transformers_compatible": true
},
{
"name": "checkpoint_tokens_012000258345",
"subfolder": "checkpoints/checkpoint_tokens_012000258345",
"trained_tokens": 12000258345,
"dtype": "float32",
"rope_basis": "HF/Qwen split-half RoPE basis",
"source_rope_basis": "custom interleaved even/odd RoPE basis",
"transformers_compatible": true
},
{
"name": "checkpoint_tokens_012500265837",
"subfolder": "checkpoints/checkpoint_tokens_012500265837",
"trained_tokens": 12500265837,
"dtype": "float32",
"rope_basis": "HF/Qwen split-half RoPE basis",
"source_rope_basis": "custom interleaved even/odd RoPE basis",
"transformers_compatible": true
},
{
"name": "checkpoint_tokens_013000266889",
"subfolder": "checkpoints/checkpoint_tokens_013000266889",
"trained_tokens": 13000266889,
"dtype": "float32",
"rope_basis": "HF/Qwen split-half RoPE basis",
"source_rope_basis": "custom interleaved even/odd RoPE basis",
"transformers_compatible": true
},
{
"name": "checkpoint_tokens_013500289737",
"subfolder": "checkpoints/checkpoint_tokens_013500289737",
"trained_tokens": 13500289737,
"dtype": "float32",
"rope_basis": "HF/Qwen split-half RoPE basis",
"source_rope_basis": "custom interleaved even/odd RoPE basis",
"transformers_compatible": true
},
{
"name": "final_latest",
"subfolder": "checkpoints/final_latest",
"trained_tokens": 13999999995,
"dtype": "float32",
"rope_basis": "HF/Qwen split-half RoPE basis",
"source_rope_basis": "custom interleaved even/odd RoPE basis",
"transformers_compatible": true
}
]
}