FartingBackwards commited on
Commit
3fef913
·
verified ·
1 Parent(s): 3b0d3f5

Update transformer/config.json

Browse files

The committed transformer/config.json describes the 14B architecture, but the weights in this repo are the 1.3B checkpoint. This PR corrects the architecture fields to match the 1.3B weights.

Files changed (1) hide show
  1. transformer/config.json +3 -3
transformer/config.json CHANGED
@@ -5,12 +5,12 @@
5
  "attention_head_dim": 128,
6
  "cross_attn_norm": true,
7
  "eps": 1e-06,
8
- "ffn_dim": 13824,
9
  "freq_dim": 256,
10
  "image_dim": null,
11
  "in_channels": 16,
12
- "num_attention_heads": 40,
13
- "num_layers": 40,
14
  "out_channels": 16,
15
  "patch_size": [
16
  1,
 
5
  "attention_head_dim": 128,
6
  "cross_attn_norm": true,
7
  "eps": 1e-06,
8
+ "ffn_dim": 8960,
9
  "freq_dim": 256,
10
  "image_dim": null,
11
  "in_channels": 16,
12
+ "num_attention_heads": 12,
13
+ "num_layers": 30,
14
  "out_channels": 16,
15
  "patch_size": [
16
  1,