Student Watery zhuoyang20 commited on
Commit
5b73fdf
·
0 Parent(s):

Duplicate from mit-han-lab/foreact-pretrained

Browse files

Co-authored-by: Zhuoyang Zhang <zhuoyang20@users.noreply.huggingface.co>

.gitattributes ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ trainer_state.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_gradient_checkpointing": false,
3
+ "architectures": [
4
+ "VisualForesight"
5
+ ],
6
+ "attn_implementation": null,
7
+ "diffusion_model_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
8
+ "dtype": "bfloat16",
9
+ "in_channels": 32,
10
+ "input_size": [
11
+ 15,
12
+ 20
13
+ ],
14
+ "max_input_text_tokens": 256,
15
+ "mllm_id": "google/gemma-2-2b-it",
16
+ "model_type": "visualforesight",
17
+ "modules_to_freeze": [
18
+ "vae",
19
+ "mllm_backbone"
20
+ ],
21
+ "modules_to_unfreeze": [],
22
+ "noise_scheduler_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
23
+ "scheduler_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
24
+ "system_prompt": "You are a robot and should focus on your actions. Generate a new image that meets the user's instruction while maintaining consistency with the original input where appropriate.",
25
+ "transformers_version": "4.57.1",
26
+ "vae_downsample_f": 32,
27
+ "vae_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers"
28
+ }
model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4d5fd396dea2b11f3ba1220232ac2148069ddfcd26773dcc29585c0a4fee0f7
3
+ size 4988029512
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:735169436251e2fb0876ec54085828bf178b87ef70c8a2d0a2c4b9b63a537f95
3
+ size 4999982648
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b508be211e31684541f48733a991ed6cebdd7022f0d4097c62c2f10749970e2
3
+ size 253880534
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff