wonwonn commited on
Commit
8bb44ef
·
verified ·
1 Parent(s): a4ea3ff

Upload LoRA adapter (pcagent-7B-human-only)

Browse files
Files changed (50) hide show
  1. .gitattributes +4 -0
  2. README.md +62 -0
  3. adapter_config.json +127 -0
  4. adapter_model.safetensors +3 -0
  5. all_results.json +8 -0
  6. chat_template.jinja +7 -0
  7. checkpoint-1200/README.md +208 -0
  8. checkpoint-1200/adapter_config.json +127 -0
  9. checkpoint-1200/adapter_model.safetensors +3 -0
  10. checkpoint-1200/chat_template.jinja +7 -0
  11. checkpoint-1200/optimizer.pt +3 -0
  12. checkpoint-1200/processor_config.json +63 -0
  13. checkpoint-1200/rng_state.pth +3 -0
  14. checkpoint-1200/scheduler.pt +3 -0
  15. checkpoint-1200/tokenizer.json +3 -0
  16. checkpoint-1200/tokenizer_config.json +31 -0
  17. checkpoint-1200/trainer_state.json +0 -0
  18. checkpoint-1200/training_args.bin +3 -0
  19. checkpoint-1300/README.md +208 -0
  20. checkpoint-1300/adapter_config.json +127 -0
  21. checkpoint-1300/adapter_model.safetensors +3 -0
  22. checkpoint-1300/chat_template.jinja +7 -0
  23. checkpoint-1300/optimizer.pt +3 -0
  24. checkpoint-1300/processor_config.json +63 -0
  25. checkpoint-1300/rng_state.pth +3 -0
  26. checkpoint-1300/scheduler.pt +3 -0
  27. checkpoint-1300/tokenizer.json +3 -0
  28. checkpoint-1300/tokenizer_config.json +31 -0
  29. checkpoint-1300/trainer_state.json +0 -0
  30. checkpoint-1300/training_args.bin +3 -0
  31. checkpoint-1388/README.md +208 -0
  32. checkpoint-1388/adapter_config.json +127 -0
  33. checkpoint-1388/adapter_model.safetensors +3 -0
  34. checkpoint-1388/chat_template.jinja +7 -0
  35. checkpoint-1388/optimizer.pt +3 -0
  36. checkpoint-1388/processor_config.json +63 -0
  37. checkpoint-1388/rng_state.pth +3 -0
  38. checkpoint-1388/scheduler.pt +3 -0
  39. checkpoint-1388/tokenizer.json +3 -0
  40. checkpoint-1388/tokenizer_config.json +31 -0
  41. checkpoint-1388/trainer_state.json +0 -0
  42. checkpoint-1388/training_args.bin +3 -0
  43. processor_config.json +63 -0
  44. tokenizer.json +3 -0
  45. tokenizer_config.json +31 -0
  46. train_results.json +8 -0
  47. trainer_log.jsonl +0 -0
  48. trainer_state.json +0 -0
  49. training_args.bin +3 -0
  50. training_loss.png +0 -0
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint-1200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint-1300/tokenizer.json filter=lfs diff=lfs merge=lfs -text
38
+ checkpoint-1388/tokenizer.json filter=lfs diff=lfs merge=lfs -text
39
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ license: other
4
+ base_model: Qwen/Qwen2.5-VL-7B-Instruct
5
+ tags:
6
+ - base_model:adapter:Qwen/Qwen2.5-VL-7B-Instruct
7
+ - llama-factory
8
+ - lora
9
+ - transformers
10
+ pipeline_tag: text-generation
11
+ model-index:
12
+ - name: pcagent-7B-human-only
13
+ results: []
14
+ ---
15
+
16
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
+ should probably proofread and complete it, then remove this comment. -->
18
+
19
+ # pcagent-7B-human-only
20
+
21
+ This model is a fine-tuned version of [Qwen/Qwen2.5-VL-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-7B-Instruct) on the pc-agent-e-action-only dataset.
22
+
23
+ ## Model description
24
+
25
+ More information needed
26
+
27
+ ## Intended uses & limitations
28
+
29
+ More information needed
30
+
31
+ ## Training and evaluation data
32
+
33
+ More information needed
34
+
35
+ ## Training procedure
36
+
37
+ ### Training hyperparameters
38
+
39
+ The following hyperparameters were used during training:
40
+ - learning_rate: 2e-05
41
+ - train_batch_size: 2
42
+ - eval_batch_size: 8
43
+ - seed: 42
44
+ - distributed_type: multi-GPU
45
+ - gradient_accumulation_steps: 2
46
+ - total_train_batch_size: 4
47
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
48
+ - lr_scheduler_type: cosine
49
+ - lr_scheduler_warmup_steps: 0.05
50
+ - num_epochs: 2
51
+
52
+ ### Training results
53
+
54
+
55
+
56
+ ### Framework versions
57
+
58
+ - PEFT 0.18.1
59
+ - Transformers 5.2.0
60
+ - Pytorch 2.5.1+cu124
61
+ - Datasets 4.0.0
62
+ - Tokenizers 0.22.2
adapter_config.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": null,
6
+ "base_model_name_or_path": "Qwen/Qwen2.5-VL-7B-Instruct",
7
+ "bias": "none",
8
+ "corda_config": null,
9
+ "ensure_weight_tying": false,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 128,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.05,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "peft_version": "0.18.1",
27
+ "qalora_group_size": 16,
28
+ "r": 64,
29
+ "rank_pattern": {},
30
+ "revision": null,
31
+ "target_modules": [
32
+ "layers.9.mlp.up_proj",
33
+ "layers.26.mlp.gate_proj",
34
+ "layers.11.mlp.gate_proj",
35
+ "layers.7.mlp.gate_proj",
36
+ "layers.5.mlp.up_proj",
37
+ "layers.11.mlp.down_proj",
38
+ "layers.22.mlp.down_proj",
39
+ "layers.15.mlp.down_proj",
40
+ "layers.4.mlp.gate_proj",
41
+ "layers.18.mlp.gate_proj",
42
+ "layers.3.mlp.gate_proj",
43
+ "layers.22.mlp.up_proj",
44
+ "layers.14.mlp.gate_proj",
45
+ "layers.15.mlp.up_proj",
46
+ "layers.27.mlp.up_proj",
47
+ "layers.19.mlp.up_proj",
48
+ "layers.13.mlp.down_proj",
49
+ "layers.13.mlp.up_proj",
50
+ "layers.17.mlp.up_proj",
51
+ "layers.2.mlp.down_proj",
52
+ "layers.27.mlp.down_proj",
53
+ "layers.8.mlp.gate_proj",
54
+ "layers.0.mlp.gate_proj",
55
+ "layers.3.mlp.down_proj",
56
+ "layers.5.mlp.gate_proj",
57
+ "layers.4.mlp.up_proj",
58
+ "layers.23.mlp.up_proj",
59
+ "layers.10.mlp.gate_proj",
60
+ "layers.25.mlp.up_proj",
61
+ "layers.18.mlp.down_proj",
62
+ "layers.25.mlp.gate_proj",
63
+ "layers.24.mlp.down_proj",
64
+ "layers.16.mlp.up_proj",
65
+ "layers.16.mlp.down_proj",
66
+ "layers.11.mlp.up_proj",
67
+ "layers.6.mlp.gate_proj",
68
+ "layers.26.mlp.up_proj",
69
+ "layers.20.mlp.down_proj",
70
+ "layers.12.mlp.up_proj",
71
+ "layers.24.mlp.gate_proj",
72
+ "k_proj",
73
+ "layers.21.mlp.down_proj",
74
+ "layers.13.mlp.gate_proj",
75
+ "layers.20.mlp.up_proj",
76
+ "layers.18.mlp.up_proj",
77
+ "layers.9.mlp.gate_proj",
78
+ "layers.15.mlp.gate_proj",
79
+ "layers.27.mlp.gate_proj",
80
+ "layers.6.mlp.up_proj",
81
+ "layers.7.mlp.down_proj",
82
+ "layers.23.mlp.gate_proj",
83
+ "q_proj",
84
+ "layers.22.mlp.gate_proj",
85
+ "layers.26.mlp.down_proj",
86
+ "layers.17.mlp.gate_proj",
87
+ "layers.1.mlp.down_proj",
88
+ "layers.12.mlp.gate_proj",
89
+ "layers.17.mlp.down_proj",
90
+ "layers.7.mlp.up_proj",
91
+ "layers.19.mlp.gate_proj",
92
+ "layers.3.mlp.up_proj",
93
+ "layers.0.mlp.up_proj",
94
+ "layers.19.mlp.down_proj",
95
+ "layers.8.mlp.up_proj",
96
+ "o_proj",
97
+ "layers.5.mlp.down_proj",
98
+ "layers.23.mlp.down_proj",
99
+ "layers.25.mlp.down_proj",
100
+ "layers.0.mlp.down_proj",
101
+ "layers.1.mlp.up_proj",
102
+ "layers.10.mlp.down_proj",
103
+ "layers.1.mlp.gate_proj",
104
+ "layers.16.mlp.gate_proj",
105
+ "v_proj",
106
+ "layers.2.mlp.up_proj",
107
+ "layers.6.mlp.down_proj",
108
+ "layers.14.mlp.down_proj",
109
+ "layers.9.mlp.down_proj",
110
+ "layers.20.mlp.gate_proj",
111
+ "layers.10.mlp.up_proj",
112
+ "layers.4.mlp.down_proj",
113
+ "layers.21.mlp.up_proj",
114
+ "layers.14.mlp.up_proj",
115
+ "layers.8.mlp.down_proj",
116
+ "layers.24.mlp.up_proj",
117
+ "layers.2.mlp.gate_proj",
118
+ "layers.21.mlp.gate_proj",
119
+ "layers.12.mlp.down_proj"
120
+ ],
121
+ "target_parameters": null,
122
+ "task_type": "CAUSAL_LM",
123
+ "trainable_token_indices": null,
124
+ "use_dora": false,
125
+ "use_qalora": false,
126
+ "use_rslora": false
127
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99989965bee7500af2705e7939be60be62bf4fb6710d0482710af7a07a4e0e5e
3
+ size 645981584
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.0,
3
+ "total_flos": 1.0037139745307361e+18,
4
+ "train_loss": 0.7883986402571374,
5
+ "train_runtime": 11184.8694,
6
+ "train_samples_per_second": 0.496,
7
+ "train_steps_per_second": 0.124
8
+ }
chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
+ You are a helpful assistant.<|im_end|>
3
+ {% endif %}<|im_start|>{{ message['role'] }}
4
+ {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
+ {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
+ {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
+ {% endif %}
checkpoint-1200/README.md ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: Qwen/Qwen2.5-VL-7B-Instruct
3
+ library_name: peft
4
+ pipeline_tag: text-generation
5
+ tags:
6
+ - base_model:adapter:Qwen/Qwen2.5-VL-7B-Instruct
7
+ - llama-factory
8
+ - lora
9
+ - transformers
10
+ ---
11
+
12
+ # Model Card for Model ID
13
+
14
+ <!-- Provide a quick summary of what the model is/does. -->
15
+
16
+
17
+
18
+ ## Model Details
19
+
20
+ ### Model Description
21
+
22
+ <!-- Provide a longer summary of what this model is. -->
23
+
24
+
25
+
26
+ - **Developed by:** [More Information Needed]
27
+ - **Funded by [optional]:** [More Information Needed]
28
+ - **Shared by [optional]:** [More Information Needed]
29
+ - **Model type:** [More Information Needed]
30
+ - **Language(s) (NLP):** [More Information Needed]
31
+ - **License:** [More Information Needed]
32
+ - **Finetuned from model [optional]:** [More Information Needed]
33
+
34
+ ### Model Sources [optional]
35
+
36
+ <!-- Provide the basic links for the model. -->
37
+
38
+ - **Repository:** [More Information Needed]
39
+ - **Paper [optional]:** [More Information Needed]
40
+ - **Demo [optional]:** [More Information Needed]
41
+
42
+ ## Uses
43
+
44
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
45
+
46
+ ### Direct Use
47
+
48
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Downstream Use [optional]
53
+
54
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
55
+
56
+ [More Information Needed]
57
+
58
+ ### Out-of-Scope Use
59
+
60
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ## Bias, Risks, and Limitations
65
+
66
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
67
+
68
+ [More Information Needed]
69
+
70
+ ### Recommendations
71
+
72
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
73
+
74
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
75
+
76
+ ## How to Get Started with the Model
77
+
78
+ Use the code below to get started with the model.
79
+
80
+ [More Information Needed]
81
+
82
+ ## Training Details
83
+
84
+ ### Training Data
85
+
86
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
87
+
88
+ [More Information Needed]
89
+
90
+ ### Training Procedure
91
+
92
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
93
+
94
+ #### Preprocessing [optional]
95
+
96
+ [More Information Needed]
97
+
98
+
99
+ #### Training Hyperparameters
100
+
101
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
102
+
103
+ #### Speeds, Sizes, Times [optional]
104
+
105
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
106
+
107
+ [More Information Needed]
108
+
109
+ ## Evaluation
110
+
111
+ <!-- This section describes the evaluation protocols and provides the results. -->
112
+
113
+ ### Testing Data, Factors & Metrics
114
+
115
+ #### Testing Data
116
+
117
+ <!-- This should link to a Dataset Card if possible. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Factors
122
+
123
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
124
+
125
+ [More Information Needed]
126
+
127
+ #### Metrics
128
+
129
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
130
+
131
+ [More Information Needed]
132
+
133
+ ### Results
134
+
135
+ [More Information Needed]
136
+
137
+ #### Summary
138
+
139
+
140
+
141
+ ## Model Examination [optional]
142
+
143
+ <!-- Relevant interpretability work for the model goes here -->
144
+
145
+ [More Information Needed]
146
+
147
+ ## Environmental Impact
148
+
149
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
150
+
151
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
152
+
153
+ - **Hardware Type:** [More Information Needed]
154
+ - **Hours used:** [More Information Needed]
155
+ - **Cloud Provider:** [More Information Needed]
156
+ - **Compute Region:** [More Information Needed]
157
+ - **Carbon Emitted:** [More Information Needed]
158
+
159
+ ## Technical Specifications [optional]
160
+
161
+ ### Model Architecture and Objective
162
+
163
+ [More Information Needed]
164
+
165
+ ### Compute Infrastructure
166
+
167
+ [More Information Needed]
168
+
169
+ #### Hardware
170
+
171
+ [More Information Needed]
172
+
173
+ #### Software
174
+
175
+ [More Information Needed]
176
+
177
+ ## Citation [optional]
178
+
179
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
180
+
181
+ **BibTeX:**
182
+
183
+ [More Information Needed]
184
+
185
+ **APA:**
186
+
187
+ [More Information Needed]
188
+
189
+ ## Glossary [optional]
190
+
191
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
192
+
193
+ [More Information Needed]
194
+
195
+ ## More Information [optional]
196
+
197
+ [More Information Needed]
198
+
199
+ ## Model Card Authors [optional]
200
+
201
+ [More Information Needed]
202
+
203
+ ## Model Card Contact
204
+
205
+ [More Information Needed]
206
+ ### Framework versions
207
+
208
+ - PEFT 0.18.1
checkpoint-1200/adapter_config.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": null,
6
+ "base_model_name_or_path": "Qwen/Qwen2.5-VL-7B-Instruct",
7
+ "bias": "none",
8
+ "corda_config": null,
9
+ "ensure_weight_tying": false,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 128,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.05,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "peft_version": "0.18.1",
27
+ "qalora_group_size": 16,
28
+ "r": 64,
29
+ "rank_pattern": {},
30
+ "revision": null,
31
+ "target_modules": [
32
+ "layers.9.mlp.up_proj",
33
+ "layers.26.mlp.gate_proj",
34
+ "layers.11.mlp.gate_proj",
35
+ "layers.7.mlp.gate_proj",
36
+ "layers.5.mlp.up_proj",
37
+ "layers.11.mlp.down_proj",
38
+ "layers.22.mlp.down_proj",
39
+ "layers.15.mlp.down_proj",
40
+ "layers.4.mlp.gate_proj",
41
+ "layers.18.mlp.gate_proj",
42
+ "layers.3.mlp.gate_proj",
43
+ "layers.22.mlp.up_proj",
44
+ "layers.14.mlp.gate_proj",
45
+ "layers.15.mlp.up_proj",
46
+ "layers.27.mlp.up_proj",
47
+ "layers.19.mlp.up_proj",
48
+ "layers.13.mlp.down_proj",
49
+ "layers.13.mlp.up_proj",
50
+ "layers.17.mlp.up_proj",
51
+ "layers.2.mlp.down_proj",
52
+ "layers.27.mlp.down_proj",
53
+ "layers.8.mlp.gate_proj",
54
+ "layers.0.mlp.gate_proj",
55
+ "layers.3.mlp.down_proj",
56
+ "layers.5.mlp.gate_proj",
57
+ "layers.4.mlp.up_proj",
58
+ "layers.23.mlp.up_proj",
59
+ "layers.10.mlp.gate_proj",
60
+ "layers.25.mlp.up_proj",
61
+ "layers.18.mlp.down_proj",
62
+ "layers.25.mlp.gate_proj",
63
+ "layers.24.mlp.down_proj",
64
+ "layers.16.mlp.up_proj",
65
+ "layers.16.mlp.down_proj",
66
+ "layers.11.mlp.up_proj",
67
+ "layers.6.mlp.gate_proj",
68
+ "layers.26.mlp.up_proj",
69
+ "layers.20.mlp.down_proj",
70
+ "layers.12.mlp.up_proj",
71
+ "layers.24.mlp.gate_proj",
72
+ "k_proj",
73
+ "layers.21.mlp.down_proj",
74
+ "layers.13.mlp.gate_proj",
75
+ "layers.20.mlp.up_proj",
76
+ "layers.18.mlp.up_proj",
77
+ "layers.9.mlp.gate_proj",
78
+ "layers.15.mlp.gate_proj",
79
+ "layers.27.mlp.gate_proj",
80
+ "layers.6.mlp.up_proj",
81
+ "layers.7.mlp.down_proj",
82
+ "layers.23.mlp.gate_proj",
83
+ "q_proj",
84
+ "layers.22.mlp.gate_proj",
85
+ "layers.26.mlp.down_proj",
86
+ "layers.17.mlp.gate_proj",
87
+ "layers.1.mlp.down_proj",
88
+ "layers.12.mlp.gate_proj",
89
+ "layers.17.mlp.down_proj",
90
+ "layers.7.mlp.up_proj",
91
+ "layers.19.mlp.gate_proj",
92
+ "layers.3.mlp.up_proj",
93
+ "layers.0.mlp.up_proj",
94
+ "layers.19.mlp.down_proj",
95
+ "layers.8.mlp.up_proj",
96
+ "o_proj",
97
+ "layers.5.mlp.down_proj",
98
+ "layers.23.mlp.down_proj",
99
+ "layers.25.mlp.down_proj",
100
+ "layers.0.mlp.down_proj",
101
+ "layers.1.mlp.up_proj",
102
+ "layers.10.mlp.down_proj",
103
+ "layers.1.mlp.gate_proj",
104
+ "layers.16.mlp.gate_proj",
105
+ "v_proj",
106
+ "layers.2.mlp.up_proj",
107
+ "layers.6.mlp.down_proj",
108
+ "layers.14.mlp.down_proj",
109
+ "layers.9.mlp.down_proj",
110
+ "layers.20.mlp.gate_proj",
111
+ "layers.10.mlp.up_proj",
112
+ "layers.4.mlp.down_proj",
113
+ "layers.21.mlp.up_proj",
114
+ "layers.14.mlp.up_proj",
115
+ "layers.8.mlp.down_proj",
116
+ "layers.24.mlp.up_proj",
117
+ "layers.2.mlp.gate_proj",
118
+ "layers.21.mlp.gate_proj",
119
+ "layers.12.mlp.down_proj"
120
+ ],
121
+ "target_parameters": null,
122
+ "task_type": "CAUSAL_LM",
123
+ "trainable_token_indices": null,
124
+ "use_dora": false,
125
+ "use_qalora": false,
126
+ "use_rslora": false
127
+ }
checkpoint-1200/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18a873fda14e72a55e5f4eef70eb98c5a405940c1ab76a814093857de19849a0
3
+ size 645981584
checkpoint-1200/chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
+ You are a helpful assistant.<|im_end|>
3
+ {% endif %}<|im_start|>{{ message['role'] }}
4
+ {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
+ {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
+ {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
+ {% endif %}
checkpoint-1200/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c736d925f7766dd032404c01d99b673514e0df167feae1d13333c757ba1893ae
3
+ size 1292176234
checkpoint-1200/processor_config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "image_processor": {
3
+ "data_format": "channels_first",
4
+ "do_convert_rgb": true,
5
+ "do_normalize": true,
6
+ "do_rescale": true,
7
+ "do_resize": true,
8
+ "image_mean": [
9
+ 0.48145466,
10
+ 0.4578275,
11
+ 0.40821073
12
+ ],
13
+ "image_processor_type": "Qwen2VLImageProcessorFast",
14
+ "image_std": [
15
+ 0.26862954,
16
+ 0.26130258,
17
+ 0.27577711
18
+ ],
19
+ "merge_size": 2,
20
+ "patch_size": 14,
21
+ "resample": 3,
22
+ "rescale_factor": 0.00392156862745098,
23
+ "size": {
24
+ "longest_edge": 12845056,
25
+ "shortest_edge": 3136
26
+ },
27
+ "temporal_patch_size": 2
28
+ },
29
+ "processor_class": "Qwen2_5_VLProcessor",
30
+ "video_processor": {
31
+ "data_format": "channels_first",
32
+ "default_to_square": true,
33
+ "do_convert_rgb": true,
34
+ "do_normalize": true,
35
+ "do_rescale": true,
36
+ "do_resize": true,
37
+ "do_sample_frames": false,
38
+ "image_mean": [
39
+ 0.48145466,
40
+ 0.4578275,
41
+ 0.40821073
42
+ ],
43
+ "image_processor_type": "Qwen2VLImageProcessor",
44
+ "image_std": [
45
+ 0.26862954,
46
+ 0.26130258,
47
+ 0.27577711
48
+ ],
49
+ "max_frames": 768,
50
+ "merge_size": 2,
51
+ "min_frames": 4,
52
+ "patch_size": 14,
53
+ "resample": 3,
54
+ "rescale_factor": 0.00392156862745098,
55
+ "return_metadata": false,
56
+ "size": {
57
+ "longest_edge": 12845056,
58
+ "shortest_edge": 3136
59
+ },
60
+ "temporal_patch_size": 2,
61
+ "video_processor_type": "Qwen2VLVideoProcessor"
62
+ }
63
+ }
checkpoint-1200/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:858f7fc09bee30a3a299d5b07c5dd77679a9b77dd1c96241862056644d3072de
3
+ size 14244
checkpoint-1200/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72ec3fd9d2b3b9072c219f368074730e1e3f64dfe773b44380754ae0a56bc1ab
3
+ size 1064
checkpoint-1200/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd169731d2cbde95e10bf356d66d5997fd885dd8dbb6fb4684da3f23b2585d8
3
+ size 11421892
checkpoint-1200/tokenizer_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "<|im_end|>",
7
+ "errors": "replace",
8
+ "extra_special_tokens": [
9
+ "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<|object_ref_start|>",
12
+ "<|object_ref_end|>",
13
+ "<|box_start|>",
14
+ "<|box_end|>",
15
+ "<|quad_start|>",
16
+ "<|quad_end|>",
17
+ "<|vision_start|>",
18
+ "<|vision_end|>",
19
+ "<|vision_pad|>",
20
+ "<|image_pad|>",
21
+ "<|video_pad|>"
22
+ ],
23
+ "is_local": false,
24
+ "model_max_length": 131072,
25
+ "pad_token": "<|endoftext|>",
26
+ "padding_side": "right",
27
+ "processor_class": "Qwen2_5_VLProcessor",
28
+ "split_special_tokens": false,
29
+ "tokenizer_class": "Qwen2Tokenizer",
30
+ "unk_token": null
31
+ }
checkpoint-1200/trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1200/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0742392223bf62bf3e233a68f09ba267cf039dfafb723ee8590bd8f637eaecfb
3
+ size 5176
checkpoint-1300/README.md ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: Qwen/Qwen2.5-VL-7B-Instruct
3
+ library_name: peft
4
+ pipeline_tag: text-generation
5
+ tags:
6
+ - base_model:adapter:Qwen/Qwen2.5-VL-7B-Instruct
7
+ - llama-factory
8
+ - lora
9
+ - transformers
10
+ ---
11
+
12
+ # Model Card for Model ID
13
+
14
+ <!-- Provide a quick summary of what the model is/does. -->
15
+
16
+
17
+
18
+ ## Model Details
19
+
20
+ ### Model Description
21
+
22
+ <!-- Provide a longer summary of what this model is. -->
23
+
24
+
25
+
26
+ - **Developed by:** [More Information Needed]
27
+ - **Funded by [optional]:** [More Information Needed]
28
+ - **Shared by [optional]:** [More Information Needed]
29
+ - **Model type:** [More Information Needed]
30
+ - **Language(s) (NLP):** [More Information Needed]
31
+ - **License:** [More Information Needed]
32
+ - **Finetuned from model [optional]:** [More Information Needed]
33
+
34
+ ### Model Sources [optional]
35
+
36
+ <!-- Provide the basic links for the model. -->
37
+
38
+ - **Repository:** [More Information Needed]
39
+ - **Paper [optional]:** [More Information Needed]
40
+ - **Demo [optional]:** [More Information Needed]
41
+
42
+ ## Uses
43
+
44
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
45
+
46
+ ### Direct Use
47
+
48
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Downstream Use [optional]
53
+
54
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
55
+
56
+ [More Information Needed]
57
+
58
+ ### Out-of-Scope Use
59
+
60
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ## Bias, Risks, and Limitations
65
+
66
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
67
+
68
+ [More Information Needed]
69
+
70
+ ### Recommendations
71
+
72
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
73
+
74
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
75
+
76
+ ## How to Get Started with the Model
77
+
78
+ Use the code below to get started with the model.
79
+
80
+ [More Information Needed]
81
+
82
+ ## Training Details
83
+
84
+ ### Training Data
85
+
86
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
87
+
88
+ [More Information Needed]
89
+
90
+ ### Training Procedure
91
+
92
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
93
+
94
+ #### Preprocessing [optional]
95
+
96
+ [More Information Needed]
97
+
98
+
99
+ #### Training Hyperparameters
100
+
101
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
102
+
103
+ #### Speeds, Sizes, Times [optional]
104
+
105
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
106
+
107
+ [More Information Needed]
108
+
109
+ ## Evaluation
110
+
111
+ <!-- This section describes the evaluation protocols and provides the results. -->
112
+
113
+ ### Testing Data, Factors & Metrics
114
+
115
+ #### Testing Data
116
+
117
+ <!-- This should link to a Dataset Card if possible. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Factors
122
+
123
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
124
+
125
+ [More Information Needed]
126
+
127
+ #### Metrics
128
+
129
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
130
+
131
+ [More Information Needed]
132
+
133
+ ### Results
134
+
135
+ [More Information Needed]
136
+
137
+ #### Summary
138
+
139
+
140
+
141
+ ## Model Examination [optional]
142
+
143
+ <!-- Relevant interpretability work for the model goes here -->
144
+
145
+ [More Information Needed]
146
+
147
+ ## Environmental Impact
148
+
149
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
150
+
151
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
152
+
153
+ - **Hardware Type:** [More Information Needed]
154
+ - **Hours used:** [More Information Needed]
155
+ - **Cloud Provider:** [More Information Needed]
156
+ - **Compute Region:** [More Information Needed]
157
+ - **Carbon Emitted:** [More Information Needed]
158
+
159
+ ## Technical Specifications [optional]
160
+
161
+ ### Model Architecture and Objective
162
+
163
+ [More Information Needed]
164
+
165
+ ### Compute Infrastructure
166
+
167
+ [More Information Needed]
168
+
169
+ #### Hardware
170
+
171
+ [More Information Needed]
172
+
173
+ #### Software
174
+
175
+ [More Information Needed]
176
+
177
+ ## Citation [optional]
178
+
179
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
180
+
181
+ **BibTeX:**
182
+
183
+ [More Information Needed]
184
+
185
+ **APA:**
186
+
187
+ [More Information Needed]
188
+
189
+ ## Glossary [optional]
190
+
191
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
192
+
193
+ [More Information Needed]
194
+
195
+ ## More Information [optional]
196
+
197
+ [More Information Needed]
198
+
199
+ ## Model Card Authors [optional]
200
+
201
+ [More Information Needed]
202
+
203
+ ## Model Card Contact
204
+
205
+ [More Information Needed]
206
+ ### Framework versions
207
+
208
+ - PEFT 0.18.1
checkpoint-1300/adapter_config.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": null,
6
+ "base_model_name_or_path": "Qwen/Qwen2.5-VL-7B-Instruct",
7
+ "bias": "none",
8
+ "corda_config": null,
9
+ "ensure_weight_tying": false,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 128,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.05,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "peft_version": "0.18.1",
27
+ "qalora_group_size": 16,
28
+ "r": 64,
29
+ "rank_pattern": {},
30
+ "revision": null,
31
+ "target_modules": [
32
+ "layers.9.mlp.up_proj",
33
+ "layers.26.mlp.gate_proj",
34
+ "layers.11.mlp.gate_proj",
35
+ "layers.7.mlp.gate_proj",
36
+ "layers.5.mlp.up_proj",
37
+ "layers.11.mlp.down_proj",
38
+ "layers.22.mlp.down_proj",
39
+ "layers.15.mlp.down_proj",
40
+ "layers.4.mlp.gate_proj",
41
+ "layers.18.mlp.gate_proj",
42
+ "layers.3.mlp.gate_proj",
43
+ "layers.22.mlp.up_proj",
44
+ "layers.14.mlp.gate_proj",
45
+ "layers.15.mlp.up_proj",
46
+ "layers.27.mlp.up_proj",
47
+ "layers.19.mlp.up_proj",
48
+ "layers.13.mlp.down_proj",
49
+ "layers.13.mlp.up_proj",
50
+ "layers.17.mlp.up_proj",
51
+ "layers.2.mlp.down_proj",
52
+ "layers.27.mlp.down_proj",
53
+ "layers.8.mlp.gate_proj",
54
+ "layers.0.mlp.gate_proj",
55
+ "layers.3.mlp.down_proj",
56
+ "layers.5.mlp.gate_proj",
57
+ "layers.4.mlp.up_proj",
58
+ "layers.23.mlp.up_proj",
59
+ "layers.10.mlp.gate_proj",
60
+ "layers.25.mlp.up_proj",
61
+ "layers.18.mlp.down_proj",
62
+ "layers.25.mlp.gate_proj",
63
+ "layers.24.mlp.down_proj",
64
+ "layers.16.mlp.up_proj",
65
+ "layers.16.mlp.down_proj",
66
+ "layers.11.mlp.up_proj",
67
+ "layers.6.mlp.gate_proj",
68
+ "layers.26.mlp.up_proj",
69
+ "layers.20.mlp.down_proj",
70
+ "layers.12.mlp.up_proj",
71
+ "layers.24.mlp.gate_proj",
72
+ "k_proj",
73
+ "layers.21.mlp.down_proj",
74
+ "layers.13.mlp.gate_proj",
75
+ "layers.20.mlp.up_proj",
76
+ "layers.18.mlp.up_proj",
77
+ "layers.9.mlp.gate_proj",
78
+ "layers.15.mlp.gate_proj",
79
+ "layers.27.mlp.gate_proj",
80
+ "layers.6.mlp.up_proj",
81
+ "layers.7.mlp.down_proj",
82
+ "layers.23.mlp.gate_proj",
83
+ "q_proj",
84
+ "layers.22.mlp.gate_proj",
85
+ "layers.26.mlp.down_proj",
86
+ "layers.17.mlp.gate_proj",
87
+ "layers.1.mlp.down_proj",
88
+ "layers.12.mlp.gate_proj",
89
+ "layers.17.mlp.down_proj",
90
+ "layers.7.mlp.up_proj",
91
+ "layers.19.mlp.gate_proj",
92
+ "layers.3.mlp.up_proj",
93
+ "layers.0.mlp.up_proj",
94
+ "layers.19.mlp.down_proj",
95
+ "layers.8.mlp.up_proj",
96
+ "o_proj",
97
+ "layers.5.mlp.down_proj",
98
+ "layers.23.mlp.down_proj",
99
+ "layers.25.mlp.down_proj",
100
+ "layers.0.mlp.down_proj",
101
+ "layers.1.mlp.up_proj",
102
+ "layers.10.mlp.down_proj",
103
+ "layers.1.mlp.gate_proj",
104
+ "layers.16.mlp.gate_proj",
105
+ "v_proj",
106
+ "layers.2.mlp.up_proj",
107
+ "layers.6.mlp.down_proj",
108
+ "layers.14.mlp.down_proj",
109
+ "layers.9.mlp.down_proj",
110
+ "layers.20.mlp.gate_proj",
111
+ "layers.10.mlp.up_proj",
112
+ "layers.4.mlp.down_proj",
113
+ "layers.21.mlp.up_proj",
114
+ "layers.14.mlp.up_proj",
115
+ "layers.8.mlp.down_proj",
116
+ "layers.24.mlp.up_proj",
117
+ "layers.2.mlp.gate_proj",
118
+ "layers.21.mlp.gate_proj",
119
+ "layers.12.mlp.down_proj"
120
+ ],
121
+ "target_parameters": null,
122
+ "task_type": "CAUSAL_LM",
123
+ "trainable_token_indices": null,
124
+ "use_dora": false,
125
+ "use_qalora": false,
126
+ "use_rslora": false
127
+ }
checkpoint-1300/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a12b670909e8ec91a552773e057b4cabcc87df8325bcca39e4eb6a5f44c6a0a6
3
+ size 645981584
checkpoint-1300/chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
+ You are a helpful assistant.<|im_end|>
3
+ {% endif %}<|im_start|>{{ message['role'] }}
4
+ {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
+ {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
+ {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
+ {% endif %}
checkpoint-1300/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:907d3e0ce1338d0dd38466f7ba09b5d32dde5e768728cdbc2d8142c5752d3be3
3
+ size 1292176234
checkpoint-1300/processor_config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "image_processor": {
3
+ "data_format": "channels_first",
4
+ "do_convert_rgb": true,
5
+ "do_normalize": true,
6
+ "do_rescale": true,
7
+ "do_resize": true,
8
+ "image_mean": [
9
+ 0.48145466,
10
+ 0.4578275,
11
+ 0.40821073
12
+ ],
13
+ "image_processor_type": "Qwen2VLImageProcessorFast",
14
+ "image_std": [
15
+ 0.26862954,
16
+ 0.26130258,
17
+ 0.27577711
18
+ ],
19
+ "merge_size": 2,
20
+ "patch_size": 14,
21
+ "resample": 3,
22
+ "rescale_factor": 0.00392156862745098,
23
+ "size": {
24
+ "longest_edge": 12845056,
25
+ "shortest_edge": 3136
26
+ },
27
+ "temporal_patch_size": 2
28
+ },
29
+ "processor_class": "Qwen2_5_VLProcessor",
30
+ "video_processor": {
31
+ "data_format": "channels_first",
32
+ "default_to_square": true,
33
+ "do_convert_rgb": true,
34
+ "do_normalize": true,
35
+ "do_rescale": true,
36
+ "do_resize": true,
37
+ "do_sample_frames": false,
38
+ "image_mean": [
39
+ 0.48145466,
40
+ 0.4578275,
41
+ 0.40821073
42
+ ],
43
+ "image_processor_type": "Qwen2VLImageProcessor",
44
+ "image_std": [
45
+ 0.26862954,
46
+ 0.26130258,
47
+ 0.27577711
48
+ ],
49
+ "max_frames": 768,
50
+ "merge_size": 2,
51
+ "min_frames": 4,
52
+ "patch_size": 14,
53
+ "resample": 3,
54
+ "rescale_factor": 0.00392156862745098,
55
+ "return_metadata": false,
56
+ "size": {
57
+ "longest_edge": 12845056,
58
+ "shortest_edge": 3136
59
+ },
60
+ "temporal_patch_size": 2,
61
+ "video_processor_type": "Qwen2VLVideoProcessor"
62
+ }
63
+ }
checkpoint-1300/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c007b8c46529bfec9c1720caae32f726e24c0c9428547874d516118c380b527
3
+ size 14244
checkpoint-1300/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d3f4add932db57be28cf66f8035b1efa01988674b5e2de2f653ded19a9b35e4
3
+ size 1064
checkpoint-1300/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd169731d2cbde95e10bf356d66d5997fd885dd8dbb6fb4684da3f23b2585d8
3
+ size 11421892
checkpoint-1300/tokenizer_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "<|im_end|>",
7
+ "errors": "replace",
8
+ "extra_special_tokens": [
9
+ "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<|object_ref_start|>",
12
+ "<|object_ref_end|>",
13
+ "<|box_start|>",
14
+ "<|box_end|>",
15
+ "<|quad_start|>",
16
+ "<|quad_end|>",
17
+ "<|vision_start|>",
18
+ "<|vision_end|>",
19
+ "<|vision_pad|>",
20
+ "<|image_pad|>",
21
+ "<|video_pad|>"
22
+ ],
23
+ "is_local": false,
24
+ "model_max_length": 131072,
25
+ "pad_token": "<|endoftext|>",
26
+ "padding_side": "right",
27
+ "processor_class": "Qwen2_5_VLProcessor",
28
+ "split_special_tokens": false,
29
+ "tokenizer_class": "Qwen2Tokenizer",
30
+ "unk_token": null
31
+ }
checkpoint-1300/trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1300/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0742392223bf62bf3e233a68f09ba267cf039dfafb723ee8590bd8f637eaecfb
3
+ size 5176
checkpoint-1388/README.md ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: Qwen/Qwen2.5-VL-7B-Instruct
3
+ library_name: peft
4
+ pipeline_tag: text-generation
5
+ tags:
6
+ - base_model:adapter:Qwen/Qwen2.5-VL-7B-Instruct
7
+ - llama-factory
8
+ - lora
9
+ - transformers
10
+ ---
11
+
12
+ # Model Card for Model ID
13
+
14
+ <!-- Provide a quick summary of what the model is/does. -->
15
+
16
+
17
+
18
+ ## Model Details
19
+
20
+ ### Model Description
21
+
22
+ <!-- Provide a longer summary of what this model is. -->
23
+
24
+
25
+
26
+ - **Developed by:** [More Information Needed]
27
+ - **Funded by [optional]:** [More Information Needed]
28
+ - **Shared by [optional]:** [More Information Needed]
29
+ - **Model type:** [More Information Needed]
30
+ - **Language(s) (NLP):** [More Information Needed]
31
+ - **License:** [More Information Needed]
32
+ - **Finetuned from model [optional]:** [More Information Needed]
33
+
34
+ ### Model Sources [optional]
35
+
36
+ <!-- Provide the basic links for the model. -->
37
+
38
+ - **Repository:** [More Information Needed]
39
+ - **Paper [optional]:** [More Information Needed]
40
+ - **Demo [optional]:** [More Information Needed]
41
+
42
+ ## Uses
43
+
44
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
45
+
46
+ ### Direct Use
47
+
48
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Downstream Use [optional]
53
+
54
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
55
+
56
+ [More Information Needed]
57
+
58
+ ### Out-of-Scope Use
59
+
60
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ## Bias, Risks, and Limitations
65
+
66
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
67
+
68
+ [More Information Needed]
69
+
70
+ ### Recommendations
71
+
72
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
73
+
74
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
75
+
76
+ ## How to Get Started with the Model
77
+
78
+ Use the code below to get started with the model.
79
+
80
+ [More Information Needed]
81
+
82
+ ## Training Details
83
+
84
+ ### Training Data
85
+
86
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
87
+
88
+ [More Information Needed]
89
+
90
+ ### Training Procedure
91
+
92
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
93
+
94
+ #### Preprocessing [optional]
95
+
96
+ [More Information Needed]
97
+
98
+
99
+ #### Training Hyperparameters
100
+
101
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
102
+
103
+ #### Speeds, Sizes, Times [optional]
104
+
105
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
106
+
107
+ [More Information Needed]
108
+
109
+ ## Evaluation
110
+
111
+ <!-- This section describes the evaluation protocols and provides the results. -->
112
+
113
+ ### Testing Data, Factors & Metrics
114
+
115
+ #### Testing Data
116
+
117
+ <!-- This should link to a Dataset Card if possible. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Factors
122
+
123
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
124
+
125
+ [More Information Needed]
126
+
127
+ #### Metrics
128
+
129
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
130
+
131
+ [More Information Needed]
132
+
133
+ ### Results
134
+
135
+ [More Information Needed]
136
+
137
+ #### Summary
138
+
139
+
140
+
141
+ ## Model Examination [optional]
142
+
143
+ <!-- Relevant interpretability work for the model goes here -->
144
+
145
+ [More Information Needed]
146
+
147
+ ## Environmental Impact
148
+
149
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
150
+
151
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
152
+
153
+ - **Hardware Type:** [More Information Needed]
154
+ - **Hours used:** [More Information Needed]
155
+ - **Cloud Provider:** [More Information Needed]
156
+ - **Compute Region:** [More Information Needed]
157
+ - **Carbon Emitted:** [More Information Needed]
158
+
159
+ ## Technical Specifications [optional]
160
+
161
+ ### Model Architecture and Objective
162
+
163
+ [More Information Needed]
164
+
165
+ ### Compute Infrastructure
166
+
167
+ [More Information Needed]
168
+
169
+ #### Hardware
170
+
171
+ [More Information Needed]
172
+
173
+ #### Software
174
+
175
+ [More Information Needed]
176
+
177
+ ## Citation [optional]
178
+
179
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
180
+
181
+ **BibTeX:**
182
+
183
+ [More Information Needed]
184
+
185
+ **APA:**
186
+
187
+ [More Information Needed]
188
+
189
+ ## Glossary [optional]
190
+
191
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
192
+
193
+ [More Information Needed]
194
+
195
+ ## More Information [optional]
196
+
197
+ [More Information Needed]
198
+
199
+ ## Model Card Authors [optional]
200
+
201
+ [More Information Needed]
202
+
203
+ ## Model Card Contact
204
+
205
+ [More Information Needed]
206
+ ### Framework versions
207
+
208
+ - PEFT 0.18.1
checkpoint-1388/adapter_config.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": null,
6
+ "base_model_name_or_path": "Qwen/Qwen2.5-VL-7B-Instruct",
7
+ "bias": "none",
8
+ "corda_config": null,
9
+ "ensure_weight_tying": false,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 128,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.05,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "peft_version": "0.18.1",
27
+ "qalora_group_size": 16,
28
+ "r": 64,
29
+ "rank_pattern": {},
30
+ "revision": null,
31
+ "target_modules": [
32
+ "layers.9.mlp.up_proj",
33
+ "layers.26.mlp.gate_proj",
34
+ "layers.11.mlp.gate_proj",
35
+ "layers.7.mlp.gate_proj",
36
+ "layers.5.mlp.up_proj",
37
+ "layers.11.mlp.down_proj",
38
+ "layers.22.mlp.down_proj",
39
+ "layers.15.mlp.down_proj",
40
+ "layers.4.mlp.gate_proj",
41
+ "layers.18.mlp.gate_proj",
42
+ "layers.3.mlp.gate_proj",
43
+ "layers.22.mlp.up_proj",
44
+ "layers.14.mlp.gate_proj",
45
+ "layers.15.mlp.up_proj",
46
+ "layers.27.mlp.up_proj",
47
+ "layers.19.mlp.up_proj",
48
+ "layers.13.mlp.down_proj",
49
+ "layers.13.mlp.up_proj",
50
+ "layers.17.mlp.up_proj",
51
+ "layers.2.mlp.down_proj",
52
+ "layers.27.mlp.down_proj",
53
+ "layers.8.mlp.gate_proj",
54
+ "layers.0.mlp.gate_proj",
55
+ "layers.3.mlp.down_proj",
56
+ "layers.5.mlp.gate_proj",
57
+ "layers.4.mlp.up_proj",
58
+ "layers.23.mlp.up_proj",
59
+ "layers.10.mlp.gate_proj",
60
+ "layers.25.mlp.up_proj",
61
+ "layers.18.mlp.down_proj",
62
+ "layers.25.mlp.gate_proj",
63
+ "layers.24.mlp.down_proj",
64
+ "layers.16.mlp.up_proj",
65
+ "layers.16.mlp.down_proj",
66
+ "layers.11.mlp.up_proj",
67
+ "layers.6.mlp.gate_proj",
68
+ "layers.26.mlp.up_proj",
69
+ "layers.20.mlp.down_proj",
70
+ "layers.12.mlp.up_proj",
71
+ "layers.24.mlp.gate_proj",
72
+ "k_proj",
73
+ "layers.21.mlp.down_proj",
74
+ "layers.13.mlp.gate_proj",
75
+ "layers.20.mlp.up_proj",
76
+ "layers.18.mlp.up_proj",
77
+ "layers.9.mlp.gate_proj",
78
+ "layers.15.mlp.gate_proj",
79
+ "layers.27.mlp.gate_proj",
80
+ "layers.6.mlp.up_proj",
81
+ "layers.7.mlp.down_proj",
82
+ "layers.23.mlp.gate_proj",
83
+ "q_proj",
84
+ "layers.22.mlp.gate_proj",
85
+ "layers.26.mlp.down_proj",
86
+ "layers.17.mlp.gate_proj",
87
+ "layers.1.mlp.down_proj",
88
+ "layers.12.mlp.gate_proj",
89
+ "layers.17.mlp.down_proj",
90
+ "layers.7.mlp.up_proj",
91
+ "layers.19.mlp.gate_proj",
92
+ "layers.3.mlp.up_proj",
93
+ "layers.0.mlp.up_proj",
94
+ "layers.19.mlp.down_proj",
95
+ "layers.8.mlp.up_proj",
96
+ "o_proj",
97
+ "layers.5.mlp.down_proj",
98
+ "layers.23.mlp.down_proj",
99
+ "layers.25.mlp.down_proj",
100
+ "layers.0.mlp.down_proj",
101
+ "layers.1.mlp.up_proj",
102
+ "layers.10.mlp.down_proj",
103
+ "layers.1.mlp.gate_proj",
104
+ "layers.16.mlp.gate_proj",
105
+ "v_proj",
106
+ "layers.2.mlp.up_proj",
107
+ "layers.6.mlp.down_proj",
108
+ "layers.14.mlp.down_proj",
109
+ "layers.9.mlp.down_proj",
110
+ "layers.20.mlp.gate_proj",
111
+ "layers.10.mlp.up_proj",
112
+ "layers.4.mlp.down_proj",
113
+ "layers.21.mlp.up_proj",
114
+ "layers.14.mlp.up_proj",
115
+ "layers.8.mlp.down_proj",
116
+ "layers.24.mlp.up_proj",
117
+ "layers.2.mlp.gate_proj",
118
+ "layers.21.mlp.gate_proj",
119
+ "layers.12.mlp.down_proj"
120
+ ],
121
+ "target_parameters": null,
122
+ "task_type": "CAUSAL_LM",
123
+ "trainable_token_indices": null,
124
+ "use_dora": false,
125
+ "use_qalora": false,
126
+ "use_rslora": false
127
+ }
checkpoint-1388/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99989965bee7500af2705e7939be60be62bf4fb6710d0482710af7a07a4e0e5e
3
+ size 645981584
checkpoint-1388/chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
+ You are a helpful assistant.<|im_end|>
3
+ {% endif %}<|im_start|>{{ message['role'] }}
4
+ {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
+ {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
+ {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
+ {% endif %}
checkpoint-1388/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17d1e94b9fd6c0ecaf7f0f316b014008e63f23d40fb2401c1bf7cb4bd870665c
3
+ size 1292176234
checkpoint-1388/processor_config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "image_processor": {
3
+ "data_format": "channels_first",
4
+ "do_convert_rgb": true,
5
+ "do_normalize": true,
6
+ "do_rescale": true,
7
+ "do_resize": true,
8
+ "image_mean": [
9
+ 0.48145466,
10
+ 0.4578275,
11
+ 0.40821073
12
+ ],
13
+ "image_processor_type": "Qwen2VLImageProcessorFast",
14
+ "image_std": [
15
+ 0.26862954,
16
+ 0.26130258,
17
+ 0.27577711
18
+ ],
19
+ "merge_size": 2,
20
+ "patch_size": 14,
21
+ "resample": 3,
22
+ "rescale_factor": 0.00392156862745098,
23
+ "size": {
24
+ "longest_edge": 12845056,
25
+ "shortest_edge": 3136
26
+ },
27
+ "temporal_patch_size": 2
28
+ },
29
+ "processor_class": "Qwen2_5_VLProcessor",
30
+ "video_processor": {
31
+ "data_format": "channels_first",
32
+ "default_to_square": true,
33
+ "do_convert_rgb": true,
34
+ "do_normalize": true,
35
+ "do_rescale": true,
36
+ "do_resize": true,
37
+ "do_sample_frames": false,
38
+ "image_mean": [
39
+ 0.48145466,
40
+ 0.4578275,
41
+ 0.40821073
42
+ ],
43
+ "image_processor_type": "Qwen2VLImageProcessor",
44
+ "image_std": [
45
+ 0.26862954,
46
+ 0.26130258,
47
+ 0.27577711
48
+ ],
49
+ "max_frames": 768,
50
+ "merge_size": 2,
51
+ "min_frames": 4,
52
+ "patch_size": 14,
53
+ "resample": 3,
54
+ "rescale_factor": 0.00392156862745098,
55
+ "return_metadata": false,
56
+ "size": {
57
+ "longest_edge": 12845056,
58
+ "shortest_edge": 3136
59
+ },
60
+ "temporal_patch_size": 2,
61
+ "video_processor_type": "Qwen2VLVideoProcessor"
62
+ }
63
+ }
checkpoint-1388/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fde47c12c783fddaab2b60f8d617e42db9837ed7a3e6232b98d4fb5d313414d3
3
+ size 14244
checkpoint-1388/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21a998ea052e5537e9308629e2889dd950e4bc958983b7ef5ef4692756deff2
3
+ size 1064
checkpoint-1388/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd169731d2cbde95e10bf356d66d5997fd885dd8dbb6fb4684da3f23b2585d8
3
+ size 11421892
checkpoint-1388/tokenizer_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "<|im_end|>",
7
+ "errors": "replace",
8
+ "extra_special_tokens": [
9
+ "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<|object_ref_start|>",
12
+ "<|object_ref_end|>",
13
+ "<|box_start|>",
14
+ "<|box_end|>",
15
+ "<|quad_start|>",
16
+ "<|quad_end|>",
17
+ "<|vision_start|>",
18
+ "<|vision_end|>",
19
+ "<|vision_pad|>",
20
+ "<|image_pad|>",
21
+ "<|video_pad|>"
22
+ ],
23
+ "is_local": false,
24
+ "model_max_length": 131072,
25
+ "pad_token": "<|endoftext|>",
26
+ "padding_side": "right",
27
+ "processor_class": "Qwen2_5_VLProcessor",
28
+ "split_special_tokens": false,
29
+ "tokenizer_class": "Qwen2Tokenizer",
30
+ "unk_token": null
31
+ }
checkpoint-1388/trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1388/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0742392223bf62bf3e233a68f09ba267cf039dfafb723ee8590bd8f637eaecfb
3
+ size 5176
processor_config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "image_processor": {
3
+ "data_format": "channels_first",
4
+ "do_convert_rgb": true,
5
+ "do_normalize": true,
6
+ "do_rescale": true,
7
+ "do_resize": true,
8
+ "image_mean": [
9
+ 0.48145466,
10
+ 0.4578275,
11
+ 0.40821073
12
+ ],
13
+ "image_processor_type": "Qwen2VLImageProcessorFast",
14
+ "image_std": [
15
+ 0.26862954,
16
+ 0.26130258,
17
+ 0.27577711
18
+ ],
19
+ "merge_size": 2,
20
+ "patch_size": 14,
21
+ "resample": 3,
22
+ "rescale_factor": 0.00392156862745098,
23
+ "size": {
24
+ "longest_edge": 12845056,
25
+ "shortest_edge": 3136
26
+ },
27
+ "temporal_patch_size": 2
28
+ },
29
+ "processor_class": "Qwen2_5_VLProcessor",
30
+ "video_processor": {
31
+ "data_format": "channels_first",
32
+ "default_to_square": true,
33
+ "do_convert_rgb": true,
34
+ "do_normalize": true,
35
+ "do_rescale": true,
36
+ "do_resize": true,
37
+ "do_sample_frames": false,
38
+ "image_mean": [
39
+ 0.48145466,
40
+ 0.4578275,
41
+ 0.40821073
42
+ ],
43
+ "image_processor_type": "Qwen2VLImageProcessor",
44
+ "image_std": [
45
+ 0.26862954,
46
+ 0.26130258,
47
+ 0.27577711
48
+ ],
49
+ "max_frames": 768,
50
+ "merge_size": 2,
51
+ "min_frames": 4,
52
+ "patch_size": 14,
53
+ "resample": 3,
54
+ "rescale_factor": 0.00392156862745098,
55
+ "return_metadata": false,
56
+ "size": {
57
+ "longest_edge": 12845056,
58
+ "shortest_edge": 3136
59
+ },
60
+ "temporal_patch_size": 2,
61
+ "video_processor_type": "Qwen2VLVideoProcessor"
62
+ }
63
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd169731d2cbde95e10bf356d66d5997fd885dd8dbb6fb4684da3f23b2585d8
3
+ size 11421892
tokenizer_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "<|im_end|>",
7
+ "errors": "replace",
8
+ "extra_special_tokens": [
9
+ "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<|object_ref_start|>",
12
+ "<|object_ref_end|>",
13
+ "<|box_start|>",
14
+ "<|box_end|>",
15
+ "<|quad_start|>",
16
+ "<|quad_end|>",
17
+ "<|vision_start|>",
18
+ "<|vision_end|>",
19
+ "<|vision_pad|>",
20
+ "<|image_pad|>",
21
+ "<|video_pad|>"
22
+ ],
23
+ "is_local": false,
24
+ "model_max_length": 131072,
25
+ "pad_token": "<|endoftext|>",
26
+ "padding_side": "right",
27
+ "processor_class": "Qwen2_5_VLProcessor",
28
+ "split_special_tokens": false,
29
+ "tokenizer_class": "Qwen2Tokenizer",
30
+ "unk_token": null
31
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.0,
3
+ "total_flos": 1.0037139745307361e+18,
4
+ "train_loss": 0.7883986402571374,
5
+ "train_runtime": 11184.8694,
6
+ "train_samples_per_second": 0.496,
7
+ "train_steps_per_second": 0.124
8
+ }
trainer_log.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0742392223bf62bf3e233a68f09ba267cf039dfafb723ee8590bd8f637eaecfb
3
+ size 5176
training_loss.png ADDED