A-Mahla HF Staff commited on
Commit
cba23e4
·
verified ·
1 Parent(s): 677741e

Model save

Browse files
README.md CHANGED
@@ -1,13 +1,9 @@
1
  ---
2
  base_model: Qwen/Qwen2.5-VL-3B-Instruct
3
- datasets: smolagents/aguvis-stage-2
4
  library_name: transformers
5
  model_name: Qwen2.5-VL-3B-Instruct-Agentic-GUI
6
  tags:
7
  - generated_from_trainer
8
- - open-r1
9
- - vision-language
10
- - vlm
11
  - trl
12
  - sft
13
  licence: license
@@ -15,7 +11,7 @@ licence: license
15
 
16
  # Model Card for Qwen2.5-VL-3B-Instruct-Agentic-GUI
17
 
18
- This model is a fine-tuned version of [Qwen/Qwen2.5-VL-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct) on the [smolagents/aguvis-stage-2](https://huggingface.co/datasets/smolagents/aguvis-stage-2) dataset.
19
  It has been trained using [TRL](https://github.com/huggingface/trl).
20
 
21
  ## Quick start
@@ -31,7 +27,7 @@ print(output["generated_text"])
31
 
32
  ## Training procedure
33
 
34
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/huggingface/smolagents/runs/7y8mgnns)
35
 
36
 
37
  This model was trained with SFT.
 
1
  ---
2
  base_model: Qwen/Qwen2.5-VL-3B-Instruct
 
3
  library_name: transformers
4
  model_name: Qwen2.5-VL-3B-Instruct-Agentic-GUI
5
  tags:
6
  - generated_from_trainer
 
 
 
7
  - trl
8
  - sft
9
  licence: license
 
11
 
12
  # Model Card for Qwen2.5-VL-3B-Instruct-Agentic-GUI
13
 
14
+ This model is a fine-tuned version of [Qwen/Qwen2.5-VL-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/huggingface/smolagents/runs/6le3ndu5)
31
 
32
 
33
  This model was trained with SFT.
all_results.json CHANGED
@@ -5,9 +5,9 @@
5
  "eval_samples_per_second": 12.121,
6
  "eval_steps_per_second": 0.38,
7
  "total_flos": 1.2125984924893184e+16,
8
- "train_loss": 0.645972225476395,
9
- "train_runtime": 88419.8411,
10
  "train_samples": 360252,
11
- "train_samples_per_second": 4.074,
12
- "train_steps_per_second": 0.008
13
  }
 
5
  "eval_samples_per_second": 12.121,
6
  "eval_steps_per_second": 0.38,
7
  "total_flos": 1.2125984924893184e+16,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 1.4965,
10
  "train_samples": 360252,
11
+ "train_samples_per_second": 240725.021,
12
+ "train_steps_per_second": 470.422
13
  }
config.json CHANGED
@@ -5,13 +5,9 @@
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 151643,
7
  "eos_token_id": 151645,
8
- "vision_start_token_id": 151652,
9
- "vision_end_token_id": 151653,
10
- "vision_token_id": 151654,
11
- "image_token_id": 151655,
12
- "video_token_id": 151656,
13
  "hidden_act": "silu",
14
  "hidden_size": 2048,
 
15
  "initializer_range": 0.02,
16
  "intermediate_size": 11008,
17
  "max_position_embeddings": 128000,
@@ -21,41 +17,89 @@
21
  "num_hidden_layers": 36,
22
  "num_key_value_heads": 2,
23
  "rms_norm_eps": 1e-06,
 
 
 
 
 
 
 
 
 
24
  "rope_theta": 1000000.0,
25
  "sliding_window": 32768,
26
- "tie_word_embeddings": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  "torch_dtype": "bfloat16",
28
- "transformers_version": "4.41.2",
29
- "use_cache": true,
30
  "use_sliding_window": false,
 
31
  "vision_config": {
32
  "depth": 32,
 
 
 
 
 
 
33
  "hidden_act": "silu",
34
  "hidden_size": 1280,
 
 
 
35
  "intermediate_size": 3420,
 
36
  "num_heads": 16,
37
- "in_chans": 3,
38
  "out_hidden_size": 2048,
39
  "patch_size": 14,
40
  "spatial_merge_size": 2,
41
  "spatial_patch_size": 14,
42
- "window_size": 112,
43
- "fullatt_block_indexes": [
44
- 7,
45
- 15,
46
- 23,
47
- 31
48
- ],
49
  "tokens_per_second": 2,
50
- "temporal_patch_size": 2
51
- },
52
- "rope_scaling": {
53
- "type": "mrope",
54
- "mrope_section": [
55
- 16,
56
- 24,
57
- 24
58
- ]
59
  },
 
 
 
60
  "vocab_size": 151936
61
- }
 
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 151643,
7
  "eos_token_id": 151645,
 
 
 
 
 
8
  "hidden_act": "silu",
9
  "hidden_size": 2048,
10
+ "image_token_id": 151655,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 11008,
13
  "max_position_embeddings": 128000,
 
17
  "num_hidden_layers": 36,
18
  "num_key_value_heads": 2,
19
  "rms_norm_eps": 1e-06,
20
+ "rope_scaling": {
21
+ "mrope_section": [
22
+ 16,
23
+ 24,
24
+ 24
25
+ ],
26
+ "rope_type": "default",
27
+ "type": "default"
28
+ },
29
  "rope_theta": 1000000.0,
30
  "sliding_window": 32768,
31
+ "text_config": {
32
+ "architectures": [
33
+ "Qwen2_5_VLForConditionalGeneration"
34
+ ],
35
+ "attention_dropout": 0.0,
36
+ "bos_token_id": 151643,
37
+ "eos_token_id": 151645,
38
+ "hidden_act": "silu",
39
+ "hidden_size": 2048,
40
+ "image_token_id": null,
41
+ "initializer_range": 0.02,
42
+ "intermediate_size": 11008,
43
+ "max_position_embeddings": 128000,
44
+ "max_window_layers": 70,
45
+ "model_type": "qwen2_5_vl_text",
46
+ "num_attention_heads": 16,
47
+ "num_hidden_layers": 36,
48
+ "num_key_value_heads": 2,
49
+ "rms_norm_eps": 1e-06,
50
+ "rope_scaling": {
51
+ "mrope_section": [
52
+ 16,
53
+ 24,
54
+ 24
55
+ ],
56
+ "rope_type": "default",
57
+ "type": "default"
58
+ },
59
+ "rope_theta": 1000000.0,
60
+ "sliding_window": 32768,
61
+ "tie_word_embeddings": true,
62
+ "torch_dtype": "bfloat16",
63
+ "use_cache": true,
64
+ "use_sliding_window": false,
65
+ "video_token_id": null,
66
+ "vision_end_token_id": 151653,
67
+ "vision_start_token_id": 151652,
68
+ "vision_token_id": 151654,
69
+ "vocab_size": 151936
70
+ },
71
  "torch_dtype": "bfloat16",
72
+ "transformers_version": "4.52.3",
73
+ "use_cache": false,
74
  "use_sliding_window": false,
75
+ "video_token_id": 151656,
76
  "vision_config": {
77
  "depth": 32,
78
+ "fullatt_block_indexes": [
79
+ 7,
80
+ 15,
81
+ 23,
82
+ 31
83
+ ],
84
  "hidden_act": "silu",
85
  "hidden_size": 1280,
86
+ "in_channels": 3,
87
+ "in_chans": 3,
88
+ "initializer_range": 0.02,
89
  "intermediate_size": 3420,
90
+ "model_type": "qwen2_5_vl",
91
  "num_heads": 16,
 
92
  "out_hidden_size": 2048,
93
  "patch_size": 14,
94
  "spatial_merge_size": 2,
95
  "spatial_patch_size": 14,
96
+ "temporal_patch_size": 2,
 
 
 
 
 
 
97
  "tokens_per_second": 2,
98
+ "torch_dtype": "bfloat16",
99
+ "window_size": 112
 
 
 
 
 
 
 
100
  },
101
+ "vision_end_token_id": 151653,
102
+ "vision_start_token_id": 151652,
103
+ "vision_token_id": 151654,
104
  "vocab_size": 151936
105
+ }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6fe409f01b313692f8fc9bf506320a5c7b9ed2d303aff08eef15b69ce82e9e4
3
- size 4997750728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0bd1bf2cdf09d2aba3c8913a60dffeae4c7e482ec4a7109b5283c72b75ba007
3
+ size 4997756664
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84db7fa01549bbd8c5e5be9331d00a837d5b874cca1c05f967072c2fefa61c05
3
- size 2511587152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:464b852d99ffe18b4ab4fbf725c2b3d95ae58db3d6390d3a191ca55799407cbf
3
+ size 2511590128
model.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,209 +1,207 @@
1
  {
2
- "add_bos_token": false,
3
- "add_prefix_space": false,
4
- "added_tokens_decoder": {
5
- "151643": {
6
- "content": "<|endoftext|>",
7
- "lstrip": false,
8
- "normalized": false,
9
- "rstrip": false,
10
- "single_word": false,
11
- "special": true
12
- },
13
- "151644": {
14
- "content": "<|im_start|>",
15
- "lstrip": false,
16
- "normalized": false,
17
- "rstrip": false,
18
- "single_word": false,
19
- "special": true
20
- },
21
- "151645": {
22
- "content": "<|im_end|>",
23
- "lstrip": false,
24
- "normalized": false,
25
- "rstrip": false,
26
- "single_word": false,
27
- "special": true
28
- },
29
- "151646": {
30
- "content": "<|object_ref_start|>",
31
- "lstrip": false,
32
- "normalized": false,
33
- "rstrip": false,
34
- "single_word": false,
35
- "special": true
36
- },
37
- "151647": {
38
- "content": "<|object_ref_end|>",
39
- "lstrip": false,
40
- "normalized": false,
41
- "rstrip": false,
42
- "single_word": false,
43
- "special": true
44
- },
45
- "151648": {
46
- "content": "<|box_start|>",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": false,
50
- "single_word": false,
51
- "special": true
52
- },
53
- "151649": {
54
- "content": "<|box_end|>",
55
- "lstrip": false,
56
- "normalized": false,
57
- "rstrip": false,
58
- "single_word": false,
59
- "special": true
60
- },
61
- "151650": {
62
- "content": "<|quad_start|>",
63
- "lstrip": false,
64
- "normalized": false,
65
- "rstrip": false,
66
- "single_word": false,
67
- "special": true
68
- },
69
- "151651": {
70
- "content": "<|quad_end|>",
71
- "lstrip": false,
72
- "normalized": false,
73
- "rstrip": false,
74
- "single_word": false,
75
- "special": true
76
- },
77
- "151652": {
78
- "content": "<|vision_start|>",
79
- "lstrip": false,
80
- "normalized": false,
81
- "rstrip": false,
82
- "single_word": false,
83
- "special": true
84
- },
85
- "151653": {
86
- "content": "<|vision_end|>",
87
- "lstrip": false,
88
- "normalized": false,
89
- "rstrip": false,
90
- "single_word": false,
91
- "special": true
92
- },
93
- "151654": {
94
- "content": "<|vision_pad|>",
95
- "lstrip": false,
96
- "normalized": false,
97
- "rstrip": false,
98
- "single_word": false,
99
- "special": true
100
- },
101
- "151655": {
102
- "content": "<|image_pad|>",
103
- "lstrip": false,
104
- "normalized": false,
105
- "rstrip": false,
106
- "single_word": false,
107
- "special": true
108
- },
109
- "151656": {
110
- "content": "<|video_pad|>",
111
- "lstrip": false,
112
- "normalized": false,
113
- "rstrip": false,
114
- "single_word": false,
115
- "special": true
116
- },
117
- "151657": {
118
- "content": "<tool_call>",
119
- "lstrip": false,
120
- "normalized": false,
121
- "rstrip": false,
122
- "single_word": false,
123
- "special": false
124
- },
125
- "151658": {
126
- "content": "</tool_call>",
127
- "lstrip": false,
128
- "normalized": false,
129
- "rstrip": false,
130
- "single_word": false,
131
- "special": false
132
- },
133
- "151659": {
134
- "content": "<|fim_prefix|>",
135
- "lstrip": false,
136
- "normalized": false,
137
- "rstrip": false,
138
- "single_word": false,
139
- "special": false
140
- },
141
- "151660": {
142
- "content": "<|fim_middle|>",
143
- "lstrip": false,
144
- "normalized": false,
145
- "rstrip": false,
146
- "single_word": false,
147
- "special": false
148
- },
149
- "151661": {
150
- "content": "<|fim_suffix|>",
151
- "lstrip": false,
152
- "normalized": false,
153
- "rstrip": false,
154
- "single_word": false,
155
- "special": false
156
- },
157
- "151662": {
158
- "content": "<|fim_pad|>",
159
- "lstrip": false,
160
- "normalized": false,
161
- "rstrip": false,
162
- "single_word": false,
163
- "special": false
164
- },
165
- "151663": {
166
- "content": "<|repo_name|>",
167
- "lstrip": false,
168
- "normalized": false,
169
- "rstrip": false,
170
- "single_word": false,
171
- "special": false
172
- },
173
- "151664": {
174
- "content": "<|file_sep|>",
175
- "lstrip": false,
176
- "normalized": false,
177
- "rstrip": false,
178
- "single_word": false,
179
- "special": false
180
- }
181
- },
182
- "additional_special_tokens": [
183
- "<|im_start|>",
184
- "<|im_end|>",
185
- "<|object_ref_start|>",
186
- "<|object_ref_end|>",
187
- "<|box_start|>",
188
- "<|box_end|>",
189
- "<|quad_start|>",
190
- "<|quad_end|>",
191
- "<|vision_start|>",
192
- "<|vision_end|>",
193
- "<|vision_pad|>",
194
- "<|image_pad|>",
195
- "<|video_pad|>"
196
- ],
197
- "bos_token": null,
198
- "clean_up_tokenization_spaces": false,
199
- "eos_token": "<|im_end|>",
200
- "errors": "replace",
201
- "extra_special_tokens": {},
202
- "model_max_length": 131072,
203
- "pad_token": "<|endoftext|>",
204
- "processor_class": "Qwen2_5_VLProcessor",
205
- "split_special_tokens": false,
206
- "tokenizer_class": "Qwen2Tokenizer",
207
- "unk_token": null,
208
- "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
209
- }
 
1
  {
2
+ "add_bos_token": false,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "151643": {
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "151644": {
14
+ "content": "<|im_start|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "151645": {
22
+ "content": "<|im_end|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "151646": {
30
+ "content": "<|object_ref_start|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "151647": {
38
+ "content": "<|object_ref_end|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "151648": {
46
+ "content": "<|box_start|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "151649": {
54
+ "content": "<|box_end|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "151650": {
62
+ "content": "<|quad_start|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ },
69
+ "151651": {
70
+ "content": "<|quad_end|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
+ },
77
+ "151652": {
78
+ "content": "<|vision_start|>",
79
+ "lstrip": false,
80
+ "normalized": false,
81
+ "rstrip": false,
82
+ "single_word": false,
83
+ "special": true
84
+ },
85
+ "151653": {
86
+ "content": "<|vision_end|>",
87
+ "lstrip": false,
88
+ "normalized": false,
89
+ "rstrip": false,
90
+ "single_word": false,
91
+ "special": true
92
+ },
93
+ "151654": {
94
+ "content": "<|vision_pad|>",
95
+ "lstrip": false,
96
+ "normalized": false,
97
+ "rstrip": false,
98
+ "single_word": false,
99
+ "special": true
100
+ },
101
+ "151655": {
102
+ "content": "<|image_pad|>",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false,
107
+ "special": true
108
+ },
109
+ "151656": {
110
+ "content": "<|video_pad|>",
111
+ "lstrip": false,
112
+ "normalized": false,
113
+ "rstrip": false,
114
+ "single_word": false,
115
+ "special": true
116
+ },
117
+ "151657": {
118
+ "content": "<tool_call>",
119
+ "lstrip": false,
120
+ "normalized": false,
121
+ "rstrip": false,
122
+ "single_word": false,
123
+ "special": false
124
+ },
125
+ "151658": {
126
+ "content": "</tool_call>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false,
131
+ "special": false
132
+ },
133
+ "151659": {
134
+ "content": "<|fim_prefix|>",
135
+ "lstrip": false,
136
+ "normalized": false,
137
+ "rstrip": false,
138
+ "single_word": false,
139
+ "special": false
140
+ },
141
+ "151660": {
142
+ "content": "<|fim_middle|>",
143
+ "lstrip": false,
144
+ "normalized": false,
145
+ "rstrip": false,
146
+ "single_word": false,
147
+ "special": false
148
+ },
149
+ "151661": {
150
+ "content": "<|fim_suffix|>",
151
+ "lstrip": false,
152
+ "normalized": false,
153
+ "rstrip": false,
154
+ "single_word": false,
155
+ "special": false
156
+ },
157
+ "151662": {
158
+ "content": "<|fim_pad|>",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false,
163
+ "special": false
164
+ },
165
+ "151663": {
166
+ "content": "<|repo_name|>",
167
+ "lstrip": false,
168
+ "normalized": false,
169
+ "rstrip": false,
170
+ "single_word": false,
171
+ "special": false
172
+ },
173
+ "151664": {
174
+ "content": "<|file_sep|>",
175
+ "lstrip": false,
176
+ "normalized": false,
177
+ "rstrip": false,
178
+ "single_word": false,
179
+ "special": false
180
+ }
181
+ },
182
+ "additional_special_tokens": [
183
+ "<|im_start|>",
184
+ "<|im_end|>",
185
+ "<|object_ref_start|>",
186
+ "<|object_ref_end|>",
187
+ "<|box_start|>",
188
+ "<|box_end|>",
189
+ "<|quad_start|>",
190
+ "<|quad_end|>",
191
+ "<|vision_start|>",
192
+ "<|vision_end|>",
193
+ "<|vision_pad|>",
194
+ "<|image_pad|>",
195
+ "<|video_pad|>"
196
+ ],
197
+ "bos_token": null,
198
+ "clean_up_tokenization_spaces": false,
199
+ "eos_token": "<|im_end|>",
200
+ "errors": "replace",
201
+ "extra_special_tokens": {},
202
+ "model_max_length": 131072,
203
+ "pad_token": "<|endoftext|>",
204
+ "split_special_tokens": false,
205
+ "tokenizer_class": "Qwen2Tokenizer",
206
+ "unk_token": null
207
+ }
 
 
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 1.2125984924893184e+16,
3
- "train_loss": 0.645972225476395,
4
- "train_runtime": 88419.8411,
5
  "train_samples": 360252,
6
- "train_samples_per_second": 4.074,
7
- "train_steps_per_second": 0.008
8
  }
 
1
  {
2
  "total_flos": 1.2125984924893184e+16,
3
+ "train_loss": 0.0,
4
+ "train_runtime": 1.4965,
5
  "train_samples": 360252,
6
+ "train_samples_per_second": 240725.021,
7
+ "train_steps_per_second": 470.422
8
  }
trainer_state.json CHANGED
@@ -1341,14 +1341,12 @@
1341
  },
1342
  {
1343
  "epoch": 1.0,
1344
- "mean_token_accuracy": 0.8058657122069391,
1345
- "num_tokens": 834374055.0,
1346
  "step": 704,
1347
  "total_flos": 1.2125984924893184e+16,
1348
- "train_loss": 0.645972225476395,
1349
- "train_runtime": 88419.8411,
1350
- "train_samples_per_second": 4.074,
1351
- "train_steps_per_second": 0.008
1352
  }
1353
  ],
1354
  "logging_steps": 5,
 
1341
  },
1342
  {
1343
  "epoch": 1.0,
 
 
1344
  "step": 704,
1345
  "total_flos": 1.2125984924893184e+16,
1346
+ "train_loss": 0.0,
1347
+ "train_runtime": 1.4965,
1348
+ "train_samples_per_second": 240725.021,
1349
+ "train_steps_per_second": 470.422
1350
  }
1351
  ],
1352
  "logging_steps": 5,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75510d220562276768a262cdef788e60d531dcda3cc93519d59555c01f5d8f88
3
  size 7416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9200a5447fbc68c080f36c064447506ad8c2651fb30799814fe17b6d621ddb08
3
  size 7416