Upload folder using huggingface_hub
Browse files- .gitattributes +3 -0
- README.md +63 -0
- adapter_config.json +42 -0
- adapter_model.safetensors +3 -0
- chat_template.jinja +154 -0
- checkpoint-500/README.md +210 -0
- checkpoint-500/adapter_config.json +42 -0
- checkpoint-500/adapter_model.safetensors +3 -0
- checkpoint-500/chat_template.jinja +154 -0
- checkpoint-500/optimizer.pt +3 -0
- checkpoint-500/processor_config.json +63 -0
- checkpoint-500/rng_state.pth +3 -0
- checkpoint-500/scheduler.pt +3 -0
- checkpoint-500/tokenizer.json +3 -0
- checkpoint-500/tokenizer_config.json +33 -0
- checkpoint-500/trainer_state.json +3534 -0
- checkpoint-500/training_args.bin +3 -0
- checkpoint-770/README.md +210 -0
- checkpoint-770/adapter_config.json +42 -0
- checkpoint-770/adapter_model.safetensors +3 -0
- checkpoint-770/chat_template.jinja +154 -0
- checkpoint-770/optimizer.pt +3 -0
- checkpoint-770/processor_config.json +63 -0
- checkpoint-770/rng_state.pth +3 -0
- checkpoint-770/scheduler.pt +3 -0
- checkpoint-770/tokenizer.json +3 -0
- checkpoint-770/tokenizer_config.json +33 -0
- checkpoint-770/trainer_state.json +0 -0
- checkpoint-770/training_args.bin +3 -0
- eval.json +601 -0
- eval.md +63 -0
- predictions.jsonl +98 -0
- processor_config.json +63 -0
- tokenizer.json +3 -0
- tokenizer_config.json +33 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
checkpoint-770/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
base_model: Qwen/Qwen3.5-9B
|
| 3 |
+
library_name: peft
|
| 4 |
+
model_name: v21_semantic_boundaries
|
| 5 |
+
tags:
|
| 6 |
+
- base_model:adapter:Qwen/Qwen3.5-9B
|
| 7 |
+
- lora
|
| 8 |
+
- sft
|
| 9 |
+
- transformers
|
| 10 |
+
- trl
|
| 11 |
+
- unsloth
|
| 12 |
+
licence: license
|
| 13 |
+
pipeline_tag: text-generation
|
| 14 |
+
---
|
| 15 |
+
|
| 16 |
+
# Model Card for v21_semantic_boundaries
|
| 17 |
+
|
| 18 |
+
This model is a fine-tuned version of [Qwen/Qwen3.5-9B](https://huggingface.co/Qwen/Qwen3.5-9B).
|
| 19 |
+
It has been trained using [TRL](https://github.com/huggingface/trl).
|
| 20 |
+
|
| 21 |
+
## Quick start
|
| 22 |
+
|
| 23 |
+
```python
|
| 24 |
+
from transformers import pipeline
|
| 25 |
+
|
| 26 |
+
question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
|
| 27 |
+
generator = pipeline("text-generation", model="None", device="cuda")
|
| 28 |
+
output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
|
| 29 |
+
print(output["generated_text"])
|
| 30 |
+
```
|
| 31 |
+
|
| 32 |
+
## Training procedure
|
| 33 |
+
|
| 34 |
+
|
| 35 |
+
|
| 36 |
+
|
| 37 |
+
This model was trained with SFT.
|
| 38 |
+
|
| 39 |
+
### Framework versions
|
| 40 |
+
|
| 41 |
+
- PEFT 0.18.1
|
| 42 |
+
- TRL: 0.24.0
|
| 43 |
+
- Transformers: 5.3.0
|
| 44 |
+
- Pytorch: 2.10.0
|
| 45 |
+
- Datasets: 4.6.1
|
| 46 |
+
- Tokenizers: 0.22.2
|
| 47 |
+
|
| 48 |
+
## Citations
|
| 49 |
+
|
| 50 |
+
|
| 51 |
+
|
| 52 |
+
Cite TRL as:
|
| 53 |
+
|
| 54 |
+
```bibtex
|
| 55 |
+
@misc{vonwerra2022trl,
|
| 56 |
+
title = {{TRL: Transformer Reinforcement Learning}},
|
| 57 |
+
author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
|
| 58 |
+
year = 2020,
|
| 59 |
+
journal = {GitHub repository},
|
| 60 |
+
publisher = {GitHub},
|
| 61 |
+
howpublished = {\url{https://github.com/huggingface/trl}}
|
| 62 |
+
}
|
| 63 |
+
```
|
adapter_config.json
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"alora_invocation_tokens": null,
|
| 3 |
+
"alpha_pattern": {},
|
| 4 |
+
"arrow_config": null,
|
| 5 |
+
"auto_mapping": {
|
| 6 |
+
"base_model_class": "Qwen3_5ForConditionalGeneration",
|
| 7 |
+
"parent_library": "transformers.models.qwen3_5.modeling_qwen3_5",
|
| 8 |
+
"unsloth_fixed": true
|
| 9 |
+
},
|
| 10 |
+
"base_model_name_or_path": "Qwen/Qwen3.5-9B",
|
| 11 |
+
"bias": "none",
|
| 12 |
+
"corda_config": null,
|
| 13 |
+
"ensure_weight_tying": false,
|
| 14 |
+
"eva_config": null,
|
| 15 |
+
"exclude_modules": null,
|
| 16 |
+
"fan_in_fan_out": false,
|
| 17 |
+
"inference_mode": true,
|
| 18 |
+
"init_lora_weights": true,
|
| 19 |
+
"layer_replication": null,
|
| 20 |
+
"layers_pattern": null,
|
| 21 |
+
"layers_to_transform": null,
|
| 22 |
+
"loftq_config": {},
|
| 23 |
+
"lora_alpha": 16,
|
| 24 |
+
"lora_bias": false,
|
| 25 |
+
"lora_dropout": 0,
|
| 26 |
+
"megatron_config": null,
|
| 27 |
+
"megatron_core": "megatron.core",
|
| 28 |
+
"modules_to_save": null,
|
| 29 |
+
"peft_type": "LORA",
|
| 30 |
+
"peft_version": "0.18.1",
|
| 31 |
+
"qalora_group_size": 16,
|
| 32 |
+
"r": 16,
|
| 33 |
+
"rank_pattern": {},
|
| 34 |
+
"revision": null,
|
| 35 |
+
"target_modules": "(?:.*?(?:language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:qkv|proj|linear_fc1|linear_fc2|out_proj|in_proj_qkv|in_proj_z|in_proj_b|in_proj_a|gate_proj|up_proj|down_proj|q_proj|k_proj|v_proj|o_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:qkv|proj|linear_fc1|linear_fc2|out_proj|in_proj_qkv|in_proj_z|in_proj_b|in_proj_a|gate_proj|up_proj|down_proj|q_proj|k_proj|v_proj|o_proj)))",
|
| 36 |
+
"target_parameters": null,
|
| 37 |
+
"task_type": "CAUSAL_LM",
|
| 38 |
+
"trainable_token_indices": null,
|
| 39 |
+
"use_dora": false,
|
| 40 |
+
"use_qalora": false,
|
| 41 |
+
"use_rslora": false
|
| 42 |
+
}
|
adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8dc94603f0c6e625c9716499f91c5acf38deff4596e0ed2ca5fc3a4f5126806c
|
| 3 |
+
size 173188512
|
chat_template.jinja
ADDED
|
@@ -0,0 +1,154 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{%- set image_count = namespace(value=0) %}
|
| 2 |
+
{%- set video_count = namespace(value=0) %}
|
| 3 |
+
{%- macro render_content(content, do_vision_count, is_system_content=false) %}
|
| 4 |
+
{%- if content is string %}
|
| 5 |
+
{{- content }}
|
| 6 |
+
{%- elif content is iterable and content is not mapping %}
|
| 7 |
+
{%- for item in content %}
|
| 8 |
+
{%- if 'image' in item or 'image_url' in item or item.type == 'image' %}
|
| 9 |
+
{%- if is_system_content %}
|
| 10 |
+
{{- raise_exception('System message cannot contain images.') }}
|
| 11 |
+
{%- endif %}
|
| 12 |
+
{%- if do_vision_count %}
|
| 13 |
+
{%- set image_count.value = image_count.value + 1 %}
|
| 14 |
+
{%- endif %}
|
| 15 |
+
{%- if add_vision_id %}
|
| 16 |
+
{{- 'Picture ' ~ image_count.value ~ ': ' }}
|
| 17 |
+
{%- endif %}
|
| 18 |
+
{{- '<|vision_start|><|image_pad|><|vision_end|>' }}
|
| 19 |
+
{%- elif 'video' in item or item.type == 'video' %}
|
| 20 |
+
{%- if is_system_content %}
|
| 21 |
+
{{- raise_exception('System message cannot contain videos.') }}
|
| 22 |
+
{%- endif %}
|
| 23 |
+
{%- if do_vision_count %}
|
| 24 |
+
{%- set video_count.value = video_count.value + 1 %}
|
| 25 |
+
{%- endif %}
|
| 26 |
+
{%- if add_vision_id %}
|
| 27 |
+
{{- 'Video ' ~ video_count.value ~ ': ' }}
|
| 28 |
+
{%- endif %}
|
| 29 |
+
{{- '<|vision_start|><|video_pad|><|vision_end|>' }}
|
| 30 |
+
{%- elif 'text' in item %}
|
| 31 |
+
{{- item.text }}
|
| 32 |
+
{%- else %}
|
| 33 |
+
{{- raise_exception('Unexpected item type in content.') }}
|
| 34 |
+
{%- endif %}
|
| 35 |
+
{%- endfor %}
|
| 36 |
+
{%- elif content is none or content is undefined %}
|
| 37 |
+
{{- '' }}
|
| 38 |
+
{%- else %}
|
| 39 |
+
{{- raise_exception('Unexpected content type.') }}
|
| 40 |
+
{%- endif %}
|
| 41 |
+
{%- endmacro %}
|
| 42 |
+
{%- if not messages %}
|
| 43 |
+
{{- raise_exception('No messages provided.') }}
|
| 44 |
+
{%- endif %}
|
| 45 |
+
{%- if tools and tools is iterable and tools is not mapping %}
|
| 46 |
+
{{- '<|im_start|>system\n' }}
|
| 47 |
+
{{- "# Tools\n\nYou have access to the following functions:\n\n<tools>" }}
|
| 48 |
+
{%- for tool in tools %}
|
| 49 |
+
{{- "\n" }}
|
| 50 |
+
{{- tool | tojson }}
|
| 51 |
+
{%- endfor %}
|
| 52 |
+
{{- "\n</tools>" }}
|
| 53 |
+
{{- '\n\nIf you choose to call a function ONLY reply in the following format with NO suffix:\n\n<tool_call>\n<function=example_function_name>\n<parameter=example_parameter_1>\nvalue_1\n</parameter>\n<parameter=example_parameter_2>\nThis is the value for the second parameter\nthat can span\nmultiple lines\n</parameter>\n</function>\n</tool_call>\n\n<IMPORTANT>\nReminder:\n- Function calls MUST follow the specified format: an inner <function=...></function> block must be nested within <tool_call></tool_call> XML tags\n- Required parameters MUST be specified\n- You may provide optional reasoning for your function call in natural language BEFORE the function call, but NOT after\n- If there is no function call available, answer the question like normal with your current knowledge and do not tell the user about function calls\n</IMPORTANT>' }}
|
| 54 |
+
{%- if messages[0].role == 'system' %}
|
| 55 |
+
{%- set content = render_content(messages[0].content, false, true)|trim %}
|
| 56 |
+
{%- if content %}
|
| 57 |
+
{{- '\n\n' + content }}
|
| 58 |
+
{%- endif %}
|
| 59 |
+
{%- endif %}
|
| 60 |
+
{{- '<|im_end|>\n' }}
|
| 61 |
+
{%- else %}
|
| 62 |
+
{%- if messages[0].role == 'system' %}
|
| 63 |
+
{%- set content = render_content(messages[0].content, false, true)|trim %}
|
| 64 |
+
{{- '<|im_start|>system\n' + content + '<|im_end|>\n' }}
|
| 65 |
+
{%- endif %}
|
| 66 |
+
{%- endif %}
|
| 67 |
+
{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
|
| 68 |
+
{%- for message in messages[::-1] %}
|
| 69 |
+
{%- set index = (messages|length - 1) - loop.index0 %}
|
| 70 |
+
{%- if ns.multi_step_tool and message.role == "user" %}
|
| 71 |
+
{%- set content = render_content(message.content, false)|trim %}
|
| 72 |
+
{%- if not(content.startswith('<tool_response>') and content.endswith('</tool_response>')) %}
|
| 73 |
+
{%- set ns.multi_step_tool = false %}
|
| 74 |
+
{%- set ns.last_query_index = index %}
|
| 75 |
+
{%- endif %}
|
| 76 |
+
{%- endif %}
|
| 77 |
+
{%- endfor %}
|
| 78 |
+
{%- if ns.multi_step_tool %}
|
| 79 |
+
{{- raise_exception('No user query found in messages.') }}
|
| 80 |
+
{%- endif %}
|
| 81 |
+
{%- for message in messages %}
|
| 82 |
+
{%- set content = render_content(message.content, true)|trim %}
|
| 83 |
+
{%- if message.role == "system" %}
|
| 84 |
+
{%- if not loop.first %}
|
| 85 |
+
{{- raise_exception('System message must be at the beginning.') }}
|
| 86 |
+
{%- endif %}
|
| 87 |
+
{%- elif message.role == "user" %}
|
| 88 |
+
{{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
|
| 89 |
+
{%- elif message.role == "assistant" %}
|
| 90 |
+
{%- set reasoning_content = '' %}
|
| 91 |
+
{%- if message.reasoning_content is string %}
|
| 92 |
+
{%- set reasoning_content = message.reasoning_content %}
|
| 93 |
+
{%- else %}
|
| 94 |
+
{%- if '</think>' in content %}
|
| 95 |
+
{%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
|
| 96 |
+
{%- set content = content.split('</think>')[-1].lstrip('\n') %}
|
| 97 |
+
{%- endif %}
|
| 98 |
+
{%- endif %}
|
| 99 |
+
{%- set reasoning_content = reasoning_content|trim %}
|
| 100 |
+
{%- if loop.index0 > ns.last_query_index %}
|
| 101 |
+
{{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content + '\n</think>\n\n' + content }}
|
| 102 |
+
{%- else %}
|
| 103 |
+
{{- '<|im_start|>' + message.role + '\n' + content }}
|
| 104 |
+
{%- endif %}
|
| 105 |
+
{%- if message.tool_calls and message.tool_calls is iterable and message.tool_calls is not mapping %}
|
| 106 |
+
{%- for tool_call in message.tool_calls %}
|
| 107 |
+
{%- if tool_call.function is defined %}
|
| 108 |
+
{%- set tool_call = tool_call.function %}
|
| 109 |
+
{%- endif %}
|
| 110 |
+
{%- if loop.first %}
|
| 111 |
+
{%- if content|trim %}
|
| 112 |
+
{{- '\n\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 113 |
+
{%- else %}
|
| 114 |
+
{{- '<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 115 |
+
{%- endif %}
|
| 116 |
+
{%- else %}
|
| 117 |
+
{{- '\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 118 |
+
{%- endif %}
|
| 119 |
+
{%- if tool_call.arguments is defined %}
|
| 120 |
+
{%- for args_name, args_value in tool_call.arguments|items %}
|
| 121 |
+
{{- '<parameter=' + args_name + '>\n' }}
|
| 122 |
+
{%- set args_value = args_value | tojson | safe if args_value is mapping or (args_value is sequence and args_value is not string) else args_value | string %}
|
| 123 |
+
{{- args_value }}
|
| 124 |
+
{{- '\n</parameter>\n' }}
|
| 125 |
+
{%- endfor %}
|
| 126 |
+
{%- endif %}
|
| 127 |
+
{{- '</function>\n</tool_call>' }}
|
| 128 |
+
{%- endfor %}
|
| 129 |
+
{%- endif %}
|
| 130 |
+
{{- '<|im_end|>\n' }}
|
| 131 |
+
{%- elif message.role == "tool" %}
|
| 132 |
+
{%- if loop.previtem and loop.previtem.role != "tool" %}
|
| 133 |
+
{{- '<|im_start|>user' }}
|
| 134 |
+
{%- endif %}
|
| 135 |
+
{{- '\n<tool_response>\n' }}
|
| 136 |
+
{{- content }}
|
| 137 |
+
{{- '\n</tool_response>' }}
|
| 138 |
+
{%- if not loop.last and loop.nextitem.role != "tool" %}
|
| 139 |
+
{{- '<|im_end|>\n' }}
|
| 140 |
+
{%- elif loop.last %}
|
| 141 |
+
{{- '<|im_end|>\n' }}
|
| 142 |
+
{%- endif %}
|
| 143 |
+
{%- else %}
|
| 144 |
+
{{- raise_exception('Unexpected message role.') }}
|
| 145 |
+
{%- endif %}
|
| 146 |
+
{%- endfor %}
|
| 147 |
+
{%- if add_generation_prompt %}
|
| 148 |
+
{{- '<|im_start|>assistant\n' }}
|
| 149 |
+
{%- if enable_thinking is defined and enable_thinking is false %}
|
| 150 |
+
{{- '<think>\n\n</think>\n\n' }}
|
| 151 |
+
{%- else %}
|
| 152 |
+
{{- '<think>\n' }}
|
| 153 |
+
{%- endif %}
|
| 154 |
+
{%- endif %}
|
checkpoint-500/README.md
ADDED
|
@@ -0,0 +1,210 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
base_model: Qwen/Qwen3.5-9B
|
| 3 |
+
library_name: peft
|
| 4 |
+
pipeline_tag: text-generation
|
| 5 |
+
tags:
|
| 6 |
+
- base_model:adapter:Qwen/Qwen3.5-9B
|
| 7 |
+
- lora
|
| 8 |
+
- sft
|
| 9 |
+
- transformers
|
| 10 |
+
- trl
|
| 11 |
+
- unsloth
|
| 12 |
+
---
|
| 13 |
+
|
| 14 |
+
# Model Card for Model ID
|
| 15 |
+
|
| 16 |
+
<!-- Provide a quick summary of what the model is/does. -->
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
|
| 20 |
+
## Model Details
|
| 21 |
+
|
| 22 |
+
### Model Description
|
| 23 |
+
|
| 24 |
+
<!-- Provide a longer summary of what this model is. -->
|
| 25 |
+
|
| 26 |
+
|
| 27 |
+
|
| 28 |
+
- **Developed by:** [More Information Needed]
|
| 29 |
+
- **Funded by [optional]:** [More Information Needed]
|
| 30 |
+
- **Shared by [optional]:** [More Information Needed]
|
| 31 |
+
- **Model type:** [More Information Needed]
|
| 32 |
+
- **Language(s) (NLP):** [More Information Needed]
|
| 33 |
+
- **License:** [More Information Needed]
|
| 34 |
+
- **Finetuned from model [optional]:** [More Information Needed]
|
| 35 |
+
|
| 36 |
+
### Model Sources [optional]
|
| 37 |
+
|
| 38 |
+
<!-- Provide the basic links for the model. -->
|
| 39 |
+
|
| 40 |
+
- **Repository:** [More Information Needed]
|
| 41 |
+
- **Paper [optional]:** [More Information Needed]
|
| 42 |
+
- **Demo [optional]:** [More Information Needed]
|
| 43 |
+
|
| 44 |
+
## Uses
|
| 45 |
+
|
| 46 |
+
<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
|
| 47 |
+
|
| 48 |
+
### Direct Use
|
| 49 |
+
|
| 50 |
+
<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
|
| 51 |
+
|
| 52 |
+
[More Information Needed]
|
| 53 |
+
|
| 54 |
+
### Downstream Use [optional]
|
| 55 |
+
|
| 56 |
+
<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
|
| 57 |
+
|
| 58 |
+
[More Information Needed]
|
| 59 |
+
|
| 60 |
+
### Out-of-Scope Use
|
| 61 |
+
|
| 62 |
+
<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
|
| 63 |
+
|
| 64 |
+
[More Information Needed]
|
| 65 |
+
|
| 66 |
+
## Bias, Risks, and Limitations
|
| 67 |
+
|
| 68 |
+
<!-- This section is meant to convey both technical and sociotechnical limitations. -->
|
| 69 |
+
|
| 70 |
+
[More Information Needed]
|
| 71 |
+
|
| 72 |
+
### Recommendations
|
| 73 |
+
|
| 74 |
+
<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
|
| 75 |
+
|
| 76 |
+
Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
|
| 77 |
+
|
| 78 |
+
## How to Get Started with the Model
|
| 79 |
+
|
| 80 |
+
Use the code below to get started with the model.
|
| 81 |
+
|
| 82 |
+
[More Information Needed]
|
| 83 |
+
|
| 84 |
+
## Training Details
|
| 85 |
+
|
| 86 |
+
### Training Data
|
| 87 |
+
|
| 88 |
+
<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
|
| 89 |
+
|
| 90 |
+
[More Information Needed]
|
| 91 |
+
|
| 92 |
+
### Training Procedure
|
| 93 |
+
|
| 94 |
+
<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
|
| 95 |
+
|
| 96 |
+
#### Preprocessing [optional]
|
| 97 |
+
|
| 98 |
+
[More Information Needed]
|
| 99 |
+
|
| 100 |
+
|
| 101 |
+
#### Training Hyperparameters
|
| 102 |
+
|
| 103 |
+
- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
|
| 104 |
+
|
| 105 |
+
#### Speeds, Sizes, Times [optional]
|
| 106 |
+
|
| 107 |
+
<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
|
| 108 |
+
|
| 109 |
+
[More Information Needed]
|
| 110 |
+
|
| 111 |
+
## Evaluation
|
| 112 |
+
|
| 113 |
+
<!-- This section describes the evaluation protocols and provides the results. -->
|
| 114 |
+
|
| 115 |
+
### Testing Data, Factors & Metrics
|
| 116 |
+
|
| 117 |
+
#### Testing Data
|
| 118 |
+
|
| 119 |
+
<!-- This should link to a Dataset Card if possible. -->
|
| 120 |
+
|
| 121 |
+
[More Information Needed]
|
| 122 |
+
|
| 123 |
+
#### Factors
|
| 124 |
+
|
| 125 |
+
<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
|
| 126 |
+
|
| 127 |
+
[More Information Needed]
|
| 128 |
+
|
| 129 |
+
#### Metrics
|
| 130 |
+
|
| 131 |
+
<!-- These are the evaluation metrics being used, ideally with a description of why. -->
|
| 132 |
+
|
| 133 |
+
[More Information Needed]
|
| 134 |
+
|
| 135 |
+
### Results
|
| 136 |
+
|
| 137 |
+
[More Information Needed]
|
| 138 |
+
|
| 139 |
+
#### Summary
|
| 140 |
+
|
| 141 |
+
|
| 142 |
+
|
| 143 |
+
## Model Examination [optional]
|
| 144 |
+
|
| 145 |
+
<!-- Relevant interpretability work for the model goes here -->
|
| 146 |
+
|
| 147 |
+
[More Information Needed]
|
| 148 |
+
|
| 149 |
+
## Environmental Impact
|
| 150 |
+
|
| 151 |
+
<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
|
| 152 |
+
|
| 153 |
+
Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
|
| 154 |
+
|
| 155 |
+
- **Hardware Type:** [More Information Needed]
|
| 156 |
+
- **Hours used:** [More Information Needed]
|
| 157 |
+
- **Cloud Provider:** [More Information Needed]
|
| 158 |
+
- **Compute Region:** [More Information Needed]
|
| 159 |
+
- **Carbon Emitted:** [More Information Needed]
|
| 160 |
+
|
| 161 |
+
## Technical Specifications [optional]
|
| 162 |
+
|
| 163 |
+
### Model Architecture and Objective
|
| 164 |
+
|
| 165 |
+
[More Information Needed]
|
| 166 |
+
|
| 167 |
+
### Compute Infrastructure
|
| 168 |
+
|
| 169 |
+
[More Information Needed]
|
| 170 |
+
|
| 171 |
+
#### Hardware
|
| 172 |
+
|
| 173 |
+
[More Information Needed]
|
| 174 |
+
|
| 175 |
+
#### Software
|
| 176 |
+
|
| 177 |
+
[More Information Needed]
|
| 178 |
+
|
| 179 |
+
## Citation [optional]
|
| 180 |
+
|
| 181 |
+
<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
|
| 182 |
+
|
| 183 |
+
**BibTeX:**
|
| 184 |
+
|
| 185 |
+
[More Information Needed]
|
| 186 |
+
|
| 187 |
+
**APA:**
|
| 188 |
+
|
| 189 |
+
[More Information Needed]
|
| 190 |
+
|
| 191 |
+
## Glossary [optional]
|
| 192 |
+
|
| 193 |
+
<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
|
| 194 |
+
|
| 195 |
+
[More Information Needed]
|
| 196 |
+
|
| 197 |
+
## More Information [optional]
|
| 198 |
+
|
| 199 |
+
[More Information Needed]
|
| 200 |
+
|
| 201 |
+
## Model Card Authors [optional]
|
| 202 |
+
|
| 203 |
+
[More Information Needed]
|
| 204 |
+
|
| 205 |
+
## Model Card Contact
|
| 206 |
+
|
| 207 |
+
[More Information Needed]
|
| 208 |
+
### Framework versions
|
| 209 |
+
|
| 210 |
+
- PEFT 0.18.1
|
checkpoint-500/adapter_config.json
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"alora_invocation_tokens": null,
|
| 3 |
+
"alpha_pattern": {},
|
| 4 |
+
"arrow_config": null,
|
| 5 |
+
"auto_mapping": {
|
| 6 |
+
"base_model_class": "Qwen3_5ForConditionalGeneration",
|
| 7 |
+
"parent_library": "transformers.models.qwen3_5.modeling_qwen3_5",
|
| 8 |
+
"unsloth_fixed": true
|
| 9 |
+
},
|
| 10 |
+
"base_model_name_or_path": "Qwen/Qwen3.5-9B",
|
| 11 |
+
"bias": "none",
|
| 12 |
+
"corda_config": null,
|
| 13 |
+
"ensure_weight_tying": false,
|
| 14 |
+
"eva_config": null,
|
| 15 |
+
"exclude_modules": null,
|
| 16 |
+
"fan_in_fan_out": false,
|
| 17 |
+
"inference_mode": true,
|
| 18 |
+
"init_lora_weights": true,
|
| 19 |
+
"layer_replication": null,
|
| 20 |
+
"layers_pattern": null,
|
| 21 |
+
"layers_to_transform": null,
|
| 22 |
+
"loftq_config": {},
|
| 23 |
+
"lora_alpha": 16,
|
| 24 |
+
"lora_bias": false,
|
| 25 |
+
"lora_dropout": 0,
|
| 26 |
+
"megatron_config": null,
|
| 27 |
+
"megatron_core": "megatron.core",
|
| 28 |
+
"modules_to_save": null,
|
| 29 |
+
"peft_type": "LORA",
|
| 30 |
+
"peft_version": "0.18.1",
|
| 31 |
+
"qalora_group_size": 16,
|
| 32 |
+
"r": 16,
|
| 33 |
+
"rank_pattern": {},
|
| 34 |
+
"revision": null,
|
| 35 |
+
"target_modules": "(?:.*?(?:language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:qkv|proj|linear_fc1|linear_fc2|out_proj|in_proj_qkv|in_proj_z|in_proj_b|in_proj_a|gate_proj|up_proj|down_proj|q_proj|k_proj|v_proj|o_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:qkv|proj|linear_fc1|linear_fc2|out_proj|in_proj_qkv|in_proj_z|in_proj_b|in_proj_a|gate_proj|up_proj|down_proj|q_proj|k_proj|v_proj|o_proj)))",
|
| 36 |
+
"target_parameters": null,
|
| 37 |
+
"task_type": "CAUSAL_LM",
|
| 38 |
+
"trainable_token_indices": null,
|
| 39 |
+
"use_dora": false,
|
| 40 |
+
"use_qalora": false,
|
| 41 |
+
"use_rslora": false
|
| 42 |
+
}
|
checkpoint-500/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7302f5a435c3f2311801ee617b710886c58a92e7197b37676d81ea4261f5f7b9
|
| 3 |
+
size 173188512
|
checkpoint-500/chat_template.jinja
ADDED
|
@@ -0,0 +1,154 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{%- set image_count = namespace(value=0) %}
|
| 2 |
+
{%- set video_count = namespace(value=0) %}
|
| 3 |
+
{%- macro render_content(content, do_vision_count, is_system_content=false) %}
|
| 4 |
+
{%- if content is string %}
|
| 5 |
+
{{- content }}
|
| 6 |
+
{%- elif content is iterable and content is not mapping %}
|
| 7 |
+
{%- for item in content %}
|
| 8 |
+
{%- if 'image' in item or 'image_url' in item or item.type == 'image' %}
|
| 9 |
+
{%- if is_system_content %}
|
| 10 |
+
{{- raise_exception('System message cannot contain images.') }}
|
| 11 |
+
{%- endif %}
|
| 12 |
+
{%- if do_vision_count %}
|
| 13 |
+
{%- set image_count.value = image_count.value + 1 %}
|
| 14 |
+
{%- endif %}
|
| 15 |
+
{%- if add_vision_id %}
|
| 16 |
+
{{- 'Picture ' ~ image_count.value ~ ': ' }}
|
| 17 |
+
{%- endif %}
|
| 18 |
+
{{- '<|vision_start|><|image_pad|><|vision_end|>' }}
|
| 19 |
+
{%- elif 'video' in item or item.type == 'video' %}
|
| 20 |
+
{%- if is_system_content %}
|
| 21 |
+
{{- raise_exception('System message cannot contain videos.') }}
|
| 22 |
+
{%- endif %}
|
| 23 |
+
{%- if do_vision_count %}
|
| 24 |
+
{%- set video_count.value = video_count.value + 1 %}
|
| 25 |
+
{%- endif %}
|
| 26 |
+
{%- if add_vision_id %}
|
| 27 |
+
{{- 'Video ' ~ video_count.value ~ ': ' }}
|
| 28 |
+
{%- endif %}
|
| 29 |
+
{{- '<|vision_start|><|video_pad|><|vision_end|>' }}
|
| 30 |
+
{%- elif 'text' in item %}
|
| 31 |
+
{{- item.text }}
|
| 32 |
+
{%- else %}
|
| 33 |
+
{{- raise_exception('Unexpected item type in content.') }}
|
| 34 |
+
{%- endif %}
|
| 35 |
+
{%- endfor %}
|
| 36 |
+
{%- elif content is none or content is undefined %}
|
| 37 |
+
{{- '' }}
|
| 38 |
+
{%- else %}
|
| 39 |
+
{{- raise_exception('Unexpected content type.') }}
|
| 40 |
+
{%- endif %}
|
| 41 |
+
{%- endmacro %}
|
| 42 |
+
{%- if not messages %}
|
| 43 |
+
{{- raise_exception('No messages provided.') }}
|
| 44 |
+
{%- endif %}
|
| 45 |
+
{%- if tools and tools is iterable and tools is not mapping %}
|
| 46 |
+
{{- '<|im_start|>system\n' }}
|
| 47 |
+
{{- "# Tools\n\nYou have access to the following functions:\n\n<tools>" }}
|
| 48 |
+
{%- for tool in tools %}
|
| 49 |
+
{{- "\n" }}
|
| 50 |
+
{{- tool | tojson }}
|
| 51 |
+
{%- endfor %}
|
| 52 |
+
{{- "\n</tools>" }}
|
| 53 |
+
{{- '\n\nIf you choose to call a function ONLY reply in the following format with NO suffix:\n\n<tool_call>\n<function=example_function_name>\n<parameter=example_parameter_1>\nvalue_1\n</parameter>\n<parameter=example_parameter_2>\nThis is the value for the second parameter\nthat can span\nmultiple lines\n</parameter>\n</function>\n</tool_call>\n\n<IMPORTANT>\nReminder:\n- Function calls MUST follow the specified format: an inner <function=...></function> block must be nested within <tool_call></tool_call> XML tags\n- Required parameters MUST be specified\n- You may provide optional reasoning for your function call in natural language BEFORE the function call, but NOT after\n- If there is no function call available, answer the question like normal with your current knowledge and do not tell the user about function calls\n</IMPORTANT>' }}
|
| 54 |
+
{%- if messages[0].role == 'system' %}
|
| 55 |
+
{%- set content = render_content(messages[0].content, false, true)|trim %}
|
| 56 |
+
{%- if content %}
|
| 57 |
+
{{- '\n\n' + content }}
|
| 58 |
+
{%- endif %}
|
| 59 |
+
{%- endif %}
|
| 60 |
+
{{- '<|im_end|>\n' }}
|
| 61 |
+
{%- else %}
|
| 62 |
+
{%- if messages[0].role == 'system' %}
|
| 63 |
+
{%- set content = render_content(messages[0].content, false, true)|trim %}
|
| 64 |
+
{{- '<|im_start|>system\n' + content + '<|im_end|>\n' }}
|
| 65 |
+
{%- endif %}
|
| 66 |
+
{%- endif %}
|
| 67 |
+
{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
|
| 68 |
+
{%- for message in messages[::-1] %}
|
| 69 |
+
{%- set index = (messages|length - 1) - loop.index0 %}
|
| 70 |
+
{%- if ns.multi_step_tool and message.role == "user" %}
|
| 71 |
+
{%- set content = render_content(message.content, false)|trim %}
|
| 72 |
+
{%- if not(content.startswith('<tool_response>') and content.endswith('</tool_response>')) %}
|
| 73 |
+
{%- set ns.multi_step_tool = false %}
|
| 74 |
+
{%- set ns.last_query_index = index %}
|
| 75 |
+
{%- endif %}
|
| 76 |
+
{%- endif %}
|
| 77 |
+
{%- endfor %}
|
| 78 |
+
{%- if ns.multi_step_tool %}
|
| 79 |
+
{{- raise_exception('No user query found in messages.') }}
|
| 80 |
+
{%- endif %}
|
| 81 |
+
{%- for message in messages %}
|
| 82 |
+
{%- set content = render_content(message.content, true)|trim %}
|
| 83 |
+
{%- if message.role == "system" %}
|
| 84 |
+
{%- if not loop.first %}
|
| 85 |
+
{{- raise_exception('System message must be at the beginning.') }}
|
| 86 |
+
{%- endif %}
|
| 87 |
+
{%- elif message.role == "user" %}
|
| 88 |
+
{{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
|
| 89 |
+
{%- elif message.role == "assistant" %}
|
| 90 |
+
{%- set reasoning_content = '' %}
|
| 91 |
+
{%- if message.reasoning_content is string %}
|
| 92 |
+
{%- set reasoning_content = message.reasoning_content %}
|
| 93 |
+
{%- else %}
|
| 94 |
+
{%- if '</think>' in content %}
|
| 95 |
+
{%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
|
| 96 |
+
{%- set content = content.split('</think>')[-1].lstrip('\n') %}
|
| 97 |
+
{%- endif %}
|
| 98 |
+
{%- endif %}
|
| 99 |
+
{%- set reasoning_content = reasoning_content|trim %}
|
| 100 |
+
{%- if loop.index0 > ns.last_query_index %}
|
| 101 |
+
{{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content + '\n</think>\n\n' + content }}
|
| 102 |
+
{%- else %}
|
| 103 |
+
{{- '<|im_start|>' + message.role + '\n' + content }}
|
| 104 |
+
{%- endif %}
|
| 105 |
+
{%- if message.tool_calls and message.tool_calls is iterable and message.tool_calls is not mapping %}
|
| 106 |
+
{%- for tool_call in message.tool_calls %}
|
| 107 |
+
{%- if tool_call.function is defined %}
|
| 108 |
+
{%- set tool_call = tool_call.function %}
|
| 109 |
+
{%- endif %}
|
| 110 |
+
{%- if loop.first %}
|
| 111 |
+
{%- if content|trim %}
|
| 112 |
+
{{- '\n\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 113 |
+
{%- else %}
|
| 114 |
+
{{- '<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 115 |
+
{%- endif %}
|
| 116 |
+
{%- else %}
|
| 117 |
+
{{- '\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 118 |
+
{%- endif %}
|
| 119 |
+
{%- if tool_call.arguments is defined %}
|
| 120 |
+
{%- for args_name, args_value in tool_call.arguments|items %}
|
| 121 |
+
{{- '<parameter=' + args_name + '>\n' }}
|
| 122 |
+
{%- set args_value = args_value | tojson | safe if args_value is mapping or (args_value is sequence and args_value is not string) else args_value | string %}
|
| 123 |
+
{{- args_value }}
|
| 124 |
+
{{- '\n</parameter>\n' }}
|
| 125 |
+
{%- endfor %}
|
| 126 |
+
{%- endif %}
|
| 127 |
+
{{- '</function>\n</tool_call>' }}
|
| 128 |
+
{%- endfor %}
|
| 129 |
+
{%- endif %}
|
| 130 |
+
{{- '<|im_end|>\n' }}
|
| 131 |
+
{%- elif message.role == "tool" %}
|
| 132 |
+
{%- if loop.previtem and loop.previtem.role != "tool" %}
|
| 133 |
+
{{- '<|im_start|>user' }}
|
| 134 |
+
{%- endif %}
|
| 135 |
+
{{- '\n<tool_response>\n' }}
|
| 136 |
+
{{- content }}
|
| 137 |
+
{{- '\n</tool_response>' }}
|
| 138 |
+
{%- if not loop.last and loop.nextitem.role != "tool" %}
|
| 139 |
+
{{- '<|im_end|>\n' }}
|
| 140 |
+
{%- elif loop.last %}
|
| 141 |
+
{{- '<|im_end|>\n' }}
|
| 142 |
+
{%- endif %}
|
| 143 |
+
{%- else %}
|
| 144 |
+
{{- raise_exception('Unexpected message role.') }}
|
| 145 |
+
{%- endif %}
|
| 146 |
+
{%- endfor %}
|
| 147 |
+
{%- if add_generation_prompt %}
|
| 148 |
+
{{- '<|im_start|>assistant\n' }}
|
| 149 |
+
{%- if enable_thinking is defined and enable_thinking is false %}
|
| 150 |
+
{{- '<think>\n\n</think>\n\n' }}
|
| 151 |
+
{%- else %}
|
| 152 |
+
{{- '<think>\n' }}
|
| 153 |
+
{%- endif %}
|
| 154 |
+
{%- endif %}
|
checkpoint-500/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91d2126200d3f2000e846fc2c5efb0503b7dc1e60da6cc626874b080c19aeaf4
|
| 3 |
+
size 88617029
|
checkpoint-500/processor_config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"image_processor": {
|
| 3 |
+
"data_format": "channels_first",
|
| 4 |
+
"do_convert_rgb": true,
|
| 5 |
+
"do_normalize": true,
|
| 6 |
+
"do_rescale": true,
|
| 7 |
+
"do_resize": true,
|
| 8 |
+
"image_mean": [
|
| 9 |
+
0.5,
|
| 10 |
+
0.5,
|
| 11 |
+
0.5
|
| 12 |
+
],
|
| 13 |
+
"image_processor_type": "Qwen2VLImageProcessorFast",
|
| 14 |
+
"image_std": [
|
| 15 |
+
0.5,
|
| 16 |
+
0.5,
|
| 17 |
+
0.5
|
| 18 |
+
],
|
| 19 |
+
"merge_size": 2,
|
| 20 |
+
"patch_size": 16,
|
| 21 |
+
"resample": 3,
|
| 22 |
+
"rescale_factor": 0.00392156862745098,
|
| 23 |
+
"size": {
|
| 24 |
+
"longest_edge": 16777216,
|
| 25 |
+
"shortest_edge": 65536
|
| 26 |
+
},
|
| 27 |
+
"temporal_patch_size": 2
|
| 28 |
+
},
|
| 29 |
+
"processor_class": "Qwen3VLProcessor",
|
| 30 |
+
"video_processor": {
|
| 31 |
+
"data_format": "channels_first",
|
| 32 |
+
"default_to_square": true,
|
| 33 |
+
"do_convert_rgb": true,
|
| 34 |
+
"do_normalize": true,
|
| 35 |
+
"do_rescale": true,
|
| 36 |
+
"do_resize": true,
|
| 37 |
+
"do_sample_frames": true,
|
| 38 |
+
"fps": 2,
|
| 39 |
+
"image_mean": [
|
| 40 |
+
0.5,
|
| 41 |
+
0.5,
|
| 42 |
+
0.5
|
| 43 |
+
],
|
| 44 |
+
"image_std": [
|
| 45 |
+
0.5,
|
| 46 |
+
0.5,
|
| 47 |
+
0.5
|
| 48 |
+
],
|
| 49 |
+
"max_frames": 768,
|
| 50 |
+
"merge_size": 2,
|
| 51 |
+
"min_frames": 4,
|
| 52 |
+
"patch_size": 16,
|
| 53 |
+
"resample": 3,
|
| 54 |
+
"rescale_factor": 0.00392156862745098,
|
| 55 |
+
"return_metadata": false,
|
| 56 |
+
"size": {
|
| 57 |
+
"longest_edge": 25165824,
|
| 58 |
+
"shortest_edge": 4096
|
| 59 |
+
},
|
| 60 |
+
"temporal_patch_size": 2,
|
| 61 |
+
"video_processor_type": "Qwen3VLVideoProcessor"
|
| 62 |
+
}
|
| 63 |
+
}
|
checkpoint-500/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d6d8fafcd1ee268414be5acf0366296af5b03d60871978712eac1979cb42d65
|
| 3 |
+
size 14645
|
checkpoint-500/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc7746ec87c19743016407a58d3acdb0930ab84f523fb5edda75bbf4563c6928
|
| 3 |
+
size 1465
|
checkpoint-500/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:263dcc3feef53d558a357d52941ff3649fa9cd9a3199934376f2bbf615d49ffc
|
| 3 |
+
size 19989610
|
checkpoint-500/tokenizer_config.json
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"audio_bos_token": "<|audio_start|>",
|
| 4 |
+
"audio_eos_token": "<|audio_end|>",
|
| 5 |
+
"audio_token": "<|audio_pad|>",
|
| 6 |
+
"backend": "tokenizers",
|
| 7 |
+
"bos_token": null,
|
| 8 |
+
"clean_up_tokenization_spaces": false,
|
| 9 |
+
"eos_token": "<|im_end|>",
|
| 10 |
+
"errors": "replace",
|
| 11 |
+
"image_token": "<|image_pad|>",
|
| 12 |
+
"is_local": false,
|
| 13 |
+
"model_max_length": 262144,
|
| 14 |
+
"model_specific_special_tokens": {
|
| 15 |
+
"audio_bos_token": "<|audio_start|>",
|
| 16 |
+
"audio_eos_token": "<|audio_end|>",
|
| 17 |
+
"audio_token": "<|audio_pad|>",
|
| 18 |
+
"image_token": "<|image_pad|>",
|
| 19 |
+
"video_token": "<|video_pad|>",
|
| 20 |
+
"vision_bos_token": "<|vision_start|>",
|
| 21 |
+
"vision_eos_token": "<|vision_end|>"
|
| 22 |
+
},
|
| 23 |
+
"pad_token": "<|endoftext|>",
|
| 24 |
+
"padding_side": "right",
|
| 25 |
+
"pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
|
| 26 |
+
"processor_class": "Qwen3VLProcessor",
|
| 27 |
+
"split_special_tokens": false,
|
| 28 |
+
"tokenizer_class": "TokenizersBackend",
|
| 29 |
+
"unk_token": null,
|
| 30 |
+
"video_token": "<|video_pad|>",
|
| 31 |
+
"vision_bos_token": "<|vision_start|>",
|
| 32 |
+
"vision_eos_token": "<|vision_end|>"
|
| 33 |
+
}
|
checkpoint-500/trainer_state.json
ADDED
|
@@ -0,0 +1,3534 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": null,
|
| 3 |
+
"best_metric": null,
|
| 4 |
+
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 3.5992779783393503,
|
| 6 |
+
"eval_steps": 770,
|
| 7 |
+
"global_step": 500,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 0.007220216606498195,
|
| 14 |
+
"grad_norm": 2.68963885307312,
|
| 15 |
+
"learning_rate": 0.0,
|
| 16 |
+
"loss": 1.880106806755066,
|
| 17 |
+
"step": 1
|
| 18 |
+
},
|
| 19 |
+
{
|
| 20 |
+
"epoch": 0.01444043321299639,
|
| 21 |
+
"grad_norm": 2.3691370487213135,
|
| 22 |
+
"learning_rate": 8e-05,
|
| 23 |
+
"loss": 1.882678508758545,
|
| 24 |
+
"step": 2
|
| 25 |
+
},
|
| 26 |
+
{
|
| 27 |
+
"epoch": 0.021660649819494584,
|
| 28 |
+
"grad_norm": 3.7024030685424805,
|
| 29 |
+
"learning_rate": 0.00016,
|
| 30 |
+
"loss": 1.9426246881484985,
|
| 31 |
+
"step": 3
|
| 32 |
+
},
|
| 33 |
+
{
|
| 34 |
+
"epoch": 0.02888086642599278,
|
| 35 |
+
"grad_norm": 0.7646510601043701,
|
| 36 |
+
"learning_rate": 0.00024,
|
| 37 |
+
"loss": 1.6261038780212402,
|
| 38 |
+
"step": 4
|
| 39 |
+
},
|
| 40 |
+
{
|
| 41 |
+
"epoch": 0.036101083032490974,
|
| 42 |
+
"grad_norm": 0.6628475189208984,
|
| 43 |
+
"learning_rate": 0.00032,
|
| 44 |
+
"loss": 1.478842854499817,
|
| 45 |
+
"step": 5
|
| 46 |
+
},
|
| 47 |
+
{
|
| 48 |
+
"epoch": 0.04332129963898917,
|
| 49 |
+
"grad_norm": 0.7141556143760681,
|
| 50 |
+
"learning_rate": 0.0004,
|
| 51 |
+
"loss": 1.1376413106918335,
|
| 52 |
+
"step": 6
|
| 53 |
+
},
|
| 54 |
+
{
|
| 55 |
+
"epoch": 0.05054151624548736,
|
| 56 |
+
"grad_norm": 0.7212001085281372,
|
| 57 |
+
"learning_rate": 0.0003999983135391464,
|
| 58 |
+
"loss": 1.0410869121551514,
|
| 59 |
+
"step": 7
|
| 60 |
+
},
|
| 61 |
+
{
|
| 62 |
+
"epoch": 0.05776173285198556,
|
| 63 |
+
"grad_norm": 0.7515780925750732,
|
| 64 |
+
"learning_rate": 0.0003999932541850271,
|
| 65 |
+
"loss": 0.8246882557868958,
|
| 66 |
+
"step": 8
|
| 67 |
+
},
|
| 68 |
+
{
|
| 69 |
+
"epoch": 0.06498194945848375,
|
| 70 |
+
"grad_norm": 2.474442481994629,
|
| 71 |
+
"learning_rate": 0.0003999848220229661,
|
| 72 |
+
"loss": 0.7787771821022034,
|
| 73 |
+
"step": 9
|
| 74 |
+
},
|
| 75 |
+
{
|
| 76 |
+
"epoch": 0.07220216606498195,
|
| 77 |
+
"grad_norm": 1.2009592056274414,
|
| 78 |
+
"learning_rate": 0.0003999730171951686,
|
| 79 |
+
"loss": 0.6830324530601501,
|
| 80 |
+
"step": 10
|
| 81 |
+
},
|
| 82 |
+
{
|
| 83 |
+
"epoch": 0.07942238267148015,
|
| 84 |
+
"grad_norm": 0.7545379996299744,
|
| 85 |
+
"learning_rate": 0.00039995783990071825,
|
| 86 |
+
"loss": 0.7438161969184875,
|
| 87 |
+
"step": 11
|
| 88 |
+
},
|
| 89 |
+
{
|
| 90 |
+
"epoch": 0.08664259927797834,
|
| 91 |
+
"grad_norm": 0.9728625416755676,
|
| 92 |
+
"learning_rate": 0.0003999392903955744,
|
| 93 |
+
"loss": 0.6851149797439575,
|
| 94 |
+
"step": 12
|
| 95 |
+
},
|
| 96 |
+
{
|
| 97 |
+
"epoch": 0.09386281588447654,
|
| 98 |
+
"grad_norm": 0.5509404540061951,
|
| 99 |
+
"learning_rate": 0.00039991736899256693,
|
| 100 |
+
"loss": 0.5853980183601379,
|
| 101 |
+
"step": 13
|
| 102 |
+
},
|
| 103 |
+
{
|
| 104 |
+
"epoch": 0.10108303249097472,
|
| 105 |
+
"grad_norm": 0.715829074382782,
|
| 106 |
+
"learning_rate": 0.0003998920760613919,
|
| 107 |
+
"loss": 0.7855823040008545,
|
| 108 |
+
"step": 14
|
| 109 |
+
},
|
| 110 |
+
{
|
| 111 |
+
"epoch": 0.10830324909747292,
|
| 112 |
+
"grad_norm": 0.6777167320251465,
|
| 113 |
+
"learning_rate": 0.0003998634120286046,
|
| 114 |
+
"loss": 0.5202292799949646,
|
| 115 |
+
"step": 15
|
| 116 |
+
},
|
| 117 |
+
{
|
| 118 |
+
"epoch": 0.11552346570397112,
|
| 119 |
+
"grad_norm": 0.5348321199417114,
|
| 120 |
+
"learning_rate": 0.0003998313773776128,
|
| 121 |
+
"loss": 0.6527559757232666,
|
| 122 |
+
"step": 16
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"epoch": 0.12274368231046931,
|
| 126 |
+
"grad_norm": 0.4939132332801819,
|
| 127 |
+
"learning_rate": 0.0003997959726486683,
|
| 128 |
+
"loss": 0.584251880645752,
|
| 129 |
+
"step": 17
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"epoch": 0.1299638989169675,
|
| 133 |
+
"grad_norm": 0.47802454233169556,
|
| 134 |
+
"learning_rate": 0.00039975719843885805,
|
| 135 |
+
"loss": 0.5235528349876404,
|
| 136 |
+
"step": 18
|
| 137 |
+
},
|
| 138 |
+
{
|
| 139 |
+
"epoch": 0.1371841155234657,
|
| 140 |
+
"grad_norm": 0.44072362780570984,
|
| 141 |
+
"learning_rate": 0.0003997150554020938,
|
| 142 |
+
"loss": 0.5184933543205261,
|
| 143 |
+
"step": 19
|
| 144 |
+
},
|
| 145 |
+
{
|
| 146 |
+
"epoch": 0.1444043321299639,
|
| 147 |
+
"grad_norm": 0.4251253306865692,
|
| 148 |
+
"learning_rate": 0.00039966954424910147,
|
| 149 |
+
"loss": 0.6167617440223694,
|
| 150 |
+
"step": 20
|
| 151 |
+
},
|
| 152 |
+
{
|
| 153 |
+
"epoch": 0.15162454873646208,
|
| 154 |
+
"grad_norm": 0.5198166370391846,
|
| 155 |
+
"learning_rate": 0.00039962066574740886,
|
| 156 |
+
"loss": 0.7412333488464355,
|
| 157 |
+
"step": 21
|
| 158 |
+
},
|
| 159 |
+
{
|
| 160 |
+
"epoch": 0.1588447653429603,
|
| 161 |
+
"grad_norm": 0.44667476415634155,
|
| 162 |
+
"learning_rate": 0.00039956842072133266,
|
| 163 |
+
"loss": 0.6361726522445679,
|
| 164 |
+
"step": 22
|
| 165 |
+
},
|
| 166 |
+
{
|
| 167 |
+
"epoch": 0.16606498194945848,
|
| 168 |
+
"grad_norm": 0.40787550806999207,
|
| 169 |
+
"learning_rate": 0.0003995128100519649,
|
| 170 |
+
"loss": 0.49531102180480957,
|
| 171 |
+
"step": 23
|
| 172 |
+
},
|
| 173 |
+
{
|
| 174 |
+
"epoch": 0.17328519855595667,
|
| 175 |
+
"grad_norm": 0.4681910276412964,
|
| 176 |
+
"learning_rate": 0.00039945383467715766,
|
| 177 |
+
"loss": 0.584551990032196,
|
| 178 |
+
"step": 24
|
| 179 |
+
},
|
| 180 |
+
{
|
| 181 |
+
"epoch": 0.18050541516245489,
|
| 182 |
+
"grad_norm": 0.41188451647758484,
|
| 183 |
+
"learning_rate": 0.00039939149559150753,
|
| 184 |
+
"loss": 0.6003429889678955,
|
| 185 |
+
"step": 25
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"epoch": 0.18772563176895307,
|
| 189 |
+
"grad_norm": 0.43262341618537903,
|
| 190 |
+
"learning_rate": 0.0003993257938463389,
|
| 191 |
+
"loss": 0.5725842118263245,
|
| 192 |
+
"step": 26
|
| 193 |
+
},
|
| 194 |
+
{
|
| 195 |
+
"epoch": 0.19494584837545126,
|
| 196 |
+
"grad_norm": 0.45091742277145386,
|
| 197 |
+
"learning_rate": 0.0003992567305496859,
|
| 198 |
+
"loss": 0.6373569965362549,
|
| 199 |
+
"step": 27
|
| 200 |
+
},
|
| 201 |
+
{
|
| 202 |
+
"epoch": 0.20216606498194944,
|
| 203 |
+
"grad_norm": 0.3687536120414734,
|
| 204 |
+
"learning_rate": 0.00039918430686627406,
|
| 205 |
+
"loss": 0.4958152174949646,
|
| 206 |
+
"step": 28
|
| 207 |
+
},
|
| 208 |
+
{
|
| 209 |
+
"epoch": 0.20938628158844766,
|
| 210 |
+
"grad_norm": 0.3994904160499573,
|
| 211 |
+
"learning_rate": 0.00039910852401750036,
|
| 212 |
+
"loss": 0.6146813631057739,
|
| 213 |
+
"step": 29
|
| 214 |
+
},
|
| 215 |
+
{
|
| 216 |
+
"epoch": 0.21660649819494585,
|
| 217 |
+
"grad_norm": 0.41312268376350403,
|
| 218 |
+
"learning_rate": 0.0003990293832814129,
|
| 219 |
+
"loss": 0.5313689708709717,
|
| 220 |
+
"step": 30
|
| 221 |
+
},
|
| 222 |
+
{
|
| 223 |
+
"epoch": 0.22382671480144403,
|
| 224 |
+
"grad_norm": 0.37877994775772095,
|
| 225 |
+
"learning_rate": 0.0003989468859926893,
|
| 226 |
+
"loss": 0.5694329738616943,
|
| 227 |
+
"step": 31
|
| 228 |
+
},
|
| 229 |
+
{
|
| 230 |
+
"epoch": 0.23104693140794225,
|
| 231 |
+
"grad_norm": 0.32251644134521484,
|
| 232 |
+
"learning_rate": 0.0003988610335426139,
|
| 233 |
+
"loss": 0.4476504921913147,
|
| 234 |
+
"step": 32
|
| 235 |
+
},
|
| 236 |
+
{
|
| 237 |
+
"epoch": 0.23826714801444043,
|
| 238 |
+
"grad_norm": 0.40205422043800354,
|
| 239 |
+
"learning_rate": 0.0003987718273790548,
|
| 240 |
+
"loss": 0.4696302115917206,
|
| 241 |
+
"step": 33
|
| 242 |
+
},
|
| 243 |
+
{
|
| 244 |
+
"epoch": 0.24548736462093862,
|
| 245 |
+
"grad_norm": 0.3664834201335907,
|
| 246 |
+
"learning_rate": 0.0003986792690064389,
|
| 247 |
+
"loss": 0.5304725170135498,
|
| 248 |
+
"step": 34
|
| 249 |
+
},
|
| 250 |
+
{
|
| 251 |
+
"epoch": 0.2527075812274368,
|
| 252 |
+
"grad_norm": 0.5150560736656189,
|
| 253 |
+
"learning_rate": 0.000398583359985727,
|
| 254 |
+
"loss": 0.5886795520782471,
|
| 255 |
+
"step": 35
|
| 256 |
+
},
|
| 257 |
+
{
|
| 258 |
+
"epoch": 0.259927797833935,
|
| 259 |
+
"grad_norm": 0.37544649839401245,
|
| 260 |
+
"learning_rate": 0.0003984841019343872,
|
| 261 |
+
"loss": 0.6374161839485168,
|
| 262 |
+
"step": 36
|
| 263 |
+
},
|
| 264 |
+
{
|
| 265 |
+
"epoch": 0.26714801444043323,
|
| 266 |
+
"grad_norm": 0.3426123857498169,
|
| 267 |
+
"learning_rate": 0.0003983814965263676,
|
| 268 |
+
"loss": 0.507249116897583,
|
| 269 |
+
"step": 37
|
| 270 |
+
},
|
| 271 |
+
{
|
| 272 |
+
"epoch": 0.2743682310469314,
|
| 273 |
+
"grad_norm": 0.36909183859825134,
|
| 274 |
+
"learning_rate": 0.00039827554549206836,
|
| 275 |
+
"loss": 0.5216564536094666,
|
| 276 |
+
"step": 38
|
| 277 |
+
},
|
| 278 |
+
{
|
| 279 |
+
"epoch": 0.2815884476534296,
|
| 280 |
+
"grad_norm": 0.3864560127258301,
|
| 281 |
+
"learning_rate": 0.00039816625061831206,
|
| 282 |
+
"loss": 0.4607892632484436,
|
| 283 |
+
"step": 39
|
| 284 |
+
},
|
| 285 |
+
{
|
| 286 |
+
"epoch": 0.2888086642599278,
|
| 287 |
+
"grad_norm": 0.3553301692008972,
|
| 288 |
+
"learning_rate": 0.0003980536137483141,
|
| 289 |
+
"loss": 0.6021184921264648,
|
| 290 |
+
"step": 40
|
| 291 |
+
},
|
| 292 |
+
{
|
| 293 |
+
"epoch": 0.296028880866426,
|
| 294 |
+
"grad_norm": 0.3300604224205017,
|
| 295 |
+
"learning_rate": 0.0003979376367816511,
|
| 296 |
+
"loss": 0.49985307455062866,
|
| 297 |
+
"step": 41
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"epoch": 0.30324909747292417,
|
| 301 |
+
"grad_norm": 0.3894491493701935,
|
| 302 |
+
"learning_rate": 0.0003978183216742292,
|
| 303 |
+
"loss": 0.5403987169265747,
|
| 304 |
+
"step": 42
|
| 305 |
+
},
|
| 306 |
+
{
|
| 307 |
+
"epoch": 0.3104693140794224,
|
| 308 |
+
"grad_norm": 0.32339245080947876,
|
| 309 |
+
"learning_rate": 0.0003976956704382511,
|
| 310 |
+
"loss": 0.5262795090675354,
|
| 311 |
+
"step": 43
|
| 312 |
+
},
|
| 313 |
+
{
|
| 314 |
+
"epoch": 0.3176895306859206,
|
| 315 |
+
"grad_norm": 0.3121689260005951,
|
| 316 |
+
"learning_rate": 0.00039756968514218166,
|
| 317 |
+
"loss": 0.4988410174846649,
|
| 318 |
+
"step": 44
|
| 319 |
+
},
|
| 320 |
+
{
|
| 321 |
+
"epoch": 0.3249097472924188,
|
| 322 |
+
"grad_norm": 0.37562957406044006,
|
| 323 |
+
"learning_rate": 0.0003974403679107138,
|
| 324 |
+
"loss": 0.5539376735687256,
|
| 325 |
+
"step": 45
|
| 326 |
+
},
|
| 327 |
+
{
|
| 328 |
+
"epoch": 0.33212996389891697,
|
| 329 |
+
"grad_norm": 0.3560684323310852,
|
| 330 |
+
"learning_rate": 0.0003973077209247319,
|
| 331 |
+
"loss": 0.4829791784286499,
|
| 332 |
+
"step": 46
|
| 333 |
+
},
|
| 334 |
+
{
|
| 335 |
+
"epoch": 0.33935018050541516,
|
| 336 |
+
"grad_norm": 0.3543923497200012,
|
| 337 |
+
"learning_rate": 0.0003971717464212755,
|
| 338 |
+
"loss": 0.4733068346977234,
|
| 339 |
+
"step": 47
|
| 340 |
+
},
|
| 341 |
+
{
|
| 342 |
+
"epoch": 0.34657039711191334,
|
| 343 |
+
"grad_norm": 0.3253995180130005,
|
| 344 |
+
"learning_rate": 0.0003970324466935013,
|
| 345 |
+
"loss": 0.4318773150444031,
|
| 346 |
+
"step": 48
|
| 347 |
+
},
|
| 348 |
+
{
|
| 349 |
+
"epoch": 0.35379061371841153,
|
| 350 |
+
"grad_norm": 0.3587929904460907,
|
| 351 |
+
"learning_rate": 0.0003968898240906447,
|
| 352 |
+
"loss": 0.6348429322242737,
|
| 353 |
+
"step": 49
|
| 354 |
+
},
|
| 355 |
+
{
|
| 356 |
+
"epoch": 0.36101083032490977,
|
| 357 |
+
"grad_norm": 0.3772837519645691,
|
| 358 |
+
"learning_rate": 0.0003967438810179802,
|
| 359 |
+
"loss": 0.5192855596542358,
|
| 360 |
+
"step": 50
|
| 361 |
+
},
|
| 362 |
+
{
|
| 363 |
+
"epoch": 0.36823104693140796,
|
| 364 |
+
"grad_norm": 0.3878256380558014,
|
| 365 |
+
"learning_rate": 0.0003965946199367804,
|
| 366 |
+
"loss": 0.4653000831604004,
|
| 367 |
+
"step": 51
|
| 368 |
+
},
|
| 369 |
+
{
|
| 370 |
+
"epoch": 0.37545126353790614,
|
| 371 |
+
"grad_norm": 0.306704044342041,
|
| 372 |
+
"learning_rate": 0.00039644204336427506,
|
| 373 |
+
"loss": 0.46054646372795105,
|
| 374 |
+
"step": 52
|
| 375 |
+
},
|
| 376 |
+
{
|
| 377 |
+
"epoch": 0.38267148014440433,
|
| 378 |
+
"grad_norm": 0.3290722072124481,
|
| 379 |
+
"learning_rate": 0.0003962861538736084,
|
| 380 |
+
"loss": 0.4637136459350586,
|
| 381 |
+
"step": 53
|
| 382 |
+
},
|
| 383 |
+
{
|
| 384 |
+
"epoch": 0.3898916967509025,
|
| 385 |
+
"grad_norm": 0.3877376914024353,
|
| 386 |
+
"learning_rate": 0.00039612695409379557,
|
| 387 |
+
"loss": 0.6008591651916504,
|
| 388 |
+
"step": 54
|
| 389 |
+
},
|
| 390 |
+
{
|
| 391 |
+
"epoch": 0.3971119133574007,
|
| 392 |
+
"grad_norm": 0.3738860785961151,
|
| 393 |
+
"learning_rate": 0.00039596444670967864,
|
| 394 |
+
"loss": 0.49255216121673584,
|
| 395 |
+
"step": 55
|
| 396 |
+
},
|
| 397 |
+
{
|
| 398 |
+
"epoch": 0.4043321299638989,
|
| 399 |
+
"grad_norm": 0.43176719546318054,
|
| 400 |
+
"learning_rate": 0.0003957986344618809,
|
| 401 |
+
"loss": 0.6328399777412415,
|
| 402 |
+
"step": 56
|
| 403 |
+
},
|
| 404 |
+
{
|
| 405 |
+
"epoch": 0.41155234657039713,
|
| 406 |
+
"grad_norm": 0.34965041279792786,
|
| 407 |
+
"learning_rate": 0.00039562952014676116,
|
| 408 |
+
"loss": 0.5274545550346375,
|
| 409 |
+
"step": 57
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"epoch": 0.4187725631768953,
|
| 413 |
+
"grad_norm": 0.3525114059448242,
|
| 414 |
+
"learning_rate": 0.000395457106616366,
|
| 415 |
+
"loss": 0.5174035429954529,
|
| 416 |
+
"step": 58
|
| 417 |
+
},
|
| 418 |
+
{
|
| 419 |
+
"epoch": 0.4259927797833935,
|
| 420 |
+
"grad_norm": 0.36805179715156555,
|
| 421 |
+
"learning_rate": 0.0003952813967783822,
|
| 422 |
+
"loss": 0.5132086277008057,
|
| 423 |
+
"step": 59
|
| 424 |
+
},
|
| 425 |
+
{
|
| 426 |
+
"epoch": 0.4332129963898917,
|
| 427 |
+
"grad_norm": 0.3320341110229492,
|
| 428 |
+
"learning_rate": 0.00039510239359608735,
|
| 429 |
+
"loss": 0.47466331720352173,
|
| 430 |
+
"step": 60
|
| 431 |
+
},
|
| 432 |
+
{
|
| 433 |
+
"epoch": 0.4404332129963899,
|
| 434 |
+
"grad_norm": 0.36727970838546753,
|
| 435 |
+
"learning_rate": 0.0003949201000883001,
|
| 436 |
+
"loss": 0.5845056772232056,
|
| 437 |
+
"step": 61
|
| 438 |
+
},
|
| 439 |
+
{
|
| 440 |
+
"epoch": 0.44765342960288806,
|
| 441 |
+
"grad_norm": 0.31494706869125366,
|
| 442 |
+
"learning_rate": 0.000394734519329329,
|
| 443 |
+
"loss": 0.5123739242553711,
|
| 444 |
+
"step": 62
|
| 445 |
+
},
|
| 446 |
+
{
|
| 447 |
+
"epoch": 0.4548736462093863,
|
| 448 |
+
"grad_norm": 0.31959858536720276,
|
| 449 |
+
"learning_rate": 0.00039454565444892094,
|
| 450 |
+
"loss": 0.3888605237007141,
|
| 451 |
+
"step": 63
|
| 452 |
+
},
|
| 453 |
+
{
|
| 454 |
+
"epoch": 0.4620938628158845,
|
| 455 |
+
"grad_norm": 0.4212755262851715,
|
| 456 |
+
"learning_rate": 0.0003943535086322083,
|
| 457 |
+
"loss": 0.6065781712532043,
|
| 458 |
+
"step": 64
|
| 459 |
+
},
|
| 460 |
+
{
|
| 461 |
+
"epoch": 0.4693140794223827,
|
| 462 |
+
"grad_norm": 0.2938922643661499,
|
| 463 |
+
"learning_rate": 0.0003941580851196549,
|
| 464 |
+
"loss": 0.47488927841186523,
|
| 465 |
+
"step": 65
|
| 466 |
+
},
|
| 467 |
+
{
|
| 468 |
+
"epoch": 0.47653429602888087,
|
| 469 |
+
"grad_norm": 0.27896228432655334,
|
| 470 |
+
"learning_rate": 0.00039395938720700196,
|
| 471 |
+
"loss": 0.36559349298477173,
|
| 472 |
+
"step": 66
|
| 473 |
+
},
|
| 474 |
+
{
|
| 475 |
+
"epoch": 0.48375451263537905,
|
| 476 |
+
"grad_norm": 0.34284013509750366,
|
| 477 |
+
"learning_rate": 0.0003937574182452118,
|
| 478 |
+
"loss": 0.49944937229156494,
|
| 479 |
+
"step": 67
|
| 480 |
+
},
|
| 481 |
+
{
|
| 482 |
+
"epoch": 0.49097472924187724,
|
| 483 |
+
"grad_norm": 0.3411049544811249,
|
| 484 |
+
"learning_rate": 0.00039355218164041194,
|
| 485 |
+
"loss": 0.5018436312675476,
|
| 486 |
+
"step": 68
|
| 487 |
+
},
|
| 488 |
+
{
|
| 489 |
+
"epoch": 0.4981949458483754,
|
| 490 |
+
"grad_norm": 0.35431182384490967,
|
| 491 |
+
"learning_rate": 0.0003933436808538375,
|
| 492 |
+
"loss": 0.42643067240715027,
|
| 493 |
+
"step": 69
|
| 494 |
+
},
|
| 495 |
+
{
|
| 496 |
+
"epoch": 0.5054151624548736,
|
| 497 |
+
"grad_norm": 0.3351145386695862,
|
| 498 |
+
"learning_rate": 0.00039313191940177256,
|
| 499 |
+
"loss": 0.5355833768844604,
|
| 500 |
+
"step": 70
|
| 501 |
+
},
|
| 502 |
+
{
|
| 503 |
+
"epoch": 0.5126353790613718,
|
| 504 |
+
"grad_norm": 0.3065779507160187,
|
| 505 |
+
"learning_rate": 0.00039291690085549105,
|
| 506 |
+
"loss": 0.4329970180988312,
|
| 507 |
+
"step": 71
|
| 508 |
+
},
|
| 509 |
+
{
|
| 510 |
+
"epoch": 0.51985559566787,
|
| 511 |
+
"grad_norm": 0.5208595395088196,
|
| 512 |
+
"learning_rate": 0.00039269862884119664,
|
| 513 |
+
"loss": 0.5850666165351868,
|
| 514 |
+
"step": 72
|
| 515 |
+
},
|
| 516 |
+
{
|
| 517 |
+
"epoch": 0.5270758122743683,
|
| 518 |
+
"grad_norm": 0.3183553218841553,
|
| 519 |
+
"learning_rate": 0.00039247710703996144,
|
| 520 |
+
"loss": 0.5500473380088806,
|
| 521 |
+
"step": 73
|
| 522 |
+
},
|
| 523 |
+
{
|
| 524 |
+
"epoch": 0.5342960288808665,
|
| 525 |
+
"grad_norm": 0.32788676023483276,
|
| 526 |
+
"learning_rate": 0.0003922523391876638,
|
| 527 |
+
"loss": 0.5200982093811035,
|
| 528 |
+
"step": 74
|
| 529 |
+
},
|
| 530 |
+
{
|
| 531 |
+
"epoch": 0.5415162454873647,
|
| 532 |
+
"grad_norm": 0.2959986925125122,
|
| 533 |
+
"learning_rate": 0.00039202432907492566,
|
| 534 |
+
"loss": 0.4983074963092804,
|
| 535 |
+
"step": 75
|
| 536 |
+
},
|
| 537 |
+
{
|
| 538 |
+
"epoch": 0.5487364620938628,
|
| 539 |
+
"grad_norm": 0.32182440161705017,
|
| 540 |
+
"learning_rate": 0.0003917930805470483,
|
| 541 |
+
"loss": 0.44362854957580566,
|
| 542 |
+
"step": 76
|
| 543 |
+
},
|
| 544 |
+
{
|
| 545 |
+
"epoch": 0.555956678700361,
|
| 546 |
+
"grad_norm": 0.2816471755504608,
|
| 547 |
+
"learning_rate": 0.00039155859750394754,
|
| 548 |
+
"loss": 0.44515836238861084,
|
| 549 |
+
"step": 77
|
| 550 |
+
},
|
| 551 |
+
{
|
| 552 |
+
"epoch": 0.5631768953068592,
|
| 553 |
+
"grad_norm": 0.290783554315567,
|
| 554 |
+
"learning_rate": 0.0003913208839000882,
|
| 555 |
+
"loss": 0.46542418003082275,
|
| 556 |
+
"step": 78
|
| 557 |
+
},
|
| 558 |
+
{
|
| 559 |
+
"epoch": 0.5703971119133574,
|
| 560 |
+
"grad_norm": 0.366773396730423,
|
| 561 |
+
"learning_rate": 0.0003910799437444171,
|
| 562 |
+
"loss": 0.5370551943778992,
|
| 563 |
+
"step": 79
|
| 564 |
+
},
|
| 565 |
+
{
|
| 566 |
+
"epoch": 0.5776173285198556,
|
| 567 |
+
"grad_norm": 0.32066911458969116,
|
| 568 |
+
"learning_rate": 0.0003908357811002957,
|
| 569 |
+
"loss": 0.5146384239196777,
|
| 570 |
+
"step": 80
|
| 571 |
+
},
|
| 572 |
+
{
|
| 573 |
+
"epoch": 0.5848375451263538,
|
| 574 |
+
"grad_norm": 0.3420974016189575,
|
| 575 |
+
"learning_rate": 0.00039058840008543135,
|
| 576 |
+
"loss": 0.6218519806861877,
|
| 577 |
+
"step": 81
|
| 578 |
+
},
|
| 579 |
+
{
|
| 580 |
+
"epoch": 0.592057761732852,
|
| 581 |
+
"grad_norm": 0.3156997263431549,
|
| 582 |
+
"learning_rate": 0.000390337804871808,
|
| 583 |
+
"loss": 0.549630343914032,
|
| 584 |
+
"step": 82
|
| 585 |
+
},
|
| 586 |
+
{
|
| 587 |
+
"epoch": 0.5992779783393501,
|
| 588 |
+
"grad_norm": 0.3494798541069031,
|
| 589 |
+
"learning_rate": 0.00039008399968561597,
|
| 590 |
+
"loss": 0.5499352216720581,
|
| 591 |
+
"step": 83
|
| 592 |
+
},
|
| 593 |
+
{
|
| 594 |
+
"epoch": 0.6064981949458483,
|
| 595 |
+
"grad_norm": 0.3652164936065674,
|
| 596 |
+
"learning_rate": 0.0003898269888071803,
|
| 597 |
+
"loss": 0.5562577843666077,
|
| 598 |
+
"step": 84
|
| 599 |
+
},
|
| 600 |
+
{
|
| 601 |
+
"epoch": 0.6137184115523465,
|
| 602 |
+
"grad_norm": 0.34751319885253906,
|
| 603 |
+
"learning_rate": 0.0003895667765708887,
|
| 604 |
+
"loss": 0.5954532027244568,
|
| 605 |
+
"step": 85
|
| 606 |
+
},
|
| 607 |
+
{
|
| 608 |
+
"epoch": 0.6209386281588448,
|
| 609 |
+
"grad_norm": 0.28338274359703064,
|
| 610 |
+
"learning_rate": 0.0003893033673651189,
|
| 611 |
+
"loss": 0.4894581735134125,
|
| 612 |
+
"step": 86
|
| 613 |
+
},
|
| 614 |
+
{
|
| 615 |
+
"epoch": 0.628158844765343,
|
| 616 |
+
"grad_norm": 0.29019951820373535,
|
| 617 |
+
"learning_rate": 0.00038903676563216394,
|
| 618 |
+
"loss": 0.4635826349258423,
|
| 619 |
+
"step": 87
|
| 620 |
+
},
|
| 621 |
+
{
|
| 622 |
+
"epoch": 0.6353790613718412,
|
| 623 |
+
"grad_norm": 0.2782176434993744,
|
| 624 |
+
"learning_rate": 0.00038876697586815763,
|
| 625 |
+
"loss": 0.4121658205986023,
|
| 626 |
+
"step": 88
|
| 627 |
+
},
|
| 628 |
+
{
|
| 629 |
+
"epoch": 0.6425992779783394,
|
| 630 |
+
"grad_norm": 0.27983078360557556,
|
| 631 |
+
"learning_rate": 0.0003884940026229988,
|
| 632 |
+
"loss": 0.40188780426979065,
|
| 633 |
+
"step": 89
|
| 634 |
+
},
|
| 635 |
+
{
|
| 636 |
+
"epoch": 0.6498194945848376,
|
| 637 |
+
"grad_norm": 0.2786664366722107,
|
| 638 |
+
"learning_rate": 0.0003882178505002744,
|
| 639 |
+
"loss": 0.44132208824157715,
|
| 640 |
+
"step": 90
|
| 641 |
+
},
|
| 642 |
+
{
|
| 643 |
+
"epoch": 0.6570397111913358,
|
| 644 |
+
"grad_norm": 0.3355483412742615,
|
| 645 |
+
"learning_rate": 0.0003879385241571817,
|
| 646 |
+
"loss": 0.512315034866333,
|
| 647 |
+
"step": 91
|
| 648 |
+
},
|
| 649 |
+
{
|
| 650 |
+
"epoch": 0.6642599277978339,
|
| 651 |
+
"grad_norm": 0.29554808139801025,
|
| 652 |
+
"learning_rate": 0.0003876560283044503,
|
| 653 |
+
"loss": 0.4540112018585205,
|
| 654 |
+
"step": 92
|
| 655 |
+
},
|
| 656 |
+
{
|
| 657 |
+
"epoch": 0.6714801444043321,
|
| 658 |
+
"grad_norm": 0.3431720435619354,
|
| 659 |
+
"learning_rate": 0.00038737036770626214,
|
| 660 |
+
"loss": 0.45164141058921814,
|
| 661 |
+
"step": 93
|
| 662 |
+
},
|
| 663 |
+
{
|
| 664 |
+
"epoch": 0.6787003610108303,
|
| 665 |
+
"grad_norm": 0.37090009450912476,
|
| 666 |
+
"learning_rate": 0.0003870815471801714,
|
| 667 |
+
"loss": 0.4878736734390259,
|
| 668 |
+
"step": 94
|
| 669 |
+
},
|
| 670 |
+
{
|
| 671 |
+
"epoch": 0.6859205776173285,
|
| 672 |
+
"grad_norm": 0.35553082823753357,
|
| 673 |
+
"learning_rate": 0.0003867895715970231,
|
| 674 |
+
"loss": 0.5573399662971497,
|
| 675 |
+
"step": 95
|
| 676 |
+
},
|
| 677 |
+
{
|
| 678 |
+
"epoch": 0.6931407942238267,
|
| 679 |
+
"grad_norm": 0.30914071202278137,
|
| 680 |
+
"learning_rate": 0.00038649444588087115,
|
| 681 |
+
"loss": 0.5417919754981995,
|
| 682 |
+
"step": 96
|
| 683 |
+
},
|
| 684 |
+
{
|
| 685 |
+
"epoch": 0.7003610108303249,
|
| 686 |
+
"grad_norm": 0.27384090423583984,
|
| 687 |
+
"learning_rate": 0.0003861961750088954,
|
| 688 |
+
"loss": 0.4475242793560028,
|
| 689 |
+
"step": 97
|
| 690 |
+
},
|
| 691 |
+
{
|
| 692 |
+
"epoch": 0.7075812274368231,
|
| 693 |
+
"grad_norm": 0.2919006049633026,
|
| 694 |
+
"learning_rate": 0.0003858947640113171,
|
| 695 |
+
"loss": 0.44341611862182617,
|
| 696 |
+
"step": 98
|
| 697 |
+
},
|
| 698 |
+
{
|
| 699 |
+
"epoch": 0.7148014440433214,
|
| 700 |
+
"grad_norm": 0.33408623933792114,
|
| 701 |
+
"learning_rate": 0.000385590217971315,
|
| 702 |
+
"loss": 0.5056685209274292,
|
| 703 |
+
"step": 99
|
| 704 |
+
},
|
| 705 |
+
{
|
| 706 |
+
"epoch": 0.7220216606498195,
|
| 707 |
+
"grad_norm": 0.3498390018939972,
|
| 708 |
+
"learning_rate": 0.0003852825420249386,
|
| 709 |
+
"loss": 0.45975226163864136,
|
| 710 |
+
"step": 100
|
| 711 |
+
},
|
| 712 |
+
{
|
| 713 |
+
"epoch": 0.7292418772563177,
|
| 714 |
+
"grad_norm": 0.32381942868232727,
|
| 715 |
+
"learning_rate": 0.0003849717413610224,
|
| 716 |
+
"loss": 0.43437302112579346,
|
| 717 |
+
"step": 101
|
| 718 |
+
},
|
| 719 |
+
{
|
| 720 |
+
"epoch": 0.7364620938628159,
|
| 721 |
+
"grad_norm": 0.30022308230400085,
|
| 722 |
+
"learning_rate": 0.0003846578212210979,
|
| 723 |
+
"loss": 0.41799411177635193,
|
| 724 |
+
"step": 102
|
| 725 |
+
},
|
| 726 |
+
{
|
| 727 |
+
"epoch": 0.7436823104693141,
|
| 728 |
+
"grad_norm": 0.31061094999313354,
|
| 729 |
+
"learning_rate": 0.0003843407868993054,
|
| 730 |
+
"loss": 0.5682204365730286,
|
| 731 |
+
"step": 103
|
| 732 |
+
},
|
| 733 |
+
{
|
| 734 |
+
"epoch": 0.7509025270758123,
|
| 735 |
+
"grad_norm": 0.31062883138656616,
|
| 736 |
+
"learning_rate": 0.0003840206437423047,
|
| 737 |
+
"loss": 0.3520132303237915,
|
| 738 |
+
"step": 104
|
| 739 |
+
},
|
| 740 |
+
{
|
| 741 |
+
"epoch": 0.7581227436823105,
|
| 742 |
+
"grad_norm": 0.36826908588409424,
|
| 743 |
+
"learning_rate": 0.00038369739714918464,
|
| 744 |
+
"loss": 0.546819269657135,
|
| 745 |
+
"step": 105
|
| 746 |
+
},
|
| 747 |
+
{
|
| 748 |
+
"epoch": 0.7653429602888087,
|
| 749 |
+
"grad_norm": 0.35304203629493713,
|
| 750 |
+
"learning_rate": 0.00038337105257137263,
|
| 751 |
+
"loss": 0.5633726716041565,
|
| 752 |
+
"step": 106
|
| 753 |
+
},
|
| 754 |
+
{
|
| 755 |
+
"epoch": 0.7725631768953068,
|
| 756 |
+
"grad_norm": 0.2879215478897095,
|
| 757 |
+
"learning_rate": 0.00038304161551254207,
|
| 758 |
+
"loss": 0.42212507128715515,
|
| 759 |
+
"step": 107
|
| 760 |
+
},
|
| 761 |
+
{
|
| 762 |
+
"epoch": 0.779783393501805,
|
| 763 |
+
"grad_norm": 0.32802048325538635,
|
| 764 |
+
"learning_rate": 0.0003827090915285202,
|
| 765 |
+
"loss": 0.4973101019859314,
|
| 766 |
+
"step": 108
|
| 767 |
+
},
|
| 768 |
+
{
|
| 769 |
+
"epoch": 0.7870036101083032,
|
| 770 |
+
"grad_norm": 0.29462599754333496,
|
| 771 |
+
"learning_rate": 0.0003823734862271937,
|
| 772 |
+
"loss": 0.4543662667274475,
|
| 773 |
+
"step": 109
|
| 774 |
+
},
|
| 775 |
+
{
|
| 776 |
+
"epoch": 0.7942238267148014,
|
| 777 |
+
"grad_norm": 0.34288832545280457,
|
| 778 |
+
"learning_rate": 0.0003820348052684146,
|
| 779 |
+
"loss": 0.5599743127822876,
|
| 780 |
+
"step": 110
|
| 781 |
+
},
|
| 782 |
+
{
|
| 783 |
+
"epoch": 0.8014440433212996,
|
| 784 |
+
"grad_norm": 0.2871699333190918,
|
| 785 |
+
"learning_rate": 0.00038169305436390477,
|
| 786 |
+
"loss": 0.5132560133934021,
|
| 787 |
+
"step": 111
|
| 788 |
+
},
|
| 789 |
+
{
|
| 790 |
+
"epoch": 0.8086642599277978,
|
| 791 |
+
"grad_norm": 0.3307580053806305,
|
| 792 |
+
"learning_rate": 0.00038134823927715933,
|
| 793 |
+
"loss": 0.5319223403930664,
|
| 794 |
+
"step": 112
|
| 795 |
+
},
|
| 796 |
+
{
|
| 797 |
+
"epoch": 0.8158844765342961,
|
| 798 |
+
"grad_norm": 0.3292873799800873,
|
| 799 |
+
"learning_rate": 0.0003810003658233498,
|
| 800 |
+
"loss": 0.5933513045310974,
|
| 801 |
+
"step": 113
|
| 802 |
+
},
|
| 803 |
+
{
|
| 804 |
+
"epoch": 0.8231046931407943,
|
| 805 |
+
"grad_norm": 0.34675127267837524,
|
| 806 |
+
"learning_rate": 0.0003806494398692258,
|
| 807 |
+
"loss": 0.6370081901550293,
|
| 808 |
+
"step": 114
|
| 809 |
+
},
|
| 810 |
+
{
|
| 811 |
+
"epoch": 0.8303249097472925,
|
| 812 |
+
"grad_norm": 0.31837624311447144,
|
| 813 |
+
"learning_rate": 0.00038029546733301615,
|
| 814 |
+
"loss": 0.44530773162841797,
|
| 815 |
+
"step": 115
|
| 816 |
+
},
|
| 817 |
+
{
|
| 818 |
+
"epoch": 0.8375451263537906,
|
| 819 |
+
"grad_norm": 0.3014152944087982,
|
| 820 |
+
"learning_rate": 0.0003799384541843291,
|
| 821 |
+
"loss": 0.5310161113739014,
|
| 822 |
+
"step": 116
|
| 823 |
+
},
|
| 824 |
+
{
|
| 825 |
+
"epoch": 0.8447653429602888,
|
| 826 |
+
"grad_norm": 0.30693644285202026,
|
| 827 |
+
"learning_rate": 0.00037957840644405164,
|
| 828 |
+
"loss": 0.5011177659034729,
|
| 829 |
+
"step": 117
|
| 830 |
+
},
|
| 831 |
+
{
|
| 832 |
+
"epoch": 0.851985559566787,
|
| 833 |
+
"grad_norm": 0.2840467095375061,
|
| 834 |
+
"learning_rate": 0.000379215330184248,
|
| 835 |
+
"loss": 0.37618446350097656,
|
| 836 |
+
"step": 118
|
| 837 |
+
},
|
| 838 |
+
{
|
| 839 |
+
"epoch": 0.8592057761732852,
|
| 840 |
+
"grad_norm": 0.3380180597305298,
|
| 841 |
+
"learning_rate": 0.00037884923152805715,
|
| 842 |
+
"loss": 0.5536396503448486,
|
| 843 |
+
"step": 119
|
| 844 |
+
},
|
| 845 |
+
{
|
| 846 |
+
"epoch": 0.8664259927797834,
|
| 847 |
+
"grad_norm": 0.30026137828826904,
|
| 848 |
+
"learning_rate": 0.00037848011664958956,
|
| 849 |
+
"loss": 0.5487097501754761,
|
| 850 |
+
"step": 120
|
| 851 |
+
},
|
| 852 |
+
{
|
| 853 |
+
"epoch": 0.8736462093862816,
|
| 854 |
+
"grad_norm": 0.3990669250488281,
|
| 855 |
+
"learning_rate": 0.00037810799177382325,
|
| 856 |
+
"loss": 0.34712734818458557,
|
| 857 |
+
"step": 121
|
| 858 |
+
},
|
| 859 |
+
{
|
| 860 |
+
"epoch": 0.8808664259927798,
|
| 861 |
+
"grad_norm": 0.3168427646160126,
|
| 862 |
+
"learning_rate": 0.0003777328631764986,
|
| 863 |
+
"loss": 0.44405245780944824,
|
| 864 |
+
"step": 122
|
| 865 |
+
},
|
| 866 |
+
{
|
| 867 |
+
"epoch": 0.8880866425992779,
|
| 868 |
+
"grad_norm": 0.2761262059211731,
|
| 869 |
+
"learning_rate": 0.0003773547371840124,
|
| 870 |
+
"loss": 0.4112606942653656,
|
| 871 |
+
"step": 123
|
| 872 |
+
},
|
| 873 |
+
{
|
| 874 |
+
"epoch": 0.8953068592057761,
|
| 875 |
+
"grad_norm": 0.27056002616882324,
|
| 876 |
+
"learning_rate": 0.00037697362017331164,
|
| 877 |
+
"loss": 0.45218032598495483,
|
| 878 |
+
"step": 124
|
| 879 |
+
},
|
| 880 |
+
{
|
| 881 |
+
"epoch": 0.9025270758122743,
|
| 882 |
+
"grad_norm": 0.2833767831325531,
|
| 883 |
+
"learning_rate": 0.00037658951857178543,
|
| 884 |
+
"loss": 0.4833817481994629,
|
| 885 |
+
"step": 125
|
| 886 |
+
},
|
| 887 |
+
{
|
| 888 |
+
"epoch": 0.9097472924187726,
|
| 889 |
+
"grad_norm": 0.30818742513656616,
|
| 890 |
+
"learning_rate": 0.0003762024388571569,
|
| 891 |
+
"loss": 0.4847618341445923,
|
| 892 |
+
"step": 126
|
| 893 |
+
},
|
| 894 |
+
{
|
| 895 |
+
"epoch": 0.9169675090252708,
|
| 896 |
+
"grad_norm": 0.32447490096092224,
|
| 897 |
+
"learning_rate": 0.00037581238755737405,
|
| 898 |
+
"loss": 0.5068320035934448,
|
| 899 |
+
"step": 127
|
| 900 |
+
},
|
| 901 |
+
{
|
| 902 |
+
"epoch": 0.924187725631769,
|
| 903 |
+
"grad_norm": 0.307781845331192,
|
| 904 |
+
"learning_rate": 0.0003754193712504992,
|
| 905 |
+
"loss": 0.455619752407074,
|
| 906 |
+
"step": 128
|
| 907 |
+
},
|
| 908 |
+
{
|
| 909 |
+
"epoch": 0.9314079422382672,
|
| 910 |
+
"grad_norm": 0.29909971356391907,
|
| 911 |
+
"learning_rate": 0.00037502339656459853,
|
| 912 |
+
"loss": 0.5618020296096802,
|
| 913 |
+
"step": 129
|
| 914 |
+
},
|
| 915 |
+
{
|
| 916 |
+
"epoch": 0.9386281588447654,
|
| 917 |
+
"grad_norm": 0.33699020743370056,
|
| 918 |
+
"learning_rate": 0.0003746244701776302,
|
| 919 |
+
"loss": 0.50435870885849,
|
| 920 |
+
"step": 130
|
| 921 |
+
},
|
| 922 |
+
{
|
| 923 |
+
"epoch": 0.9458483754512635,
|
| 924 |
+
"grad_norm": 0.2932925820350647,
|
| 925 |
+
"learning_rate": 0.0003742225988173315,
|
| 926 |
+
"loss": 0.503471314907074,
|
| 927 |
+
"step": 131
|
| 928 |
+
},
|
| 929 |
+
{
|
| 930 |
+
"epoch": 0.9530685920577617,
|
| 931 |
+
"grad_norm": 0.27647075057029724,
|
| 932 |
+
"learning_rate": 0.00037381778926110567,
|
| 933 |
+
"loss": 0.4979417324066162,
|
| 934 |
+
"step": 132
|
| 935 |
+
},
|
| 936 |
+
{
|
| 937 |
+
"epoch": 0.9602888086642599,
|
| 938 |
+
"grad_norm": 0.23902934789657593,
|
| 939 |
+
"learning_rate": 0.00037341004833590734,
|
| 940 |
+
"loss": 0.4127359390258789,
|
| 941 |
+
"step": 133
|
| 942 |
+
},
|
| 943 |
+
{
|
| 944 |
+
"epoch": 0.9675090252707581,
|
| 945 |
+
"grad_norm": 0.3308359980583191,
|
| 946 |
+
"learning_rate": 0.0003729993829181276,
|
| 947 |
+
"loss": 0.6199836730957031,
|
| 948 |
+
"step": 134
|
| 949 |
+
},
|
| 950 |
+
{
|
| 951 |
+
"epoch": 0.9747292418772563,
|
| 952 |
+
"grad_norm": 0.30997487902641296,
|
| 953 |
+
"learning_rate": 0.00037258579993347795,
|
| 954 |
+
"loss": 0.5043972134590149,
|
| 955 |
+
"step": 135
|
| 956 |
+
},
|
| 957 |
+
{
|
| 958 |
+
"epoch": 0.9819494584837545,
|
| 959 |
+
"grad_norm": 0.5225651264190674,
|
| 960 |
+
"learning_rate": 0.00037216930635687357,
|
| 961 |
+
"loss": 0.5078832507133484,
|
| 962 |
+
"step": 136
|
| 963 |
+
},
|
| 964 |
+
{
|
| 965 |
+
"epoch": 0.9891696750902527,
|
| 966 |
+
"grad_norm": 0.2910468280315399,
|
| 967 |
+
"learning_rate": 0.00037174990921231557,
|
| 968 |
+
"loss": 0.5478032827377319,
|
| 969 |
+
"step": 137
|
| 970 |
+
},
|
| 971 |
+
{
|
| 972 |
+
"epoch": 0.9963898916967509,
|
| 973 |
+
"grad_norm": 0.3448226749897003,
|
| 974 |
+
"learning_rate": 0.00037132761557277257,
|
| 975 |
+
"loss": 0.5461761355400085,
|
| 976 |
+
"step": 138
|
| 977 |
+
},
|
| 978 |
+
{
|
| 979 |
+
"epoch": 1.0,
|
| 980 |
+
"grad_norm": 0.5731388926506042,
|
| 981 |
+
"learning_rate": 0.00037090243256006155,
|
| 982 |
+
"loss": 0.39478886127471924,
|
| 983 |
+
"step": 139
|
| 984 |
+
},
|
| 985 |
+
{
|
| 986 |
+
"epoch": 1.0072202166064983,
|
| 987 |
+
"grad_norm": 0.3017331659793854,
|
| 988 |
+
"learning_rate": 0.0003704743673447276,
|
| 989 |
+
"loss": 0.3729703426361084,
|
| 990 |
+
"step": 140
|
| 991 |
+
},
|
| 992 |
+
{
|
| 993 |
+
"epoch": 1.0144404332129964,
|
| 994 |
+
"grad_norm": 0.29272574186325073,
|
| 995 |
+
"learning_rate": 0.0003700434271459229,
|
| 996 |
+
"loss": 0.45498228073120117,
|
| 997 |
+
"step": 141
|
| 998 |
+
},
|
| 999 |
+
{
|
| 1000 |
+
"epoch": 1.0216606498194947,
|
| 1001 |
+
"grad_norm": 0.2818097770214081,
|
| 1002 |
+
"learning_rate": 0.0003696096192312852,
|
| 1003 |
+
"loss": 0.37411680817604065,
|
| 1004 |
+
"step": 142
|
| 1005 |
+
},
|
| 1006 |
+
{
|
| 1007 |
+
"epoch": 1.0288808664259927,
|
| 1008 |
+
"grad_norm": 0.31325557827949524,
|
| 1009 |
+
"learning_rate": 0.00036917295091681526,
|
| 1010 |
+
"loss": 0.4299224019050598,
|
| 1011 |
+
"step": 143
|
| 1012 |
+
},
|
| 1013 |
+
{
|
| 1014 |
+
"epoch": 1.036101083032491,
|
| 1015 |
+
"grad_norm": 0.2971343994140625,
|
| 1016 |
+
"learning_rate": 0.0003687334295667533,
|
| 1017 |
+
"loss": 0.4103966951370239,
|
| 1018 |
+
"step": 144
|
| 1019 |
+
},
|
| 1020 |
+
{
|
| 1021 |
+
"epoch": 1.0433212996389891,
|
| 1022 |
+
"grad_norm": 0.32004889845848083,
|
| 1023 |
+
"learning_rate": 0.00036829106259345465,
|
| 1024 |
+
"loss": 0.49494248628616333,
|
| 1025 |
+
"step": 145
|
| 1026 |
+
},
|
| 1027 |
+
{
|
| 1028 |
+
"epoch": 1.0505415162454874,
|
| 1029 |
+
"grad_norm": 0.29688122868537903,
|
| 1030 |
+
"learning_rate": 0.00036784585745726535,
|
| 1031 |
+
"loss": 0.4550933241844177,
|
| 1032 |
+
"step": 146
|
| 1033 |
+
},
|
| 1034 |
+
{
|
| 1035 |
+
"epoch": 1.0577617328519855,
|
| 1036 |
+
"grad_norm": 0.3322184681892395,
|
| 1037 |
+
"learning_rate": 0.00036739782166639556,
|
| 1038 |
+
"loss": 0.46367114782333374,
|
| 1039 |
+
"step": 147
|
| 1040 |
+
},
|
| 1041 |
+
{
|
| 1042 |
+
"epoch": 1.0649819494584838,
|
| 1043 |
+
"grad_norm": 0.267844021320343,
|
| 1044 |
+
"learning_rate": 0.00036694696277679367,
|
| 1045 |
+
"loss": 0.33760106563568115,
|
| 1046 |
+
"step": 148
|
| 1047 |
+
},
|
| 1048 |
+
{
|
| 1049 |
+
"epoch": 1.0722021660649819,
|
| 1050 |
+
"grad_norm": 0.3240787386894226,
|
| 1051 |
+
"learning_rate": 0.0003664932883920182,
|
| 1052 |
+
"loss": 0.43709027767181396,
|
| 1053 |
+
"step": 149
|
| 1054 |
+
},
|
| 1055 |
+
{
|
| 1056 |
+
"epoch": 1.0794223826714802,
|
| 1057 |
+
"grad_norm": 0.29441356658935547,
|
| 1058 |
+
"learning_rate": 0.00036603680616311015,
|
| 1059 |
+
"loss": 0.4205693304538727,
|
| 1060 |
+
"step": 150
|
| 1061 |
+
},
|
| 1062 |
+
{
|
| 1063 |
+
"epoch": 1.0866425992779782,
|
| 1064 |
+
"grad_norm": 0.33195292949676514,
|
| 1065 |
+
"learning_rate": 0.00036557752378846357,
|
| 1066 |
+
"loss": 0.44472751021385193,
|
| 1067 |
+
"step": 151
|
| 1068 |
+
},
|
| 1069 |
+
{
|
| 1070 |
+
"epoch": 1.0938628158844765,
|
| 1071 |
+
"grad_norm": 0.3113086223602295,
|
| 1072 |
+
"learning_rate": 0.00036511544901369597,
|
| 1073 |
+
"loss": 0.3894999921321869,
|
| 1074 |
+
"step": 152
|
| 1075 |
+
},
|
| 1076 |
+
{
|
| 1077 |
+
"epoch": 1.1010830324909748,
|
| 1078 |
+
"grad_norm": 0.30926311016082764,
|
| 1079 |
+
"learning_rate": 0.00036465058963151744,
|
| 1080 |
+
"loss": 0.33893927931785583,
|
| 1081 |
+
"step": 153
|
| 1082 |
+
},
|
| 1083 |
+
{
|
| 1084 |
+
"epoch": 1.108303249097473,
|
| 1085 |
+
"grad_norm": 0.31725767254829407,
|
| 1086 |
+
"learning_rate": 0.00036418295348159967,
|
| 1087 |
+
"loss": 0.4384872019290924,
|
| 1088 |
+
"step": 154
|
| 1089 |
+
},
|
| 1090 |
+
{
|
| 1091 |
+
"epoch": 1.1155234657039712,
|
| 1092 |
+
"grad_norm": 0.3411625027656555,
|
| 1093 |
+
"learning_rate": 0.00036371254845044297,
|
| 1094 |
+
"loss": 0.4130849838256836,
|
| 1095 |
+
"step": 155
|
| 1096 |
+
},
|
| 1097 |
+
{
|
| 1098 |
+
"epoch": 1.1227436823104693,
|
| 1099 |
+
"grad_norm": 0.3470022976398468,
|
| 1100 |
+
"learning_rate": 0.0003632393824712444,
|
| 1101 |
+
"loss": 0.4436883330345154,
|
| 1102 |
+
"step": 156
|
| 1103 |
+
},
|
| 1104 |
+
{
|
| 1105 |
+
"epoch": 1.1299638989169676,
|
| 1106 |
+
"grad_norm": 0.31315702199935913,
|
| 1107 |
+
"learning_rate": 0.00036276346352376266,
|
| 1108 |
+
"loss": 0.39922523498535156,
|
| 1109 |
+
"step": 157
|
| 1110 |
+
},
|
| 1111 |
+
{
|
| 1112 |
+
"epoch": 1.1371841155234657,
|
| 1113 |
+
"grad_norm": 0.36140701174736023,
|
| 1114 |
+
"learning_rate": 0.00036228479963418465,
|
| 1115 |
+
"loss": 0.44266432523727417,
|
| 1116 |
+
"step": 158
|
| 1117 |
+
},
|
| 1118 |
+
{
|
| 1119 |
+
"epoch": 1.144404332129964,
|
| 1120 |
+
"grad_norm": 0.37621912360191345,
|
| 1121 |
+
"learning_rate": 0.0003618033988749895,
|
| 1122 |
+
"loss": 0.3703776001930237,
|
| 1123 |
+
"step": 159
|
| 1124 |
+
},
|
| 1125 |
+
{
|
| 1126 |
+
"epoch": 1.151624548736462,
|
| 1127 |
+
"grad_norm": 0.40457242727279663,
|
| 1128 |
+
"learning_rate": 0.0003613192693648125,
|
| 1129 |
+
"loss": 0.48410341143608093,
|
| 1130 |
+
"step": 160
|
| 1131 |
+
},
|
| 1132 |
+
{
|
| 1133 |
+
"epoch": 1.1588447653429603,
|
| 1134 |
+
"grad_norm": 0.35907864570617676,
|
| 1135 |
+
"learning_rate": 0.00036083241926830833,
|
| 1136 |
+
"loss": 0.3249608874320984,
|
| 1137 |
+
"step": 161
|
| 1138 |
+
},
|
| 1139 |
+
{
|
| 1140 |
+
"epoch": 1.1660649819494584,
|
| 1141 |
+
"grad_norm": 0.3328985869884491,
|
| 1142 |
+
"learning_rate": 0.00036034285679601336,
|
| 1143 |
+
"loss": 0.3642440140247345,
|
| 1144 |
+
"step": 162
|
| 1145 |
+
},
|
| 1146 |
+
{
|
| 1147 |
+
"epoch": 1.1732851985559567,
|
| 1148 |
+
"grad_norm": 0.3639651834964752,
|
| 1149 |
+
"learning_rate": 0.00035985059020420695,
|
| 1150 |
+
"loss": 0.4125223457813263,
|
| 1151 |
+
"step": 163
|
| 1152 |
+
},
|
| 1153 |
+
{
|
| 1154 |
+
"epoch": 1.1805054151624548,
|
| 1155 |
+
"grad_norm": 0.3122009038925171,
|
| 1156 |
+
"learning_rate": 0.0003593556277947725,
|
| 1157 |
+
"loss": 0.26333218812942505,
|
| 1158 |
+
"step": 164
|
| 1159 |
+
},
|
| 1160 |
+
{
|
| 1161 |
+
"epoch": 1.187725631768953,
|
| 1162 |
+
"grad_norm": 0.3917737901210785,
|
| 1163 |
+
"learning_rate": 0.0003588579779150572,
|
| 1164 |
+
"loss": 0.41683149337768555,
|
| 1165 |
+
"step": 165
|
| 1166 |
+
},
|
| 1167 |
+
{
|
| 1168 |
+
"epoch": 1.1949458483754514,
|
| 1169 |
+
"grad_norm": 0.3892008066177368,
|
| 1170 |
+
"learning_rate": 0.00035835764895773164,
|
| 1171 |
+
"loss": 0.34965166449546814,
|
| 1172 |
+
"step": 166
|
| 1173 |
+
},
|
| 1174 |
+
{
|
| 1175 |
+
"epoch": 1.2021660649819494,
|
| 1176 |
+
"grad_norm": 0.32206663489341736,
|
| 1177 |
+
"learning_rate": 0.0003578546493606477,
|
| 1178 |
+
"loss": 0.3289134204387665,
|
| 1179 |
+
"step": 167
|
| 1180 |
+
},
|
| 1181 |
+
{
|
| 1182 |
+
"epoch": 1.2093862815884477,
|
| 1183 |
+
"grad_norm": 0.373098760843277,
|
| 1184 |
+
"learning_rate": 0.0003573489876066967,
|
| 1185 |
+
"loss": 0.37044239044189453,
|
| 1186 |
+
"step": 168
|
| 1187 |
+
},
|
| 1188 |
+
{
|
| 1189 |
+
"epoch": 1.2166064981949458,
|
| 1190 |
+
"grad_norm": 0.4301343262195587,
|
| 1191 |
+
"learning_rate": 0.00035684067222366614,
|
| 1192 |
+
"loss": 0.46339157223701477,
|
| 1193 |
+
"step": 169
|
| 1194 |
+
},
|
| 1195 |
+
{
|
| 1196 |
+
"epoch": 1.2238267148014441,
|
| 1197 |
+
"grad_norm": 0.3458724915981293,
|
| 1198 |
+
"learning_rate": 0.00035632971178409603,
|
| 1199 |
+
"loss": 0.41736456751823425,
|
| 1200 |
+
"step": 170
|
| 1201 |
+
},
|
| 1202 |
+
{
|
| 1203 |
+
"epoch": 1.2310469314079422,
|
| 1204 |
+
"grad_norm": 0.45238223671913147,
|
| 1205 |
+
"learning_rate": 0.0003558161149051341,
|
| 1206 |
+
"loss": 0.4182761311531067,
|
| 1207 |
+
"step": 171
|
| 1208 |
+
},
|
| 1209 |
+
{
|
| 1210 |
+
"epoch": 1.2382671480144405,
|
| 1211 |
+
"grad_norm": 0.32411810755729675,
|
| 1212 |
+
"learning_rate": 0.0003552998902483907,
|
| 1213 |
+
"loss": 0.30536049604415894,
|
| 1214 |
+
"step": 172
|
| 1215 |
+
},
|
| 1216 |
+
{
|
| 1217 |
+
"epoch": 1.2454873646209386,
|
| 1218 |
+
"grad_norm": 0.40648043155670166,
|
| 1219 |
+
"learning_rate": 0.0003547810465197926,
|
| 1220 |
+
"loss": 0.45940107107162476,
|
| 1221 |
+
"step": 173
|
| 1222 |
+
},
|
| 1223 |
+
{
|
| 1224 |
+
"epoch": 1.2527075812274369,
|
| 1225 |
+
"grad_norm": 0.34474775195121765,
|
| 1226 |
+
"learning_rate": 0.00035425959246943614,
|
| 1227 |
+
"loss": 0.4267578423023224,
|
| 1228 |
+
"step": 174
|
| 1229 |
+
},
|
| 1230 |
+
{
|
| 1231 |
+
"epoch": 1.259927797833935,
|
| 1232 |
+
"grad_norm": 0.33473461866378784,
|
| 1233 |
+
"learning_rate": 0.00035373553689143977,
|
| 1234 |
+
"loss": 0.31750980019569397,
|
| 1235 |
+
"step": 175
|
| 1236 |
+
},
|
| 1237 |
+
{
|
| 1238 |
+
"epoch": 1.2671480144404332,
|
| 1239 |
+
"grad_norm": 0.29968079924583435,
|
| 1240 |
+
"learning_rate": 0.0003532088886237956,
|
| 1241 |
+
"loss": 0.3412264883518219,
|
| 1242 |
+
"step": 176
|
| 1243 |
+
},
|
| 1244 |
+
{
|
| 1245 |
+
"epoch": 1.2743682310469313,
|
| 1246 |
+
"grad_norm": 0.3362952172756195,
|
| 1247 |
+
"learning_rate": 0.00035267965654822063,
|
| 1248 |
+
"loss": 0.347223162651062,
|
| 1249 |
+
"step": 177
|
| 1250 |
+
},
|
| 1251 |
+
{
|
| 1252 |
+
"epoch": 1.2815884476534296,
|
| 1253 |
+
"grad_norm": 0.38441580533981323,
|
| 1254 |
+
"learning_rate": 0.0003521478495900065,
|
| 1255 |
+
"loss": 0.4132072925567627,
|
| 1256 |
+
"step": 178
|
| 1257 |
+
},
|
| 1258 |
+
{
|
| 1259 |
+
"epoch": 1.288808664259928,
|
| 1260 |
+
"grad_norm": 0.3259715437889099,
|
| 1261 |
+
"learning_rate": 0.00035161347671786947,
|
| 1262 |
+
"loss": 0.3259287476539612,
|
| 1263 |
+
"step": 179
|
| 1264 |
+
},
|
| 1265 |
+
{
|
| 1266 |
+
"epoch": 1.296028880866426,
|
| 1267 |
+
"grad_norm": 0.30564218759536743,
|
| 1268 |
+
"learning_rate": 0.00035107654694379876,
|
| 1269 |
+
"loss": 0.33284130692481995,
|
| 1270 |
+
"step": 180
|
| 1271 |
+
},
|
| 1272 |
+
{
|
| 1273 |
+
"epoch": 1.303249097472924,
|
| 1274 |
+
"grad_norm": 0.3464779853820801,
|
| 1275 |
+
"learning_rate": 0.0003505370693229049,
|
| 1276 |
+
"loss": 0.3613452613353729,
|
| 1277 |
+
"step": 181
|
| 1278 |
+
},
|
| 1279 |
+
{
|
| 1280 |
+
"epoch": 1.3104693140794224,
|
| 1281 |
+
"grad_norm": 0.4113422632217407,
|
| 1282 |
+
"learning_rate": 0.0003499950529532668,
|
| 1283 |
+
"loss": 0.49952858686447144,
|
| 1284 |
+
"step": 182
|
| 1285 |
+
},
|
| 1286 |
+
{
|
| 1287 |
+
"epoch": 1.3176895306859207,
|
| 1288 |
+
"grad_norm": 0.3503414988517761,
|
| 1289 |
+
"learning_rate": 0.0003494505069757782,
|
| 1290 |
+
"loss": 0.43928611278533936,
|
| 1291 |
+
"step": 183
|
| 1292 |
+
},
|
| 1293 |
+
{
|
| 1294 |
+
"epoch": 1.3249097472924187,
|
| 1295 |
+
"grad_norm": 0.3231402337551117,
|
| 1296 |
+
"learning_rate": 0.000348903440573994,
|
| 1297 |
+
"loss": 0.35302072763442993,
|
| 1298 |
+
"step": 184
|
| 1299 |
+
},
|
| 1300 |
+
{
|
| 1301 |
+
"epoch": 1.332129963898917,
|
| 1302 |
+
"grad_norm": 0.3849830627441406,
|
| 1303 |
+
"learning_rate": 0.00034835386297397486,
|
| 1304 |
+
"loss": 0.42382097244262695,
|
| 1305 |
+
"step": 185
|
| 1306 |
+
},
|
| 1307 |
+
{
|
| 1308 |
+
"epoch": 1.339350180505415,
|
| 1309 |
+
"grad_norm": 0.35116714239120483,
|
| 1310 |
+
"learning_rate": 0.00034780178344413185,
|
| 1311 |
+
"loss": 0.3274853229522705,
|
| 1312 |
+
"step": 186
|
| 1313 |
+
},
|
| 1314 |
+
{
|
| 1315 |
+
"epoch": 1.3465703971119134,
|
| 1316 |
+
"grad_norm": 0.3941578269004822,
|
| 1317 |
+
"learning_rate": 0.0003472472112950701,
|
| 1318 |
+
"loss": 0.34617680311203003,
|
| 1319 |
+
"step": 187
|
| 1320 |
+
},
|
| 1321 |
+
{
|
| 1322 |
+
"epoch": 1.3537906137184115,
|
| 1323 |
+
"grad_norm": 0.32104700803756714,
|
| 1324 |
+
"learning_rate": 0.00034669015587943184,
|
| 1325 |
+
"loss": 0.39410364627838135,
|
| 1326 |
+
"step": 188
|
| 1327 |
+
},
|
| 1328 |
+
{
|
| 1329 |
+
"epoch": 1.3610108303249098,
|
| 1330 |
+
"grad_norm": 0.42431211471557617,
|
| 1331 |
+
"learning_rate": 0.00034613062659173867,
|
| 1332 |
+
"loss": 0.49896761775016785,
|
| 1333 |
+
"step": 189
|
| 1334 |
+
},
|
| 1335 |
+
{
|
| 1336 |
+
"epoch": 1.3682310469314078,
|
| 1337 |
+
"grad_norm": 0.4387979209423065,
|
| 1338 |
+
"learning_rate": 0.00034556863286823284,
|
| 1339 |
+
"loss": 0.4435005784034729,
|
| 1340 |
+
"step": 190
|
| 1341 |
+
},
|
| 1342 |
+
{
|
| 1343 |
+
"epoch": 1.3754512635379061,
|
| 1344 |
+
"grad_norm": 0.3983216881752014,
|
| 1345 |
+
"learning_rate": 0.00034500418418671855,
|
| 1346 |
+
"loss": 0.44415876269340515,
|
| 1347 |
+
"step": 191
|
| 1348 |
+
},
|
| 1349 |
+
{
|
| 1350 |
+
"epoch": 1.3826714801444044,
|
| 1351 |
+
"grad_norm": 0.30740320682525635,
|
| 1352 |
+
"learning_rate": 0.00034443729006640184,
|
| 1353 |
+
"loss": 0.36664414405822754,
|
| 1354 |
+
"step": 192
|
| 1355 |
+
},
|
| 1356 |
+
{
|
| 1357 |
+
"epoch": 1.3898916967509025,
|
| 1358 |
+
"grad_norm": 0.35397860407829285,
|
| 1359 |
+
"learning_rate": 0.0003438679600677302,
|
| 1360 |
+
"loss": 0.36680418252944946,
|
| 1361 |
+
"step": 193
|
| 1362 |
+
},
|
| 1363 |
+
{
|
| 1364 |
+
"epoch": 1.3971119133574006,
|
| 1365 |
+
"grad_norm": 0.3522591292858124,
|
| 1366 |
+
"learning_rate": 0.0003432962037922312,
|
| 1367 |
+
"loss": 0.3908054232597351,
|
| 1368 |
+
"step": 194
|
| 1369 |
+
},
|
| 1370 |
+
{
|
| 1371 |
+
"epoch": 1.404332129963899,
|
| 1372 |
+
"grad_norm": 0.36350661516189575,
|
| 1373 |
+
"learning_rate": 0.0003427220308823505,
|
| 1374 |
+
"loss": 0.34363672137260437,
|
| 1375 |
+
"step": 195
|
| 1376 |
+
},
|
| 1377 |
+
{
|
| 1378 |
+
"epoch": 1.4115523465703972,
|
| 1379 |
+
"grad_norm": 0.3392064869403839,
|
| 1380 |
+
"learning_rate": 0.00034214545102128946,
|
| 1381 |
+
"loss": 0.40172988176345825,
|
| 1382 |
+
"step": 196
|
| 1383 |
+
},
|
| 1384 |
+
{
|
| 1385 |
+
"epoch": 1.4187725631768953,
|
| 1386 |
+
"grad_norm": 0.3826808035373688,
|
| 1387 |
+
"learning_rate": 0.0003415664739328418,
|
| 1388 |
+
"loss": 0.4292600452899933,
|
| 1389 |
+
"step": 197
|
| 1390 |
+
},
|
| 1391 |
+
{
|
| 1392 |
+
"epoch": 1.4259927797833936,
|
| 1393 |
+
"grad_norm": 0.4102179706096649,
|
| 1394 |
+
"learning_rate": 0.00034098510938122947,
|
| 1395 |
+
"loss": 0.40238481760025024,
|
| 1396 |
+
"step": 198
|
| 1397 |
+
},
|
| 1398 |
+
{
|
| 1399 |
+
"epoch": 1.4332129963898916,
|
| 1400 |
+
"grad_norm": 0.38712596893310547,
|
| 1401 |
+
"learning_rate": 0.00034040136717093796,
|
| 1402 |
+
"loss": 0.3980088233947754,
|
| 1403 |
+
"step": 199
|
| 1404 |
+
},
|
| 1405 |
+
{
|
| 1406 |
+
"epoch": 1.44043321299639,
|
| 1407 |
+
"grad_norm": 0.35182803869247437,
|
| 1408 |
+
"learning_rate": 0.0003398152571465512,
|
| 1409 |
+
"loss": 0.3569096028804779,
|
| 1410 |
+
"step": 200
|
| 1411 |
+
},
|
| 1412 |
+
{
|
| 1413 |
+
"epoch": 1.447653429602888,
|
| 1414 |
+
"grad_norm": 0.4129750728607178,
|
| 1415 |
+
"learning_rate": 0.0003392267891925854,
|
| 1416 |
+
"loss": 0.4729324281215668,
|
| 1417 |
+
"step": 201
|
| 1418 |
+
},
|
| 1419 |
+
{
|
| 1420 |
+
"epoch": 1.4548736462093863,
|
| 1421 |
+
"grad_norm": 0.3427615463733673,
|
| 1422 |
+
"learning_rate": 0.000338635973233322,
|
| 1423 |
+
"loss": 0.38466876745224,
|
| 1424 |
+
"step": 202
|
| 1425 |
+
},
|
| 1426 |
+
{
|
| 1427 |
+
"epoch": 1.4620938628158844,
|
| 1428 |
+
"grad_norm": 0.29937732219696045,
|
| 1429 |
+
"learning_rate": 0.0003380428192326411,
|
| 1430 |
+
"loss": 0.24431845545768738,
|
| 1431 |
+
"step": 203
|
| 1432 |
+
},
|
| 1433 |
+
{
|
| 1434 |
+
"epoch": 1.4693140794223827,
|
| 1435 |
+
"grad_norm": 0.35563215613365173,
|
| 1436 |
+
"learning_rate": 0.00033744733719385253,
|
| 1437 |
+
"loss": 0.34825772047042847,
|
| 1438 |
+
"step": 204
|
| 1439 |
+
},
|
| 1440 |
+
{
|
| 1441 |
+
"epoch": 1.476534296028881,
|
| 1442 |
+
"grad_norm": 0.3395077586174011,
|
| 1443 |
+
"learning_rate": 0.0003368495371595279,
|
| 1444 |
+
"loss": 0.37704023718833923,
|
| 1445 |
+
"step": 205
|
| 1446 |
+
},
|
| 1447 |
+
{
|
| 1448 |
+
"epoch": 1.483754512635379,
|
| 1449 |
+
"grad_norm": 0.32358789443969727,
|
| 1450 |
+
"learning_rate": 0.0003362494292113308,
|
| 1451 |
+
"loss": 0.29866379499435425,
|
| 1452 |
+
"step": 206
|
| 1453 |
+
},
|
| 1454 |
+
{
|
| 1455 |
+
"epoch": 1.4909747292418771,
|
| 1456 |
+
"grad_norm": 0.44219517707824707,
|
| 1457 |
+
"learning_rate": 0.00033564702346984684,
|
| 1458 |
+
"loss": 0.5036117434501648,
|
| 1459 |
+
"step": 207
|
| 1460 |
+
},
|
| 1461 |
+
{
|
| 1462 |
+
"epoch": 1.4981949458483754,
|
| 1463 |
+
"grad_norm": 0.358549565076828,
|
| 1464 |
+
"learning_rate": 0.00033504233009441287,
|
| 1465 |
+
"loss": 0.42227745056152344,
|
| 1466 |
+
"step": 208
|
| 1467 |
+
},
|
| 1468 |
+
{
|
| 1469 |
+
"epoch": 1.5054151624548737,
|
| 1470 |
+
"grad_norm": 0.3784799575805664,
|
| 1471 |
+
"learning_rate": 0.0003344353592829461,
|
| 1472 |
+
"loss": 0.4267178773880005,
|
| 1473 |
+
"step": 209
|
| 1474 |
+
},
|
| 1475 |
+
{
|
| 1476 |
+
"epoch": 1.5126353790613718,
|
| 1477 |
+
"grad_norm": 0.3619599938392639,
|
| 1478 |
+
"learning_rate": 0.00033382612127177166,
|
| 1479 |
+
"loss": 0.4075395166873932,
|
| 1480 |
+
"step": 210
|
| 1481 |
+
},
|
| 1482 |
+
{
|
| 1483 |
+
"epoch": 1.5198555956678699,
|
| 1484 |
+
"grad_norm": 0.44484809041023254,
|
| 1485 |
+
"learning_rate": 0.0003332146263354501,
|
| 1486 |
+
"loss": 0.5016494989395142,
|
| 1487 |
+
"step": 211
|
| 1488 |
+
},
|
| 1489 |
+
{
|
| 1490 |
+
"epoch": 1.5270758122743682,
|
| 1491 |
+
"grad_norm": 0.34379443526268005,
|
| 1492 |
+
"learning_rate": 0.00033260088478660407,
|
| 1493 |
+
"loss": 0.317508339881897,
|
| 1494 |
+
"step": 212
|
| 1495 |
+
},
|
| 1496 |
+
{
|
| 1497 |
+
"epoch": 1.5342960288808665,
|
| 1498 |
+
"grad_norm": 0.4008065164089203,
|
| 1499 |
+
"learning_rate": 0.0003319849069757446,
|
| 1500 |
+
"loss": 0.3974913954734802,
|
| 1501 |
+
"step": 213
|
| 1502 |
+
},
|
| 1503 |
+
{
|
| 1504 |
+
"epoch": 1.5415162454873648,
|
| 1505 |
+
"grad_norm": 0.4006946384906769,
|
| 1506 |
+
"learning_rate": 0.00033136670329109624,
|
| 1507 |
+
"loss": 0.5162532925605774,
|
| 1508 |
+
"step": 214
|
| 1509 |
+
},
|
| 1510 |
+
{
|
| 1511 |
+
"epoch": 1.5487364620938628,
|
| 1512 |
+
"grad_norm": 0.32255908846855164,
|
| 1513 |
+
"learning_rate": 0.0003307462841584223,
|
| 1514 |
+
"loss": 0.37669965624809265,
|
| 1515 |
+
"step": 215
|
| 1516 |
+
},
|
| 1517 |
+
{
|
| 1518 |
+
"epoch": 1.555956678700361,
|
| 1519 |
+
"grad_norm": 0.7169090509414673,
|
| 1520 |
+
"learning_rate": 0.0003301236600408484,
|
| 1521 |
+
"loss": 0.4477896988391876,
|
| 1522 |
+
"step": 216
|
| 1523 |
+
},
|
| 1524 |
+
{
|
| 1525 |
+
"epoch": 1.5631768953068592,
|
| 1526 |
+
"grad_norm": 0.3694959580898285,
|
| 1527 |
+
"learning_rate": 0.00032949884143868675,
|
| 1528 |
+
"loss": 0.45744967460632324,
|
| 1529 |
+
"step": 217
|
| 1530 |
+
},
|
| 1531 |
+
{
|
| 1532 |
+
"epoch": 1.5703971119133575,
|
| 1533 |
+
"grad_norm": 0.3709769546985626,
|
| 1534 |
+
"learning_rate": 0.0003288718388892583,
|
| 1535 |
+
"loss": 0.4952532947063446,
|
| 1536 |
+
"step": 218
|
| 1537 |
+
},
|
| 1538 |
+
{
|
| 1539 |
+
"epoch": 1.5776173285198556,
|
| 1540 |
+
"grad_norm": 0.29159069061279297,
|
| 1541 |
+
"learning_rate": 0.00032824266296671567,
|
| 1542 |
+
"loss": 0.28994375467300415,
|
| 1543 |
+
"step": 219
|
| 1544 |
+
},
|
| 1545 |
+
{
|
| 1546 |
+
"epoch": 1.5848375451263537,
|
| 1547 |
+
"grad_norm": 0.3600374460220337,
|
| 1548 |
+
"learning_rate": 0.0003276113242818645,
|
| 1549 |
+
"loss": 0.43825557827949524,
|
| 1550 |
+
"step": 220
|
| 1551 |
+
},
|
| 1552 |
+
{
|
| 1553 |
+
"epoch": 1.592057761732852,
|
| 1554 |
+
"grad_norm": 0.2843645215034485,
|
| 1555 |
+
"learning_rate": 0.0003269778334819846,
|
| 1556 |
+
"loss": 0.32124435901641846,
|
| 1557 |
+
"step": 221
|
| 1558 |
+
},
|
| 1559 |
+
{
|
| 1560 |
+
"epoch": 1.5992779783393503,
|
| 1561 |
+
"grad_norm": 0.3688318431377411,
|
| 1562 |
+
"learning_rate": 0.0003263422012506502,
|
| 1563 |
+
"loss": 0.4742942750453949,
|
| 1564 |
+
"step": 222
|
| 1565 |
+
},
|
| 1566 |
+
{
|
| 1567 |
+
"epoch": 1.6064981949458483,
|
| 1568 |
+
"grad_norm": 0.3213002383708954,
|
| 1569 |
+
"learning_rate": 0.00032570443830755015,
|
| 1570 |
+
"loss": 0.42100387811660767,
|
| 1571 |
+
"step": 223
|
| 1572 |
+
},
|
| 1573 |
+
{
|
| 1574 |
+
"epoch": 1.6137184115523464,
|
| 1575 |
+
"grad_norm": 0.3240319490432739,
|
| 1576 |
+
"learning_rate": 0.0003250645554083068,
|
| 1577 |
+
"loss": 0.29403799772262573,
|
| 1578 |
+
"step": 224
|
| 1579 |
+
},
|
| 1580 |
+
{
|
| 1581 |
+
"epoch": 1.6209386281588447,
|
| 1582 |
+
"grad_norm": 0.3569975197315216,
|
| 1583 |
+
"learning_rate": 0.0003244225633442948,
|
| 1584 |
+
"loss": 0.4555712938308716,
|
| 1585 |
+
"step": 225
|
| 1586 |
+
},
|
| 1587 |
+
{
|
| 1588 |
+
"epoch": 1.628158844765343,
|
| 1589 |
+
"grad_norm": 0.43396008014678955,
|
| 1590 |
+
"learning_rate": 0.00032377847294245895,
|
| 1591 |
+
"loss": 0.4877527356147766,
|
| 1592 |
+
"step": 226
|
| 1593 |
+
},
|
| 1594 |
+
{
|
| 1595 |
+
"epoch": 1.6353790613718413,
|
| 1596 |
+
"grad_norm": 0.3694853186607361,
|
| 1597 |
+
"learning_rate": 0.0003231322950651316,
|
| 1598 |
+
"loss": 0.41299888491630554,
|
| 1599 |
+
"step": 227
|
| 1600 |
+
},
|
| 1601 |
+
{
|
| 1602 |
+
"epoch": 1.6425992779783394,
|
| 1603 |
+
"grad_norm": 0.3358525335788727,
|
| 1604 |
+
"learning_rate": 0.00032248404060985,
|
| 1605 |
+
"loss": 0.4551587998867035,
|
| 1606 |
+
"step": 228
|
| 1607 |
+
},
|
| 1608 |
+
{
|
| 1609 |
+
"epoch": 1.6498194945848375,
|
| 1610 |
+
"grad_norm": 0.38492903113365173,
|
| 1611 |
+
"learning_rate": 0.0003218337205091715,
|
| 1612 |
+
"loss": 0.4316423535346985,
|
| 1613 |
+
"step": 229
|
| 1614 |
+
},
|
| 1615 |
+
{
|
| 1616 |
+
"epoch": 1.6570397111913358,
|
| 1617 |
+
"grad_norm": 0.34664952754974365,
|
| 1618 |
+
"learning_rate": 0.0003211813457304902,
|
| 1619 |
+
"loss": 0.39314523339271545,
|
| 1620 |
+
"step": 230
|
| 1621 |
+
},
|
| 1622 |
+
{
|
| 1623 |
+
"epoch": 1.664259927797834,
|
| 1624 |
+
"grad_norm": 0.3254722058773041,
|
| 1625 |
+
"learning_rate": 0.00032052692727585133,
|
| 1626 |
+
"loss": 0.3327226936817169,
|
| 1627 |
+
"step": 231
|
| 1628 |
+
},
|
| 1629 |
+
{
|
| 1630 |
+
"epoch": 1.6714801444043321,
|
| 1631 |
+
"grad_norm": 0.4386709928512573,
|
| 1632 |
+
"learning_rate": 0.0003198704761817658,
|
| 1633 |
+
"loss": 0.4558185935020447,
|
| 1634 |
+
"step": 232
|
| 1635 |
+
},
|
| 1636 |
+
{
|
| 1637 |
+
"epoch": 1.6787003610108302,
|
| 1638 |
+
"grad_norm": 0.5447010397911072,
|
| 1639 |
+
"learning_rate": 0.00031921200351902446,
|
| 1640 |
+
"loss": 0.48867422342300415,
|
| 1641 |
+
"step": 233
|
| 1642 |
+
},
|
| 1643 |
+
{
|
| 1644 |
+
"epoch": 1.6859205776173285,
|
| 1645 |
+
"grad_norm": 0.2976516783237457,
|
| 1646 |
+
"learning_rate": 0.000318551520392511,
|
| 1647 |
+
"loss": 0.3376544117927551,
|
| 1648 |
+
"step": 234
|
| 1649 |
+
},
|
| 1650 |
+
{
|
| 1651 |
+
"epoch": 1.6931407942238268,
|
| 1652 |
+
"grad_norm": 0.3854595124721527,
|
| 1653 |
+
"learning_rate": 0.00031788903794101477,
|
| 1654 |
+
"loss": 0.45083147287368774,
|
| 1655 |
+
"step": 235
|
| 1656 |
+
},
|
| 1657 |
+
{
|
| 1658 |
+
"epoch": 1.7003610108303249,
|
| 1659 |
+
"grad_norm": 0.37051668763160706,
|
| 1660 |
+
"learning_rate": 0.00031722456733704297,
|
| 1661 |
+
"loss": 0.4483460485935211,
|
| 1662 |
+
"step": 236
|
| 1663 |
+
},
|
| 1664 |
+
{
|
| 1665 |
+
"epoch": 1.707581227436823,
|
| 1666 |
+
"grad_norm": 0.42628687620162964,
|
| 1667 |
+
"learning_rate": 0.0003165581197866322,
|
| 1668 |
+
"loss": 0.5173429250717163,
|
| 1669 |
+
"step": 237
|
| 1670 |
+
},
|
| 1671 |
+
{
|
| 1672 |
+
"epoch": 1.7148014440433212,
|
| 1673 |
+
"grad_norm": 0.44184717535972595,
|
| 1674 |
+
"learning_rate": 0.0003158897065291596,
|
| 1675 |
+
"loss": 0.45995786786079407,
|
| 1676 |
+
"step": 238
|
| 1677 |
+
},
|
| 1678 |
+
{
|
| 1679 |
+
"epoch": 1.7220216606498195,
|
| 1680 |
+
"grad_norm": 0.3687286376953125,
|
| 1681 |
+
"learning_rate": 0.00031521933883715293,
|
| 1682 |
+
"loss": 0.33321040868759155,
|
| 1683 |
+
"step": 239
|
| 1684 |
+
},
|
| 1685 |
+
{
|
| 1686 |
+
"epoch": 1.7292418772563178,
|
| 1687 |
+
"grad_norm": 0.3514050841331482,
|
| 1688 |
+
"learning_rate": 0.00031454702801610103,
|
| 1689 |
+
"loss": 0.3461155891418457,
|
| 1690 |
+
"step": 240
|
| 1691 |
+
},
|
| 1692 |
+
{
|
| 1693 |
+
"epoch": 1.736462093862816,
|
| 1694 |
+
"grad_norm": 0.4148181676864624,
|
| 1695 |
+
"learning_rate": 0.0003138727854042627,
|
| 1696 |
+
"loss": 0.4323638677597046,
|
| 1697 |
+
"step": 241
|
| 1698 |
+
},
|
| 1699 |
+
{
|
| 1700 |
+
"epoch": 1.743682310469314,
|
| 1701 |
+
"grad_norm": 0.44285446405410767,
|
| 1702 |
+
"learning_rate": 0.0003131966223724756,
|
| 1703 |
+
"loss": 0.4780181646347046,
|
| 1704 |
+
"step": 242
|
| 1705 |
+
},
|
| 1706 |
+
{
|
| 1707 |
+
"epoch": 1.7509025270758123,
|
| 1708 |
+
"grad_norm": 0.3196166157722473,
|
| 1709 |
+
"learning_rate": 0.00031251855032396464,
|
| 1710 |
+
"loss": 0.3380797505378723,
|
| 1711 |
+
"step": 243
|
| 1712 |
+
},
|
| 1713 |
+
{
|
| 1714 |
+
"epoch": 1.7581227436823106,
|
| 1715 |
+
"grad_norm": 0.48847395181655884,
|
| 1716 |
+
"learning_rate": 0.0003118385806941494,
|
| 1717 |
+
"loss": 0.4878506064414978,
|
| 1718 |
+
"step": 244
|
| 1719 |
+
},
|
| 1720 |
+
{
|
| 1721 |
+
"epoch": 1.7653429602888087,
|
| 1722 |
+
"grad_norm": 0.398876816034317,
|
| 1723 |
+
"learning_rate": 0.0003111567249504515,
|
| 1724 |
+
"loss": 0.4532281458377838,
|
| 1725 |
+
"step": 245
|
| 1726 |
+
},
|
| 1727 |
+
{
|
| 1728 |
+
"epoch": 1.7725631768953067,
|
| 1729 |
+
"grad_norm": 0.34218019247055054,
|
| 1730 |
+
"learning_rate": 0.0003104729945921012,
|
| 1731 |
+
"loss": 0.3738666772842407,
|
| 1732 |
+
"step": 246
|
| 1733 |
+
},
|
| 1734 |
+
{
|
| 1735 |
+
"epoch": 1.779783393501805,
|
| 1736 |
+
"grad_norm": 0.4071042835712433,
|
| 1737 |
+
"learning_rate": 0.0003097874011499433,
|
| 1738 |
+
"loss": 0.4437788724899292,
|
| 1739 |
+
"step": 247
|
| 1740 |
+
},
|
| 1741 |
+
{
|
| 1742 |
+
"epoch": 1.7870036101083033,
|
| 1743 |
+
"grad_norm": 0.35893604159355164,
|
| 1744 |
+
"learning_rate": 0.0003090999561862428,
|
| 1745 |
+
"loss": 0.35174691677093506,
|
| 1746 |
+
"step": 248
|
| 1747 |
+
},
|
| 1748 |
+
{
|
| 1749 |
+
"epoch": 1.7942238267148014,
|
| 1750 |
+
"grad_norm": 0.34495967626571655,
|
| 1751 |
+
"learning_rate": 0.0003084106712944899,
|
| 1752 |
+
"loss": 0.34072697162628174,
|
| 1753 |
+
"step": 249
|
| 1754 |
+
},
|
| 1755 |
+
{
|
| 1756 |
+
"epoch": 1.8014440433212995,
|
| 1757 |
+
"grad_norm": 0.4653945565223694,
|
| 1758 |
+
"learning_rate": 0.0003077195580992045,
|
| 1759 |
+
"loss": 0.45023709535598755,
|
| 1760 |
+
"step": 250
|
| 1761 |
+
},
|
| 1762 |
+
{
|
| 1763 |
+
"epoch": 1.8086642599277978,
|
| 1764 |
+
"grad_norm": 0.42124322056770325,
|
| 1765 |
+
"learning_rate": 0.0003070266282557401,
|
| 1766 |
+
"loss": 0.4846741557121277,
|
| 1767 |
+
"step": 251
|
| 1768 |
+
},
|
| 1769 |
+
{
|
| 1770 |
+
"epoch": 1.815884476534296,
|
| 1771 |
+
"grad_norm": 0.38208404183387756,
|
| 1772 |
+
"learning_rate": 0.0003063318934500872,
|
| 1773 |
+
"loss": 0.3900390565395355,
|
| 1774 |
+
"step": 252
|
| 1775 |
+
},
|
| 1776 |
+
{
|
| 1777 |
+
"epoch": 1.8231046931407944,
|
| 1778 |
+
"grad_norm": 0.3911641538143158,
|
| 1779 |
+
"learning_rate": 0.0003056353653986764,
|
| 1780 |
+
"loss": 0.3795917332172394,
|
| 1781 |
+
"step": 253
|
| 1782 |
+
},
|
| 1783 |
+
{
|
| 1784 |
+
"epoch": 1.8303249097472925,
|
| 1785 |
+
"grad_norm": 0.34185168147087097,
|
| 1786 |
+
"learning_rate": 0.00030493705584818065,
|
| 1787 |
+
"loss": 0.39876672625541687,
|
| 1788 |
+
"step": 254
|
| 1789 |
+
},
|
| 1790 |
+
{
|
| 1791 |
+
"epoch": 1.8375451263537905,
|
| 1792 |
+
"grad_norm": 0.4229717552661896,
|
| 1793 |
+
"learning_rate": 0.000304236976575317,
|
| 1794 |
+
"loss": 0.357430100440979,
|
| 1795 |
+
"step": 255
|
| 1796 |
+
},
|
| 1797 |
+
{
|
| 1798 |
+
"epoch": 1.8447653429602888,
|
| 1799 |
+
"grad_norm": 0.35156992077827454,
|
| 1800 |
+
"learning_rate": 0.0003035351393866485,
|
| 1801 |
+
"loss": 0.37869274616241455,
|
| 1802 |
+
"step": 256
|
| 1803 |
+
},
|
| 1804 |
+
{
|
| 1805 |
+
"epoch": 1.8519855595667871,
|
| 1806 |
+
"grad_norm": 0.3945099711418152,
|
| 1807 |
+
"learning_rate": 0.0003028315561183845,
|
| 1808 |
+
"loss": 0.45211949944496155,
|
| 1809 |
+
"step": 257
|
| 1810 |
+
},
|
| 1811 |
+
{
|
| 1812 |
+
"epoch": 1.8592057761732852,
|
| 1813 |
+
"grad_norm": 0.31473544239997864,
|
| 1814 |
+
"learning_rate": 0.0003021262386361814,
|
| 1815 |
+
"loss": 0.32624444365501404,
|
| 1816 |
+
"step": 258
|
| 1817 |
+
},
|
| 1818 |
+
{
|
| 1819 |
+
"epoch": 1.8664259927797833,
|
| 1820 |
+
"grad_norm": 0.4487520158290863,
|
| 1821 |
+
"learning_rate": 0.00030141919883494247,
|
| 1822 |
+
"loss": 0.48553428053855896,
|
| 1823 |
+
"step": 259
|
| 1824 |
+
},
|
| 1825 |
+
{
|
| 1826 |
+
"epoch": 1.8736462093862816,
|
| 1827 |
+
"grad_norm": 0.3847423791885376,
|
| 1828 |
+
"learning_rate": 0.00030071044863861713,
|
| 1829 |
+
"loss": 0.457511842250824,
|
| 1830 |
+
"step": 260
|
| 1831 |
+
},
|
| 1832 |
+
{
|
| 1833 |
+
"epoch": 1.8808664259927799,
|
| 1834 |
+
"grad_norm": 0.3822494447231293,
|
| 1835 |
+
"learning_rate": 0.00030000000000000003,
|
| 1836 |
+
"loss": 0.38700124621391296,
|
| 1837 |
+
"step": 261
|
| 1838 |
+
},
|
| 1839 |
+
{
|
| 1840 |
+
"epoch": 1.888086642599278,
|
| 1841 |
+
"grad_norm": 0.37934961915016174,
|
| 1842 |
+
"learning_rate": 0.0002992878649005293,
|
| 1843 |
+
"loss": 0.4150720238685608,
|
| 1844 |
+
"step": 262
|
| 1845 |
+
},
|
| 1846 |
+
{
|
| 1847 |
+
"epoch": 1.895306859205776,
|
| 1848 |
+
"grad_norm": 0.37126392126083374,
|
| 1849 |
+
"learning_rate": 0.00029857405535008467,
|
| 1850 |
+
"loss": 0.3389851450920105,
|
| 1851 |
+
"step": 263
|
| 1852 |
+
},
|
| 1853 |
+
{
|
| 1854 |
+
"epoch": 1.9025270758122743,
|
| 1855 |
+
"grad_norm": 0.3264472484588623,
|
| 1856 |
+
"learning_rate": 0.0002978585833867847,
|
| 1857 |
+
"loss": 0.327554315328598,
|
| 1858 |
+
"step": 264
|
| 1859 |
+
},
|
| 1860 |
+
{
|
| 1861 |
+
"epoch": 1.9097472924187726,
|
| 1862 |
+
"grad_norm": 0.3889877200126648,
|
| 1863 |
+
"learning_rate": 0.00029714146107678413,
|
| 1864 |
+
"loss": 0.4393918812274933,
|
| 1865 |
+
"step": 265
|
| 1866 |
+
},
|
| 1867 |
+
{
|
| 1868 |
+
"epoch": 1.916967509025271,
|
| 1869 |
+
"grad_norm": 0.4926806092262268,
|
| 1870 |
+
"learning_rate": 0.0002964227005140698,
|
| 1871 |
+
"loss": 0.5468560457229614,
|
| 1872 |
+
"step": 266
|
| 1873 |
+
},
|
| 1874 |
+
{
|
| 1875 |
+
"epoch": 1.924187725631769,
|
| 1876 |
+
"grad_norm": 0.4259951114654541,
|
| 1877 |
+
"learning_rate": 0.0002957023138202573,
|
| 1878 |
+
"loss": 0.39216533303260803,
|
| 1879 |
+
"step": 267
|
| 1880 |
+
},
|
| 1881 |
+
{
|
| 1882 |
+
"epoch": 1.931407942238267,
|
| 1883 |
+
"grad_norm": 0.39791861176490784,
|
| 1884 |
+
"learning_rate": 0.00029498031314438626,
|
| 1885 |
+
"loss": 0.37104716897010803,
|
| 1886 |
+
"step": 268
|
| 1887 |
+
},
|
| 1888 |
+
{
|
| 1889 |
+
"epoch": 1.9386281588447654,
|
| 1890 |
+
"grad_norm": 0.3682475686073303,
|
| 1891 |
+
"learning_rate": 0.0002942567106627155,
|
| 1892 |
+
"loss": 0.41986221075057983,
|
| 1893 |
+
"step": 269
|
| 1894 |
+
},
|
| 1895 |
+
{
|
| 1896 |
+
"epoch": 1.9458483754512637,
|
| 1897 |
+
"grad_norm": 0.3230769634246826,
|
| 1898 |
+
"learning_rate": 0.00029353151857851735,
|
| 1899 |
+
"loss": 0.35548532009124756,
|
| 1900 |
+
"step": 270
|
| 1901 |
+
},
|
| 1902 |
+
{
|
| 1903 |
+
"epoch": 1.9530685920577617,
|
| 1904 |
+
"grad_norm": 0.4607864320278168,
|
| 1905 |
+
"learning_rate": 0.0002928047491218727,
|
| 1906 |
+
"loss": 0.4246275722980499,
|
| 1907 |
+
"step": 271
|
| 1908 |
+
},
|
| 1909 |
+
{
|
| 1910 |
+
"epoch": 1.9602888086642598,
|
| 1911 |
+
"grad_norm": 0.4302678108215332,
|
| 1912 |
+
"learning_rate": 0.0002920764145494638,
|
| 1913 |
+
"loss": 0.42147913575172424,
|
| 1914 |
+
"step": 272
|
| 1915 |
+
},
|
| 1916 |
+
{
|
| 1917 |
+
"epoch": 1.967509025270758,
|
| 1918 |
+
"grad_norm": 0.36212071776390076,
|
| 1919 |
+
"learning_rate": 0.00029134652714436814,
|
| 1920 |
+
"loss": 0.4659682512283325,
|
| 1921 |
+
"step": 273
|
| 1922 |
+
},
|
| 1923 |
+
{
|
| 1924 |
+
"epoch": 1.9747292418772564,
|
| 1925 |
+
"grad_norm": 0.31535375118255615,
|
| 1926 |
+
"learning_rate": 0.00029061509921585107,
|
| 1927 |
+
"loss": 0.38229790329933167,
|
| 1928 |
+
"step": 274
|
| 1929 |
+
},
|
| 1930 |
+
{
|
| 1931 |
+
"epoch": 1.9819494584837545,
|
| 1932 |
+
"grad_norm": 0.3685518801212311,
|
| 1933 |
+
"learning_rate": 0.0002898821430991582,
|
| 1934 |
+
"loss": 0.46467846632003784,
|
| 1935 |
+
"step": 275
|
| 1936 |
+
},
|
| 1937 |
+
{
|
| 1938 |
+
"epoch": 1.9891696750902526,
|
| 1939 |
+
"grad_norm": 0.3998563885688782,
|
| 1940 |
+
"learning_rate": 0.0002891476711553077,
|
| 1941 |
+
"loss": 0.42970407009124756,
|
| 1942 |
+
"step": 276
|
| 1943 |
+
},
|
| 1944 |
+
{
|
| 1945 |
+
"epoch": 1.9963898916967509,
|
| 1946 |
+
"grad_norm": 0.35800614953041077,
|
| 1947 |
+
"learning_rate": 0.00028841169577088115,
|
| 1948 |
+
"loss": 0.4408795237541199,
|
| 1949 |
+
"step": 277
|
| 1950 |
+
},
|
| 1951 |
+
{
|
| 1952 |
+
"epoch": 2.0,
|
| 1953 |
+
"grad_norm": 0.5006654858589172,
|
| 1954 |
+
"learning_rate": 0.0002876742293578155,
|
| 1955 |
+
"loss": 0.38447684049606323,
|
| 1956 |
+
"step": 278
|
| 1957 |
+
},
|
| 1958 |
+
{
|
| 1959 |
+
"epoch": 2.0072202166064983,
|
| 1960 |
+
"grad_norm": 0.31330448389053345,
|
| 1961 |
+
"learning_rate": 0.00028693528435319305,
|
| 1962 |
+
"loss": 0.30373793840408325,
|
| 1963 |
+
"step": 279
|
| 1964 |
+
},
|
| 1965 |
+
{
|
| 1966 |
+
"epoch": 2.0144404332129966,
|
| 1967 |
+
"grad_norm": 0.29946643114089966,
|
| 1968 |
+
"learning_rate": 0.0002861948732190319,
|
| 1969 |
+
"loss": 0.26699960231781006,
|
| 1970 |
+
"step": 280
|
| 1971 |
+
},
|
| 1972 |
+
{
|
| 1973 |
+
"epoch": 2.0216606498194944,
|
| 1974 |
+
"grad_norm": 0.26591944694519043,
|
| 1975 |
+
"learning_rate": 0.0002854530084420762,
|
| 1976 |
+
"loss": 0.23807109892368317,
|
| 1977 |
+
"step": 281
|
| 1978 |
+
},
|
| 1979 |
+
{
|
| 1980 |
+
"epoch": 2.0288808664259927,
|
| 1981 |
+
"grad_norm": 0.34681931138038635,
|
| 1982 |
+
"learning_rate": 0.00028470970253358487,
|
| 1983 |
+
"loss": 0.32200539112091064,
|
| 1984 |
+
"step": 282
|
| 1985 |
+
},
|
| 1986 |
+
{
|
| 1987 |
+
"epoch": 2.036101083032491,
|
| 1988 |
+
"grad_norm": 0.3542478382587433,
|
| 1989 |
+
"learning_rate": 0.0002839649680291211,
|
| 1990 |
+
"loss": 0.3349723815917969,
|
| 1991 |
+
"step": 283
|
| 1992 |
+
},
|
| 1993 |
+
{
|
| 1994 |
+
"epoch": 2.0433212996389893,
|
| 1995 |
+
"grad_norm": 0.3007175624370575,
|
| 1996 |
+
"learning_rate": 0.0002832188174883408,
|
| 1997 |
+
"loss": 0.2172810435295105,
|
| 1998 |
+
"step": 284
|
| 1999 |
+
},
|
| 2000 |
+
{
|
| 2001 |
+
"epoch": 2.050541516245487,
|
| 2002 |
+
"grad_norm": 0.381719708442688,
|
| 2003 |
+
"learning_rate": 0.00028247126349478075,
|
| 2004 |
+
"loss": 0.3058876693248749,
|
| 2005 |
+
"step": 285
|
| 2006 |
+
},
|
| 2007 |
+
{
|
| 2008 |
+
"epoch": 2.0577617328519855,
|
| 2009 |
+
"grad_norm": 0.4056151211261749,
|
| 2010 |
+
"learning_rate": 0.0002817223186556463,
|
| 2011 |
+
"loss": 0.25402823090553284,
|
| 2012 |
+
"step": 286
|
| 2013 |
+
},
|
| 2014 |
+
{
|
| 2015 |
+
"epoch": 2.064981949458484,
|
| 2016 |
+
"grad_norm": 0.5069922804832458,
|
| 2017 |
+
"learning_rate": 0.00028097199560159913,
|
| 2018 |
+
"loss": 0.2375117838382721,
|
| 2019 |
+
"step": 287
|
| 2020 |
+
},
|
| 2021 |
+
{
|
| 2022 |
+
"epoch": 2.072202166064982,
|
| 2023 |
+
"grad_norm": 0.574663519859314,
|
| 2024 |
+
"learning_rate": 0.00028022030698654374,
|
| 2025 |
+
"loss": 0.3134710490703583,
|
| 2026 |
+
"step": 288
|
| 2027 |
+
},
|
| 2028 |
+
{
|
| 2029 |
+
"epoch": 2.07942238267148,
|
| 2030 |
+
"grad_norm": 0.5239531993865967,
|
| 2031 |
+
"learning_rate": 0.00027946726548741443,
|
| 2032 |
+
"loss": 0.20423674583435059,
|
| 2033 |
+
"step": 289
|
| 2034 |
+
},
|
| 2035 |
+
{
|
| 2036 |
+
"epoch": 2.0866425992779782,
|
| 2037 |
+
"grad_norm": 0.5845417976379395,
|
| 2038 |
+
"learning_rate": 0.0002787128838039612,
|
| 2039 |
+
"loss": 0.3297584354877472,
|
| 2040 |
+
"step": 290
|
| 2041 |
+
},
|
| 2042 |
+
{
|
| 2043 |
+
"epoch": 2.0938628158844765,
|
| 2044 |
+
"grad_norm": 0.47120949625968933,
|
| 2045 |
+
"learning_rate": 0.00027795717465853585,
|
| 2046 |
+
"loss": 0.32672739028930664,
|
| 2047 |
+
"step": 291
|
| 2048 |
+
},
|
| 2049 |
+
{
|
| 2050 |
+
"epoch": 2.101083032490975,
|
| 2051 |
+
"grad_norm": 0.40136632323265076,
|
| 2052 |
+
"learning_rate": 0.00027720015079587743,
|
| 2053 |
+
"loss": 0.23871661722660065,
|
| 2054 |
+
"step": 292
|
| 2055 |
+
},
|
| 2056 |
+
{
|
| 2057 |
+
"epoch": 2.108303249097473,
|
| 2058 |
+
"grad_norm": 0.5156406164169312,
|
| 2059 |
+
"learning_rate": 0.00027644182498289677,
|
| 2060 |
+
"loss": 0.23360338807106018,
|
| 2061 |
+
"step": 293
|
| 2062 |
+
},
|
| 2063 |
+
{
|
| 2064 |
+
"epoch": 2.115523465703971,
|
| 2065 |
+
"grad_norm": 0.4302510917186737,
|
| 2066 |
+
"learning_rate": 0.0002756822100084621,
|
| 2067 |
+
"loss": 0.31100887060165405,
|
| 2068 |
+
"step": 294
|
| 2069 |
+
},
|
| 2070 |
+
{
|
| 2071 |
+
"epoch": 2.1227436823104693,
|
| 2072 |
+
"grad_norm": 0.3673456609249115,
|
| 2073 |
+
"learning_rate": 0.00027492131868318246,
|
| 2074 |
+
"loss": 0.21802300214767456,
|
| 2075 |
+
"step": 295
|
| 2076 |
+
},
|
| 2077 |
+
{
|
| 2078 |
+
"epoch": 2.1299638989169676,
|
| 2079 |
+
"grad_norm": 0.32138535380363464,
|
| 2080 |
+
"learning_rate": 0.00027415916383919216,
|
| 2081 |
+
"loss": 0.19008119404315948,
|
| 2082 |
+
"step": 296
|
| 2083 |
+
},
|
| 2084 |
+
{
|
| 2085 |
+
"epoch": 2.137184115523466,
|
| 2086 |
+
"grad_norm": 0.3203730285167694,
|
| 2087 |
+
"learning_rate": 0.00027339575832993444,
|
| 2088 |
+
"loss": 0.1889929622411728,
|
| 2089 |
+
"step": 297
|
| 2090 |
+
},
|
| 2091 |
+
{
|
| 2092 |
+
"epoch": 2.1444043321299637,
|
| 2093 |
+
"grad_norm": 0.4612288773059845,
|
| 2094 |
+
"learning_rate": 0.0002726311150299443,
|
| 2095 |
+
"loss": 0.22323200106620789,
|
| 2096 |
+
"step": 298
|
| 2097 |
+
},
|
| 2098 |
+
{
|
| 2099 |
+
"epoch": 2.151624548736462,
|
| 2100 |
+
"grad_norm": 0.36709311604499817,
|
| 2101 |
+
"learning_rate": 0.00027186524683463155,
|
| 2102 |
+
"loss": 0.20466932654380798,
|
| 2103 |
+
"step": 299
|
| 2104 |
+
},
|
| 2105 |
+
{
|
| 2106 |
+
"epoch": 2.1588447653429603,
|
| 2107 |
+
"grad_norm": 0.4253864586353302,
|
| 2108 |
+
"learning_rate": 0.0002710981666600636,
|
| 2109 |
+
"loss": 0.2431459128856659,
|
| 2110 |
+
"step": 300
|
| 2111 |
+
},
|
| 2112 |
+
{
|
| 2113 |
+
"epoch": 2.1660649819494586,
|
| 2114 |
+
"grad_norm": 0.4018993675708771,
|
| 2115 |
+
"learning_rate": 0.00027032988744274736,
|
| 2116 |
+
"loss": 0.2751820385456085,
|
| 2117 |
+
"step": 301
|
| 2118 |
+
},
|
| 2119 |
+
{
|
| 2120 |
+
"epoch": 2.1732851985559565,
|
| 2121 |
+
"grad_norm": 0.4428861737251282,
|
| 2122 |
+
"learning_rate": 0.000269560422139411,
|
| 2123 |
+
"loss": 0.269814133644104,
|
| 2124 |
+
"step": 302
|
| 2125 |
+
},
|
| 2126 |
+
{
|
| 2127 |
+
"epoch": 2.1805054151624548,
|
| 2128 |
+
"grad_norm": 0.47122061252593994,
|
| 2129 |
+
"learning_rate": 0.00026878978372678564,
|
| 2130 |
+
"loss": 0.22829411923885345,
|
| 2131 |
+
"step": 303
|
| 2132 |
+
},
|
| 2133 |
+
{
|
| 2134 |
+
"epoch": 2.187725631768953,
|
| 2135 |
+
"grad_norm": 0.4426339268684387,
|
| 2136 |
+
"learning_rate": 0.00026801798520138646,
|
| 2137 |
+
"loss": 0.2637779414653778,
|
| 2138 |
+
"step": 304
|
| 2139 |
+
},
|
| 2140 |
+
{
|
| 2141 |
+
"epoch": 2.1949458483754514,
|
| 2142 |
+
"grad_norm": 0.4073690176010132,
|
| 2143 |
+
"learning_rate": 0.0002672450395792935,
|
| 2144 |
+
"loss": 0.1904142051935196,
|
| 2145 |
+
"step": 305
|
| 2146 |
+
},
|
| 2147 |
+
{
|
| 2148 |
+
"epoch": 2.2021660649819497,
|
| 2149 |
+
"grad_norm": 0.4896828234195709,
|
| 2150 |
+
"learning_rate": 0.00026647095989593193,
|
| 2151 |
+
"loss": 0.34650635719299316,
|
| 2152 |
+
"step": 306
|
| 2153 |
+
},
|
| 2154 |
+
{
|
| 2155 |
+
"epoch": 2.2093862815884475,
|
| 2156 |
+
"grad_norm": 0.48900970816612244,
|
| 2157 |
+
"learning_rate": 0.0002656957592058528,
|
| 2158 |
+
"loss": 0.2542106807231903,
|
| 2159 |
+
"step": 307
|
| 2160 |
+
},
|
| 2161 |
+
{
|
| 2162 |
+
"epoch": 2.216606498194946,
|
| 2163 |
+
"grad_norm": 0.4600171446800232,
|
| 2164 |
+
"learning_rate": 0.0002649194505825121,
|
| 2165 |
+
"loss": 0.21008341014385223,
|
| 2166 |
+
"step": 308
|
| 2167 |
+
},
|
| 2168 |
+
{
|
| 2169 |
+
"epoch": 2.223826714801444,
|
| 2170 |
+
"grad_norm": 0.43380653858184814,
|
| 2171 |
+
"learning_rate": 0.00026414204711805103,
|
| 2172 |
+
"loss": 0.2683791518211365,
|
| 2173 |
+
"step": 309
|
| 2174 |
+
},
|
| 2175 |
+
{
|
| 2176 |
+
"epoch": 2.2310469314079424,
|
| 2177 |
+
"grad_norm": 0.5792773365974426,
|
| 2178 |
+
"learning_rate": 0.0002633635619230746,
|
| 2179 |
+
"loss": 0.33160915970802307,
|
| 2180 |
+
"step": 310
|
| 2181 |
+
},
|
| 2182 |
+
{
|
| 2183 |
+
"epoch": 2.2382671480144403,
|
| 2184 |
+
"grad_norm": 0.5626965165138245,
|
| 2185 |
+
"learning_rate": 0.0002625840081264309,
|
| 2186 |
+
"loss": 0.26700398325920105,
|
| 2187 |
+
"step": 311
|
| 2188 |
+
},
|
| 2189 |
+
{
|
| 2190 |
+
"epoch": 2.2454873646209386,
|
| 2191 |
+
"grad_norm": 0.4952887296676636,
|
| 2192 |
+
"learning_rate": 0.00026180339887498953,
|
| 2193 |
+
"loss": 0.2689879536628723,
|
| 2194 |
+
"step": 312
|
| 2195 |
+
},
|
| 2196 |
+
{
|
| 2197 |
+
"epoch": 2.252707581227437,
|
| 2198 |
+
"grad_norm": 0.4501405656337738,
|
| 2199 |
+
"learning_rate": 0.0002610217473334199,
|
| 2200 |
+
"loss": 0.26021096110343933,
|
| 2201 |
+
"step": 313
|
| 2202 |
+
},
|
| 2203 |
+
{
|
| 2204 |
+
"epoch": 2.259927797833935,
|
| 2205 |
+
"grad_norm": 0.36552777886390686,
|
| 2206 |
+
"learning_rate": 0.00026023906668396933,
|
| 2207 |
+
"loss": 0.26156651973724365,
|
| 2208 |
+
"step": 314
|
| 2209 |
+
},
|
| 2210 |
+
{
|
| 2211 |
+
"epoch": 2.2671480144404335,
|
| 2212 |
+
"grad_norm": 0.3733731806278229,
|
| 2213 |
+
"learning_rate": 0.00025945537012624054,
|
| 2214 |
+
"loss": 0.21406950056552887,
|
| 2215 |
+
"step": 315
|
| 2216 |
+
},
|
| 2217 |
+
{
|
| 2218 |
+
"epoch": 2.2743682310469313,
|
| 2219 |
+
"grad_norm": 0.4240867495536804,
|
| 2220 |
+
"learning_rate": 0.00025867067087696923,
|
| 2221 |
+
"loss": 0.32105109095573425,
|
| 2222 |
+
"step": 316
|
| 2223 |
+
},
|
| 2224 |
+
{
|
| 2225 |
+
"epoch": 2.2815884476534296,
|
| 2226 |
+
"grad_norm": 0.4198870360851288,
|
| 2227 |
+
"learning_rate": 0.000257884982169801,
|
| 2228 |
+
"loss": 0.3047807216644287,
|
| 2229 |
+
"step": 317
|
| 2230 |
+
},
|
| 2231 |
+
{
|
| 2232 |
+
"epoch": 2.288808664259928,
|
| 2233 |
+
"grad_norm": 0.4444144666194916,
|
| 2234 |
+
"learning_rate": 0.00025709831725506845,
|
| 2235 |
+
"loss": 0.23268437385559082,
|
| 2236 |
+
"step": 318
|
| 2237 |
+
},
|
| 2238 |
+
{
|
| 2239 |
+
"epoch": 2.2960288808664258,
|
| 2240 |
+
"grad_norm": 0.41258376836776733,
|
| 2241 |
+
"learning_rate": 0.00025631068939956726,
|
| 2242 |
+
"loss": 0.26838576793670654,
|
| 2243 |
+
"step": 319
|
| 2244 |
+
},
|
| 2245 |
+
{
|
| 2246 |
+
"epoch": 2.303249097472924,
|
| 2247 |
+
"grad_norm": 0.5179259777069092,
|
| 2248 |
+
"learning_rate": 0.00025552211188633293,
|
| 2249 |
+
"loss": 0.2882261574268341,
|
| 2250 |
+
"step": 320
|
| 2251 |
+
},
|
| 2252 |
+
{
|
| 2253 |
+
"epoch": 2.3104693140794224,
|
| 2254 |
+
"grad_norm": 0.4838998019695282,
|
| 2255 |
+
"learning_rate": 0.0002547325980144166,
|
| 2256 |
+
"loss": 0.30366814136505127,
|
| 2257 |
+
"step": 321
|
| 2258 |
+
},
|
| 2259 |
+
{
|
| 2260 |
+
"epoch": 2.3176895306859207,
|
| 2261 |
+
"grad_norm": 0.4862940311431885,
|
| 2262 |
+
"learning_rate": 0.0002539421610986605,
|
| 2263 |
+
"loss": 0.29283270239830017,
|
| 2264 |
+
"step": 322
|
| 2265 |
+
},
|
| 2266 |
+
{
|
| 2267 |
+
"epoch": 2.324909747292419,
|
| 2268 |
+
"grad_norm": 0.441685289144516,
|
| 2269 |
+
"learning_rate": 0.000253150814469474,
|
| 2270 |
+
"loss": 0.22393643856048584,
|
| 2271 |
+
"step": 323
|
| 2272 |
+
},
|
| 2273 |
+
{
|
| 2274 |
+
"epoch": 2.332129963898917,
|
| 2275 |
+
"grad_norm": 0.39844486117362976,
|
| 2276 |
+
"learning_rate": 0.0002523585714726081,
|
| 2277 |
+
"loss": 0.17744283378124237,
|
| 2278 |
+
"step": 324
|
| 2279 |
+
},
|
| 2280 |
+
{
|
| 2281 |
+
"epoch": 2.339350180505415,
|
| 2282 |
+
"grad_norm": 0.4977899491786957,
|
| 2283 |
+
"learning_rate": 0.0002515654454689307,
|
| 2284 |
+
"loss": 0.24069495499134064,
|
| 2285 |
+
"step": 325
|
| 2286 |
+
},
|
| 2287 |
+
{
|
| 2288 |
+
"epoch": 2.3465703971119134,
|
| 2289 |
+
"grad_norm": 0.4101859927177429,
|
| 2290 |
+
"learning_rate": 0.0002507714498342016,
|
| 2291 |
+
"loss": 0.25044453144073486,
|
| 2292 |
+
"step": 326
|
| 2293 |
+
},
|
| 2294 |
+
{
|
| 2295 |
+
"epoch": 2.3537906137184117,
|
| 2296 |
+
"grad_norm": 0.3521929085254669,
|
| 2297 |
+
"learning_rate": 0.0002499765979588462,
|
| 2298 |
+
"loss": 0.20651675760746002,
|
| 2299 |
+
"step": 327
|
| 2300 |
+
},
|
| 2301 |
+
{
|
| 2302 |
+
"epoch": 2.3610108303249095,
|
| 2303 |
+
"grad_norm": 0.5269883871078491,
|
| 2304 |
+
"learning_rate": 0.00024918090324773024,
|
| 2305 |
+
"loss": 0.301647424697876,
|
| 2306 |
+
"step": 328
|
| 2307 |
+
},
|
| 2308 |
+
{
|
| 2309 |
+
"epoch": 2.368231046931408,
|
| 2310 |
+
"grad_norm": 0.47672051191329956,
|
| 2311 |
+
"learning_rate": 0.0002483843791199335,
|
| 2312 |
+
"loss": 0.23506474494934082,
|
| 2313 |
+
"step": 329
|
| 2314 |
+
},
|
| 2315 |
+
{
|
| 2316 |
+
"epoch": 2.375451263537906,
|
| 2317 |
+
"grad_norm": 0.5546545386314392,
|
| 2318 |
+
"learning_rate": 0.00024758703900852375,
|
| 2319 |
+
"loss": 0.3066970705986023,
|
| 2320 |
+
"step": 330
|
| 2321 |
+
},
|
| 2322 |
+
{
|
| 2323 |
+
"epoch": 2.3826714801444044,
|
| 2324 |
+
"grad_norm": 0.3792511820793152,
|
| 2325 |
+
"learning_rate": 0.0002467888963603298,
|
| 2326 |
+
"loss": 0.20687991380691528,
|
| 2327 |
+
"step": 331
|
| 2328 |
+
},
|
| 2329 |
+
{
|
| 2330 |
+
"epoch": 2.3898916967509027,
|
| 2331 |
+
"grad_norm": 0.4949963092803955,
|
| 2332 |
+
"learning_rate": 0.00024598996463571474,
|
| 2333 |
+
"loss": 0.2865826189517975,
|
| 2334 |
+
"step": 332
|
| 2335 |
+
},
|
| 2336 |
+
{
|
| 2337 |
+
"epoch": 2.3971119133574006,
|
| 2338 |
+
"grad_norm": 0.4250241219997406,
|
| 2339 |
+
"learning_rate": 0.00024519025730834954,
|
| 2340 |
+
"loss": 0.25499409437179565,
|
| 2341 |
+
"step": 333
|
| 2342 |
+
},
|
| 2343 |
+
{
|
| 2344 |
+
"epoch": 2.404332129963899,
|
| 2345 |
+
"grad_norm": 0.30932316184043884,
|
| 2346 |
+
"learning_rate": 0.00024438978786498524,
|
| 2347 |
+
"loss": 0.18888786435127258,
|
| 2348 |
+
"step": 334
|
| 2349 |
+
},
|
| 2350 |
+
{
|
| 2351 |
+
"epoch": 2.411552346570397,
|
| 2352 |
+
"grad_norm": 0.5183025002479553,
|
| 2353 |
+
"learning_rate": 0.00024358856980522556,
|
| 2354 |
+
"loss": 0.2950358986854553,
|
| 2355 |
+
"step": 335
|
| 2356 |
+
},
|
| 2357 |
+
{
|
| 2358 |
+
"epoch": 2.4187725631768955,
|
| 2359 |
+
"grad_norm": 0.46398693323135376,
|
| 2360 |
+
"learning_rate": 0.00024278661664129948,
|
| 2361 |
+
"loss": 0.28177422285079956,
|
| 2362 |
+
"step": 336
|
| 2363 |
+
},
|
| 2364 |
+
{
|
| 2365 |
+
"epoch": 2.4259927797833933,
|
| 2366 |
+
"grad_norm": 0.4938473701477051,
|
| 2367 |
+
"learning_rate": 0.00024198394189783317,
|
| 2368 |
+
"loss": 0.31616371870040894,
|
| 2369 |
+
"step": 337
|
| 2370 |
+
},
|
| 2371 |
+
{
|
| 2372 |
+
"epoch": 2.4332129963898916,
|
| 2373 |
+
"grad_norm": 0.4439496099948883,
|
| 2374 |
+
"learning_rate": 0.00024118055911162198,
|
| 2375 |
+
"loss": 0.2702808380126953,
|
| 2376 |
+
"step": 338
|
| 2377 |
+
},
|
| 2378 |
+
{
|
| 2379 |
+
"epoch": 2.44043321299639,
|
| 2380 |
+
"grad_norm": 0.45705899596214294,
|
| 2381 |
+
"learning_rate": 0.00024037648183140205,
|
| 2382 |
+
"loss": 0.33506399393081665,
|
| 2383 |
+
"step": 339
|
| 2384 |
+
},
|
| 2385 |
+
{
|
| 2386 |
+
"epoch": 2.4476534296028882,
|
| 2387 |
+
"grad_norm": 0.4123782217502594,
|
| 2388 |
+
"learning_rate": 0.00023957172361762199,
|
| 2389 |
+
"loss": 0.2569669783115387,
|
| 2390 |
+
"step": 340
|
| 2391 |
+
},
|
| 2392 |
+
{
|
| 2393 |
+
"epoch": 2.4548736462093865,
|
| 2394 |
+
"grad_norm": 0.5178057551383972,
|
| 2395 |
+
"learning_rate": 0.00023876629804221402,
|
| 2396 |
+
"loss": 0.2357858568429947,
|
| 2397 |
+
"step": 341
|
| 2398 |
+
},
|
| 2399 |
+
{
|
| 2400 |
+
"epoch": 2.4620938628158844,
|
| 2401 |
+
"grad_norm": 0.5206875205039978,
|
| 2402 |
+
"learning_rate": 0.0002379602186883652,
|
| 2403 |
+
"loss": 0.30847087502479553,
|
| 2404 |
+
"step": 342
|
| 2405 |
+
},
|
| 2406 |
+
{
|
| 2407 |
+
"epoch": 2.4693140794223827,
|
| 2408 |
+
"grad_norm": 0.4264805018901825,
|
| 2409 |
+
"learning_rate": 0.00023715349915028823,
|
| 2410 |
+
"loss": 0.27529531717300415,
|
| 2411 |
+
"step": 343
|
| 2412 |
+
},
|
| 2413 |
+
{
|
| 2414 |
+
"epoch": 2.476534296028881,
|
| 2415 |
+
"grad_norm": 0.5162002444267273,
|
| 2416 |
+
"learning_rate": 0.00023634615303299233,
|
| 2417 |
+
"loss": 0.3068305253982544,
|
| 2418 |
+
"step": 344
|
| 2419 |
+
},
|
| 2420 |
+
{
|
| 2421 |
+
"epoch": 2.483754512635379,
|
| 2422 |
+
"grad_norm": 0.45099541544914246,
|
| 2423 |
+
"learning_rate": 0.00023553819395205378,
|
| 2424 |
+
"loss": 0.2681335508823395,
|
| 2425 |
+
"step": 345
|
| 2426 |
+
},
|
| 2427 |
+
{
|
| 2428 |
+
"epoch": 2.490974729241877,
|
| 2429 |
+
"grad_norm": 0.49566006660461426,
|
| 2430 |
+
"learning_rate": 0.00023472963553338613,
|
| 2431 |
+
"loss": 0.2626950144767761,
|
| 2432 |
+
"step": 346
|
| 2433 |
+
},
|
| 2434 |
+
{
|
| 2435 |
+
"epoch": 2.4981949458483754,
|
| 2436 |
+
"grad_norm": 0.4181882441043854,
|
| 2437 |
+
"learning_rate": 0.00023392049141301055,
|
| 2438 |
+
"loss": 0.2935839891433716,
|
| 2439 |
+
"step": 347
|
| 2440 |
+
},
|
| 2441 |
+
{
|
| 2442 |
+
"epoch": 2.5054151624548737,
|
| 2443 |
+
"grad_norm": 0.4298352897167206,
|
| 2444 |
+
"learning_rate": 0.000233110775236826,
|
| 2445 |
+
"loss": 0.2565048038959503,
|
| 2446 |
+
"step": 348
|
| 2447 |
+
},
|
| 2448 |
+
{
|
| 2449 |
+
"epoch": 2.512635379061372,
|
| 2450 |
+
"grad_norm": 0.46044519543647766,
|
| 2451 |
+
"learning_rate": 0.00023230050066037872,
|
| 2452 |
+
"loss": 0.2740374207496643,
|
| 2453 |
+
"step": 349
|
| 2454 |
+
},
|
| 2455 |
+
{
|
| 2456 |
+
"epoch": 2.51985559566787,
|
| 2457 |
+
"grad_norm": 0.3774242401123047,
|
| 2458 |
+
"learning_rate": 0.00023148968134863233,
|
| 2459 |
+
"loss": 0.23688335716724396,
|
| 2460 |
+
"step": 350
|
| 2461 |
+
},
|
| 2462 |
+
{
|
| 2463 |
+
"epoch": 2.527075812274368,
|
| 2464 |
+
"grad_norm": 0.4179275631904602,
|
| 2465 |
+
"learning_rate": 0.00023067833097573714,
|
| 2466 |
+
"loss": 0.2116960883140564,
|
| 2467 |
+
"step": 351
|
| 2468 |
+
},
|
| 2469 |
+
{
|
| 2470 |
+
"epoch": 2.5342960288808665,
|
| 2471 |
+
"grad_norm": 0.5179049968719482,
|
| 2472 |
+
"learning_rate": 0.0002298664632247994,
|
| 2473 |
+
"loss": 0.2446313500404358,
|
| 2474 |
+
"step": 352
|
| 2475 |
+
},
|
| 2476 |
+
{
|
| 2477 |
+
"epoch": 2.5415162454873648,
|
| 2478 |
+
"grad_norm": 0.44997915625572205,
|
| 2479 |
+
"learning_rate": 0.000229054091787651,
|
| 2480 |
+
"loss": 0.3158394694328308,
|
| 2481 |
+
"step": 353
|
| 2482 |
+
},
|
| 2483 |
+
{
|
| 2484 |
+
"epoch": 2.5487364620938626,
|
| 2485 |
+
"grad_norm": 0.41355574131011963,
|
| 2486 |
+
"learning_rate": 0.0002282412303646183,
|
| 2487 |
+
"loss": 0.2720823884010315,
|
| 2488 |
+
"step": 354
|
| 2489 |
+
},
|
| 2490 |
+
{
|
| 2491 |
+
"epoch": 2.555956678700361,
|
| 2492 |
+
"grad_norm": 0.36182165145874023,
|
| 2493 |
+
"learning_rate": 0.00022742789266429095,
|
| 2494 |
+
"loss": 0.22511911392211914,
|
| 2495 |
+
"step": 355
|
| 2496 |
+
},
|
| 2497 |
+
{
|
| 2498 |
+
"epoch": 2.563176895306859,
|
| 2499 |
+
"grad_norm": 0.43841102719306946,
|
| 2500 |
+
"learning_rate": 0.00022661409240329076,
|
| 2501 |
+
"loss": 0.21212677657604218,
|
| 2502 |
+
"step": 356
|
| 2503 |
+
},
|
| 2504 |
+
{
|
| 2505 |
+
"epoch": 2.5703971119133575,
|
| 2506 |
+
"grad_norm": 0.4933500289916992,
|
| 2507 |
+
"learning_rate": 0.0002257998433060407,
|
| 2508 |
+
"loss": 0.3581770956516266,
|
| 2509 |
+
"step": 357
|
| 2510 |
+
},
|
| 2511 |
+
{
|
| 2512 |
+
"epoch": 2.577617328519856,
|
| 2513 |
+
"grad_norm": 0.4325965344905853,
|
| 2514 |
+
"learning_rate": 0.00022498515910453296,
|
| 2515 |
+
"loss": 0.3252311646938324,
|
| 2516 |
+
"step": 358
|
| 2517 |
+
},
|
| 2518 |
+
{
|
| 2519 |
+
"epoch": 2.5848375451263537,
|
| 2520 |
+
"grad_norm": 0.45968931913375854,
|
| 2521 |
+
"learning_rate": 0.00022417005353809772,
|
| 2522 |
+
"loss": 0.3097744286060333,
|
| 2523 |
+
"step": 359
|
| 2524 |
+
},
|
| 2525 |
+
{
|
| 2526 |
+
"epoch": 2.592057761732852,
|
| 2527 |
+
"grad_norm": 0.43083667755126953,
|
| 2528 |
+
"learning_rate": 0.00022335454035317124,
|
| 2529 |
+
"loss": 0.25429341197013855,
|
| 2530 |
+
"step": 360
|
| 2531 |
+
},
|
| 2532 |
+
{
|
| 2533 |
+
"epoch": 2.5992779783393503,
|
| 2534 |
+
"grad_norm": 0.4504421353340149,
|
| 2535 |
+
"learning_rate": 0.00022253863330306425,
|
| 2536 |
+
"loss": 0.315784215927124,
|
| 2537 |
+
"step": 361
|
| 2538 |
+
},
|
| 2539 |
+
{
|
| 2540 |
+
"epoch": 2.606498194945848,
|
| 2541 |
+
"grad_norm": 0.44943565130233765,
|
| 2542 |
+
"learning_rate": 0.0002217223461477296,
|
| 2543 |
+
"loss": 0.22878926992416382,
|
| 2544 |
+
"step": 362
|
| 2545 |
+
},
|
| 2546 |
+
{
|
| 2547 |
+
"epoch": 2.6137184115523464,
|
| 2548 |
+
"grad_norm": 0.4279639720916748,
|
| 2549 |
+
"learning_rate": 0.00022090569265353072,
|
| 2550 |
+
"loss": 0.2623154819011688,
|
| 2551 |
+
"step": 363
|
| 2552 |
+
},
|
| 2553 |
+
{
|
| 2554 |
+
"epoch": 2.6209386281588447,
|
| 2555 |
+
"grad_norm": 0.4907088279724121,
|
| 2556 |
+
"learning_rate": 0.00022008868659300905,
|
| 2557 |
+
"loss": 0.317205548286438,
|
| 2558 |
+
"step": 364
|
| 2559 |
+
},
|
| 2560 |
+
{
|
| 2561 |
+
"epoch": 2.628158844765343,
|
| 2562 |
+
"grad_norm": 0.49302950501441956,
|
| 2563 |
+
"learning_rate": 0.000219271341744652,
|
| 2564 |
+
"loss": 0.30752891302108765,
|
| 2565 |
+
"step": 365
|
| 2566 |
+
},
|
| 2567 |
+
{
|
| 2568 |
+
"epoch": 2.6353790613718413,
|
| 2569 |
+
"grad_norm": 0.38831761479377747,
|
| 2570 |
+
"learning_rate": 0.00021845367189266042,
|
| 2571 |
+
"loss": 0.27115532755851746,
|
| 2572 |
+
"step": 366
|
| 2573 |
+
},
|
| 2574 |
+
{
|
| 2575 |
+
"epoch": 2.6425992779783396,
|
| 2576 |
+
"grad_norm": 0.47725188732147217,
|
| 2577 |
+
"learning_rate": 0.00021763569082671635,
|
| 2578 |
+
"loss": 0.20296484231948853,
|
| 2579 |
+
"step": 367
|
| 2580 |
+
},
|
| 2581 |
+
{
|
| 2582 |
+
"epoch": 2.6498194945848375,
|
| 2583 |
+
"grad_norm": 0.4198381006717682,
|
| 2584 |
+
"learning_rate": 0.00021681741234175027,
|
| 2585 |
+
"loss": 0.22836127877235413,
|
| 2586 |
+
"step": 368
|
| 2587 |
+
},
|
| 2588 |
+
{
|
| 2589 |
+
"epoch": 2.6570397111913358,
|
| 2590 |
+
"grad_norm": 0.5218875408172607,
|
| 2591 |
+
"learning_rate": 0.00021599885023770835,
|
| 2592 |
+
"loss": 0.29816269874572754,
|
| 2593 |
+
"step": 369
|
| 2594 |
+
},
|
| 2595 |
+
{
|
| 2596 |
+
"epoch": 2.664259927797834,
|
| 2597 |
+
"grad_norm": 0.4321244955062866,
|
| 2598 |
+
"learning_rate": 0.00021518001831932022,
|
| 2599 |
+
"loss": 0.21631377935409546,
|
| 2600 |
+
"step": 370
|
| 2601 |
+
},
|
| 2602 |
+
{
|
| 2603 |
+
"epoch": 2.671480144404332,
|
| 2604 |
+
"grad_norm": 0.4036301374435425,
|
| 2605 |
+
"learning_rate": 0.00021436093039586552,
|
| 2606 |
+
"loss": 0.19903570413589478,
|
| 2607 |
+
"step": 371
|
| 2608 |
+
},
|
| 2609 |
+
{
|
| 2610 |
+
"epoch": 2.67870036101083,
|
| 2611 |
+
"grad_norm": 0.543828010559082,
|
| 2612 |
+
"learning_rate": 0.00021354160028094153,
|
| 2613 |
+
"loss": 0.2922933101654053,
|
| 2614 |
+
"step": 372
|
| 2615 |
+
},
|
| 2616 |
+
{
|
| 2617 |
+
"epoch": 2.6859205776173285,
|
| 2618 |
+
"grad_norm": 0.5146738290786743,
|
| 2619 |
+
"learning_rate": 0.00021272204179222982,
|
| 2620 |
+
"loss": 0.2749359607696533,
|
| 2621 |
+
"step": 373
|
| 2622 |
+
},
|
| 2623 |
+
{
|
| 2624 |
+
"epoch": 2.693140794223827,
|
| 2625 |
+
"grad_norm": 0.47690504789352417,
|
| 2626 |
+
"learning_rate": 0.00021190226875126352,
|
| 2627 |
+
"loss": 0.296896755695343,
|
| 2628 |
+
"step": 374
|
| 2629 |
+
},
|
| 2630 |
+
{
|
| 2631 |
+
"epoch": 2.700361010830325,
|
| 2632 |
+
"grad_norm": 0.545520007610321,
|
| 2633 |
+
"learning_rate": 0.000211082294983194,
|
| 2634 |
+
"loss": 0.27578210830688477,
|
| 2635 |
+
"step": 375
|
| 2636 |
+
},
|
| 2637 |
+
{
|
| 2638 |
+
"epoch": 2.707581227436823,
|
| 2639 |
+
"grad_norm": 0.42757925391197205,
|
| 2640 |
+
"learning_rate": 0.00021026213431655792,
|
| 2641 |
+
"loss": 0.2315436154603958,
|
| 2642 |
+
"step": 376
|
| 2643 |
+
},
|
| 2644 |
+
{
|
| 2645 |
+
"epoch": 2.7148014440433212,
|
| 2646 |
+
"grad_norm": 0.5044121146202087,
|
| 2647 |
+
"learning_rate": 0.0002094418005830439,
|
| 2648 |
+
"loss": 0.34600791335105896,
|
| 2649 |
+
"step": 377
|
| 2650 |
+
},
|
| 2651 |
+
{
|
| 2652 |
+
"epoch": 2.7220216606498195,
|
| 2653 |
+
"grad_norm": 0.5155430436134338,
|
| 2654 |
+
"learning_rate": 0.00020862130761725917,
|
| 2655 |
+
"loss": 0.3247469663619995,
|
| 2656 |
+
"step": 378
|
| 2657 |
+
},
|
| 2658 |
+
{
|
| 2659 |
+
"epoch": 2.729241877256318,
|
| 2660 |
+
"grad_norm": 0.5196051001548767,
|
| 2661 |
+
"learning_rate": 0.00020780066925649634,
|
| 2662 |
+
"loss": 0.3277815878391266,
|
| 2663 |
+
"step": 379
|
| 2664 |
+
},
|
| 2665 |
+
{
|
| 2666 |
+
"epoch": 2.7364620938628157,
|
| 2667 |
+
"grad_norm": 0.44720444083213806,
|
| 2668 |
+
"learning_rate": 0.00020697989934050025,
|
| 2669 |
+
"loss": 0.25156158208847046,
|
| 2670 |
+
"step": 380
|
| 2671 |
+
},
|
| 2672 |
+
{
|
| 2673 |
+
"epoch": 2.743682310469314,
|
| 2674 |
+
"grad_norm": 0.43984708189964294,
|
| 2675 |
+
"learning_rate": 0.00020615901171123412,
|
| 2676 |
+
"loss": 0.28022634983062744,
|
| 2677 |
+
"step": 381
|
| 2678 |
+
},
|
| 2679 |
+
{
|
| 2680 |
+
"epoch": 2.7509025270758123,
|
| 2681 |
+
"grad_norm": 0.47703853249549866,
|
| 2682 |
+
"learning_rate": 0.00020533802021264648,
|
| 2683 |
+
"loss": 0.2780344486236572,
|
| 2684 |
+
"step": 382
|
| 2685 |
+
},
|
| 2686 |
+
{
|
| 2687 |
+
"epoch": 2.7581227436823106,
|
| 2688 |
+
"grad_norm": 0.43746253848075867,
|
| 2689 |
+
"learning_rate": 0.00020451693869043763,
|
| 2690 |
+
"loss": 0.23613542318344116,
|
| 2691 |
+
"step": 383
|
| 2692 |
+
},
|
| 2693 |
+
{
|
| 2694 |
+
"epoch": 2.765342960288809,
|
| 2695 |
+
"grad_norm": 0.41468992829322815,
|
| 2696 |
+
"learning_rate": 0.00020369578099182597,
|
| 2697 |
+
"loss": 0.3185104429721832,
|
| 2698 |
+
"step": 384
|
| 2699 |
+
},
|
| 2700 |
+
{
|
| 2701 |
+
"epoch": 2.7725631768953067,
|
| 2702 |
+
"grad_norm": 0.5149108171463013,
|
| 2703 |
+
"learning_rate": 0.0002028745609653147,
|
| 2704 |
+
"loss": 0.2768135070800781,
|
| 2705 |
+
"step": 385
|
| 2706 |
+
},
|
| 2707 |
+
{
|
| 2708 |
+
"epoch": 2.779783393501805,
|
| 2709 |
+
"grad_norm": 0.47348129749298096,
|
| 2710 |
+
"learning_rate": 0.00020205329246045798,
|
| 2711 |
+
"loss": 0.31962212920188904,
|
| 2712 |
+
"step": 386
|
| 2713 |
+
},
|
| 2714 |
+
{
|
| 2715 |
+
"epoch": 2.7870036101083033,
|
| 2716 |
+
"grad_norm": 0.4738944172859192,
|
| 2717 |
+
"learning_rate": 0.00020123198932762778,
|
| 2718 |
+
"loss": 0.23498407006263733,
|
| 2719 |
+
"step": 387
|
| 2720 |
+
},
|
| 2721 |
+
{
|
| 2722 |
+
"epoch": 2.794223826714801,
|
| 2723 |
+
"grad_norm": 0.48899075388908386,
|
| 2724 |
+
"learning_rate": 0.0002004106654177798,
|
| 2725 |
+
"loss": 0.23857903480529785,
|
| 2726 |
+
"step": 388
|
| 2727 |
+
},
|
| 2728 |
+
{
|
| 2729 |
+
"epoch": 2.8014440433212995,
|
| 2730 |
+
"grad_norm": 0.45867517590522766,
|
| 2731 |
+
"learning_rate": 0.00019958933458222026,
|
| 2732 |
+
"loss": 0.3246588706970215,
|
| 2733 |
+
"step": 389
|
| 2734 |
+
},
|
| 2735 |
+
{
|
| 2736 |
+
"epoch": 2.808664259927798,
|
| 2737 |
+
"grad_norm": 0.5840234160423279,
|
| 2738 |
+
"learning_rate": 0.0001987680106723723,
|
| 2739 |
+
"loss": 0.2935522198677063,
|
| 2740 |
+
"step": 390
|
| 2741 |
+
},
|
| 2742 |
+
{
|
| 2743 |
+
"epoch": 2.815884476534296,
|
| 2744 |
+
"grad_norm": 0.3764658272266388,
|
| 2745 |
+
"learning_rate": 0.00019794670753954204,
|
| 2746 |
+
"loss": 0.2096547782421112,
|
| 2747 |
+
"step": 391
|
| 2748 |
+
},
|
| 2749 |
+
{
|
| 2750 |
+
"epoch": 2.8231046931407944,
|
| 2751 |
+
"grad_norm": 0.44675493240356445,
|
| 2752 |
+
"learning_rate": 0.00019712543903468535,
|
| 2753 |
+
"loss": 0.2988222539424896,
|
| 2754 |
+
"step": 392
|
| 2755 |
+
},
|
| 2756 |
+
{
|
| 2757 |
+
"epoch": 2.8303249097472927,
|
| 2758 |
+
"grad_norm": 0.43063509464263916,
|
| 2759 |
+
"learning_rate": 0.00019630421900817407,
|
| 2760 |
+
"loss": 0.2222481369972229,
|
| 2761 |
+
"step": 393
|
| 2762 |
+
},
|
| 2763 |
+
{
|
| 2764 |
+
"epoch": 2.8375451263537905,
|
| 2765 |
+
"grad_norm": 0.47969475388526917,
|
| 2766 |
+
"learning_rate": 0.00019548306130956242,
|
| 2767 |
+
"loss": 0.26167353987693787,
|
| 2768 |
+
"step": 394
|
| 2769 |
+
},
|
| 2770 |
+
{
|
| 2771 |
+
"epoch": 2.844765342960289,
|
| 2772 |
+
"grad_norm": 0.47235366702079773,
|
| 2773 |
+
"learning_rate": 0.00019466197978735354,
|
| 2774 |
+
"loss": 0.30541300773620605,
|
| 2775 |
+
"step": 395
|
| 2776 |
+
},
|
| 2777 |
+
{
|
| 2778 |
+
"epoch": 2.851985559566787,
|
| 2779 |
+
"grad_norm": 0.47744160890579224,
|
| 2780 |
+
"learning_rate": 0.00019384098828876598,
|
| 2781 |
+
"loss": 0.23645427823066711,
|
| 2782 |
+
"step": 396
|
| 2783 |
+
},
|
| 2784 |
+
{
|
| 2785 |
+
"epoch": 2.859205776173285,
|
| 2786 |
+
"grad_norm": 0.5037774443626404,
|
| 2787 |
+
"learning_rate": 0.00019302010065949988,
|
| 2788 |
+
"loss": 0.26774662733078003,
|
| 2789 |
+
"step": 397
|
| 2790 |
+
},
|
| 2791 |
+
{
|
| 2792 |
+
"epoch": 2.8664259927797833,
|
| 2793 |
+
"grad_norm": 0.4689895510673523,
|
| 2794 |
+
"learning_rate": 0.0001921993307435037,
|
| 2795 |
+
"loss": 0.3405228853225708,
|
| 2796 |
+
"step": 398
|
| 2797 |
+
},
|
| 2798 |
+
{
|
| 2799 |
+
"epoch": 2.8736462093862816,
|
| 2800 |
+
"grad_norm": 0.44282686710357666,
|
| 2801 |
+
"learning_rate": 0.00019137869238274093,
|
| 2802 |
+
"loss": 0.26063668727874756,
|
| 2803 |
+
"step": 399
|
| 2804 |
+
},
|
| 2805 |
+
{
|
| 2806 |
+
"epoch": 2.88086642599278,
|
| 2807 |
+
"grad_norm": 0.4379267990589142,
|
| 2808 |
+
"learning_rate": 0.0001905581994169562,
|
| 2809 |
+
"loss": 0.26478758454322815,
|
| 2810 |
+
"step": 400
|
| 2811 |
+
},
|
| 2812 |
+
{
|
| 2813 |
+
"epoch": 2.888086642599278,
|
| 2814 |
+
"grad_norm": 0.519749641418457,
|
| 2815 |
+
"learning_rate": 0.00018973786568344205,
|
| 2816 |
+
"loss": 0.31215131282806396,
|
| 2817 |
+
"step": 401
|
| 2818 |
+
},
|
| 2819 |
+
{
|
| 2820 |
+
"epoch": 2.895306859205776,
|
| 2821 |
+
"grad_norm": 0.4515770375728607,
|
| 2822 |
+
"learning_rate": 0.000188917705016806,
|
| 2823 |
+
"loss": 0.2881377339363098,
|
| 2824 |
+
"step": 402
|
| 2825 |
+
},
|
| 2826 |
+
{
|
| 2827 |
+
"epoch": 2.9025270758122743,
|
| 2828 |
+
"grad_norm": 0.4650344252586365,
|
| 2829 |
+
"learning_rate": 0.0001880977312487365,
|
| 2830 |
+
"loss": 0.2557958960533142,
|
| 2831 |
+
"step": 403
|
| 2832 |
+
},
|
| 2833 |
+
{
|
| 2834 |
+
"epoch": 2.9097472924187726,
|
| 2835 |
+
"grad_norm": 0.4621173143386841,
|
| 2836 |
+
"learning_rate": 0.0001872779582077702,
|
| 2837 |
+
"loss": 0.23401126265525818,
|
| 2838 |
+
"step": 404
|
| 2839 |
+
},
|
| 2840 |
+
{
|
| 2841 |
+
"epoch": 2.916967509025271,
|
| 2842 |
+
"grad_norm": 0.4094926118850708,
|
| 2843 |
+
"learning_rate": 0.00018645839971905852,
|
| 2844 |
+
"loss": 0.24556361138820648,
|
| 2845 |
+
"step": 405
|
| 2846 |
+
},
|
| 2847 |
+
{
|
| 2848 |
+
"epoch": 2.9241877256317688,
|
| 2849 |
+
"grad_norm": 0.48592710494995117,
|
| 2850 |
+
"learning_rate": 0.0001856390696041345,
|
| 2851 |
+
"loss": 0.27918654680252075,
|
| 2852 |
+
"step": 406
|
| 2853 |
+
},
|
| 2854 |
+
{
|
| 2855 |
+
"epoch": 2.931407942238267,
|
| 2856 |
+
"grad_norm": 0.4039171040058136,
|
| 2857 |
+
"learning_rate": 0.00018481998168067983,
|
| 2858 |
+
"loss": 0.22918914258480072,
|
| 2859 |
+
"step": 407
|
| 2860 |
+
},
|
| 2861 |
+
{
|
| 2862 |
+
"epoch": 2.9386281588447654,
|
| 2863 |
+
"grad_norm": 0.5521522760391235,
|
| 2864 |
+
"learning_rate": 0.0001840011497622917,
|
| 2865 |
+
"loss": 0.35596632957458496,
|
| 2866 |
+
"step": 408
|
| 2867 |
+
},
|
| 2868 |
+
{
|
| 2869 |
+
"epoch": 2.9458483754512637,
|
| 2870 |
+
"grad_norm": 0.5527123212814331,
|
| 2871 |
+
"learning_rate": 0.0001831825876582498,
|
| 2872 |
+
"loss": 0.25526192784309387,
|
| 2873 |
+
"step": 409
|
| 2874 |
+
},
|
| 2875 |
+
{
|
| 2876 |
+
"epoch": 2.953068592057762,
|
| 2877 |
+
"grad_norm": 0.4386238157749176,
|
| 2878 |
+
"learning_rate": 0.0001823643091732837,
|
| 2879 |
+
"loss": 0.2627878189086914,
|
| 2880 |
+
"step": 410
|
| 2881 |
+
},
|
| 2882 |
+
{
|
| 2883 |
+
"epoch": 2.96028880866426,
|
| 2884 |
+
"grad_norm": 0.48318973183631897,
|
| 2885 |
+
"learning_rate": 0.00018154632810733962,
|
| 2886 |
+
"loss": 0.29408901929855347,
|
| 2887 |
+
"step": 411
|
| 2888 |
+
},
|
| 2889 |
+
{
|
| 2890 |
+
"epoch": 2.967509025270758,
|
| 2891 |
+
"grad_norm": 0.5193997025489807,
|
| 2892 |
+
"learning_rate": 0.00018072865825534805,
|
| 2893 |
+
"loss": 0.2762555480003357,
|
| 2894 |
+
"step": 412
|
| 2895 |
+
},
|
| 2896 |
+
{
|
| 2897 |
+
"epoch": 2.9747292418772564,
|
| 2898 |
+
"grad_norm": 0.488490492105484,
|
| 2899 |
+
"learning_rate": 0.000179911313406991,
|
| 2900 |
+
"loss": 0.3119064271450043,
|
| 2901 |
+
"step": 413
|
| 2902 |
+
},
|
| 2903 |
+
{
|
| 2904 |
+
"epoch": 2.9819494584837543,
|
| 2905 |
+
"grad_norm": 0.4461340010166168,
|
| 2906 |
+
"learning_rate": 0.00017909430734646935,
|
| 2907 |
+
"loss": 0.2738839089870453,
|
| 2908 |
+
"step": 414
|
| 2909 |
+
},
|
| 2910 |
+
{
|
| 2911 |
+
"epoch": 2.9891696750902526,
|
| 2912 |
+
"grad_norm": 0.4488433003425598,
|
| 2913 |
+
"learning_rate": 0.0001782776538522704,
|
| 2914 |
+
"loss": 0.25788843631744385,
|
| 2915 |
+
"step": 415
|
| 2916 |
+
},
|
| 2917 |
+
{
|
| 2918 |
+
"epoch": 2.996389891696751,
|
| 2919 |
+
"grad_norm": 0.5179741382598877,
|
| 2920 |
+
"learning_rate": 0.0001774613666969358,
|
| 2921 |
+
"loss": 0.2556946575641632,
|
| 2922 |
+
"step": 416
|
| 2923 |
+
},
|
| 2924 |
+
{
|
| 2925 |
+
"epoch": 3.0,
|
| 2926 |
+
"grad_norm": 0.6138741374015808,
|
| 2927 |
+
"learning_rate": 0.00017664545964682878,
|
| 2928 |
+
"loss": 0.23274531960487366,
|
| 2929 |
+
"step": 417
|
| 2930 |
+
},
|
| 2931 |
+
{
|
| 2932 |
+
"epoch": 3.0072202166064983,
|
| 2933 |
+
"grad_norm": 0.27745357155799866,
|
| 2934 |
+
"learning_rate": 0.00017582994646190233,
|
| 2935 |
+
"loss": 0.14754480123519897,
|
| 2936 |
+
"step": 418
|
| 2937 |
+
},
|
| 2938 |
+
{
|
| 2939 |
+
"epoch": 3.0144404332129966,
|
| 2940 |
+
"grad_norm": 0.40759217739105225,
|
| 2941 |
+
"learning_rate": 0.00017501484089546708,
|
| 2942 |
+
"loss": 0.21522817015647888,
|
| 2943 |
+
"step": 419
|
| 2944 |
+
},
|
| 2945 |
+
{
|
| 2946 |
+
"epoch": 3.0216606498194944,
|
| 2947 |
+
"grad_norm": 0.3123788833618164,
|
| 2948 |
+
"learning_rate": 0.00017420015669395938,
|
| 2949 |
+
"loss": 0.15608534216880798,
|
| 2950 |
+
"step": 420
|
| 2951 |
+
},
|
| 2952 |
+
{
|
| 2953 |
+
"epoch": 3.0288808664259927,
|
| 2954 |
+
"grad_norm": 0.4599035978317261,
|
| 2955 |
+
"learning_rate": 0.00017338590759670934,
|
| 2956 |
+
"loss": 0.1309528797864914,
|
| 2957 |
+
"step": 421
|
| 2958 |
+
},
|
| 2959 |
+
{
|
| 2960 |
+
"epoch": 3.036101083032491,
|
| 2961 |
+
"grad_norm": 0.38352325558662415,
|
| 2962 |
+
"learning_rate": 0.00017257210733570916,
|
| 2963 |
+
"loss": 0.1724625676870346,
|
| 2964 |
+
"step": 422
|
| 2965 |
+
},
|
| 2966 |
+
{
|
| 2967 |
+
"epoch": 3.0433212996389893,
|
| 2968 |
+
"grad_norm": 0.44771838188171387,
|
| 2969 |
+
"learning_rate": 0.00017175876963538178,
|
| 2970 |
+
"loss": 0.1661359965801239,
|
| 2971 |
+
"step": 423
|
| 2972 |
+
},
|
| 2973 |
+
{
|
| 2974 |
+
"epoch": 3.050541516245487,
|
| 2975 |
+
"grad_norm": 0.5998123288154602,
|
| 2976 |
+
"learning_rate": 0.00017094590821234906,
|
| 2977 |
+
"loss": 0.1318468153476715,
|
| 2978 |
+
"step": 424
|
| 2979 |
+
},
|
| 2980 |
+
{
|
| 2981 |
+
"epoch": 3.0577617328519855,
|
| 2982 |
+
"grad_norm": 0.47632187604904175,
|
| 2983 |
+
"learning_rate": 0.00017013353677520064,
|
| 2984 |
+
"loss": 0.10464094579219818,
|
| 2985 |
+
"step": 425
|
| 2986 |
+
},
|
| 2987 |
+
{
|
| 2988 |
+
"epoch": 3.064981949458484,
|
| 2989 |
+
"grad_norm": 0.3745962083339691,
|
| 2990 |
+
"learning_rate": 0.00016932166902426288,
|
| 2991 |
+
"loss": 0.10677687078714371,
|
| 2992 |
+
"step": 426
|
| 2993 |
+
},
|
| 2994 |
+
{
|
| 2995 |
+
"epoch": 3.072202166064982,
|
| 2996 |
+
"grad_norm": 0.6340925693511963,
|
| 2997 |
+
"learning_rate": 0.00016851031865136763,
|
| 2998 |
+
"loss": 0.1600916087627411,
|
| 2999 |
+
"step": 427
|
| 3000 |
+
},
|
| 3001 |
+
{
|
| 3002 |
+
"epoch": 3.07942238267148,
|
| 3003 |
+
"grad_norm": 0.8183390498161316,
|
| 3004 |
+
"learning_rate": 0.00016769949933962127,
|
| 3005 |
+
"loss": 0.13513822853565216,
|
| 3006 |
+
"step": 428
|
| 3007 |
+
},
|
| 3008 |
+
{
|
| 3009 |
+
"epoch": 3.0866425992779782,
|
| 3010 |
+
"grad_norm": 0.8068543076515198,
|
| 3011 |
+
"learning_rate": 0.00016688922476317398,
|
| 3012 |
+
"loss": 0.14319300651550293,
|
| 3013 |
+
"step": 429
|
| 3014 |
+
},
|
| 3015 |
+
{
|
| 3016 |
+
"epoch": 3.0938628158844765,
|
| 3017 |
+
"grad_norm": 0.6381204128265381,
|
| 3018 |
+
"learning_rate": 0.00016607950858698946,
|
| 3019 |
+
"loss": 0.1376371830701828,
|
| 3020 |
+
"step": 430
|
| 3021 |
+
},
|
| 3022 |
+
{
|
| 3023 |
+
"epoch": 3.101083032490975,
|
| 3024 |
+
"grad_norm": 0.5576755404472351,
|
| 3025 |
+
"learning_rate": 0.00016527036446661395,
|
| 3026 |
+
"loss": 0.14407199621200562,
|
| 3027 |
+
"step": 431
|
| 3028 |
+
},
|
| 3029 |
+
{
|
| 3030 |
+
"epoch": 3.108303249097473,
|
| 3031 |
+
"grad_norm": 0.6089445948600769,
|
| 3032 |
+
"learning_rate": 0.00016446180604794627,
|
| 3033 |
+
"loss": 0.1575869917869568,
|
| 3034 |
+
"step": 432
|
| 3035 |
+
},
|
| 3036 |
+
{
|
| 3037 |
+
"epoch": 3.115523465703971,
|
| 3038 |
+
"grad_norm": 0.6250684857368469,
|
| 3039 |
+
"learning_rate": 0.0001636538469670077,
|
| 3040 |
+
"loss": 0.17905279994010925,
|
| 3041 |
+
"step": 433
|
| 3042 |
+
},
|
| 3043 |
+
{
|
| 3044 |
+
"epoch": 3.1227436823104693,
|
| 3045 |
+
"grad_norm": 0.4243159592151642,
|
| 3046 |
+
"learning_rate": 0.00016284650084971185,
|
| 3047 |
+
"loss": 0.12401723116636276,
|
| 3048 |
+
"step": 434
|
| 3049 |
+
},
|
| 3050 |
+
{
|
| 3051 |
+
"epoch": 3.1299638989169676,
|
| 3052 |
+
"grad_norm": 0.4369412362575531,
|
| 3053 |
+
"learning_rate": 0.00016203978131163485,
|
| 3054 |
+
"loss": 0.11108125746250153,
|
| 3055 |
+
"step": 435
|
| 3056 |
+
},
|
| 3057 |
+
{
|
| 3058 |
+
"epoch": 3.137184115523466,
|
| 3059 |
+
"grad_norm": 0.45113661885261536,
|
| 3060 |
+
"learning_rate": 0.000161233701957786,
|
| 3061 |
+
"loss": 0.1364113986492157,
|
| 3062 |
+
"step": 436
|
| 3063 |
+
},
|
| 3064 |
+
{
|
| 3065 |
+
"epoch": 3.1444043321299637,
|
| 3066 |
+
"grad_norm": 0.33899277448654175,
|
| 3067 |
+
"learning_rate": 0.00016042827638237806,
|
| 3068 |
+
"loss": 0.1253184676170349,
|
| 3069 |
+
"step": 437
|
| 3070 |
+
},
|
| 3071 |
+
{
|
| 3072 |
+
"epoch": 3.151624548736462,
|
| 3073 |
+
"grad_norm": 0.48023247718811035,
|
| 3074 |
+
"learning_rate": 0.000159623518168598,
|
| 3075 |
+
"loss": 0.1729699671268463,
|
| 3076 |
+
"step": 438
|
| 3077 |
+
},
|
| 3078 |
+
{
|
| 3079 |
+
"epoch": 3.1588447653429603,
|
| 3080 |
+
"grad_norm": 0.4260300397872925,
|
| 3081 |
+
"learning_rate": 0.00015881944088837804,
|
| 3082 |
+
"loss": 0.1630483865737915,
|
| 3083 |
+
"step": 439
|
| 3084 |
+
},
|
| 3085 |
+
{
|
| 3086 |
+
"epoch": 3.1660649819494586,
|
| 3087 |
+
"grad_norm": 0.34896689653396606,
|
| 3088 |
+
"learning_rate": 0.00015801605810216685,
|
| 3089 |
+
"loss": 0.14477582275867462,
|
| 3090 |
+
"step": 440
|
| 3091 |
+
},
|
| 3092 |
+
{
|
| 3093 |
+
"epoch": 3.1732851985559565,
|
| 3094 |
+
"grad_norm": 0.46189841628074646,
|
| 3095 |
+
"learning_rate": 0.00015721338335870057,
|
| 3096 |
+
"loss": 0.16415920853614807,
|
| 3097 |
+
"step": 441
|
| 3098 |
+
},
|
| 3099 |
+
{
|
| 3100 |
+
"epoch": 3.1805054151624548,
|
| 3101 |
+
"grad_norm": 0.40856343507766724,
|
| 3102 |
+
"learning_rate": 0.00015641143019477446,
|
| 3103 |
+
"loss": 0.12028312683105469,
|
| 3104 |
+
"step": 442
|
| 3105 |
+
},
|
| 3106 |
+
{
|
| 3107 |
+
"epoch": 3.187725631768953,
|
| 3108 |
+
"grad_norm": 0.36561018228530884,
|
| 3109 |
+
"learning_rate": 0.00015561021213501483,
|
| 3110 |
+
"loss": 0.12599362432956696,
|
| 3111 |
+
"step": 443
|
| 3112 |
+
},
|
| 3113 |
+
{
|
| 3114 |
+
"epoch": 3.1949458483754514,
|
| 3115 |
+
"grad_norm": 0.4341471493244171,
|
| 3116 |
+
"learning_rate": 0.0001548097426916505,
|
| 3117 |
+
"loss": 0.14446969330310822,
|
| 3118 |
+
"step": 444
|
| 3119 |
+
},
|
| 3120 |
+
{
|
| 3121 |
+
"epoch": 3.2021660649819497,
|
| 3122 |
+
"grad_norm": 0.3864421844482422,
|
| 3123 |
+
"learning_rate": 0.00015401003536428534,
|
| 3124 |
+
"loss": 0.11642799526453018,
|
| 3125 |
+
"step": 445
|
| 3126 |
+
},
|
| 3127 |
+
{
|
| 3128 |
+
"epoch": 3.2093862815884475,
|
| 3129 |
+
"grad_norm": 0.5154263973236084,
|
| 3130 |
+
"learning_rate": 0.00015321110363967035,
|
| 3131 |
+
"loss": 0.17028403282165527,
|
| 3132 |
+
"step": 446
|
| 3133 |
+
},
|
| 3134 |
+
{
|
| 3135 |
+
"epoch": 3.216606498194946,
|
| 3136 |
+
"grad_norm": 0.4077145755290985,
|
| 3137 |
+
"learning_rate": 0.0001524129609914763,
|
| 3138 |
+
"loss": 0.11544163525104523,
|
| 3139 |
+
"step": 447
|
| 3140 |
+
},
|
| 3141 |
+
{
|
| 3142 |
+
"epoch": 3.223826714801444,
|
| 3143 |
+
"grad_norm": 0.41609570384025574,
|
| 3144 |
+
"learning_rate": 0.00015161562088006648,
|
| 3145 |
+
"loss": 0.1203891783952713,
|
| 3146 |
+
"step": 448
|
| 3147 |
+
},
|
| 3148 |
+
{
|
| 3149 |
+
"epoch": 3.2310469314079424,
|
| 3150 |
+
"grad_norm": 0.430624783039093,
|
| 3151 |
+
"learning_rate": 0.00015081909675226975,
|
| 3152 |
+
"loss": 0.09192588925361633,
|
| 3153 |
+
"step": 449
|
| 3154 |
+
},
|
| 3155 |
+
{
|
| 3156 |
+
"epoch": 3.2382671480144403,
|
| 3157 |
+
"grad_norm": 0.5538221001625061,
|
| 3158 |
+
"learning_rate": 0.0001500234020411538,
|
| 3159 |
+
"loss": 0.16532525420188904,
|
| 3160 |
+
"step": 450
|
| 3161 |
+
},
|
| 3162 |
+
{
|
| 3163 |
+
"epoch": 3.2454873646209386,
|
| 3164 |
+
"grad_norm": 0.6360041499137878,
|
| 3165 |
+
"learning_rate": 0.00014922855016579845,
|
| 3166 |
+
"loss": 0.13534685969352722,
|
| 3167 |
+
"step": 451
|
| 3168 |
+
},
|
| 3169 |
+
{
|
| 3170 |
+
"epoch": 3.252707581227437,
|
| 3171 |
+
"grad_norm": 0.556538462638855,
|
| 3172 |
+
"learning_rate": 0.00014843455453106925,
|
| 3173 |
+
"loss": 0.16164641082286835,
|
| 3174 |
+
"step": 452
|
| 3175 |
+
},
|
| 3176 |
+
{
|
| 3177 |
+
"epoch": 3.259927797833935,
|
| 3178 |
+
"grad_norm": 0.8166404366493225,
|
| 3179 |
+
"learning_rate": 0.00014764142852739193,
|
| 3180 |
+
"loss": 0.17865729331970215,
|
| 3181 |
+
"step": 453
|
| 3182 |
+
},
|
| 3183 |
+
{
|
| 3184 |
+
"epoch": 3.2671480144404335,
|
| 3185 |
+
"grad_norm": 0.6231580972671509,
|
| 3186 |
+
"learning_rate": 0.00014684918553052603,
|
| 3187 |
+
"loss": 0.11281149089336395,
|
| 3188 |
+
"step": 454
|
| 3189 |
+
},
|
| 3190 |
+
{
|
| 3191 |
+
"epoch": 3.2743682310469313,
|
| 3192 |
+
"grad_norm": 0.5884938836097717,
|
| 3193 |
+
"learning_rate": 0.00014605783890133948,
|
| 3194 |
+
"loss": 0.15221013128757477,
|
| 3195 |
+
"step": 455
|
| 3196 |
+
},
|
| 3197 |
+
{
|
| 3198 |
+
"epoch": 3.2815884476534296,
|
| 3199 |
+
"grad_norm": 0.40336933732032776,
|
| 3200 |
+
"learning_rate": 0.00014526740198558344,
|
| 3201 |
+
"loss": 0.08725619316101074,
|
| 3202 |
+
"step": 456
|
| 3203 |
+
},
|
| 3204 |
+
{
|
| 3205 |
+
"epoch": 3.288808664259928,
|
| 3206 |
+
"grad_norm": 0.7082973718643188,
|
| 3207 |
+
"learning_rate": 0.0001444778881136671,
|
| 3208 |
+
"loss": 0.1795981079339981,
|
| 3209 |
+
"step": 457
|
| 3210 |
+
},
|
| 3211 |
+
{
|
| 3212 |
+
"epoch": 3.2960288808664258,
|
| 3213 |
+
"grad_norm": 0.44312670826911926,
|
| 3214 |
+
"learning_rate": 0.0001436893106004328,
|
| 3215 |
+
"loss": 0.11532506346702576,
|
| 3216 |
+
"step": 458
|
| 3217 |
+
},
|
| 3218 |
+
{
|
| 3219 |
+
"epoch": 3.303249097472924,
|
| 3220 |
+
"grad_norm": 0.4892312288284302,
|
| 3221 |
+
"learning_rate": 0.0001429016827449316,
|
| 3222 |
+
"loss": 0.15218153595924377,
|
| 3223 |
+
"step": 459
|
| 3224 |
+
},
|
| 3225 |
+
{
|
| 3226 |
+
"epoch": 3.3104693140794224,
|
| 3227 |
+
"grad_norm": 0.36000511050224304,
|
| 3228 |
+
"learning_rate": 0.000142115017830199,
|
| 3229 |
+
"loss": 0.1174839586019516,
|
| 3230 |
+
"step": 460
|
| 3231 |
+
},
|
| 3232 |
+
{
|
| 3233 |
+
"epoch": 3.3176895306859207,
|
| 3234 |
+
"grad_norm": 0.42502933740615845,
|
| 3235 |
+
"learning_rate": 0.00014132932912303082,
|
| 3236 |
+
"loss": 0.1354883909225464,
|
| 3237 |
+
"step": 461
|
| 3238 |
+
},
|
| 3239 |
+
{
|
| 3240 |
+
"epoch": 3.324909747292419,
|
| 3241 |
+
"grad_norm": 0.5004318356513977,
|
| 3242 |
+
"learning_rate": 0.00014054462987375947,
|
| 3243 |
+
"loss": 0.14879979193210602,
|
| 3244 |
+
"step": 462
|
| 3245 |
+
},
|
| 3246 |
+
{
|
| 3247 |
+
"epoch": 3.332129963898917,
|
| 3248 |
+
"grad_norm": 0.5428838729858398,
|
| 3249 |
+
"learning_rate": 0.00013976093331603072,
|
| 3250 |
+
"loss": 0.1601594090461731,
|
| 3251 |
+
"step": 463
|
| 3252 |
+
},
|
| 3253 |
+
{
|
| 3254 |
+
"epoch": 3.339350180505415,
|
| 3255 |
+
"grad_norm": 0.5523360967636108,
|
| 3256 |
+
"learning_rate": 0.00013897825266658015,
|
| 3257 |
+
"loss": 0.1349392980337143,
|
| 3258 |
+
"step": 464
|
| 3259 |
+
},
|
| 3260 |
+
{
|
| 3261 |
+
"epoch": 3.3465703971119134,
|
| 3262 |
+
"grad_norm": 0.4672771394252777,
|
| 3263 |
+
"learning_rate": 0.00013819660112501054,
|
| 3264 |
+
"loss": 0.1563996523618698,
|
| 3265 |
+
"step": 465
|
| 3266 |
+
},
|
| 3267 |
+
{
|
| 3268 |
+
"epoch": 3.3537906137184117,
|
| 3269 |
+
"grad_norm": 0.4747507870197296,
|
| 3270 |
+
"learning_rate": 0.00013741599187356917,
|
| 3271 |
+
"loss": 0.12792187929153442,
|
| 3272 |
+
"step": 466
|
| 3273 |
+
},
|
| 3274 |
+
{
|
| 3275 |
+
"epoch": 3.3610108303249095,
|
| 3276 |
+
"grad_norm": 0.4293171167373657,
|
| 3277 |
+
"learning_rate": 0.00013663643807692547,
|
| 3278 |
+
"loss": 0.13704359531402588,
|
| 3279 |
+
"step": 467
|
| 3280 |
+
},
|
| 3281 |
+
{
|
| 3282 |
+
"epoch": 3.368231046931408,
|
| 3283 |
+
"grad_norm": 0.406646728515625,
|
| 3284 |
+
"learning_rate": 0.00013585795288194902,
|
| 3285 |
+
"loss": 0.14688344299793243,
|
| 3286 |
+
"step": 468
|
| 3287 |
+
},
|
| 3288 |
+
{
|
| 3289 |
+
"epoch": 3.375451263537906,
|
| 3290 |
+
"grad_norm": 0.44870486855506897,
|
| 3291 |
+
"learning_rate": 0.00013508054941748792,
|
| 3292 |
+
"loss": 0.11994664371013641,
|
| 3293 |
+
"step": 469
|
| 3294 |
+
},
|
| 3295 |
+
{
|
| 3296 |
+
"epoch": 3.3826714801444044,
|
| 3297 |
+
"grad_norm": 0.46383994817733765,
|
| 3298 |
+
"learning_rate": 0.00013430424079414728,
|
| 3299 |
+
"loss": 0.13228918612003326,
|
| 3300 |
+
"step": 470
|
| 3301 |
+
},
|
| 3302 |
+
{
|
| 3303 |
+
"epoch": 3.3898916967509027,
|
| 3304 |
+
"grad_norm": 0.873016893863678,
|
| 3305 |
+
"learning_rate": 0.0001335290401040681,
|
| 3306 |
+
"loss": 0.14495904743671417,
|
| 3307 |
+
"step": 471
|
| 3308 |
+
},
|
| 3309 |
+
{
|
| 3310 |
+
"epoch": 3.3971119133574006,
|
| 3311 |
+
"grad_norm": 0.5575613975524902,
|
| 3312 |
+
"learning_rate": 0.0001327549604207066,
|
| 3313 |
+
"loss": 0.17171433568000793,
|
| 3314 |
+
"step": 472
|
| 3315 |
+
},
|
| 3316 |
+
{
|
| 3317 |
+
"epoch": 3.404332129963899,
|
| 3318 |
+
"grad_norm": 0.541860818862915,
|
| 3319 |
+
"learning_rate": 0.00013198201479861353,
|
| 3320 |
+
"loss": 0.14465925097465515,
|
| 3321 |
+
"step": 473
|
| 3322 |
+
},
|
| 3323 |
+
{
|
| 3324 |
+
"epoch": 3.411552346570397,
|
| 3325 |
+
"grad_norm": 0.5210021734237671,
|
| 3326 |
+
"learning_rate": 0.00013121021627321438,
|
| 3327 |
+
"loss": 0.15102122724056244,
|
| 3328 |
+
"step": 474
|
| 3329 |
+
},
|
| 3330 |
+
{
|
| 3331 |
+
"epoch": 3.4187725631768955,
|
| 3332 |
+
"grad_norm": 0.46373456716537476,
|
| 3333 |
+
"learning_rate": 0.00013043957786058904,
|
| 3334 |
+
"loss": 0.15518702566623688,
|
| 3335 |
+
"step": 475
|
| 3336 |
+
},
|
| 3337 |
+
{
|
| 3338 |
+
"epoch": 3.4259927797833933,
|
| 3339 |
+
"grad_norm": 0.48513785004615784,
|
| 3340 |
+
"learning_rate": 0.00012967011255725263,
|
| 3341 |
+
"loss": 0.14110815525054932,
|
| 3342 |
+
"step": 476
|
| 3343 |
+
},
|
| 3344 |
+
{
|
| 3345 |
+
"epoch": 3.4332129963898916,
|
| 3346 |
+
"grad_norm": 0.5956123471260071,
|
| 3347 |
+
"learning_rate": 0.0001289018333399364,
|
| 3348 |
+
"loss": 0.14913466572761536,
|
| 3349 |
+
"step": 477
|
| 3350 |
+
},
|
| 3351 |
+
{
|
| 3352 |
+
"epoch": 3.44043321299639,
|
| 3353 |
+
"grad_norm": 0.5387746095657349,
|
| 3354 |
+
"learning_rate": 0.0001281347531653685,
|
| 3355 |
+
"loss": 0.14882197976112366,
|
| 3356 |
+
"step": 478
|
| 3357 |
+
},
|
| 3358 |
+
{
|
| 3359 |
+
"epoch": 3.4476534296028882,
|
| 3360 |
+
"grad_norm": 0.43160125613212585,
|
| 3361 |
+
"learning_rate": 0.00012736888497005578,
|
| 3362 |
+
"loss": 0.13204768300056458,
|
| 3363 |
+
"step": 479
|
| 3364 |
+
},
|
| 3365 |
+
{
|
| 3366 |
+
"epoch": 3.4548736462093865,
|
| 3367 |
+
"grad_norm": 0.41130170226097107,
|
| 3368 |
+
"learning_rate": 0.0001266042416700656,
|
| 3369 |
+
"loss": 0.13427188992500305,
|
| 3370 |
+
"step": 480
|
| 3371 |
+
},
|
| 3372 |
+
{
|
| 3373 |
+
"epoch": 3.4620938628158844,
|
| 3374 |
+
"grad_norm": 0.5126029253005981,
|
| 3375 |
+
"learning_rate": 0.00012584083616080786,
|
| 3376 |
+
"loss": 0.12719954550266266,
|
| 3377 |
+
"step": 481
|
| 3378 |
+
},
|
| 3379 |
+
{
|
| 3380 |
+
"epoch": 3.4693140794223827,
|
| 3381 |
+
"grad_norm": 0.4994872212409973,
|
| 3382 |
+
"learning_rate": 0.0001250786813168176,
|
| 3383 |
+
"loss": 0.15062202513217926,
|
| 3384 |
+
"step": 482
|
| 3385 |
+
},
|
| 3386 |
+
{
|
| 3387 |
+
"epoch": 3.476534296028881,
|
| 3388 |
+
"grad_norm": 0.4697980284690857,
|
| 3389 |
+
"learning_rate": 0.00012431778999153796,
|
| 3390 |
+
"loss": 0.14715459942817688,
|
| 3391 |
+
"step": 483
|
| 3392 |
+
},
|
| 3393 |
+
{
|
| 3394 |
+
"epoch": 3.483754512635379,
|
| 3395 |
+
"grad_norm": 0.5356115102767944,
|
| 3396 |
+
"learning_rate": 0.00012355817501710328,
|
| 3397 |
+
"loss": 0.12667298316955566,
|
| 3398 |
+
"step": 484
|
| 3399 |
+
},
|
| 3400 |
+
{
|
| 3401 |
+
"epoch": 3.490974729241877,
|
| 3402 |
+
"grad_norm": 0.48629310727119446,
|
| 3403 |
+
"learning_rate": 0.00012279984920412264,
|
| 3404 |
+
"loss": 0.12396648526191711,
|
| 3405 |
+
"step": 485
|
| 3406 |
+
},
|
| 3407 |
+
{
|
| 3408 |
+
"epoch": 3.4981949458483754,
|
| 3409 |
+
"grad_norm": 0.6295841336250305,
|
| 3410 |
+
"learning_rate": 0.00012204282534146414,
|
| 3411 |
+
"loss": 0.1579296588897705,
|
| 3412 |
+
"step": 486
|
| 3413 |
+
},
|
| 3414 |
+
{
|
| 3415 |
+
"epoch": 3.5054151624548737,
|
| 3416 |
+
"grad_norm": 0.524736225605011,
|
| 3417 |
+
"learning_rate": 0.00012128711619603885,
|
| 3418 |
+
"loss": 0.14176616072654724,
|
| 3419 |
+
"step": 487
|
| 3420 |
+
},
|
| 3421 |
+
{
|
| 3422 |
+
"epoch": 3.512635379061372,
|
| 3423 |
+
"grad_norm": 0.4429115355014801,
|
| 3424 |
+
"learning_rate": 0.0001205327345125856,
|
| 3425 |
+
"loss": 0.16075468063354492,
|
| 3426 |
+
"step": 488
|
| 3427 |
+
},
|
| 3428 |
+
{
|
| 3429 |
+
"epoch": 3.51985559566787,
|
| 3430 |
+
"grad_norm": 0.5202926993370056,
|
| 3431 |
+
"learning_rate": 0.00011977969301345627,
|
| 3432 |
+
"loss": 0.155876025557518,
|
| 3433 |
+
"step": 489
|
| 3434 |
+
},
|
| 3435 |
+
{
|
| 3436 |
+
"epoch": 3.527075812274368,
|
| 3437 |
+
"grad_norm": 0.5090999603271484,
|
| 3438 |
+
"learning_rate": 0.00011902800439840091,
|
| 3439 |
+
"loss": 0.1420796513557434,
|
| 3440 |
+
"step": 490
|
| 3441 |
+
},
|
| 3442 |
+
{
|
| 3443 |
+
"epoch": 3.5342960288808665,
|
| 3444 |
+
"grad_norm": 0.5266745686531067,
|
| 3445 |
+
"learning_rate": 0.0001182776813443537,
|
| 3446 |
+
"loss": 0.1911281943321228,
|
| 3447 |
+
"step": 491
|
| 3448 |
+
},
|
| 3449 |
+
{
|
| 3450 |
+
"epoch": 3.5415162454873648,
|
| 3451 |
+
"grad_norm": 0.4100717306137085,
|
| 3452 |
+
"learning_rate": 0.00011752873650521934,
|
| 3453 |
+
"loss": 0.12646690011024475,
|
| 3454 |
+
"step": 492
|
| 3455 |
+
},
|
| 3456 |
+
{
|
| 3457 |
+
"epoch": 3.5487364620938626,
|
| 3458 |
+
"grad_norm": 0.4897909164428711,
|
| 3459 |
+
"learning_rate": 0.00011678118251165929,
|
| 3460 |
+
"loss": 0.14893396198749542,
|
| 3461 |
+
"step": 493
|
| 3462 |
+
},
|
| 3463 |
+
{
|
| 3464 |
+
"epoch": 3.555956678700361,
|
| 3465 |
+
"grad_norm": 0.48633724451065063,
|
| 3466 |
+
"learning_rate": 0.00011603503197087893,
|
| 3467 |
+
"loss": 0.11430861800909042,
|
| 3468 |
+
"step": 494
|
| 3469 |
+
},
|
| 3470 |
+
{
|
| 3471 |
+
"epoch": 3.563176895306859,
|
| 3472 |
+
"grad_norm": 0.3797968327999115,
|
| 3473 |
+
"learning_rate": 0.00011529029746641522,
|
| 3474 |
+
"loss": 0.10336866229772568,
|
| 3475 |
+
"step": 495
|
| 3476 |
+
},
|
| 3477 |
+
{
|
| 3478 |
+
"epoch": 3.5703971119133575,
|
| 3479 |
+
"grad_norm": 0.4714502692222595,
|
| 3480 |
+
"learning_rate": 0.00011454699155792387,
|
| 3481 |
+
"loss": 0.12609894573688507,
|
| 3482 |
+
"step": 496
|
| 3483 |
+
},
|
| 3484 |
+
{
|
| 3485 |
+
"epoch": 3.577617328519856,
|
| 3486 |
+
"grad_norm": 0.5311459898948669,
|
| 3487 |
+
"learning_rate": 0.00011380512678096805,
|
| 3488 |
+
"loss": 0.14762037992477417,
|
| 3489 |
+
"step": 497
|
| 3490 |
+
},
|
| 3491 |
+
{
|
| 3492 |
+
"epoch": 3.5848375451263537,
|
| 3493 |
+
"grad_norm": 0.44842103123664856,
|
| 3494 |
+
"learning_rate": 0.00011306471564680703,
|
| 3495 |
+
"loss": 0.1137317568063736,
|
| 3496 |
+
"step": 498
|
| 3497 |
+
},
|
| 3498 |
+
{
|
| 3499 |
+
"epoch": 3.592057761732852,
|
| 3500 |
+
"grad_norm": 0.6083047986030579,
|
| 3501 |
+
"learning_rate": 0.0001123257706421845,
|
| 3502 |
+
"loss": 0.1538015455007553,
|
| 3503 |
+
"step": 499
|
| 3504 |
+
},
|
| 3505 |
+
{
|
| 3506 |
+
"epoch": 3.5992779783393503,
|
| 3507 |
+
"grad_norm": 0.454277902841568,
|
| 3508 |
+
"learning_rate": 0.00011158830422911882,
|
| 3509 |
+
"loss": 0.13900214433670044,
|
| 3510 |
+
"step": 500
|
| 3511 |
+
}
|
| 3512 |
+
],
|
| 3513 |
+
"logging_steps": 1,
|
| 3514 |
+
"max_steps": 770,
|
| 3515 |
+
"num_input_tokens_seen": 0,
|
| 3516 |
+
"num_train_epochs": 6,
|
| 3517 |
+
"save_steps": 500,
|
| 3518 |
+
"stateful_callbacks": {
|
| 3519 |
+
"TrainerControl": {
|
| 3520 |
+
"args": {
|
| 3521 |
+
"should_epoch_stop": false,
|
| 3522 |
+
"should_evaluate": false,
|
| 3523 |
+
"should_log": false,
|
| 3524 |
+
"should_save": true,
|
| 3525 |
+
"should_training_stop": false
|
| 3526 |
+
},
|
| 3527 |
+
"attributes": {}
|
| 3528 |
+
}
|
| 3529 |
+
},
|
| 3530 |
+
"total_flos": 5.525794067913907e+16,
|
| 3531 |
+
"train_batch_size": 1,
|
| 3532 |
+
"trial_name": null,
|
| 3533 |
+
"trial_params": null
|
| 3534 |
+
}
|
checkpoint-500/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3feb7d84776eed4718f792285c52122bc3b2372e4e090380a285a8afc9196989
|
| 3 |
+
size 5713
|
checkpoint-770/README.md
ADDED
|
@@ -0,0 +1,210 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
base_model: Qwen/Qwen3.5-9B
|
| 3 |
+
library_name: peft
|
| 4 |
+
pipeline_tag: text-generation
|
| 5 |
+
tags:
|
| 6 |
+
- base_model:adapter:Qwen/Qwen3.5-9B
|
| 7 |
+
- lora
|
| 8 |
+
- sft
|
| 9 |
+
- transformers
|
| 10 |
+
- trl
|
| 11 |
+
- unsloth
|
| 12 |
+
---
|
| 13 |
+
|
| 14 |
+
# Model Card for Model ID
|
| 15 |
+
|
| 16 |
+
<!-- Provide a quick summary of what the model is/does. -->
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
|
| 20 |
+
## Model Details
|
| 21 |
+
|
| 22 |
+
### Model Description
|
| 23 |
+
|
| 24 |
+
<!-- Provide a longer summary of what this model is. -->
|
| 25 |
+
|
| 26 |
+
|
| 27 |
+
|
| 28 |
+
- **Developed by:** [More Information Needed]
|
| 29 |
+
- **Funded by [optional]:** [More Information Needed]
|
| 30 |
+
- **Shared by [optional]:** [More Information Needed]
|
| 31 |
+
- **Model type:** [More Information Needed]
|
| 32 |
+
- **Language(s) (NLP):** [More Information Needed]
|
| 33 |
+
- **License:** [More Information Needed]
|
| 34 |
+
- **Finetuned from model [optional]:** [More Information Needed]
|
| 35 |
+
|
| 36 |
+
### Model Sources [optional]
|
| 37 |
+
|
| 38 |
+
<!-- Provide the basic links for the model. -->
|
| 39 |
+
|
| 40 |
+
- **Repository:** [More Information Needed]
|
| 41 |
+
- **Paper [optional]:** [More Information Needed]
|
| 42 |
+
- **Demo [optional]:** [More Information Needed]
|
| 43 |
+
|
| 44 |
+
## Uses
|
| 45 |
+
|
| 46 |
+
<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
|
| 47 |
+
|
| 48 |
+
### Direct Use
|
| 49 |
+
|
| 50 |
+
<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
|
| 51 |
+
|
| 52 |
+
[More Information Needed]
|
| 53 |
+
|
| 54 |
+
### Downstream Use [optional]
|
| 55 |
+
|
| 56 |
+
<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
|
| 57 |
+
|
| 58 |
+
[More Information Needed]
|
| 59 |
+
|
| 60 |
+
### Out-of-Scope Use
|
| 61 |
+
|
| 62 |
+
<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
|
| 63 |
+
|
| 64 |
+
[More Information Needed]
|
| 65 |
+
|
| 66 |
+
## Bias, Risks, and Limitations
|
| 67 |
+
|
| 68 |
+
<!-- This section is meant to convey both technical and sociotechnical limitations. -->
|
| 69 |
+
|
| 70 |
+
[More Information Needed]
|
| 71 |
+
|
| 72 |
+
### Recommendations
|
| 73 |
+
|
| 74 |
+
<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
|
| 75 |
+
|
| 76 |
+
Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
|
| 77 |
+
|
| 78 |
+
## How to Get Started with the Model
|
| 79 |
+
|
| 80 |
+
Use the code below to get started with the model.
|
| 81 |
+
|
| 82 |
+
[More Information Needed]
|
| 83 |
+
|
| 84 |
+
## Training Details
|
| 85 |
+
|
| 86 |
+
### Training Data
|
| 87 |
+
|
| 88 |
+
<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
|
| 89 |
+
|
| 90 |
+
[More Information Needed]
|
| 91 |
+
|
| 92 |
+
### Training Procedure
|
| 93 |
+
|
| 94 |
+
<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
|
| 95 |
+
|
| 96 |
+
#### Preprocessing [optional]
|
| 97 |
+
|
| 98 |
+
[More Information Needed]
|
| 99 |
+
|
| 100 |
+
|
| 101 |
+
#### Training Hyperparameters
|
| 102 |
+
|
| 103 |
+
- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
|
| 104 |
+
|
| 105 |
+
#### Speeds, Sizes, Times [optional]
|
| 106 |
+
|
| 107 |
+
<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
|
| 108 |
+
|
| 109 |
+
[More Information Needed]
|
| 110 |
+
|
| 111 |
+
## Evaluation
|
| 112 |
+
|
| 113 |
+
<!-- This section describes the evaluation protocols and provides the results. -->
|
| 114 |
+
|
| 115 |
+
### Testing Data, Factors & Metrics
|
| 116 |
+
|
| 117 |
+
#### Testing Data
|
| 118 |
+
|
| 119 |
+
<!-- This should link to a Dataset Card if possible. -->
|
| 120 |
+
|
| 121 |
+
[More Information Needed]
|
| 122 |
+
|
| 123 |
+
#### Factors
|
| 124 |
+
|
| 125 |
+
<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
|
| 126 |
+
|
| 127 |
+
[More Information Needed]
|
| 128 |
+
|
| 129 |
+
#### Metrics
|
| 130 |
+
|
| 131 |
+
<!-- These are the evaluation metrics being used, ideally with a description of why. -->
|
| 132 |
+
|
| 133 |
+
[More Information Needed]
|
| 134 |
+
|
| 135 |
+
### Results
|
| 136 |
+
|
| 137 |
+
[More Information Needed]
|
| 138 |
+
|
| 139 |
+
#### Summary
|
| 140 |
+
|
| 141 |
+
|
| 142 |
+
|
| 143 |
+
## Model Examination [optional]
|
| 144 |
+
|
| 145 |
+
<!-- Relevant interpretability work for the model goes here -->
|
| 146 |
+
|
| 147 |
+
[More Information Needed]
|
| 148 |
+
|
| 149 |
+
## Environmental Impact
|
| 150 |
+
|
| 151 |
+
<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
|
| 152 |
+
|
| 153 |
+
Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
|
| 154 |
+
|
| 155 |
+
- **Hardware Type:** [More Information Needed]
|
| 156 |
+
- **Hours used:** [More Information Needed]
|
| 157 |
+
- **Cloud Provider:** [More Information Needed]
|
| 158 |
+
- **Compute Region:** [More Information Needed]
|
| 159 |
+
- **Carbon Emitted:** [More Information Needed]
|
| 160 |
+
|
| 161 |
+
## Technical Specifications [optional]
|
| 162 |
+
|
| 163 |
+
### Model Architecture and Objective
|
| 164 |
+
|
| 165 |
+
[More Information Needed]
|
| 166 |
+
|
| 167 |
+
### Compute Infrastructure
|
| 168 |
+
|
| 169 |
+
[More Information Needed]
|
| 170 |
+
|
| 171 |
+
#### Hardware
|
| 172 |
+
|
| 173 |
+
[More Information Needed]
|
| 174 |
+
|
| 175 |
+
#### Software
|
| 176 |
+
|
| 177 |
+
[More Information Needed]
|
| 178 |
+
|
| 179 |
+
## Citation [optional]
|
| 180 |
+
|
| 181 |
+
<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
|
| 182 |
+
|
| 183 |
+
**BibTeX:**
|
| 184 |
+
|
| 185 |
+
[More Information Needed]
|
| 186 |
+
|
| 187 |
+
**APA:**
|
| 188 |
+
|
| 189 |
+
[More Information Needed]
|
| 190 |
+
|
| 191 |
+
## Glossary [optional]
|
| 192 |
+
|
| 193 |
+
<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
|
| 194 |
+
|
| 195 |
+
[More Information Needed]
|
| 196 |
+
|
| 197 |
+
## More Information [optional]
|
| 198 |
+
|
| 199 |
+
[More Information Needed]
|
| 200 |
+
|
| 201 |
+
## Model Card Authors [optional]
|
| 202 |
+
|
| 203 |
+
[More Information Needed]
|
| 204 |
+
|
| 205 |
+
## Model Card Contact
|
| 206 |
+
|
| 207 |
+
[More Information Needed]
|
| 208 |
+
### Framework versions
|
| 209 |
+
|
| 210 |
+
- PEFT 0.18.1
|
checkpoint-770/adapter_config.json
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"alora_invocation_tokens": null,
|
| 3 |
+
"alpha_pattern": {},
|
| 4 |
+
"arrow_config": null,
|
| 5 |
+
"auto_mapping": {
|
| 6 |
+
"base_model_class": "Qwen3_5ForConditionalGeneration",
|
| 7 |
+
"parent_library": "transformers.models.qwen3_5.modeling_qwen3_5",
|
| 8 |
+
"unsloth_fixed": true
|
| 9 |
+
},
|
| 10 |
+
"base_model_name_or_path": "Qwen/Qwen3.5-9B",
|
| 11 |
+
"bias": "none",
|
| 12 |
+
"corda_config": null,
|
| 13 |
+
"ensure_weight_tying": false,
|
| 14 |
+
"eva_config": null,
|
| 15 |
+
"exclude_modules": null,
|
| 16 |
+
"fan_in_fan_out": false,
|
| 17 |
+
"inference_mode": true,
|
| 18 |
+
"init_lora_weights": true,
|
| 19 |
+
"layer_replication": null,
|
| 20 |
+
"layers_pattern": null,
|
| 21 |
+
"layers_to_transform": null,
|
| 22 |
+
"loftq_config": {},
|
| 23 |
+
"lora_alpha": 16,
|
| 24 |
+
"lora_bias": false,
|
| 25 |
+
"lora_dropout": 0,
|
| 26 |
+
"megatron_config": null,
|
| 27 |
+
"megatron_core": "megatron.core",
|
| 28 |
+
"modules_to_save": null,
|
| 29 |
+
"peft_type": "LORA",
|
| 30 |
+
"peft_version": "0.18.1",
|
| 31 |
+
"qalora_group_size": 16,
|
| 32 |
+
"r": 16,
|
| 33 |
+
"rank_pattern": {},
|
| 34 |
+
"revision": null,
|
| 35 |
+
"target_modules": "(?:.*?(?:language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:qkv|proj|linear_fc1|linear_fc2|out_proj|in_proj_qkv|in_proj_z|in_proj_b|in_proj_a|gate_proj|up_proj|down_proj|q_proj|k_proj|v_proj|o_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:qkv|proj|linear_fc1|linear_fc2|out_proj|in_proj_qkv|in_proj_z|in_proj_b|in_proj_a|gate_proj|up_proj|down_proj|q_proj|k_proj|v_proj|o_proj)))",
|
| 36 |
+
"target_parameters": null,
|
| 37 |
+
"task_type": "CAUSAL_LM",
|
| 38 |
+
"trainable_token_indices": null,
|
| 39 |
+
"use_dora": false,
|
| 40 |
+
"use_qalora": false,
|
| 41 |
+
"use_rslora": false
|
| 42 |
+
}
|
checkpoint-770/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8dc94603f0c6e625c9716499f91c5acf38deff4596e0ed2ca5fc3a4f5126806c
|
| 3 |
+
size 173188512
|
checkpoint-770/chat_template.jinja
ADDED
|
@@ -0,0 +1,154 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{%- set image_count = namespace(value=0) %}
|
| 2 |
+
{%- set video_count = namespace(value=0) %}
|
| 3 |
+
{%- macro render_content(content, do_vision_count, is_system_content=false) %}
|
| 4 |
+
{%- if content is string %}
|
| 5 |
+
{{- content }}
|
| 6 |
+
{%- elif content is iterable and content is not mapping %}
|
| 7 |
+
{%- for item in content %}
|
| 8 |
+
{%- if 'image' in item or 'image_url' in item or item.type == 'image' %}
|
| 9 |
+
{%- if is_system_content %}
|
| 10 |
+
{{- raise_exception('System message cannot contain images.') }}
|
| 11 |
+
{%- endif %}
|
| 12 |
+
{%- if do_vision_count %}
|
| 13 |
+
{%- set image_count.value = image_count.value + 1 %}
|
| 14 |
+
{%- endif %}
|
| 15 |
+
{%- if add_vision_id %}
|
| 16 |
+
{{- 'Picture ' ~ image_count.value ~ ': ' }}
|
| 17 |
+
{%- endif %}
|
| 18 |
+
{{- '<|vision_start|><|image_pad|><|vision_end|>' }}
|
| 19 |
+
{%- elif 'video' in item or item.type == 'video' %}
|
| 20 |
+
{%- if is_system_content %}
|
| 21 |
+
{{- raise_exception('System message cannot contain videos.') }}
|
| 22 |
+
{%- endif %}
|
| 23 |
+
{%- if do_vision_count %}
|
| 24 |
+
{%- set video_count.value = video_count.value + 1 %}
|
| 25 |
+
{%- endif %}
|
| 26 |
+
{%- if add_vision_id %}
|
| 27 |
+
{{- 'Video ' ~ video_count.value ~ ': ' }}
|
| 28 |
+
{%- endif %}
|
| 29 |
+
{{- '<|vision_start|><|video_pad|><|vision_end|>' }}
|
| 30 |
+
{%- elif 'text' in item %}
|
| 31 |
+
{{- item.text }}
|
| 32 |
+
{%- else %}
|
| 33 |
+
{{- raise_exception('Unexpected item type in content.') }}
|
| 34 |
+
{%- endif %}
|
| 35 |
+
{%- endfor %}
|
| 36 |
+
{%- elif content is none or content is undefined %}
|
| 37 |
+
{{- '' }}
|
| 38 |
+
{%- else %}
|
| 39 |
+
{{- raise_exception('Unexpected content type.') }}
|
| 40 |
+
{%- endif %}
|
| 41 |
+
{%- endmacro %}
|
| 42 |
+
{%- if not messages %}
|
| 43 |
+
{{- raise_exception('No messages provided.') }}
|
| 44 |
+
{%- endif %}
|
| 45 |
+
{%- if tools and tools is iterable and tools is not mapping %}
|
| 46 |
+
{{- '<|im_start|>system\n' }}
|
| 47 |
+
{{- "# Tools\n\nYou have access to the following functions:\n\n<tools>" }}
|
| 48 |
+
{%- for tool in tools %}
|
| 49 |
+
{{- "\n" }}
|
| 50 |
+
{{- tool | tojson }}
|
| 51 |
+
{%- endfor %}
|
| 52 |
+
{{- "\n</tools>" }}
|
| 53 |
+
{{- '\n\nIf you choose to call a function ONLY reply in the following format with NO suffix:\n\n<tool_call>\n<function=example_function_name>\n<parameter=example_parameter_1>\nvalue_1\n</parameter>\n<parameter=example_parameter_2>\nThis is the value for the second parameter\nthat can span\nmultiple lines\n</parameter>\n</function>\n</tool_call>\n\n<IMPORTANT>\nReminder:\n- Function calls MUST follow the specified format: an inner <function=...></function> block must be nested within <tool_call></tool_call> XML tags\n- Required parameters MUST be specified\n- You may provide optional reasoning for your function call in natural language BEFORE the function call, but NOT after\n- If there is no function call available, answer the question like normal with your current knowledge and do not tell the user about function calls\n</IMPORTANT>' }}
|
| 54 |
+
{%- if messages[0].role == 'system' %}
|
| 55 |
+
{%- set content = render_content(messages[0].content, false, true)|trim %}
|
| 56 |
+
{%- if content %}
|
| 57 |
+
{{- '\n\n' + content }}
|
| 58 |
+
{%- endif %}
|
| 59 |
+
{%- endif %}
|
| 60 |
+
{{- '<|im_end|>\n' }}
|
| 61 |
+
{%- else %}
|
| 62 |
+
{%- if messages[0].role == 'system' %}
|
| 63 |
+
{%- set content = render_content(messages[0].content, false, true)|trim %}
|
| 64 |
+
{{- '<|im_start|>system\n' + content + '<|im_end|>\n' }}
|
| 65 |
+
{%- endif %}
|
| 66 |
+
{%- endif %}
|
| 67 |
+
{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
|
| 68 |
+
{%- for message in messages[::-1] %}
|
| 69 |
+
{%- set index = (messages|length - 1) - loop.index0 %}
|
| 70 |
+
{%- if ns.multi_step_tool and message.role == "user" %}
|
| 71 |
+
{%- set content = render_content(message.content, false)|trim %}
|
| 72 |
+
{%- if not(content.startswith('<tool_response>') and content.endswith('</tool_response>')) %}
|
| 73 |
+
{%- set ns.multi_step_tool = false %}
|
| 74 |
+
{%- set ns.last_query_index = index %}
|
| 75 |
+
{%- endif %}
|
| 76 |
+
{%- endif %}
|
| 77 |
+
{%- endfor %}
|
| 78 |
+
{%- if ns.multi_step_tool %}
|
| 79 |
+
{{- raise_exception('No user query found in messages.') }}
|
| 80 |
+
{%- endif %}
|
| 81 |
+
{%- for message in messages %}
|
| 82 |
+
{%- set content = render_content(message.content, true)|trim %}
|
| 83 |
+
{%- if message.role == "system" %}
|
| 84 |
+
{%- if not loop.first %}
|
| 85 |
+
{{- raise_exception('System message must be at the beginning.') }}
|
| 86 |
+
{%- endif %}
|
| 87 |
+
{%- elif message.role == "user" %}
|
| 88 |
+
{{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
|
| 89 |
+
{%- elif message.role == "assistant" %}
|
| 90 |
+
{%- set reasoning_content = '' %}
|
| 91 |
+
{%- if message.reasoning_content is string %}
|
| 92 |
+
{%- set reasoning_content = message.reasoning_content %}
|
| 93 |
+
{%- else %}
|
| 94 |
+
{%- if '</think>' in content %}
|
| 95 |
+
{%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
|
| 96 |
+
{%- set content = content.split('</think>')[-1].lstrip('\n') %}
|
| 97 |
+
{%- endif %}
|
| 98 |
+
{%- endif %}
|
| 99 |
+
{%- set reasoning_content = reasoning_content|trim %}
|
| 100 |
+
{%- if loop.index0 > ns.last_query_index %}
|
| 101 |
+
{{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content + '\n</think>\n\n' + content }}
|
| 102 |
+
{%- else %}
|
| 103 |
+
{{- '<|im_start|>' + message.role + '\n' + content }}
|
| 104 |
+
{%- endif %}
|
| 105 |
+
{%- if message.tool_calls and message.tool_calls is iterable and message.tool_calls is not mapping %}
|
| 106 |
+
{%- for tool_call in message.tool_calls %}
|
| 107 |
+
{%- if tool_call.function is defined %}
|
| 108 |
+
{%- set tool_call = tool_call.function %}
|
| 109 |
+
{%- endif %}
|
| 110 |
+
{%- if loop.first %}
|
| 111 |
+
{%- if content|trim %}
|
| 112 |
+
{{- '\n\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 113 |
+
{%- else %}
|
| 114 |
+
{{- '<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 115 |
+
{%- endif %}
|
| 116 |
+
{%- else %}
|
| 117 |
+
{{- '\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
|
| 118 |
+
{%- endif %}
|
| 119 |
+
{%- if tool_call.arguments is defined %}
|
| 120 |
+
{%- for args_name, args_value in tool_call.arguments|items %}
|
| 121 |
+
{{- '<parameter=' + args_name + '>\n' }}
|
| 122 |
+
{%- set args_value = args_value | tojson | safe if args_value is mapping or (args_value is sequence and args_value is not string) else args_value | string %}
|
| 123 |
+
{{- args_value }}
|
| 124 |
+
{{- '\n</parameter>\n' }}
|
| 125 |
+
{%- endfor %}
|
| 126 |
+
{%- endif %}
|
| 127 |
+
{{- '</function>\n</tool_call>' }}
|
| 128 |
+
{%- endfor %}
|
| 129 |
+
{%- endif %}
|
| 130 |
+
{{- '<|im_end|>\n' }}
|
| 131 |
+
{%- elif message.role == "tool" %}
|
| 132 |
+
{%- if loop.previtem and loop.previtem.role != "tool" %}
|
| 133 |
+
{{- '<|im_start|>user' }}
|
| 134 |
+
{%- endif %}
|
| 135 |
+
{{- '\n<tool_response>\n' }}
|
| 136 |
+
{{- content }}
|
| 137 |
+
{{- '\n</tool_response>' }}
|
| 138 |
+
{%- if not loop.last and loop.nextitem.role != "tool" %}
|
| 139 |
+
{{- '<|im_end|>\n' }}
|
| 140 |
+
{%- elif loop.last %}
|
| 141 |
+
{{- '<|im_end|>\n' }}
|
| 142 |
+
{%- endif %}
|
| 143 |
+
{%- else %}
|
| 144 |
+
{{- raise_exception('Unexpected message role.') }}
|
| 145 |
+
{%- endif %}
|
| 146 |
+
{%- endfor %}
|
| 147 |
+
{%- if add_generation_prompt %}
|
| 148 |
+
{{- '<|im_start|>assistant\n' }}
|
| 149 |
+
{%- if enable_thinking is defined and enable_thinking is false %}
|
| 150 |
+
{{- '<think>\n\n</think>\n\n' }}
|
| 151 |
+
{%- else %}
|
| 152 |
+
{{- '<think>\n' }}
|
| 153 |
+
{%- endif %}
|
| 154 |
+
{%- endif %}
|
checkpoint-770/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b589081ecc7eb3fc8ca1cffe8dc0cf8b74293cd27dbc861e9aa0caa6e15bfac3
|
| 3 |
+
size 88617029
|
checkpoint-770/processor_config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"image_processor": {
|
| 3 |
+
"data_format": "channels_first",
|
| 4 |
+
"do_convert_rgb": true,
|
| 5 |
+
"do_normalize": true,
|
| 6 |
+
"do_rescale": true,
|
| 7 |
+
"do_resize": true,
|
| 8 |
+
"image_mean": [
|
| 9 |
+
0.5,
|
| 10 |
+
0.5,
|
| 11 |
+
0.5
|
| 12 |
+
],
|
| 13 |
+
"image_processor_type": "Qwen2VLImageProcessorFast",
|
| 14 |
+
"image_std": [
|
| 15 |
+
0.5,
|
| 16 |
+
0.5,
|
| 17 |
+
0.5
|
| 18 |
+
],
|
| 19 |
+
"merge_size": 2,
|
| 20 |
+
"patch_size": 16,
|
| 21 |
+
"resample": 3,
|
| 22 |
+
"rescale_factor": 0.00392156862745098,
|
| 23 |
+
"size": {
|
| 24 |
+
"longest_edge": 16777216,
|
| 25 |
+
"shortest_edge": 65536
|
| 26 |
+
},
|
| 27 |
+
"temporal_patch_size": 2
|
| 28 |
+
},
|
| 29 |
+
"processor_class": "Qwen3VLProcessor",
|
| 30 |
+
"video_processor": {
|
| 31 |
+
"data_format": "channels_first",
|
| 32 |
+
"default_to_square": true,
|
| 33 |
+
"do_convert_rgb": true,
|
| 34 |
+
"do_normalize": true,
|
| 35 |
+
"do_rescale": true,
|
| 36 |
+
"do_resize": true,
|
| 37 |
+
"do_sample_frames": true,
|
| 38 |
+
"fps": 2,
|
| 39 |
+
"image_mean": [
|
| 40 |
+
0.5,
|
| 41 |
+
0.5,
|
| 42 |
+
0.5
|
| 43 |
+
],
|
| 44 |
+
"image_std": [
|
| 45 |
+
0.5,
|
| 46 |
+
0.5,
|
| 47 |
+
0.5
|
| 48 |
+
],
|
| 49 |
+
"max_frames": 768,
|
| 50 |
+
"merge_size": 2,
|
| 51 |
+
"min_frames": 4,
|
| 52 |
+
"patch_size": 16,
|
| 53 |
+
"resample": 3,
|
| 54 |
+
"rescale_factor": 0.00392156862745098,
|
| 55 |
+
"return_metadata": false,
|
| 56 |
+
"size": {
|
| 57 |
+
"longest_edge": 25165824,
|
| 58 |
+
"shortest_edge": 4096
|
| 59 |
+
},
|
| 60 |
+
"temporal_patch_size": 2,
|
| 61 |
+
"video_processor_type": "Qwen3VLVideoProcessor"
|
| 62 |
+
}
|
| 63 |
+
}
|
checkpoint-770/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2922886dc37f9211a4affea61093cbe4db90c0a37e91e7edac63ec0cf7b13d45
|
| 3 |
+
size 14645
|
checkpoint-770/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6842476510ef1a339b059738a5616f5fe7454531bf7f4f3bc53954af85a4a7f1
|
| 3 |
+
size 1465
|
checkpoint-770/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:263dcc3feef53d558a357d52941ff3649fa9cd9a3199934376f2bbf615d49ffc
|
| 3 |
+
size 19989610
|
checkpoint-770/tokenizer_config.json
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"audio_bos_token": "<|audio_start|>",
|
| 4 |
+
"audio_eos_token": "<|audio_end|>",
|
| 5 |
+
"audio_token": "<|audio_pad|>",
|
| 6 |
+
"backend": "tokenizers",
|
| 7 |
+
"bos_token": null,
|
| 8 |
+
"clean_up_tokenization_spaces": false,
|
| 9 |
+
"eos_token": "<|im_end|>",
|
| 10 |
+
"errors": "replace",
|
| 11 |
+
"image_token": "<|image_pad|>",
|
| 12 |
+
"is_local": false,
|
| 13 |
+
"model_max_length": 262144,
|
| 14 |
+
"model_specific_special_tokens": {
|
| 15 |
+
"audio_bos_token": "<|audio_start|>",
|
| 16 |
+
"audio_eos_token": "<|audio_end|>",
|
| 17 |
+
"audio_token": "<|audio_pad|>",
|
| 18 |
+
"image_token": "<|image_pad|>",
|
| 19 |
+
"video_token": "<|video_pad|>",
|
| 20 |
+
"vision_bos_token": "<|vision_start|>",
|
| 21 |
+
"vision_eos_token": "<|vision_end|>"
|
| 22 |
+
},
|
| 23 |
+
"pad_token": "<|endoftext|>",
|
| 24 |
+
"padding_side": "right",
|
| 25 |
+
"pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
|
| 26 |
+
"processor_class": "Qwen3VLProcessor",
|
| 27 |
+
"split_special_tokens": false,
|
| 28 |
+
"tokenizer_class": "TokenizersBackend",
|
| 29 |
+
"unk_token": null,
|
| 30 |
+
"video_token": "<|video_pad|>",
|
| 31 |
+
"vision_bos_token": "<|vision_start|>",
|
| 32 |
+
"vision_eos_token": "<|vision_end|>"
|
| 33 |
+
}
|
checkpoint-770/trainer_state.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoint-770/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3feb7d84776eed4718f792285c52122bc3b2372e4e090380a285a8afc9196989
|
| 3 |
+
size 5713
|
eval.json
ADDED
|
@@ -0,0 +1,601 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"checkpoint": "outputs/checkpoint-770",
|
| 3 |
+
"num_samples": 98,
|
| 4 |
+
"retrieval_similarity": 0.7239,
|
| 5 |
+
"tIOU": 0.67,
|
| 6 |
+
"mAP_0.5": 0.5092,
|
| 7 |
+
"sim_pass": true,
|
| 8 |
+
"tiou_pass": true,
|
| 9 |
+
"map_pass": true,
|
| 10 |
+
"overall_pass": true,
|
| 11 |
+
"per_sample": [
|
| 12 |
+
{
|
| 13 |
+
"idx": 0,
|
| 14 |
+
"retrieval_sim": 0.6549,
|
| 15 |
+
"tIOU": 0.5277,
|
| 16 |
+
"mAP": 0.45
|
| 17 |
+
},
|
| 18 |
+
{
|
| 19 |
+
"idx": 1,
|
| 20 |
+
"retrieval_sim": 0.7739,
|
| 21 |
+
"tIOU": 0.808,
|
| 22 |
+
"mAP": 1.0
|
| 23 |
+
},
|
| 24 |
+
{
|
| 25 |
+
"idx": 2,
|
| 26 |
+
"retrieval_sim": 0.6433,
|
| 27 |
+
"tIOU": 1.0,
|
| 28 |
+
"mAP": 1.0
|
| 29 |
+
},
|
| 30 |
+
{
|
| 31 |
+
"idx": 3,
|
| 32 |
+
"retrieval_sim": 0.7473,
|
| 33 |
+
"tIOU": 0.6228,
|
| 34 |
+
"mAP": 0.45
|
| 35 |
+
},
|
| 36 |
+
{
|
| 37 |
+
"idx": 4,
|
| 38 |
+
"retrieval_sim": 0.7774,
|
| 39 |
+
"tIOU": 0.5406,
|
| 40 |
+
"mAP": 0.25
|
| 41 |
+
},
|
| 42 |
+
{
|
| 43 |
+
"idx": 5,
|
| 44 |
+
"retrieval_sim": 0.7924,
|
| 45 |
+
"tIOU": 0.3868,
|
| 46 |
+
"mAP": 0.05
|
| 47 |
+
},
|
| 48 |
+
{
|
| 49 |
+
"idx": 6,
|
| 50 |
+
"retrieval_sim": 0.7626,
|
| 51 |
+
"tIOU": 0.7779,
|
| 52 |
+
"mAP": 0.75
|
| 53 |
+
},
|
| 54 |
+
{
|
| 55 |
+
"idx": 7,
|
| 56 |
+
"retrieval_sim": 0.6476,
|
| 57 |
+
"tIOU": 0.806,
|
| 58 |
+
"mAP": 0.75
|
| 59 |
+
},
|
| 60 |
+
{
|
| 61 |
+
"idx": 8,
|
| 62 |
+
"retrieval_sim": 0.7355,
|
| 63 |
+
"tIOU": 0.752,
|
| 64 |
+
"mAP": 0.64
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"idx": 9,
|
| 68 |
+
"retrieval_sim": 0.8859,
|
| 69 |
+
"tIOU": 0.6579,
|
| 70 |
+
"mAP": 0.5625
|
| 71 |
+
},
|
| 72 |
+
{
|
| 73 |
+
"idx": 10,
|
| 74 |
+
"retrieval_sim": 0.7486,
|
| 75 |
+
"tIOU": 0.7134,
|
| 76 |
+
"mAP": 0.8
|
| 77 |
+
},
|
| 78 |
+
{
|
| 79 |
+
"idx": 11,
|
| 80 |
+
"retrieval_sim": 0.6805,
|
| 81 |
+
"tIOU": 0.5,
|
| 82 |
+
"mAP": 0.2
|
| 83 |
+
},
|
| 84 |
+
{
|
| 85 |
+
"idx": 12,
|
| 86 |
+
"retrieval_sim": 0.7698,
|
| 87 |
+
"tIOU": 0.7164,
|
| 88 |
+
"mAP": 0.64
|
| 89 |
+
},
|
| 90 |
+
{
|
| 91 |
+
"idx": 13,
|
| 92 |
+
"retrieval_sim": 0.795,
|
| 93 |
+
"tIOU": 0.5923,
|
| 94 |
+
"mAP": 0.25
|
| 95 |
+
},
|
| 96 |
+
{
|
| 97 |
+
"idx": 14,
|
| 98 |
+
"retrieval_sim": 0.586,
|
| 99 |
+
"tIOU": 0.397,
|
| 100 |
+
"mAP": 0.2
|
| 101 |
+
},
|
| 102 |
+
{
|
| 103 |
+
"idx": 15,
|
| 104 |
+
"retrieval_sim": 0.5982,
|
| 105 |
+
"tIOU": 0.7678,
|
| 106 |
+
"mAP": 0.45
|
| 107 |
+
},
|
| 108 |
+
{
|
| 109 |
+
"idx": 16,
|
| 110 |
+
"retrieval_sim": 0.7116,
|
| 111 |
+
"tIOU": 0.5205,
|
| 112 |
+
"mAP": 0.4444
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"idx": 17,
|
| 116 |
+
"retrieval_sim": 0.6879,
|
| 117 |
+
"tIOU": 0.3502,
|
| 118 |
+
"mAP": 0.0833
|
| 119 |
+
},
|
| 120 |
+
{
|
| 121 |
+
"idx": 18,
|
| 122 |
+
"retrieval_sim": 0.7088,
|
| 123 |
+
"tIOU": 0.75,
|
| 124 |
+
"mAP": 0.75
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"idx": 19,
|
| 128 |
+
"retrieval_sim": 0.5611,
|
| 129 |
+
"tIOU": 0.7193,
|
| 130 |
+
"mAP": 0.75
|
| 131 |
+
},
|
| 132 |
+
{
|
| 133 |
+
"idx": 20,
|
| 134 |
+
"retrieval_sim": 0.5881,
|
| 135 |
+
"tIOU": 0.6111,
|
| 136 |
+
"mAP": 0.3333
|
| 137 |
+
},
|
| 138 |
+
{
|
| 139 |
+
"idx": 21,
|
| 140 |
+
"retrieval_sim": 0.7646,
|
| 141 |
+
"tIOU": 0.8172,
|
| 142 |
+
"mAP": 1.0
|
| 143 |
+
},
|
| 144 |
+
{
|
| 145 |
+
"idx": 22,
|
| 146 |
+
"retrieval_sim": 0.6744,
|
| 147 |
+
"tIOU": 1.0,
|
| 148 |
+
"mAP": 1.0
|
| 149 |
+
},
|
| 150 |
+
{
|
| 151 |
+
"idx": 23,
|
| 152 |
+
"retrieval_sim": 0.6437,
|
| 153 |
+
"tIOU": 0.7193,
|
| 154 |
+
"mAP": 0.6
|
| 155 |
+
},
|
| 156 |
+
{
|
| 157 |
+
"idx": 24,
|
| 158 |
+
"retrieval_sim": 0.6583,
|
| 159 |
+
"tIOU": 0.7193,
|
| 160 |
+
"mAP": 0.6
|
| 161 |
+
},
|
| 162 |
+
{
|
| 163 |
+
"idx": 25,
|
| 164 |
+
"retrieval_sim": 0.5824,
|
| 165 |
+
"tIOU": 0.0227,
|
| 166 |
+
"mAP": 0.0
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"idx": 26,
|
| 170 |
+
"retrieval_sim": 0.8244,
|
| 171 |
+
"tIOU": 0.755,
|
| 172 |
+
"mAP": 0.8
|
| 173 |
+
},
|
| 174 |
+
{
|
| 175 |
+
"idx": 27,
|
| 176 |
+
"retrieval_sim": 0.7577,
|
| 177 |
+
"tIOU": 0.5731,
|
| 178 |
+
"mAP": 0.2667
|
| 179 |
+
},
|
| 180 |
+
{
|
| 181 |
+
"idx": 28,
|
| 182 |
+
"retrieval_sim": 0.6997,
|
| 183 |
+
"tIOU": 0.656,
|
| 184 |
+
"mAP": 0.8
|
| 185 |
+
},
|
| 186 |
+
{
|
| 187 |
+
"idx": 29,
|
| 188 |
+
"retrieval_sim": 0.7294,
|
| 189 |
+
"tIOU": 0.8276,
|
| 190 |
+
"mAP": 0.64
|
| 191 |
+
},
|
| 192 |
+
{
|
| 193 |
+
"idx": 30,
|
| 194 |
+
"retrieval_sim": 0.6245,
|
| 195 |
+
"tIOU": 0.5177,
|
| 196 |
+
"mAP": 0.3333
|
| 197 |
+
},
|
| 198 |
+
{
|
| 199 |
+
"idx": 31,
|
| 200 |
+
"retrieval_sim": 0.7857,
|
| 201 |
+
"tIOU": 1.0,
|
| 202 |
+
"mAP": 1.0
|
| 203 |
+
},
|
| 204 |
+
{
|
| 205 |
+
"idx": 32,
|
| 206 |
+
"retrieval_sim": 0.9162,
|
| 207 |
+
"tIOU": 0.3067,
|
| 208 |
+
"mAP": 0.1111
|
| 209 |
+
},
|
| 210 |
+
{
|
| 211 |
+
"idx": 33,
|
| 212 |
+
"retrieval_sim": 0.7914,
|
| 213 |
+
"tIOU": 0.4313,
|
| 214 |
+
"mAP": 0.0833
|
| 215 |
+
},
|
| 216 |
+
{
|
| 217 |
+
"idx": 34,
|
| 218 |
+
"retrieval_sim": 0.808,
|
| 219 |
+
"tIOU": 0.5406,
|
| 220 |
+
"mAP": 0.25
|
| 221 |
+
},
|
| 222 |
+
{
|
| 223 |
+
"idx": 35,
|
| 224 |
+
"retrieval_sim": 0.6768,
|
| 225 |
+
"tIOU": 0.7678,
|
| 226 |
+
"mAP": 0.45
|
| 227 |
+
},
|
| 228 |
+
{
|
| 229 |
+
"idx": 36,
|
| 230 |
+
"retrieval_sim": 0.7682,
|
| 231 |
+
"tIOU": 0.604,
|
| 232 |
+
"mAP": 0.64
|
| 233 |
+
},
|
| 234 |
+
{
|
| 235 |
+
"idx": 37,
|
| 236 |
+
"retrieval_sim": 0.8046,
|
| 237 |
+
"tIOU": 1.0,
|
| 238 |
+
"mAP": 1.0
|
| 239 |
+
},
|
| 240 |
+
{
|
| 241 |
+
"idx": 38,
|
| 242 |
+
"retrieval_sim": 0.8366,
|
| 243 |
+
"tIOU": 0.3989,
|
| 244 |
+
"mAP": 0.2
|
| 245 |
+
},
|
| 246 |
+
{
|
| 247 |
+
"idx": 39,
|
| 248 |
+
"retrieval_sim": 0.7443,
|
| 249 |
+
"tIOU": 0.5977,
|
| 250 |
+
"mAP": 0.3333
|
| 251 |
+
},
|
| 252 |
+
{
|
| 253 |
+
"idx": 40,
|
| 254 |
+
"retrieval_sim": 0.792,
|
| 255 |
+
"tIOU": 0.4645,
|
| 256 |
+
"mAP": 0.2667
|
| 257 |
+
},
|
| 258 |
+
{
|
| 259 |
+
"idx": 41,
|
| 260 |
+
"retrieval_sim": 0.717,
|
| 261 |
+
"tIOU": 0.8,
|
| 262 |
+
"mAP": 0.8
|
| 263 |
+
},
|
| 264 |
+
{
|
| 265 |
+
"idx": 42,
|
| 266 |
+
"retrieval_sim": 0.7654,
|
| 267 |
+
"tIOU": 0.5695,
|
| 268 |
+
"mAP": 0.3333
|
| 269 |
+
},
|
| 270 |
+
{
|
| 271 |
+
"idx": 43,
|
| 272 |
+
"retrieval_sim": 0.8456,
|
| 273 |
+
"tIOU": 0.5806,
|
| 274 |
+
"mAP": 0.2
|
| 275 |
+
},
|
| 276 |
+
{
|
| 277 |
+
"idx": 44,
|
| 278 |
+
"retrieval_sim": 0.621,
|
| 279 |
+
"tIOU": 0.6756,
|
| 280 |
+
"mAP": 0.75
|
| 281 |
+
},
|
| 282 |
+
{
|
| 283 |
+
"idx": 45,
|
| 284 |
+
"retrieval_sim": 0.5566,
|
| 285 |
+
"tIOU": 0.5743,
|
| 286 |
+
"mAP": 0.36
|
| 287 |
+
},
|
| 288 |
+
{
|
| 289 |
+
"idx": 46,
|
| 290 |
+
"retrieval_sim": 0.6792,
|
| 291 |
+
"tIOU": 0.5177,
|
| 292 |
+
"mAP": 0.2667
|
| 293 |
+
},
|
| 294 |
+
{
|
| 295 |
+
"idx": 47,
|
| 296 |
+
"retrieval_sim": 0.7737,
|
| 297 |
+
"tIOU": 0.604,
|
| 298 |
+
"mAP": 0.64
|
| 299 |
+
},
|
| 300 |
+
{
|
| 301 |
+
"idx": 48,
|
| 302 |
+
"retrieval_sim": 0.7256,
|
| 303 |
+
"tIOU": 0.6667,
|
| 304 |
+
"mAP": 0.6667
|
| 305 |
+
},
|
| 306 |
+
{
|
| 307 |
+
"idx": 49,
|
| 308 |
+
"retrieval_sim": 0.7957,
|
| 309 |
+
"tIOU": 0.7011,
|
| 310 |
+
"mAP": 1.0
|
| 311 |
+
},
|
| 312 |
+
{
|
| 313 |
+
"idx": 50,
|
| 314 |
+
"retrieval_sim": 0.7171,
|
| 315 |
+
"tIOU": 0.6695,
|
| 316 |
+
"mAP": 1.0
|
| 317 |
+
},
|
| 318 |
+
{
|
| 319 |
+
"idx": 51,
|
| 320 |
+
"retrieval_sim": 0.7459,
|
| 321 |
+
"tIOU": 0.6545,
|
| 322 |
+
"mAP": 0.2
|
| 323 |
+
},
|
| 324 |
+
{
|
| 325 |
+
"idx": 52,
|
| 326 |
+
"retrieval_sim": 0.8102,
|
| 327 |
+
"tIOU": 0.858,
|
| 328 |
+
"mAP": 0.6667
|
| 329 |
+
},
|
| 330 |
+
{
|
| 331 |
+
"idx": 53,
|
| 332 |
+
"retrieval_sim": 0.8126,
|
| 333 |
+
"tIOU": 0.7,
|
| 334 |
+
"mAP": 0.64
|
| 335 |
+
},
|
| 336 |
+
{
|
| 337 |
+
"idx": 54,
|
| 338 |
+
"retrieval_sim": 0.8128,
|
| 339 |
+
"tIOU": 0.6783,
|
| 340 |
+
"mAP": 0.64
|
| 341 |
+
},
|
| 342 |
+
{
|
| 343 |
+
"idx": 55,
|
| 344 |
+
"retrieval_sim": 0.6214,
|
| 345 |
+
"tIOU": 0.6223,
|
| 346 |
+
"mAP": 0.25
|
| 347 |
+
},
|
| 348 |
+
{
|
| 349 |
+
"idx": 56,
|
| 350 |
+
"retrieval_sim": 0.729,
|
| 351 |
+
"tIOU": 0.8333,
|
| 352 |
+
"mAP": 0.6
|
| 353 |
+
},
|
| 354 |
+
{
|
| 355 |
+
"idx": 57,
|
| 356 |
+
"retrieval_sim": 0.4982,
|
| 357 |
+
"tIOU": 0.4498,
|
| 358 |
+
"mAP": 0.2
|
| 359 |
+
},
|
| 360 |
+
{
|
| 361 |
+
"idx": 58,
|
| 362 |
+
"retrieval_sim": 0.6194,
|
| 363 |
+
"tIOU": 0.6983,
|
| 364 |
+
"mAP": 0.2
|
| 365 |
+
},
|
| 366 |
+
{
|
| 367 |
+
"idx": 59,
|
| 368 |
+
"retrieval_sim": 0.8932,
|
| 369 |
+
"tIOU": 0.4533,
|
| 370 |
+
"mAP": 0.16
|
| 371 |
+
},
|
| 372 |
+
{
|
| 373 |
+
"idx": 60,
|
| 374 |
+
"retrieval_sim": 0.8175,
|
| 375 |
+
"tIOU": 0.8333,
|
| 376 |
+
"mAP": 0.5
|
| 377 |
+
},
|
| 378 |
+
{
|
| 379 |
+
"idx": 61,
|
| 380 |
+
"retrieval_sim": 0.7364,
|
| 381 |
+
"tIOU": 1.0,
|
| 382 |
+
"mAP": 1.0
|
| 383 |
+
},
|
| 384 |
+
{
|
| 385 |
+
"idx": 62,
|
| 386 |
+
"retrieval_sim": 0.5125,
|
| 387 |
+
"tIOU": 0.6703,
|
| 388 |
+
"mAP": 0.45
|
| 389 |
+
},
|
| 390 |
+
{
|
| 391 |
+
"idx": 63,
|
| 392 |
+
"retrieval_sim": 0.7301,
|
| 393 |
+
"tIOU": 0.4913,
|
| 394 |
+
"mAP": 0.2667
|
| 395 |
+
},
|
| 396 |
+
{
|
| 397 |
+
"idx": 64,
|
| 398 |
+
"retrieval_sim": 0.8172,
|
| 399 |
+
"tIOU": 0.4682,
|
| 400 |
+
"mAP": 0.0667
|
| 401 |
+
},
|
| 402 |
+
{
|
| 403 |
+
"idx": 65,
|
| 404 |
+
"retrieval_sim": 0.6517,
|
| 405 |
+
"tIOU": 0.46,
|
| 406 |
+
"mAP": 0.2
|
| 407 |
+
},
|
| 408 |
+
{
|
| 409 |
+
"idx": 66,
|
| 410 |
+
"retrieval_sim": 0.7376,
|
| 411 |
+
"tIOU": 0.8333,
|
| 412 |
+
"mAP": 0.75
|
| 413 |
+
},
|
| 414 |
+
{
|
| 415 |
+
"idx": 67,
|
| 416 |
+
"retrieval_sim": 0.5759,
|
| 417 |
+
"tIOU": 0.7167,
|
| 418 |
+
"mAP": 0.1
|
| 419 |
+
},
|
| 420 |
+
{
|
| 421 |
+
"idx": 68,
|
| 422 |
+
"retrieval_sim": 0.609,
|
| 423 |
+
"tIOU": 0.4959,
|
| 424 |
+
"mAP": 0.0833
|
| 425 |
+
},
|
| 426 |
+
{
|
| 427 |
+
"idx": 69,
|
| 428 |
+
"retrieval_sim": 0.8242,
|
| 429 |
+
"tIOU": 0.6645,
|
| 430 |
+
"mAP": 0.5625
|
| 431 |
+
},
|
| 432 |
+
{
|
| 433 |
+
"idx": 70,
|
| 434 |
+
"retrieval_sim": 0.6911,
|
| 435 |
+
"tIOU": 0.5938,
|
| 436 |
+
"mAP": 0.2
|
| 437 |
+
},
|
| 438 |
+
{
|
| 439 |
+
"idx": 71,
|
| 440 |
+
"retrieval_sim": 0.8479,
|
| 441 |
+
"tIOU": 0.9167,
|
| 442 |
+
"mAP": 0.6667
|
| 443 |
+
},
|
| 444 |
+
{
|
| 445 |
+
"idx": 72,
|
| 446 |
+
"retrieval_sim": 0.7774,
|
| 447 |
+
"tIOU": 0.6362,
|
| 448 |
+
"mAP": 0.0833
|
| 449 |
+
},
|
| 450 |
+
{
|
| 451 |
+
"idx": 73,
|
| 452 |
+
"retrieval_sim": 0.5972,
|
| 453 |
+
"tIOU": 0.7009,
|
| 454 |
+
"mAP": 0.36
|
| 455 |
+
},
|
| 456 |
+
{
|
| 457 |
+
"idx": 74,
|
| 458 |
+
"retrieval_sim": 0.7639,
|
| 459 |
+
"tIOU": 0.6788,
|
| 460 |
+
"mAP": 0.2667
|
| 461 |
+
},
|
| 462 |
+
{
|
| 463 |
+
"idx": 75,
|
| 464 |
+
"retrieval_sim": 0.5832,
|
| 465 |
+
"tIOU": 1.0,
|
| 466 |
+
"mAP": 1.0
|
| 467 |
+
},
|
| 468 |
+
{
|
| 469 |
+
"idx": 76,
|
| 470 |
+
"retrieval_sim": 0.6452,
|
| 471 |
+
"tIOU": 0.6162,
|
| 472 |
+
"mAP": 0.3333
|
| 473 |
+
},
|
| 474 |
+
{
|
| 475 |
+
"idx": 77,
|
| 476 |
+
"retrieval_sim": 0.7192,
|
| 477 |
+
"tIOU": 0.6276,
|
| 478 |
+
"mAP": 0.45
|
| 479 |
+
},
|
| 480 |
+
{
|
| 481 |
+
"idx": 78,
|
| 482 |
+
"retrieval_sim": 0.8024,
|
| 483 |
+
"tIOU": 0.9145,
|
| 484 |
+
"mAP": 0.8
|
| 485 |
+
},
|
| 486 |
+
{
|
| 487 |
+
"idx": 79,
|
| 488 |
+
"retrieval_sim": 0.7551,
|
| 489 |
+
"tIOU": 0.88,
|
| 490 |
+
"mAP": 0.8
|
| 491 |
+
},
|
| 492 |
+
{
|
| 493 |
+
"idx": 80,
|
| 494 |
+
"retrieval_sim": 0.6141,
|
| 495 |
+
"tIOU": 0.7993,
|
| 496 |
+
"mAP": 1.0
|
| 497 |
+
},
|
| 498 |
+
{
|
| 499 |
+
"idx": 81,
|
| 500 |
+
"retrieval_sim": 0.698,
|
| 501 |
+
"tIOU": 0.7751,
|
| 502 |
+
"mAP": 0.36
|
| 503 |
+
},
|
| 504 |
+
{
|
| 505 |
+
"idx": 82,
|
| 506 |
+
"retrieval_sim": 0.7071,
|
| 507 |
+
"tIOU": 0.8,
|
| 508 |
+
"mAP": 0.8
|
| 509 |
+
},
|
| 510 |
+
{
|
| 511 |
+
"idx": 83,
|
| 512 |
+
"retrieval_sim": 0.8117,
|
| 513 |
+
"tIOU": 0.6667,
|
| 514 |
+
"mAP": 0.1
|
| 515 |
+
},
|
| 516 |
+
{
|
| 517 |
+
"idx": 84,
|
| 518 |
+
"retrieval_sim": 0.8008,
|
| 519 |
+
"tIOU": 0.856,
|
| 520 |
+
"mAP": 1.0
|
| 521 |
+
},
|
| 522 |
+
{
|
| 523 |
+
"idx": 85,
|
| 524 |
+
"retrieval_sim": 0.7408,
|
| 525 |
+
"tIOU": 0.6462,
|
| 526 |
+
"mAP": 0.45
|
| 527 |
+
},
|
| 528 |
+
{
|
| 529 |
+
"idx": 86,
|
| 530 |
+
"retrieval_sim": 0.7308,
|
| 531 |
+
"tIOU": 0.6831,
|
| 532 |
+
"mAP": 0.64
|
| 533 |
+
},
|
| 534 |
+
{
|
| 535 |
+
"idx": 87,
|
| 536 |
+
"retrieval_sim": 0.6958,
|
| 537 |
+
"tIOU": 0.7533,
|
| 538 |
+
"mAP": 0.75
|
| 539 |
+
},
|
| 540 |
+
{
|
| 541 |
+
"idx": 88,
|
| 542 |
+
"retrieval_sim": 0.8543,
|
| 543 |
+
"tIOU": 0.8289,
|
| 544 |
+
"mAP": 1.0
|
| 545 |
+
},
|
| 546 |
+
{
|
| 547 |
+
"idx": 89,
|
| 548 |
+
"retrieval_sim": 0.7159,
|
| 549 |
+
"tIOU": 0.5667,
|
| 550 |
+
"mAP": 0.2
|
| 551 |
+
},
|
| 552 |
+
{
|
| 553 |
+
"idx": 90,
|
| 554 |
+
"retrieval_sim": 0.837,
|
| 555 |
+
"tIOU": 0.8276,
|
| 556 |
+
"mAP": 0.64
|
| 557 |
+
},
|
| 558 |
+
{
|
| 559 |
+
"idx": 91,
|
| 560 |
+
"retrieval_sim": 0.8093,
|
| 561 |
+
"tIOU": 0.6382,
|
| 562 |
+
"mAP": 0.16
|
| 563 |
+
},
|
| 564 |
+
{
|
| 565 |
+
"idx": 92,
|
| 566 |
+
"retrieval_sim": 0.7542,
|
| 567 |
+
"tIOU": 1.0,
|
| 568 |
+
"mAP": 1.0
|
| 569 |
+
},
|
| 570 |
+
{
|
| 571 |
+
"idx": 93,
|
| 572 |
+
"retrieval_sim": 0.6445,
|
| 573 |
+
"tIOU": 0.82,
|
| 574 |
+
"mAP": 1.0
|
| 575 |
+
},
|
| 576 |
+
{
|
| 577 |
+
"idx": 94,
|
| 578 |
+
"retrieval_sim": 0.712,
|
| 579 |
+
"tIOU": 0.7667,
|
| 580 |
+
"mAP": 0.64
|
| 581 |
+
},
|
| 582 |
+
{
|
| 583 |
+
"idx": 95,
|
| 584 |
+
"retrieval_sim": 0.6122,
|
| 585 |
+
"tIOU": 0.4707,
|
| 586 |
+
"mAP": 0.16
|
| 587 |
+
},
|
| 588 |
+
{
|
| 589 |
+
"idx": 96,
|
| 590 |
+
"retrieval_sim": 0.7239,
|
| 591 |
+
"tIOU": 0.5453,
|
| 592 |
+
"mAP": 0.2
|
| 593 |
+
},
|
| 594 |
+
{
|
| 595 |
+
"idx": 97,
|
| 596 |
+
"retrieval_sim": 0.8103,
|
| 597 |
+
"tIOU": 0.4778,
|
| 598 |
+
"mAP": 0.1111
|
| 599 |
+
}
|
| 600 |
+
]
|
| 601 |
+
}
|
eval.md
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# v1.0 Verification Results
|
| 2 |
+
|
| 3 |
+
## Summary
|
| 4 |
+
|
| 5 |
+
| Metric | Value | Threshold | Result |
|
| 6 |
+
|--------|-------|-----------|--------|
|
| 7 |
+
| retrieval_similarity | 0.7239 | >= 0.60 | PASS |
|
| 8 |
+
| tIOU | 0.6700 | >= 0.40 | PASS |
|
| 9 |
+
| mAP@0.5 | 0.5092 | >= 0.50 | PASS |
|
| 10 |
+
|
| 11 |
+
**Overall: PASS — v1.0 ACCEPTED**
|
| 12 |
+
|
| 13 |
+
## Details
|
| 14 |
+
|
| 15 |
+
- Checkpoint: `outputs/checkpoint-770` (step 770, eval_loss 0.5272)
|
| 16 |
+
- Predictions: `checkpoints/v21_semantic_boundaries/predictions.jsonl` (98 samples)
|
| 17 |
+
- Embedder: OpenAI text-embedding-3-small (production-aligned)
|
| 18 |
+
- Date: 2026-03-19
|
| 19 |
+
|
| 20 |
+
### Retrieval Similarity
|
| 21 |
+
|
| 22 |
+
- Mean: 0.7239
|
| 23 |
+
- Median: 0.7355
|
| 24 |
+
- Min: 0.4982, Max: 0.9162
|
| 25 |
+
- Excellent (>= 0.80): 22/98
|
| 26 |
+
- Good (>= 0.60): 87/98
|
| 27 |
+
- Acceptable (>= 0.40): 98/98
|
| 28 |
+
|
| 29 |
+
### Temporal IoU (tIOU)
|
| 30 |
+
|
| 31 |
+
- Mean: 0.6700
|
| 32 |
+
- Median: 0.6703
|
| 33 |
+
- Predictions with timestamps: 98/98
|
| 34 |
+
- References with timestamps: 98/98
|
| 35 |
+
|
| 36 |
+
### mAP@0.5
|
| 37 |
+
|
| 38 |
+
- Mean: 0.5092
|
| 39 |
+
|
| 40 |
+
## Production Embeddings (prior run)
|
| 41 |
+
|
| 42 |
+
For reference, the prior eval with OpenAI text-embedding-3-small on 20 pairs showed:
|
| 43 |
+
- mean_similarity: 0.6781
|
| 44 |
+
- production_ready: true
|
| 45 |
+
|
| 46 |
+
## Failure Analysis
|
| 47 |
+
|
| 48 |
+
All metrics pass. v1.0 is accepted for production.
|
| 49 |
+
|
| 50 |
+
## Per-Sample Scores (first 10)
|
| 51 |
+
|
| 52 |
+
| # | retrieval_sim | tIOU | mAP@0.5 | pred_events | ref_events |
|
| 53 |
+
|---|--------------|------|---------|-------------|------------|
|
| 54 |
+
| 0 | 0.6549 | 0.5277 | 0.4500 | 5 | 4 |
|
| 55 |
+
| 1 | 0.7739 | 0.8080 | 1.0000 | 5 | 5 |
|
| 56 |
+
| 2 | 0.6433 | 1.0000 | 1.0000 | 4 | 4 |
|
| 57 |
+
| 3 | 0.7473 | 0.6228 | 0.4500 | 5 | 4 |
|
| 58 |
+
| 4 | 0.7774 | 0.5406 | 0.2500 | 4 | 4 |
|
| 59 |
+
| 5 | 0.7924 | 0.3868 | 0.0500 | 4 | 5 |
|
| 60 |
+
| 6 | 0.7626 | 0.7779 | 0.7500 | 4 | 3 |
|
| 61 |
+
| 7 | 0.6476 | 0.8060 | 0.7500 | 4 | 3 |
|
| 62 |
+
| 8 | 0.7355 | 0.7520 | 0.6400 | 5 | 5 |
|
| 63 |
+
| 9 | 0.8859 | 0.6579 | 0.5625 | 4 | 4 |
|
predictions.jsonl
ADDED
|
@@ -0,0 +1,98 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"example_idx": 0, "prediction": "**2020.6s:** 12 people | A man with a backpack and a woman in a striped shirt stand in the foreground of a lush indoor...\n**2021.9s:** 15 people | The camera pans right to reveal a large decorative garden statue of a woman in a pink dress\n**2023.1s:** 14 people | A man in a white shirt bends over a map in the foreground while a woman and child stand nearby\n**2024.4s:** 12 people | A woman in a white shirt and a young girl in a blue dress enter the immediate foreground\n**2026.9s:** 10 people | A woman in a green dress walks toward the left as the camera continues to pan right", "reference": "**2020.6s:** 12 people | a couple on the left is seen attending to an open suitcase on the walkway\n**2021.9s:** 8 people | Camera pans left to focus on the couple with the suitcase as a woman in a floral shirt walks toward...\n**2024.4s:** 15 people | scene static, no change\n**2029.4s:** 18 people | Final pan past a large white tree trunk reveals a crowded upper-level walkway overlooking an escalator and the lower atrium"}
|
| 2 |
+
{"example_idx": 1, "prediction": "**890.6s:** 20+ people | Wide view of an airport terminal with a massive flight information board and a \"Thai Lion Air\" booth; travelers are...\n**891.9s:** 12 people | The camera pans left, focusing on a couple in the foreground walking past a \"BorPloen\" storefront\n**894.4s:** 15 people | A man in a black t-shirt and a woman in a grey hoodie walk across the frame in front of...\n**896.9s:** 18 people | scene static, no change\n**899.4s:** 10 people | The scene shifts to a \"Boarding Information\" area where passengers wait near stacks of grey cart covers", "reference": "**890.6s:** 25 people | Passengers gathered near a large international arrival flight board and information desks in the terminal hall\n**893.1s:** 12 people | scene static, no change\n**894.4s:** 16 people | Scene shows a \"SEA GAMES\" promotional wall and information booth with passengers walking by\n**896.9s:** 11 people | An elderly man with a cane moves into the foreground as the camera pans toward a \"Grab\" advertisement\n**899.4s:** 15 people | Camera reveals a check-in area with a \"Restricted Area\" sign and passengers standing in a queue"}
|
| 3 |
+
{"example_idx": 2, "prediction": "**2970.6s:** 12 people | a woman in black and a child in a blue shirt walk toward the center\n**2973.1s:** 10 people | A woman in a floral shirt and a man in a blue shirt move into the close foreground on the...\n**2975.6s:** 8 people | A woman in a grey shirt pulls a silver suitcase toward the camera while a young girl in a purple...\n**2978.1s:** 7 people | A woman in a black shirt and a young child in a blue shirt walk through the center of the...", "reference": "**2970.6s:** 12 people | Initial view of the airport walkway featuring a Disney Adventure display and travelers moving toward a decorated blue arch\n**2973.1s:** 10 people | The child in red has left the foreground, and a man in a grey polo shirt is now prominently positioned...\n**2975.6s:** 8 people | scene static, no change\n**2978.1s:** 9 people | A boy in a blue shirt and a woman in a white-and-pink shirt enter the immediate foreground from the left..."}
|
| 4 |
+
{"example_idx": 3, "prediction": "**1080.6s:** 9 people | Customers are seated at tables in a cafe with large windows overlooking an airport runway\n**1083.1s:** 11 people | A staff member in a blue uniform enters the frame from the left as more people gather in the terminal\n**1084.4s:** 15 people | The scene shifts to a busy terminal walkway with a McDonald's restaurant visible in the background\n**1086.9s:** 18 people | A woman with tattoos on her arms and a man with a backpack enter the foreground from the left\n**1089.4s:** 20 people | The crowd moves forward through the terminal past the McDonald's and a Burger King sign", "reference": "**1080.6s:** 10 people | patrons are seated at tables, including a woman with a black suitcase in the center and a couple in the...\n**1084.4s:** 15 people | travelers walk with luggage past a McDonald's, and cleaning staff is visible on the right; Significant scene change to a...\n**1085.6s:** 12 people | people are standing and walking throughout the terminal area\n**1086.9s:** 14 people | A new group of travelers enters the close foreground on the left, including a woman in a \"WHITE FOX\" tank..."}
|
| 5 |
+
{"example_idx": 4, "prediction": "**1460.6s:** 6 people | A man in a white shirt walks across the foreground past a \"KANTIN\" food service area\n**1463.1s:** 7 people | A man with a large green backpack enters the frame, walking toward the left\n**1465.6s:** 8 people | scene static, no change\n**1468.1s:** 12 people | The camera pans left to reveal a \"Home-Made Sweets\" shop and a group of people walking down a corridor in...", "reference": "**1460.6s:** 7 people | A man in a white shirt walks past the \"Rook & Tarry\" bar in a terminal\n**1464.4s:** 5 people | The view pans right to reveal an elevator entrance and several \"Soup Curry\" restaurant posters\n**1468.1s:** 8 people | The camera moves into an open corridor featuring flight information displays and an escalator\n**1469.4s:** 10 people | Multiple travelers walk down a corridor lined with food advertisements and blue storage crates"}
|
| 6 |
+
{"example_idx": 5, "prediction": "**1200.6s:** 15+ people | Tourists gather around a large Christmas tree and a indoor waterfall\n**1203.1s:** 15+ people | A man in a grey shirt and white shorts enters the foreground, moving toward the right\n**1205.6s:** 15+ people | A woman in a bright orange shirt enters the scene from the left, walking toward the Christmas tree\n**1208.1s:** 15+ people | The camera pans left to reveal a \"Shake Shack\" storefront with a queue of people waiting to enter", "reference": "**1200.6s:** 15 people | Crowded indoor garden area near a large decorated Christmas tree\n**1201.9s:** 15 people | A man in a maroon shirt and backpack walks across the foreground, momentarily obscuring the center of the frame\n**1204.4s:** 12 people | focus shifts to a woman in an orange shirt and a girl in a blue shirt standing nearby\n**1206.9s:** 14 people | The girl in the blue shirt walks across the foreground with a luggage cart while other tourists pose for photos...\n**1209.4s:** 10 people | scene static, no change"}
|
| 7 |
+
{"example_idx": 6, "prediction": "**560.6s:** 18 people | Travelers rest on benches and walk through a lush indoor garden featuring a large decorated Christmas tree and a \"KANTIN\"...\n**563.1s:** 22 people | scene static, no change\n**565.6s:** 25 people | scene static, no change\n**568.1s:** 28 people | The perspective shifts further right to reveal the \"Garden and Bar\" area, with people gathering near a lounge and the...", "reference": "**560.6s:** 18 people | Travellers rest with luggage on the left while others walk near a large Christmas tree and a festive wooden cabin...\n**564.4s:** 22 people | scene static, no change\n**568.1s:** 28 people | The scene shifts significantly to focus on an escalator area and a crowded walkway overlooking the multi-level vertical forest"}
|
| 8 |
+
{"example_idx": 7, "prediction": "**1620.6s:** 40+ people | High-angle view of a multi-level shopping mall with people on escalators and various retail floors\n**1623.1s:** 45+ people | scene static, no change\n**1625.6s:** 50+ people | scene static, no change\n**1629.4s:** 55+ people | scene static, no change", "reference": "**1620.6s:** 45 people | A wide-angle view of a multi-story shopping mall with people walking on various levels and using an escalator in the...\n**1624.4s:** 40 people | The camera tilts down to focus on the lower level, showing a LEGO display stand and a large group of...\n**1629.4s:** 55 people | The camera tilts back up to a wider shot, revealing the upper levels again and several new groups of people..."}
|
| 9 |
+
{"example_idx": 8, "prediction": "**540.6s:** 15+ people | A woman in a purple shirt walks away through a busy food court while a staff member in a blue...\n**541.9s:** 15+ people | scene static, no change\n**543.1s:** 15+ people | An elderly woman in a black floral shirt and a young girl enter the foreground from the right as the...\n**546.9s:** 15+ people | scene static, no change\n**549.4s:** 15+ people | scene static, no change", "reference": "**540.6s:** 18 people | A woman in a purple shirt walks through a crowded airport dining area past a man in a wheelchair with...\n**541.9s:** 22 people | scene static, no change\n**546.9s:** 10 people | scene static, no change\n**548.1s:** 8 people | A \"Potato Corner\" food stall comes into view as the woman in purple continues walking toward it\n**549.4s:** 11 people | scene static, no change"}
|
| 10 |
+
{"example_idx": 9, "prediction": "**1590.6s:** 15 people | Wide view of an airport terminal with passengers sitting in a waiting area and others walking in the distance\n**1594.4s:** 12 people | scene static, no change\n**1596.9s:** 10 people | The woman in white walks past a shop on the left while a man with a suitcase stands in the...\n**1599.4s:** 12 people | A robotic floor cleaner is now visible in the foreground as the woman in white exits the frame", "reference": "**1590.6s:** 9 people | Passengers walk through the terminal and sit in the waiting area while a robotic cleaner operates in the background\n**1593.1s:** 11 people | Two passengers, one in a white outfit and another in a tan shirt with a suitcase, walk toward the foreground\n**1595.6s:** 12 people | scene static, no change\n**1599.4s:** 10 people | scene static, no change"}
|
| 11 |
+
{"example_idx": 10, "prediction": "**530.6s:** 4 people | A robotic cleaner with a cartoon bear head stands in a wide airport corridor while a man in black walks...\n**531.9s:** 6 people | scene static, no change\n**534.4s:** 5 people | scene static, no change\n**536.9s:** 12 people | The camera reveals a busy food court seating area with travelers, including a woman with a stroller, eating at tables...\n**539.4s:** 15 people | A staff member in a purple uniform walks into the foreground of the bustling food court", "reference": "**530.6s:** 6 people | A wide hallway view with a cleaning robot in the foreground and several people walking in the distance toward a...\n**534.4s:** 7 people | As the camera approaches the food court, a staff member in a purple shirt walks across the frame while a...\n**538.1s:** 10 people | A woman in a white jacket enters the foreground from the right, passing by the Burger King counter where a...\n**539.4s:** 12 people | The staff member in purple returns to the foreground, and the background reveals a crowded dining area with many people..."}
|
| 12 |
+
{"example_idx": 11, "prediction": "**670.6s:** 12 people | a woman and child walk toward the left while others sit or stand near the food court entrance\n**674.4s:** 10 people | The camera pans right, focusing on a man with a large backpack standing near the railing as the woman and...\n**676.9s:** 5 people | scene static, no change\n**679.4s:** 15 people | The camera completes its pan to show the man with the backpack in the foreground while multiple people are seen...", "reference": "**670.6s:** 11 people | A woman in white pushes a stroller through a transit hall; Travelers on the right walk up a ramp past...\n**671.9s:** 10 people | The woman with the stroller moves significantly closer to the foreground\n**673.1s:** 9 people | The woman and stroller exit the frame as the camera begins to pan right\n**674.4s:** 8 people | scene static, no change\n**679.4s:** 11 people | A man with a large backpack and a travel bag enters the foreground from the right as the camera continues..."}
|
| 13 |
+
{"example_idx": 12, "prediction": "**1110.6s:** 6 people | View of a terminal corridor featuring \"Pang Chat\" and \"Dean & DeLuca\" shops with people walking and standing near the...\n**1111.9s:** 7 people | scene static, no change\n**1113.1s:** 15 people | A woman in a pink shirt appears in the foreground, pushing a luggage cart through the corridor\n**1114.4s:** 12 people | The camera pans right, showing the woman with the cart moving toward the right side of the frame as more...\n**1116.9s:** 14 people | scene static, no change", "reference": "**1110.6s:** 8 people | a woman browses bags while a man in a black jacket walks toward the camera\n**1111.9s:** 12 people | a man in a brown jacket pulls a suitcase toward the camera\n**1113.1s:** 17 people | A man in a pink shirt enters the foreground center, pushing a luggage cart toward the camera\n**1116.9s:** 21 people | focus shifts to a man in a white shirt at the cafe counter and a growing crowd in the background\n**1119.4s:** 21 people | A man in a white shirt and tan pants enters the scene from the right, walking toward the distant gates"}
|
| 14 |
+
{"example_idx": 13, "prediction": "**610.6s:** 15 people | People walk through a lush indoor garden past the \"Polo Ralph Lauren\" store\n**613.1s:** 22 people | A young boy in a black shirt runs across the foreground\n**615.6s:** 35 people | The camera pans to reveal a large crowd gathered at a viewing gallery near an escalator\n**618.1s:** 45 people | A massive crowd is visible on multiple levels as the camera reveals the full scale of the indoor waterfall", "reference": "**610.6s:** 15 people | A crowd gathers in a lush indoor garden near a rustic \"Polo Ralph Lauren\" cabin and a large decorated Christmas...\n**613.1s:** 25 people | scene static, no change\n**616.9s:** 50 people | A significant shift reveals a massive indoor waterfall in the background with a large crowd gathered along a glass railing...\n**619.4s:** 55 people | The pan concludes with a full view of the waterfall cascading into the center, with visitors appearing on escalators and..."}
|
| 15 |
+
{"example_idx": 14, "prediction": "**1600.6s:** 18 people | A man in a white t-shirt and black shorts sits on benches in an airport terminal, looking at his phone\n**1601.9s:** 20 people | scene static, no change\n**1603.1s:** 22 people | scene static, no change\n**1608.1s:** 25 people | A woman in a white jacket and a man in a blue shirt walk toward the camera through the terminal...", "reference": "**1600.6s:** 12 people | Initial view of an airport terminal waiting area featuring an \"Au We White Coffee\" stall, with a floor-cleaning robot in...\n**1603.1s:** 14 people | scene static, no change\n**1604.4s:** 15 people | scene static, no change\n**1606.9s:** 12 people | scene static, no change\n**1609.4s:** 13 people | The \"Starbucks\" stall is now fully visible on the right with several people nearby, as other travelers traverse the open..."}
|
| 16 |
+
{"example_idx": 15, "prediction": "**2910.6s:** 12 people | Visitors walk through a lush indoor garden featuring a large glass-and-steel structure and tropical foliage\n**2913.1s:** 14 people | A woman in a yellow shirt moves into the close foreground while a man in a white shirt and baseball...\n**2914.4s:** 15 people | A young girl in a blue shirt runs across the path as a woman in a white dress enters the...\n**2916.9s:** 12 people | The woman in the white dress moves to the center of the frame as the camera pans, following her movement...\n**2919.4s:** 14 people | scene static, no change", "reference": "**2910.6s:** 12 people | A group of people waits in line at the entrance of a botanical attraction, with a stroller parked in the...\n**2913.1s:** 15 people | scene static, no change\n**2914.4s:** 14 people | scene static, no change\n**2918.1s:** 12 people | scene static, no change"}
|
| 17 |
+
{"example_idx": 16, "prediction": "**710.6s:** 1 people | A man in a blue shirt walks across the terminal with a black suitcase\n**713.1s:** 1 people | scene static, no change\n**716.9s:** 40+ people | The camera pans right, revealing a large crowd of passengers and the \"Arrivals\" section on the lower level of the...", "reference": "**710.6s:** 0 people | Empty airport hallway with a marble pillar and a luggage cart; busy terminal levels are visible in the background\n**711.9s:** 1 people | A man in a black shirt enters the hallway from the left, pulling a black suitcase\n**718.1s:** 0 people | scene static, no change"}
|
| 18 |
+
{"example_idx": 17, "prediction": "**570.6s:** 6 people | Travelers walk through a corridor past a large pillar and a \"Visit Iceland\" poster\n**571.9s:** 15 people | A group of people gathers near a \"Castel\" booth in a busy terminal\n**573.1s:** 60+ people | High-angle view of a massive crowd in a large airport concourse with various booths and seating areas", "reference": "**570.6s:** 40+ people | Camera pans right from behind a large pillar, revealing a crowded station hall with travelers sitting on central benches\n**573.1s:** 70+ people | A traveler in a white jacket pulls a green suitcase across the tiled floor as the camera reveals the full...\n**574.4s:** 75+ people | A man in a grey hoodie and black backpack enters the lower-left foreground, walking toward the center of the hall\n**576.9s:** 80+ people | The camera pans further right to reveal a large glass elevator structure and several new pedestrians walking in the distance"}
|
| 19 |
+
{"example_idx": 18, "prediction": "**1690.6s:** 0 people | View of an airport runway through large glass windows\n**1694.4s:** 0 people | scene static, no change\n**1696.9s:** 0 people | A Japan Airlines airplane is taxiing across the foreground of the airfield", "reference": "**1690.6s:** 0 people | View from inside an airport terminal through glass windows overlooking the tarmac at dusk\n**1694.4s:** 0 people | Scene transition to a direct view of the runway where a white airplane is visible in the distance\n**1695.6s:** 1 people | A ground crew member appears near the bottom right as the wing of a second airplane enters the frame\n**1696.9s:** 2 people | A large airplane becomes fully visible on the right tarmac with two ground crew members standing nearby"}
|
| 20 |
+
{"example_idx": 19, "prediction": "**610.6s:** 6 people | A man in a grey shirt and a woman sit at a table in the foreground, while others queue at...\n**613.1s:** 5 people | scene static, no change\n**616.9s:** 3 people | scene static, no change\n**619.4s:** 4 people | A man in a black shirt stands at the Subway counter as another man walks down the hallway on the...", "reference": "**610.6s:** 8 people | wide view of a food court featuring Pepper Lunch and Subway with several patrons at counters and tables\n**614.4s:** 3 people | zoomed-in view of the Pepper Lunch counter as a staff member prepares an order\n**619.4s:** 2 people | focused view of the Subway counter as a man with a silver suitcase approaches to order"}
|
| 21 |
+
{"example_idx": 20, "prediction": "**2210.6s:** 12 people | A woman in a white hoodie walks through a lush indoor garden restaurant with other patrons seated at tables\n**2213.1s:** 14 people | The woman in the white hoodie moves further into the scene as more people appear in the background seating area\n**2215.6s:** 15 people | A man in a purple shirt and a woman in a black top enter the mid-ground, walking across the patio\n**2219.4s:** 12 people | scene static, no change", "reference": "**2210.6s:** 11 people | scene static, no change\n**2211.9s:** 10 people | scene static, no change\n**2213.1s:** 9 people | scene static, no change"}
|
| 22 |
+
{"example_idx": 21, "prediction": "**1130.6s:** 15+ people | Passengers wait in a terminal hallway; a couple walks away from the camera toward gates 1-6\n**1135.6s:** 15+ people | scene static, no change\n**1139.4s:** 15+ people | scene static, no change", "reference": "**1130.6s:** 12 people | Travelers sit on hallway benches while others walk toward distant gates past a Christmas tree\n**1136.9s:** 11 people | scene static, no change\n**1139.4s:** 10 people | Subtitles appear at the bottom as the camera nears gate signs and a \"Free Charging\" station"}
|
| 23 |
+
{"example_idx": 22, "prediction": "**390.6s:** 50+ people | A man in a white hat and a woman with a black backpack stand in the foreground as a large...\n**393.1s:** 50+ people | The foreground women exit the frame, revealing a boy in a yellow jersey and a girl in a red shirt...\n**395.6s:** 50+ people | The camera tilts upward, revealing the massive glass dome ceiling and the upper section of the waterfall\n**398.1s:** 50+ people | The view pans up to show the top of the waterfall cascading into the large circular pool below", "reference": "**390.6s:** 25 people | Visitors gather near the base of the indoor waterfall\n**393.1s:** 40 people | The camera tilts up, revealing tourists with large red and blue suitcases in the foreground and a growing crowd around...\n**395.6s:** 65 people | As the view expands, the pedestrian bridge and upper levels of the indoor forest become visible, showing a high density...\n**398.1s:** 85 people | scene static, no change"}
|
| 24 |
+
{"example_idx": 23, "prediction": "**1240.6s:** 25 people | scene static, no change\n**1243.1s:** 20 people | The camera pans right, bringing a man in a black shirt and backpack into the close foreground\n**1245.6s:** 18 people | A woman in a blue shirt enters the foreground from the right as the camera continues to track right\n**1248.1s:** 22 people | A man in a patterned black shirt and a woman in a blue hijab enter the frame from the right...\n**1249.4s:** 30 people | The camera reveals a large digital directory sign and a second Starbucks location as the crowd moves through the concourse", "reference": "**1240.6s:** 40+ people | Busy mall corridor with shoppers walking past a \"HANDS\" store and a Starbucks in the background\n**1244.4s:** 35+ people | Approaching a central escalator where people are descending; the perspective on the surrounding shops shifts closer\n**1249.4s:** 25+ people | View transitions into an open atrium featuring a large vertical advertisement banner"}
|
| 25 |
+
{"example_idx": 24, "prediction": "**40.6s:** 12 people | Wide view of an airport terminal with a pigeon on the floor and travelers with luggage walking in the distance\n**43.1s:** 18 people | The camera pans left to reveal a crowded walkway and a \"CardX\" credit card booth on the left side\n**45.6s:** 14 people | Two women in red dresses enter the foreground from the left as the camera approaches the Starbucks counter\n**46.9s:** 16 people | One of the women in red walks out of frame while a woman in a black dress enters from the...\n**49.4s:** 15 people | A man in a black cap and a woman in a black dress walk across the foreground in front of...", "reference": "**40.6s:** 14 people | A man in a dark suit pulls a suitcase toward the right while a monk in maroon robes walks in...\n**44.4s:** 10 people | scene static, no change\n**49.4s:** 20 people | A woman with a backpack enters the right foreground as the camera focuses on a crowded Starbucks seating area and..."}
|
| 26 |
+
{"example_idx": 25, "prediction": "**3000.6s:** 12 people | scene static, no change", "reference": "**2990.6s:** 15 people | A man in a grey polo shirt and a woman in a blue floral dress stand in the foreground of...\n**2993.1s:** 12 people | The foreground subjects change as a woman in a black dress and a young girl in a light blue dress...\n**2995.6s:** 10 people | scene static, no change\n**2998.1s:** 8 people | scene static, no change"}
|
| 27 |
+
{"example_idx": 26, "prediction": "**1970.6s:** 12 people | A group of people walk through a mall corridor past \"The Hub\" and \"Jack's Place\" cafes\n**1973.1s:** 15 people | The camera pans left, revealing a \"Red Fire Brigade\" themed train display and more shoppers\n**1975.6s:** 8 people | scene static, no change\n**1976.9s:** 6 people | Two women are seated at a table outside \"Jack's Place\" as the camera continues to pan\n**1979.4s:** 10 people | The view shifts to an escalator where several people are ascending to the next level of the mall", "reference": "**1970.6s:** 22 people | Initial view of a busy mall lobby with people queuing at \"LOBBY-E\" and walking past \"Andersen's\" bakery\n**1971.9s:** 28 people | scene static, no change\n**1976.9s:** 12 people | Perspective shifts to the entrance of \"Jack's Place\" and a \"Sanrio\" store featuring a large Hello Kitty digital display\n**1979.4s:** 4 people | Scene changes significantly as the camera moves onto an upward escalator, showing people standing on the steps ahead"}
|
| 28 |
+
{"example_idx": 27, "prediction": "**120.6s:** 1 people | Close-up of a self-service check-in kiosk screen displaying options for AirAsia and other airlines\n**121.9s:** 7 people | The camera pans right, revealing a wider view of the airport terminal with several passengers walking in the distance\n**124.4s:** 15 people | A large informational text overlay appears at the bottom of the screen as the camera continues to pan, showing a...\n**125.6s:** 20 people | The scene reveals a currency exchange area with \"Check-in\" and \"Exchange\" signs, and a significant increase in visible passenger traffic\n**129.4s:** 25 people | The camera pans further right to show a long queue of passengers waiting at the currency exchange counter", "reference": "**120.6s:** 3 people | Close-up of a self-service check-in kiosk at the airport with distant staff at counters\n**124.4s:** 12 people | Camera pans right to reveal a traveler sitting on a luggage cart in the main terminal concourse\n**126.9s:** 15 people | Perspective shifts toward currency exchange booths and a designated counter for people with disabilities"}
|
| 29 |
+
{"example_idx": 28, "prediction": "**730.6s:** 0 people | scene static, no change\n**735.6s:** 1 people | A man wearing a white mask and a black backpack enters the scene, pulling a blue suitcase through the shop...\n**736.9s:** 4 people | The man with the suitcase moves toward the left as other people become visible in the background shopping area\n**739.4s:** 6 people | The man with the suitcase exits to the left, leaving a woman in a black shirt visible in the background", "reference": "**730.6s:** 0 people | Close-up view of the \"SKY MUSEUM\" entrance wall with a monitor displaying aircraft footage\n**733.1s:** 0 people | The camera pans left, revealing a model airplane and a rope barrier in a brightly lit museum hallway\n**734.4s:** 12 people | Wide shot of the museum interior showing shop counters, various exhibits, and several visitors walking through the area\n**736.9s:** 10 people | A man wearing a face mask and a backpack enters the foreground from the left, pulling a grey suitcase past...\n**739.4s:** 8 people | The man with the suitcase moves deeper into the museum as the camera pans further right to reveal additional exhibit..."}
|
| 30 |
+
{"example_idx": 29, "prediction": "**1100.6s:** 15 people | Travelers walk through a busy airport corridor past McDonald's and a PangCha stall\n**1101.9s:** 12 people | scene static, no change\n**1103.1s:** 10 people | A woman in a black top walks away with a suitcase as the camera pans right, bringing a PangCha customer...\n**1106.9s:** 7 people | scene static, no change\n**1109.4s:** 9 people | A woman in a floral shirt appears in the foreground looking at her phone as the camera reveals more of...", "reference": "**1100.6s:** 15 people | Travelers stand and walk in a wide airport corridor near retail shops and seating areas\n**1101.9s:** 12 people | A woman in a pink shirt walks quickly across the foreground from right to left\n**1104.4s:** 10 people | scene static, no change\n**1106.9s:** 8 people | scene static, no change\n**1109.4s:** 9 people | A traveler browses merchandise at the \"Tastes of Thailand\" entrance while staff work behind the tea counter"}
|
| 31 |
+
{"example_idx": 30, "prediction": "**510.6s:** 35 people | High-angle view of a busy airport terminal with passengers walking through the hall and others gathered near check-in counters\n**513.1s:** 35 people | scene static, no change\n**516.9s:** 35 people | scene static, no change\n**519.4s:** 35 people | scene static, no change", "reference": "**510.6s:** 24 people | a woman in white walks towards the foreground while others use check-in kiosks\n**514.4s:** 22 people | A man in a blue shirt moves into the center foreground as the flow of passengers continues through the hall\n**518.1s:** 28 people | A large group of travelers walks down the main corridor, and several new passengers appear at the self-service kiosks on..."}
|
| 32 |
+
{"example_idx": 31, "prediction": "**140.6s:** 15 people | People walk through a bright mall corridor near an escalator and a \"HANDS\" store\n**143.1s:** 14 people | A woman in a grey coat walks toward the camera as others continue through the shopping area\n**145.6s:** 16 people | A man in a white t-shirt enters from the right while a man in a grey hoodie walks away\n**148.1s:** 15 people | A man in a grey t-shirt walks toward the camera as the crowd moves deeper into the mall\n**149.4s:** 14 people | A woman with a green backpack appears on the right as the man in the grey t-shirt moves into the...", "reference": "**140.6s:** 18 people | Pedestrians walk through a mall concourse past an escalator\n**143.1s:** 20 people | scene static, no change\n**145.6s:** 15 people | A woman pushing a blue luggage trolley enters the foreground, followed by a man in a light green shirt\n**148.1s:** 12 people | A woman in a black shirt and cap pushing a trolley enters the close foreground, obscuring much of the background...\n**149.4s:** 16 people | A man pushing a luggage trolley while looking at his phone dominates the foreground"}
|
| 33 |
+
{"example_idx": 32, "prediction": "**300.6s:** 50+ people | Wide shot of the indoor waterfall with tourists gathered at the base and along multiple levels of the surrounding garden\n**303.1s:** 30+ people | The camera tilts upward, shifting focus from the crowd to the top of the waterfall and the glass dome ceiling\n**304.4s:** 0 people | scene static, no change", "reference": "**300.6s:** 20+ people | Wide shot of the indoor waterfall base with visitors gathered around the viewing area and on multi-level balconies\n**301.9s:** 10+ people | Camera tilts upward to focus on the top of the central waterfall and the glass dome roof, showing fewer people...\n**309.4s:** 15+ people | scene static, no change"}
|
| 34 |
+
{"example_idx": 33, "prediction": "**30.6s:** 12 people | A man in a grey shirt walks through a food court with patrons seated at tables\n**35.6s:** 18 people | The scene shifts to a wide terminal view where a pigeon stands on the floor as travelers with luggage move...\n**36.9s:** 22 people | A woman in a patterned dress and a man pulling a blue suitcase approach the camera through the terminal walkway", "reference": "**30.6s:** 8 people | A woman walks through a food court past a noodle stall towards a seating area with multiple diners\n**33.1s:** 1 people | Close-up view of four prepared bowls of noodles displayed on a wooden counter with a staff member in the background\n**36.9s:** 20 people | A wide view of an airport terminal hallway featuring a pigeon in the foreground and travelers walking past currency exchange...\n**38.1s:** 22 people | A man in a blazer walks toward the camera while pulling a blue suitcase and talking on a phone, followed..."}
|
| 35 |
+
{"example_idx": 34, "prediction": "**240.6s:** 12 people | Visitors stand on a wooden walkway and a lower stone platform, some with luggage trolleys, overlooking a lush indoor garden...\n**243.1s:** 15 people | A man carrying a young child in a pink dress enters the scene from the right as the camera pans...\n**245.6s:** 14 people | The camera reveals the massive glass dome ceiling and the top of the waterfall as people continue to gather at...\n**248.1s:** 18 people | A significant shift in perspective shows a dense crowd of new visitors in the foreground, including a woman in a...", "reference": "**240.6s:** 10 people | Visitors walk along a lush indoor balcony overlooking a large central waterfall under a glass dome\n**244.4s:** 12 people | The camera moves closer to the crowd, revealing more individuals gathered near the railing to view the waterfall\n**248.1s:** 15 people | Foreground focus shifts to a man in a white shirt and another with a pink backpack as the camera advances...\n**249.4s:** 16 people | A man in a red shirt enters the foreground from the right, holding up a phone to take a photograph"}
|
| 36 |
+
{"example_idx": 35, "prediction": "**1150.6s:** 12 people | A woman in a grey top walks past a \"LOBBYC\" entrance while a man with a red backpack moves toward...\n**1151.9s:** 28 people | The camera pans to a crowded Apple Store area where a man in a grey shirt walks past the glass...\n**1154.4s:** 32 people | A man in a grey shirt enters the close foreground walking right, while a large crowd gathers near the store...\n**1156.9s:** 35 people | A man in a black \"Berkeley\" t-shirt and a woman in a grey shirt walk toward the camera through the...\n**1159.4s:** 38 people | A young boy in a blue shirt enters the foreground from the right as the crowd density in the background...", "reference": "**1150.6s:** 10+ people | scene static, no change\n**1151.9s:** 12+ people | Camera pans left as a man in a black shirt and red backpack walks across the foreground\n**1154.4s:** 25+ people | Camera reveals a crowded retail space\n**1158.1s:** 35+ people | scene static, no change"}
|
| 37 |
+
{"example_idx": 36, "prediction": "**2710.6s:** 6 people | A family group stands on a wooden observation deck around a large tree trunk, with a woman in a white...\n**2713.1s:** 8 people | A man in a black t-shirt and a woman in a floral dress enter the scene from the left, while...\n**2715.6s:** 4 people | The camera pans left, shifting focus from the visitors to the surrounding greenery and the distant waterfall\n**2716.9s:** 0 people | scene static, no change\n**2719.4s:** 0 people | scene static, no change", "reference": "**2710.6s:** 7 people | a man in a light green shirt sits in the foreground\n**2711.9s:** 6 people | The foreground man has left, and a family group of three is now clearly visible posing behind the woman taking...\n**2713.1s:** 7 people | A woman in a brown floral dress enters the scene on the right while the family continues to pose\n**2714.4s:** 9 people | Two more women join the posing group as the woman in the hijab prepares to take their picture\n**2719.4s:** 20+ people | The camera completes its pan, revealing a massive crowd gathered at the base of the waterfall in the distance"}
|
| 38 |
+
{"example_idx": 37, "prediction": "**2650.6s:** 12 people | A purple floral elephant statue sprays water in a lush indoor garden while visitors walk along a curved path\n**2653.1s:** 15 people | The camera pans right to reveal a Disney-themed photo op area featuring Ariel and other Disney characters\n**2655.6s:** 0 people | scene static, no change", "reference": "**2650.6s:** 8 people | A purple floral elephant statue stands beside a pond where people walk along a stone path\n**2653.1s:** 9 people | The camera pans right to reveal travelers with suitcases standing near a winding walkway surrounded by lush greenery\n**2655.6s:** 2 people | scene static, no change"}
|
| 39 |
+
{"example_idx": 38, "prediction": "**1030.6s:** 0 people | View of the \"Super Lounge\" entrance hallway with doors and a fire extinguisher\n**1031.9s:** 0 people | scene static, no change\n**1034.4s:** 1 people | A person with a bright green bag appears, standing by the window\n**1039.4s:** 1 people | scene static, no change", "reference": "**1030.6s:** 0 people | View of an empty hallway leading to the entrance of the \"Super Lounge.\"\n**1033.1s:** 1 people | A person is visible through the glass doors, standing by a window overlooking the airfield\n**1034.4s:** 2 people | Two individuals are now seen in the observation area beyond the automatic doors\n**1035.6s:** 3 people | scene static, no change\n**1036.9s:** 1 people | A person with a bright green bag stands alone by the window, looking out at the airfield"}
|
| 40 |
+
{"example_idx": 39, "prediction": "**2870.6s:** 3 people | A man and woman walk along a wooden path through a lush indoor garden, passing a large ornamental tree on...\n**2873.1s:** 12 people | scene static, no change\n**2874.4s:** 18 people | As the couple continues down the path, more visitors appear on an escalator to the left and in the background...\n**2878.1s:** 25 people | The camera pans left, revealing a crowded escalator and a larger crowd of visitors in the background shopping area", "reference": "**2870.6s:** 4 people | Three individuals walk away on a wooden path through a lush indoor garden\n**2874.4s:** 8 people | An elevated mesh walking net appears on the upper left with several people walking across it\n**2879.4s:** 12 people | Crowd density increases as more visitors become visible on the overhead net and a secondary walkway on the far left"}
|
| 41 |
+
{"example_idx": 40, "prediction": "**810.6s:** 6 people | A man carries a child past large windows while others sit at a cafe with model airplane displays\n**813.1s:** 12 people | View transitions to a lobby area with a large overhead airplane sculpture and travelers with luggage\n**816.9s:** 15 people | A man in a light blue shirt walks across the foreground of a busy terminal waiting area", "reference": "**810.6s:** 8 people | Visitors in an aviation museum view model aircraft and observe the airfield through large windows\n**811.9s:** 7 people | A man in a grey vest walks across the room while others remain at the observation windows\n**814.4s:** 2 people | A close-up of a white biplane model with a visitor's reflection visible in the background glass\n**816.9s:** 20+ people | Scene changes to a busy airport terminal area where travelers with luggage walk past a crowded seating area\n**818.1s:** 20+ people | a man with a black messenger bag walks toward the right"}
|
| 42 |
+
{"example_idx": 41, "prediction": "**1330.6s:** 1 people | Close-up of an Air Malaysia aircraft's nose and cockpit on the tarmac with a ground crew member visible on the...\n**1335.6s:** 0 people | scene static, no change\n**1336.9s:** 0 people | scene static, no change\n**1339.4s:** 0 people | scene static, no change", "reference": "**1330.6s:** 3 people | The nose of an AirAsia airplane is visible with two pilots in the cockpit and a ground crew member signaling...\n**1333.1s:** 2 people | scene static, no change\n**1335.6s:** 2 people | The airplane continues moving, revealing a large tiger graphic on the fuselage\n**1336.9s:** 0 people | The cockpit is no longer visible\n**1339.4s:** 0 people | The rear section of the plane passes by, showing the registration 9M-RAH and graphics of a sun bear and a..."}
|
| 43 |
+
{"example_idx": 42, "prediction": "**700.6s:** 9 people | People are seated at tables in a spacious lounge area with large windows and a staircase\n**701.9s:** 7 people | scene static, no change\n**703.1s:** 10 people | The camera pans to a hallway where several people are seated on a bench, and a woman walks toward the...\n**708.1s:** 0 people | scene static, no change", "reference": "**700.6s:** 7 people | Travelers are seated at tables in an airport dining area with large windows overlooking the tarmac\n**703.1s:** 5 people | The camera pans to a hallway where tables are stacked against a wall and a group of travelers waits with...\n**706.9s:** 6 people | scene static, no change"}
|
| 44 |
+
{"example_idx": 43, "prediction": "**460.6s:** 4 people | A large Gundam statue is visible in a display case within a busy terminal\n**461.9s:** 12 people | The scene shifts to a crowded terminal concourse with travelers walking past luggage carts and information boards\n**466.9s:** 25 people | A dense crowd of passengers moves through the hall as a subtitle about exploring upper levels appears on screen\n**468.1s:** 30+ people | The camera pans to reveal a large \"Toilets\" sign and a massive crowd of people in the background", "reference": "**460.6s:** 6 people | A large white and red Gundam statue is displayed behind a white chain fence in an airport terminal\n**461.9s:** 5 people | scene static, no change\n**463.1s:** 12 people | a woman in a denim vest pulls a red suitcase towards the right\n**464.4s:** 10 people | scene static, no change\n**468.1s:** 8 people | On-screen text appears as the camera follows the group towards the upper levels of the terminal"}
|
| 45 |
+
{"example_idx": 44, "prediction": "**710.6s:** 0 people | Wide view of the airport tarmac with an ANA plane parked at the gate and a service vehicle near the...\n**713.1s:** 0 people | The camera pans right, following an ANA plane as it taxis across the tarmac\n**716.9s:** 0 people | scene static, no change\n**719.4s:** 0 people | scene static, no change", "reference": "**710.6s:** 0 people | An ANA propeller plane is taxiing on the tarmac, viewed from behind a large foreground pillar\n**718.1s:** 0 people | Close-up of a warning sign in Japanese (\"Please do not touch\") on a glass partition with a JAL aircraft tail...\n**719.4s:** 0 people | Wide view of a Japan Airlines (JAL) aircraft docked at a gate with a jet bridge, and a second plane..."}
|
| 46 |
+
{"example_idx": 45, "prediction": "**330.6s:** 12 people | a woman in a black hijab stands on the left\n**331.9s:** 14 people | A woman in a brown jacket enters the foreground left as the woman in the hijab moves further into the...\n**333.1s:** 15 people | A man in a white t-shirt and a woman in a white dress walk toward the camera; a group of...\n**335.6s:** 12 people | A man with a large brown bag enters from the right as the previous group moves past the camera\n**338.1s:** 10 people | A woman in a red uniform appears on the right as a man in a black shirt walks toward the...", "reference": "**330.6s:** 18 people | Travelers with luggage carts walk through the airport terminal near the international departures sign\n**333.1s:** 17 people | A subtitle overlay appears at the bottom of the frame as travelers move deeper into the hall\n**334.4s:** 15 people | scene static, no change\n**336.9s:** 14 people | scene static, no change\n**338.1s:** 12 people | The camera pans to reveal a \"Care for safety\" booth and airport staff in red uniforms walking in the background"}
|
| 47 |
+
{"example_idx": 46, "prediction": "**2420.6s:** 6 people | A woman in a black dress and a woman in a blue patterned dress walk across a glass-floored bridge in...\n**2423.1s:** 7 people | A woman in a teal dress enters the scene from the right as the other two continue walking toward the...\n**2424.4s:** 8 people | A man in a white shirt and a woman in a light-colored dress appear in the background, walking toward the...\n**2425.6s:** 9 people | A woman with a backpack enters from the left foreground, and a man is seen sitting on the glass floor...\n**2428.1s:** 7 people | scene static, no change", "reference": "**2420.6s:** 7 people | Visitors walk across an elevated glass canopy bridge within a large indoor botanical garden\n**2424.4s:** 8 people | A visitor sits down on the glass floor to pose for a photo as a man in a white shirt...\n**2429.4s:** 7 people | scene static, no change"}
|
| 48 |
+
{"example_idx": 47, "prediction": "**210.6s:** 15+ people | Wide view of a multi-level mall with a \"COCORICE\" cafe and various shoppers in the distance\n**213.1s:** 12 people | Perspective shifts to a hallway where a man in a yellow shirt and a woman walk away from the camera\n**215.6s:** 14 people | A man in a grey shirt carrying a blue bag enters from the right as the digital screen updates to...\n**218.1s:** 16 people | A woman in a grey top enters from the right foreground, and a group of people gathers near an escalator...\n**219.4s:** 12 people | The camera pans to follow the woman in the grey top as she walks past a shop labeled \"CENTRAL WORLD\"...", "reference": "**210.6s:** 12 people | View of a \"COUCOU\" restaurant and shoppers on multiple mall levels from an upper-floor balcony\n**211.9s:** 10 people | scene static, no change\n**213.1s:** 8 people | Perspective shifts to follow a couple walking past a large digital billboard advertising \"Quick.\"\n**214.4s:** 7 people | A man in a blue cap with a backpack enters the foreground as the couple continues walking\n**219.4s:** 15 people | The group reaches an elevator lobby where several people, including one with a stroller, are waiting"}
|
| 49 |
+
{"example_idx": 48, "prediction": "**1370.6s:** 1 people | A Malaysia Airlines aircraft is parked at the gate with its cargo hold open, surrounded by several white baggage carts...\n**1376.9s:** 0 people | The scene changes to a different angle showing an AirAsia aircraft taxiing on the tarmac with its landing and taxi...", "reference": "**1370.6s:** 2 people | ground crew members are loading luggage into the cargo hold of an AirAsia aircraft via a conveyor belt system\n**1374.4s:** 0 people | scene static, no change\n**1376.9s:** 0 people | an AirAsia Airbus A320 is shown stationary on the tarmac with aircraft hangars and trees in the background"}
|
| 50 |
+
{"example_idx": 49, "prediction": "**2160.6s:** 12 people | Visitors stand on an elevated bridge overlooking a large indoor waterfall under a geometric glass dome\n**2165.6s:** 15 people | A Skytrain enters the bottom right foreground as more visitors appear on the bridge\n**2169.4s:** 8 people | scene static, no change", "reference": "**2160.6s:** 11 people | View of the Rain Vortex and bridge with tourists walking and taking photos under the glass dome\n**2163.1s:** 12 people | scene static, no change\n**2169.4s:** 7 people | scene static, no change"}
|
| 51 |
+
{"example_idx": 50, "prediction": "**800.6s:** 2 people | View of an airport museum display case featuring model airplanes\n**803.1s:** 1 people | A person in a white jacket appears on the left, looking out the window at the airfield\n**806.9s:** 6 people | The scene shifts to an airport observation deck where several people are gathered, with one individual taking a photo\n**809.4s:** 10 people | A wider view of the observation deck reveals a crowded lounge area with passengers seated and others walking in the...", "reference": "**800.6s:** 0 people | A display area features model airplanes and a \"ROKON JET\" poster behind blue stanchion ropes\n**801.9s:** 1 people | A woman wearing a black hat and a baby carrier stands by a large window looking out at the airport...\n**805.6s:** 0 people | The camera pans away from the window to show a clear view of parked ANA aircraft and airport service vehicles...\n**809.4s:** 2 people | The woman is joined by a man at the window as they observe the airplanes together"}
|
| 52 |
+
{"example_idx": 51, "prediction": "**380.6s:** 15 people | A man in a grey shirt and cap walks through a lush indoor garden while looking at his phone\n**381.9s:** 45 people | The man continues walking as a large crowd gathers around a central fountain in the background plaza\n**384.4s:** 55 people | scene static, no change\n**385.6s:** 50 people | The camera pans right, showing the crowd density near the fountain and a person in an orange shirt beginning to...\n**388.1s:** 60 people | A woman with a baby carrier enters the frame from the right as the camera focuses on the staircase and...", "reference": "**380.6s:** 30+ people | A man in a striped shirt walks up a staircase lined with lush green plants, while a couple sits on...\n**384.4s:** 25+ people | scene static, no change\n**386.9s:** 50+ people | The scene shifts to a wide view of the central indoor waterfall (Rain Vortex), with a large crowd of tourists...\n**388.1s:** 55+ people | A person with a black backpack enters the foreground on the right as the camera continues to pan across the..."}
|
| 53 |
+
{"example_idx": 52, "prediction": "**1270.6s:** 0 people | A Japan Airlines airplane is in flight, ascending into a clear blue sky\n**1276.9s:** 0 people | The airplane continues to climb, moving toward the upper right of the frame\n**1279.4s:** 0 people | scene static, no change", "reference": "**1270.6s:** 0 people | A Jetstar airplane is seen ascending into the sky immediately after takeoff\n**1279.4s:** 0 people | scene static, no change"}
|
| 54 |
+
{"example_idx": 53, "prediction": "**2000.6s:** 12 people | A man in a blue shirt leans over a table in a cafe area while others walk in the background\n**2001.9s:** 25 people | The camera pans right, revealing a large crowd of people walking through a bright indoor plaza with trees\n**2004.4s:** 30 people | A woman in a black shirt walks toward the camera in the foreground as the crowd moves through the center...\n**2008.1s:** 35 people | A man in a dark shirt and a woman pulling a suitcase walk toward the camera amidst the flowing crowd\n**2009.4s:** 40 people | The camera pans further left to reveal the \"CHECKING-IN\" entrance as a young girl in a white shirt walks into...", "reference": "**2000.6s:** 16 people | Customers dine at an outdoor cafe while travelers walk past a circular, glass-walled restaurant under a large glass dome\n**2001.9s:** 20 people | scene static, no change\n**2003.1s:** 24 people | A man in a blue shirt appears in the left foreground while the central walkway becomes more crowded with travelers\n**2006.9s:** 28 people | A woman in a black t-shirt and a man pulling a silver suitcase walk directly toward the camera from the...\n**2009.4s:** 32 people | The travelers with the suitcase move into the close foreground as a new woman in a white t-shirt enters from..."}
|
| 55 |
+
{"example_idx": 54, "prediction": "**1210.6s:** 15 people | scene static, no change\n**1211.9s:** 22 people | The camera pans left, revealing a crowded mall corridor and a man in a red shirt walking away\n**1214.4s:** 31 people | A wide view of the concourse shows an escalator and a Skechers store, with many travelers and shoppers moving through...\n**1216.9s:** 26 people | A woman in a white shirt pulling a red suitcase enters the foreground while the camera continues to pan\n**1219.4s:** 20 people | scene static, no change", "reference": "**1210.6s:** 18 people | Crowded mall corridor near a Shake Shack\n**1213.1s:** 20 people | A man in a red shirt moves to the left counter while a man in a white shirt and a...\n**1215.6s:** 19 people | The man in the dark grey shirt approaches the camera closely as a woman with a bright red suitcase enters...\n**1216.9s:** 18 people | A young girl in a pink shirt enters the foreground carrying a pink bag\n**1219.4s:** 21 people | A man in a dark polo shirt moves into the foreground on the left while the crowd near the escalator..."}
|
| 56 |
+
{"example_idx": 55, "prediction": "**440.6s:** 12 people | A man in a white hoodie walks through a terminal past luggage lockers and seated travelers\n**443.1s:** 14 people | A woman with a black backpack enters from the left as the man in the white hoodie continues toward the...\n**445.6s:** 18 people | The camera pans right to reveal a dense crowd gathered near a shop in the distance\n**448.1s:** 22 people | A detailed directional sign for \"4F Food Court\" and various food stalls appears in the foreground as the crowd moves...", "reference": "**440.6s:** 30+ people | others sit and stand in the large station hall\n**444.4s:** 35+ people | Two women, one in a maroon shirt and one in a black shirt, enter the left foreground\n**446.9s:** 30+ people | The foreground women have exited the frame, revealing a large crowd gathered in the distance near the JR station entrance\n**448.1s:** 25+ people | A woman in a long skirt and backpack walks from left to right"}
|
| 57 |
+
{"example_idx": 56, "prediction": "**1070.6s:** 15 people | Two attendants in red uniforms walk away through a terminal corridor past a \"Bakery & Coffee\" shop\n**1074.4s:** 12 people | The camera pans right, revealing the \"LukKarn Thai Royal Cooking\" restaurant and potential diners seated at outdoor-style tables\n**1076.9s:** 10 people | A closer view of the restaurant's entrance shows a man in a blue shirt standing near the seating area\n**1078.1s:** 12 people | The view shifts to the restaurant's interior, showing patrons seated at tables with large windows overlooking an airfield\n**1079.4s:** 15 people | A detailed view of the dining area reveals passengers eating at tables equipped with large glass panels for viewing the...", "reference": "**1070.6s:** 18 people | A crowded airport terminal hallway with travelers\n**1074.4s:** 10 people | The camera pans right toward the LukKaiThong restaurant entrance, where staff stand near a cleaning cart and patrons are seated...\n**1079.4s:** 6 people | scene static, no change"}
|
| 58 |
+
{"example_idx": 57, "prediction": "**30.6s:** 18 people | People gather around a large Christmas tree in an indoor garden featuring lush greenery and a waterfall\n**31.9s:** 16 people | A subtitle about airplane noise appears as the crowd density near the tree base decreases\n**35.6s:** 10 people | The subtitle disappears and the man in the light blue shirt raises his phone to capture the scene\n**38.1s:** 6 people | The man in the blue shirt moves out of view, revealing more of the tree and the surrounding forest-like environment", "reference": "**30.6s:** 18 people | scene static, no change\n**33.1s:** 15 people | A woman in a black patterned dress walks toward the right while a man in a white polo shirt moves...\n**34.4s:** 14 people | The man in the white polo shirt reaches the immediate foreground as a woman in a blue shirt poses with...\n**35.6s:** 12 people | The foreground man exits the frame, and the crowd thins out near the central walkway\n**39.4s:** 8 people | scene static, no change"}
|
| 59 |
+
{"example_idx": 58, "prediction": "**180.6s:** 12 people | a woman in a grey hoodie and another in a yellow shirt walk away in the center\n**181.9s:** 13 people | A woman in a red shirt enters from the right, walking toward the center\n**184.4s:** 12 people | The woman in red exits right; a woman with a large patterned bag enters from the left\n**185.6s:** 11 people | The woman with the patterned bag moves into the center foreground, partially obscuring the view of the concourse\n**188.1s:** 10 people | The woman with the patterned bag exits right, revealing a woman in a black shirt walking toward the camera on...", "reference": "**180.6s:** 15+ people | scene static, no change\n**181.9s:** 15+ people | scene static, no change\n**183.1s:** 15+ people | A woman and a young boy walk towards the camera, while a woman in a dark blue hoodie and patterned...\n**185.6s:** 12+ people | A worker pushing a cart with a large red bin enters the scene from the right as the pedestrians continue..."}
|
| 60 |
+
{"example_idx": 59, "prediction": "**990.6s:** 0 people | Close-up of mannequin legs in a museum display case wearing historical flight attendant uniforms\n**993.1s:** 0 people | Wide view of the \"History of Airports\" exhibit with model aircraft and vintage luggage on display\n**995.6s:** 2 people | A large model airplane is shown in a central display case while two visitors are visible in the background looking...\n**996.9s:** 4 people | A vintage white jacket is displayed next to a \"Vintage Jackets\" sign as more visitors appear in the background\n**999.4s:** 6 people | A group of visitors is gathered by a large glass partition in the background observing the exhibit", "reference": "**990.6s:** 0 people | A museum display featuring mannequins in historical airline uniforms behind a glass case\n**991.9s:** 5 people | A blurred view of several people walking through a brightly lit concourse or hallway\n**993.1s:** 0 people | A museum exhibition area with wall-mounted displays and model aircraft in glass cases\n**994.4s:** 2 people | A man and a woman stand by a museum exhibit, looking at displays of historical items and model planes\n**998.1s:** 3 people | A group of individuals stand in the background of a museum space, looking out through large windows"}
|
| 61 |
+
{"example_idx": 60, "prediction": "**400.6s:** 100+ people | Wide shot of the Jewel Changi Rain Vortex waterfall with a large crowd of visitors gathered around the viewing area...\n**403.1s:** 50+ people | The camera tilts upward, focusing on the top of the waterfall as it flows from the glass dome ceiling, shifting...", "reference": "**400.6s:** 100+ people | A large crowd of tourists gathers at the base of the Jewel Changi Rain Vortex waterfall, surrounded by lush indoor..."}
|
| 62 |
+
{"example_idx": 61, "prediction": "**940.6s:** 0 people | Close-up view of a historical timeline board showing text and dates related to New Chitose Airport's opening in 1988\n**943.1s:** 0 people | The camera pans right, revealing more details of the 1988 and 1994 timeline entries\n**945.6s:** 0 people | The pan continues to the left, bringing early timeline entries from 1979, 1981, and 1982 into view\n**948.1s:** 0 people | Significant shift to a different section of the board showcasing prehistoric and early aviation imagery, including a photo of a...\n**949.4s:** 0 people | The final pan reveals older photographs and illustrations, including a cartoon-style drawing of an early aircraft and a photo of...", "reference": "**940.6s:** 0 people | A wall-mounted informational display shows the history of New Chitose Airport, specifically the 1988 section titled \"New Chitose Airport is...\n**943.1s:** 0 people | scene static, no change\n**945.6s:** 0 people | scene static, no change\n**948.1s:** 0 people | Panning further left reveals historical entries from 1951, 1963, and 1978, accompanied by archival photos of the airport's development\n**949.4s:** 0 people | scene static, no change"}
|
| 63 |
+
{"example_idx": 62, "prediction": "**2960.6s:** 7 people | A man in black shorts and a woman in a grey shirt walk through a lush indoor garden with a...\n**2963.1s:** 11 people | scene static, no change\n**2965.6s:** 10 people | scene static, no change\n**2968.1s:** 12 people | scene static, no change", "reference": "**2960.6s:** 6 people | A walkway in an indoor garden with a child in the foreground and several people walking in the distance\n**2963.1s:** 9 people | A man with a backpack walks into the foreground while the camera focuses on a platform with blue gift boxes\n**2964.4s:** 7 people | A man carrying a child on his shoulders walks across the decorated platform alongside other visitors\n**2966.9s:** 7 people | A child in a red outfit sits on the floor near a blue structure while people walk toward a distant...\n**2968.1s:** 10 people | A group of people walks along a tree-lined path toward a large decorative archway"}
|
| 64 |
+
{"example_idx": 63, "prediction": "**1810.6s:** 25 people | A man in a black t-shirt pulls a suitcase through an airport terminal past a food court and seated travelers\n**1813.1s:** 5 people | scene static, no change\n**1819.4s:** 10 people | The camera pans right to reveal a \"Ya Kun Kaya Toast\" stall and a seating area where several passengers are...", "reference": "**1810.6s:** 18 people | A man in a black shirt pulls two suitcases down a wide airport corridor past food stalls and seating areas\n**1811.9s:** 12 people | A traveler with a backpack stops at the \"Thai Street Food\" stall while the man with suitcases continues down the...\n**1815.6s:** 10 people | A woman in a black shirt joins the man at the food stall counter\n**1816.9s:** 9 people | The man with the backpack departs, leaving the woman at the counter as the camera pans toward the next stall\n**1819.4s:** 14 people | A man in a blue polo shirt appears at the \"Au We White Coffee\" counter as the man with suitcases..."}
|
| 65 |
+
{"example_idx": 64, "prediction": "**570.6s:** 2 people | A staff member stands behind a noodle shop counter beneath large backlit menu displays\n**573.1s:** 4 people | scene static, no change\n**575.6s:** 1 people | The camera pans into a hallway, showing a person walking in the distance\n**576.9s:** 5 people | A group of people are seen sitting at tables in a dining area with luggage placed against the wall\n**579.4s:** 8 people | The KFC logo becomes clearly visible as the camera reveals more of the dining area and additional patrons", "reference": "**570.6s:** 2 people | A customer stands at the Imm Rice & Noodle counter while a staff member works behind it\n**574.4s:** 1 people | scene static, no change\n**578.1s:** 2 people | The view transitions to a seating area near a KFC where suitcases are parked by a wall"}
|
| 66 |
+
{"example_idx": 65, "prediction": "**1590.6s:** 2 people | View of the \"Royce Chocolate World\" storefront with people walking in the background\n**1593.1s:** 11 people | scene static, no change\n**1594.4s:** 10 people | scene static, no change\n**1596.9s:** 10 people | scene static, no change", "reference": "**1590.6s:** 3 people | a man with a backpack walks past a circular display\n**1591.9s:** 4 people | Transition to a different area of the shop\n**1593.1s:** 6 people | two women are packing items into a bag; New view of the service counter\n**1595.6s:** 8 people | pedestrians are walking through the corridor\n**1598.1s:** 11 people | a man pushes a cart with multiple suitcases on the left; Crowd density increases in the hallway"}
|
| 67 |
+
{"example_idx": 66, "prediction": "**2760.6s:** 6 people | A woman in a white vest and blue hat pulls a suitcase and carries a bag walks through a lush...\n**2763.1s:** 4 people | scene static, no change\n**2765.6s:** 15 people | A long queue of people is visible on the left side under a large, twisted metal sculpture\n**2768.1s:** 20 people | A woman and a young child enter the scene from the right, walking towards the camera under the sculpture", "reference": "**2760.6s:** 11 people | A man with a suitcase and paper bag walks through an indoor garden past a Marvel exhibition\n**2765.6s:** 8 people | scene static, no change\n**2768.1s:** 10 people | A woman and a child enter the foreground on the right near a large, reflective metal walkway"}
|
| 68 |
+
{"example_idx": 67, "prediction": "**1850.6s:** 25 people | a man in a white t-shirt and black cap is seated on the right looking at his phone\n**1851.9s:** 24 people | The man in the white t-shirt stands up and walks toward the background as a woman in a black shirt...\n**1853.1s:** 23 people | A man in a red shirt is now seen seated in the foreground right, looking at his phone\n**1854.4s:** 22 people | A man in a black shirt with a yellow scarf enters the frame from the right foreground\n**1856.9s:** 21 people | A man in a black shirt and blue jeans walks across the foreground from right to left", "reference": "**1850.6s:** 32 people | A crowded airport waiting area with multiple rows of seating\n**1851.9s:** 31 people | The digital advertisement on the central pillar has changed from a car image to blue text"}
|
| 69 |
+
{"example_idx": 68, "prediction": "**2920.6s:** 11 people | Crowded indoor garden walkway with visitors walking in multiple directions near a large cartoon bird sculpture\n**2923.1s:** 9 people | scene static, no change\n**2924.4s:** 10 people | A woman in a black shirt and grey skirt enters the foreground from the right\n**2926.9s:** 8 people | A person pushing a stroller becomes visible in the center of the path as the foreground woman moves out of...", "reference": "**2920.6s:** 12 people | A crowd of visitors walks towards the camera in a lush indoor garden atrium featuring a glass dome ceiling and...\n**2923.1s:** 8 people | The foreground crowd moves out of view, revealing a \"Jewel-Rassic Quest\" digital sign and a couple walking away down the...\n**2929.4s:** 10 people | A man carrying an infant in a front carrier enters the scene from the right foreground while others continue walking..."}
|
| 70 |
+
{"example_idx": 69, "prediction": "**0.6s:** 0 people | scene static, no change\n**1.9s:** 0 people | An AirAsia aircraft is seen landing on the runway\n**4.4s:** 0 people | A Thai Lion Air plane is taxiing across the foreground\n**8.1s:** 0 people | A second Lion Air aircraft is visible on the tarmac in the background", "reference": "**0.6s:** 0 people | An AirAsia aircraft lands on a runway at an airport during twilight\n**4.4s:** 0 people | Overlay text \"TOUR FROM HOME TV PRESENTS\" appears as an AirAsia plane taxies toward the camera\n**6.9s:** 5 people | Ground crew members in safety vests work near the cargo hold of a Myanmar Airways International aircraft\n**8.1s:** 0 people | A Thai Lion Air plane taxies on the runway with another aircraft visible in the background"}
|
| 71 |
+
{"example_idx": 70, "prediction": "**60.6s:** 0 people | Initial view of a modern airport terminal interior featuring a large glass elevator and complex steel truss architecture\n**61.9s:** 6 people | a \"LOVE\" sculpture is visible on the left with travelers walking in the background\n**64.4s:** 12 people | scene static, no change\n**66.9s:** 15 people | A group of travelers, including a woman in a red dress and others with luggage trolleys, gathers on the right...\n**68.1s:** 12 people | scene static, no change", "reference": "**60.6s:** 6 people | High-angle wide shot of the New Chitose Airport lobby featuring a large glass elevator structure and an intricate lattice ceiling\n**61.9s:** 12 people | Perspective shifts to ground level near a \"HOKKAIDO LOVE!\" sign where travelers are walking through the terminal\n**66.9s:** 14 people | A woman pushing a stroller enters the foreground from the right, moving across the lobby\n**69.4s:** 18 people | The scene shifts to show people using an escalator and walking towards the \"Gourmet World\" area"}
|
| 72 |
+
{"example_idx": 71, "prediction": "**1210.6s:** 12 people | View of an airport terminal featuring a long moving walkway on the left and a seating area on the right...\n**1216.9s:** 18 people | scene static, no change\n**1219.4s:** 22 people | Continued pan shows a dense crowd of travelers seated in a waiting area near large windows", "reference": "**1210.6s:** 14 people | Wide view of an airport corridor with a moving walkway on the left and several travelers walking in the distance\n**1216.9s:** 28 people | scene static, no change"}
|
| 73 |
+
{"example_idx": 72, "prediction": "**2540.6s:** 12 people | A woman in black and a man in a grey shirt pose for a photo on the high glass walkway...\n**2544.4s:** 15 people | scene static, no change\n**2545.6s:** 8 people | scene static, no change\n**2548.1s:** 25 people | The camera pans down to reveal a large crowd of people gathered at the base of the waterfall on the...", "reference": "**2540.6s:** 12 people | A man and woman are positioned on a glass walkway within a lush indoor garden under a large geometric glass...\n**2544.4s:** 32 people | scene static, no change\n**2546.9s:** 65 people | The couple on the walkway exits the frame as the camera focuses on the full waterfall and the dense crowds..."}
|
| 74 |
+
{"example_idx": 73, "prediction": "**1100.6s:** 18 people | A man in a yellow mascot costume stands near an escalator while travelers walk through a bright airport terminal past...\n**1101.9s:** 16 people | A couple carrying a child walks toward the camera as the mascot moves to the far left of the frame\n**1104.4s:** 15 people | The couple with the child passes into the foreground\n**1105.6s:** 14 people | scene static, no change\n**1108.1s:** 12 people | The children move toward the background as a man in a black t-shirt enters the scene from the right", "reference": "**1100.6s:** 14 people | A man walks with a purple suitcase past a Coach store as other travelers move through the mall\n**1101.9s:** 16 people | The man with the suitcase moves into the right foreground while more people walk towards the terminal\n**1105.6s:** 10 people | A woman in a black shirt enters the foreground while other travelers move towards the terminal gates\n**1108.1s:** 13 people | The woman in blue approaches as two men wheeling large suitcases walk towards the foreground\n**1109.4s:** 10 people | The woman in blue exits the frame as the two men with suitcases move into the foreground"}
|
| 75 |
+
{"example_idx": 74, "prediction": "**620.6s:** 4 people | Customers order at a Subway restaurant counter\n**624.4s:** 6 people | scene static, no change\n**626.9s:** 8 people | A man in a grey shirt appears in the foreground as the camera continues to pan right, revealing more of...\n**628.1s:** 10 people | A woman in a black and white patterned shirt enters the frame from the right\n**629.4s:** 12 people | A man in a blue shirt walks into the scene from the far right", "reference": "**620.6s:** 4 people | Front view of a Subway counter with two staff members preparing food and two customers waiting\n**626.9s:** 4 people | scene static, no change\n**628.1s:** 4 people | Close-up of the noodle shop counter as a customer in a plaid shirt interacts with the staff"}
|
| 76 |
+
{"example_idx": 75, "prediction": "**800.6s:** 12 people | Travelers with luggage stand near a storage area and information desk in a brightly lit terminal\n**803.1s:** 15 people | A man in a white shirt and straw hat stands by a blue suitcase as the camera pans toward a...\n**805.6s:** 18 people | A woman in a black shirt and pink mask enters the foreground while the camera continues to pan right, revealing...\n**808.1s:** 20 people | A man in a black t-shirt and a woman in a black shirt with a white shopping bag enter the...", "reference": "**800.6s:** 15 people | a man pushes a luggage cart in the center\n**803.1s:** 22 people | scene static, no change\n**805.6s:** 18 people | The view transitions to a hallway featuring a large vertical green wall on the right as people walk toward an...\n**808.1s:** 14 people | Travelers with luggage head toward the 'Customs Inspection' zone"}
|
| 77 |
+
{"example_idx": 76, "prediction": "**2950.6s:** 12 people | Visitors stand near a large mesh rope bridge and elevated green walkway in a sunlit indoor garden\n**2953.1s:** 18 people | scene static, no change\n**2958.1s:** 14 people | scene static, no change", "reference": "**2950.6s:** 6 people | Visitors pass through an entrance gate into an indoor park featuring a large geometric glass roof and lush greenery\n**2953.1s:** 15 people | The camera pans right to reveal an elevated netting structure where numerous people are walking and climbing high above the...\n**2956.9s:** 18 people | scene static, no change\n**2959.4s:** 12 people | Visitors walk along a curved pathway on the ground level, surrounded by dense tropical plants with the netting structure visible..."}
|
| 78 |
+
{"example_idx": 77, "prediction": "**400.6s:** 12 people | Travelers walk through a terminal hall under a \"Departures\" sign\n**403.1s:** 10 people | A woman in a yellow shirt pulls a suitcase toward the left foreground\n**405.6s:** 8 people | A staff member in a blue vest walks across the center of the hall\n**408.1s:** 15 people | The view transitions to an escalator looking down at a crowded lower level", "reference": "**400.6s:** 10 people | A group of travelers stands with luggage near an autonomous cleaning robot in a spacious airport terminal lobby\n**404.4s:** 12 people | A staff member in a safety vest walks directly across the foreground, momentarily obscuring the view of the terminal\n**405.6s:** 0 people | scene static, no change\n**406.9s:** 15 people | A staff member in a blue uniform pushes a luggage trolley on the right while a crowd of travelers is...\n**408.1s:** 16 people | A man pushing a stroller and another with a luggage cart walk towards the camera through the terminal corridor"}
|
| 79 |
+
{"example_idx": 78, "prediction": "**2250.6s:** 12 people | A woman in red plaid pants walks left carrying a baby in a carrier\n**2253.1s:** 14 people | A man in a grey shirt pushing a stroller enters from the background\n**2255.6s:** 15 people | A woman in a black shirt and a man in a blue shirt walk toward the camera\n**2256.9s:** 14 people | The woman in the black shirt moves into the close foreground on the left\n**2259.4s:** 12 people | scene static, no change", "reference": "**2250.6s:** 12 people | A woman in plaid walks toward the camera through a lush indoor garden while travelers rest on a bench with...\n**2253.1s:** 14 people | A woman pushing a stroller enters the walkway from the right, moving toward the foreground\n**2256.9s:** 15 people | A man pushing a second stroller appears in the background as the first stroller moves out of frame\n**2259.4s:** 13 people | The man with the stroller reaches the foreground while a man in a blue shirt walks across the background near..."}
|
| 80 |
+
{"example_idx": 79, "prediction": "**270.6s:** 8 people | A man in a black shirt walks past a shop towards a large terminal hall\n**271.9s:** 12 people | scene static, no change\n**273.1s:** 18 people | The perspective shifts to a wide view of the terminal, revealing a man in a black jacket walking away and...\n**275.6s:** 22 people | A woman with a white shopping bag enters the foreground from the right as the camera pans\n**278.1s:** 25 people | A man in a blue denim jacket pulling a red suitcase walks towards the camera through the busy terminal", "reference": "**270.6s:** 12 people | View of a souvenir shop with several shoppers\n**273.1s:** 14 people | The camera pans left, revealing a woman in a white top and black cardigan in the foreground right\n**275.6s:** 20 people | travelers with luggage are visible in the background\n**278.1s:** 30 people | In the main concourse, crowd density increases as a man with a red suitcase and other travelers navigate the open..."}
|
| 81 |
+
{"example_idx": 80, "prediction": "**2670.6s:** 12 people | scene static, no change\n**2674.4s:** 10 people | The three women have crossed the foreground, and two new women with suitcases enter from the right\n**2678.1s:** 8 people | A family group with several children and suitcases gathers on the path as the previous pedestrians move further away", "reference": "**2670.6s:** 11 people | Travelers walk past a large purple floral elephant sculpture in a lush indoor garden setting\n**2673.1s:** 13 people | Camera shifts to follow travelers with luggage as they navigate a curved wooden walkway\n**2678.1s:** 8 people | The path opens into a wider thoroughfare where travelers with multiple colorful suitcases are gathered"}
|
| 82 |
+
{"example_idx": 81, "prediction": "**1680.6s:** 10 people | Visitors stand on an observation deck, taking photos near a large indoor waterfall\n**1681.9s:** 8 people | A woman holding a baby appears in the foreground as the camera pans right\n**1683.1s:** 6 people | A man in a green shirt enters the foreground to take a photo\n**1684.4s:** 5 people | The man in green moves left, and the woman with the baby continues taking a picture\n**1685.6s:** 0 people | scene static, no change", "reference": "**1680.6s:** 12 people | Tourists gather on a balcony near a large indoor waterfall\n**1681.9s:** 10 people | A woman in an orange top moves into the foreground as others adjust their positions for photos\n**1683.1s:** 8 people | A man in a green shirt enters from the left while a woman poses with a purple teddy bear\n**1684.4s:** 6 people | scene static, no change\n**1686.9s:** 30+ people | The foreground group has moved out of view, revealing a wide perspective of the waterfall and crowds on lower levels"}
|
| 83 |
+
{"example_idx": 82, "prediction": "**750.6s:** 8 people | A man pushes a luggage cart toward the camera in an airport terminal\n**751.9s:** 12 people | scene static, no change\n**754.4s:** 15 people | scene static, no change\n**759.4s:** 20 people | A wider view of the terminal reveals more passengers walking through the concourse near the escalator", "reference": "**750.6s:** 11 people | View of a terminal hallway with \"Cafe Amazon\" on the left, a cleaning robot, and travelers with luggage\n**751.9s:** 11 people | scene static, no change\n**753.1s:** 7 people | A woman in a white shirt appears on the right as the camera approaches the escalator area\n**754.4s:** 5 people | Focus shifts to the \"Domestic Departures\" sign and a woman in black walking toward the background\n**759.4s:** 0 people | Close-up view of the directory on the Terminal Guide pillar"}
|
| 84 |
+
{"example_idx": 83, "prediction": "**600.6s:** 2 people | View of a KFC service counter with two employees standing behind the counter\n**603.1s:** 2 people | scene static, no change\n**605.6s:** 1 people | scene static, no change\n**606.9s:** 7 people | The scene shifts to a food court corridor, revealing a \"RADIO\" storefront and several patrons walking or seated at tables...\n**608.1s:** 9 people | A closer view of the food court seating area shows a man and two children at a table in the...", "reference": "**600.6s:** 2 people | Two staff members stand behind a KFC service counter under a bright menu display\n**608.1s:** 8 people | scene static, no change"}
|
| 85 |
+
{"example_idx": 84, "prediction": "**950.6s:** 0 people | Close-up of a historical timeline board showing black-and-white photos and text about aviation milestones\n**954.4s:** 0 people | The scene shifts to a museum hallway featuring a glass display case with vintage flight attendant mannequins\n**956.9s:** 0 people | A wide view of the hallway reveals a \"Toilets\" sign and a cartoonish blue bird graphic on the wall\n**958.1s:** 0 people | scene static, no change\n**959.4s:** 0 people | scene static, no change", "reference": "**950.6s:** 0 people | View of a historical aviation exhibit wall with photos and text detailing airport history from 1926 to 1978\n**955.6s:** 0 people | scene static, no change\n**956.9s:** 0 people | A display case containing five mannequins dressed in historical flight attendant uniforms comes into view\n**958.1s:** 1 people | A woman with a backpack enters the scene on the left, walking toward the \"Airport Theater\" while holding up a...\n**959.4s:** 0 people | scene static, no change"}
|
| 86 |
+
{"example_idx": 85, "prediction": "**300.6s:** 15 people | a woman in a grey top and white bag walks left while a man with a backpack stands near a...\n**303.1s:** 12 people | A woman in a red dress enters from the left as others continue walking through the terminal\n**305.6s:** 10 people | A woman pulling a white suitcase walks away from the camera towards the center of the hall\n**308.1s:** 12 people | A woman in a white shirt and black pants enters from the right, walking across the geometric patterned floor", "reference": "**300.6s:** 25 people | Wide view of a busy airport terminal with a souvenir shop and statue\n**303.1s:** 22 people | scene static, no change\n**305.6s:** 18 people | The foreground clears, revealing a woman with a white suitcase walking toward the background shops\n**306.9s:** 20 people | scene static, no change\n**309.4s:** 22 people | A man with a large red suitcase enters from the left while crowd density increases near the background stores"}
|
| 87 |
+
{"example_idx": 86, "prediction": "**320.6s:** 12 people | A man in a green cap and a woman in a black shirt walk away in the foreground of a...\n**321.9s:** 14 people | A woman in a white jacket and a man pulling a suitcase enter the scene from the left\n**323.1s:** 15 people | A man in a plaid shirt walks toward the camera while a woman in a black-and-white patterned top crosses the...\n**324.4s:** 14 people | A man in a light blue shirt enters from the left as others continue walking toward the shop\n**328.1s:** 12 people | A woman with a baby in a carrier and a man in a black shirt walk toward the camera", "reference": "**320.6s:** 15 people | Crowded airport hallway with travelers walking past confectionery shops and food stalls\n**321.9s:** 14 people | A woman with a suitcase and white shopping bag enters the foreground from the right\n**323.1s:** 16 people | A man in a plaid shirt enters the scene from the right foreground, walking towards the center\n**325.6s:** 14 people | A man in a grey t-shirt and shorts enters from the right foreground, walking towards the left\n**329.4s:** 13 people | Two women enter from the right foreground, walking quickly across the hallway"}
|
| 88 |
+
{"example_idx": 87, "prediction": "**830.6s:** 2 people | A man and a girl are seen inside a glass elevator shaft surrounded by lush vertical gardens and trees\n**835.6s:** 1 people | scene static, no change\n**838.1s:** 4 people | The scene shifts to an indoor terminal corridor where a couple walks past a McDonald's on the left and a...\n**839.4s:** 5 people | A young woman in a pink shirt enters the foreground from the right as the couple continues down the hallway", "reference": "**830.6s:** 10 people | View of a multi-level atrium with a glass dome ceiling, greenery, and glass elevators\n**834.4s:** 4 people | The perspective shifts to ground level, showing a child on a stone path amidst indoor bamboo\n**839.4s:** 10 people | The scene transitions to a mall corridor with shops and people walking"}
|
| 89 |
+
{"example_idx": 88, "prediction": "**2550.6s:** 40+ people | A Skytrain passes through the foreground tunnel as people gather around the base of the indoor waterfall\n**2553.1s:** 40+ people | The Skytrain has exited the foreground, providing a clear view of the circular water feature and the surrounding crowd\n**2556.9s:** 45+ people | scene static, no change\n**2559.4s:** 45+ people | scene static, no change", "reference": "**2550.6s:** 100+ people | the Skytrain track in the foreground is empty\n**2553.1s:** 100+ people | scene static, no change\n**2555.6s:** 100+ people | The Skytrain passes directly in front of the waterfall as it continues its crossing\n**2559.4s:** 100+ people | scene static, no change"}
|
| 90 |
+
{"example_idx": 89, "prediction": "**890.6s:** 12 people | A man in a plaid shirt stands by a window looking at airplanes while others wait in a line near...\n**893.1s:** 15 people | A woman in a light blue shirt enters the foreground from the right as the man in the plaid shirt...\n**894.4s:** 14 people | A man pushing a luggage cart and a woman in a black hijab walk toward the background\n**896.9s:** 12 people | A woman in a grey sweatshirt enters from the left foreground\n**899.4s:** 10 people | Several people, including a man in a black shirt and a woman in a light blue top, walk toward the...", "reference": "**890.6s:** 17 people | Initial view of an airport observation lounge with travelers looking out large windows and walking through the hall\n**893.1s:** 13 people | A woman in a white t-shirt walks across the foreground while a man pushes a luggage trolley down the center...\n**895.6s:** 12 people | the man with the luggage trolley continues away from the camera\n**898.1s:** 12 people | scene static, no change"}
|
| 91 |
+
{"example_idx": 90, "prediction": "**2090.6s:** 12 people | scene static, no change\n**2091.9s:** 14 people | The camera pans right, revealing a woman in a black top and a man in a white shirt walking away...\n**2093.1s:** 16 people | A family with a child in a stroller becomes the central subject as the camera follows their movement through the...\n**2096.9s:** 18 people | The family with the stroller moves into the foreground left, while a couple walks towards the camera from the background...\n**2099.4s:** 15 people | scene static, no change", "reference": "**2090.6s:** 8 people | a woman with a stroller is on the right\n**2091.9s:** 9 people | a man in a green patterned shirt appears on the right\n**2094.4s:** 13 people | A family with a stroller appears in the middle ground; crowd density increases in the background\n**2096.9s:** 15 people | two women appear walking toward the camera from the background right\n**2099.4s:** 16 people | The family with the stroller moves toward the left edge"}
|
| 92 |
+
{"example_idx": 91, "prediction": "**1040.6s:** 1 people | A woman with a bright green bag stands by a window, looking out at an airfield\n**1041.9s:** 2 people | A woman in a black dress descends an indoor staircase while carrying a patterned bag\n**1044.4s:** 2 people | Outdoors, a woman in a black dress with a floral bag walks toward the camera on a paved path\n**1045.6s:** 3 people | Two women ascend an outdoor staircase, one pulling a silver suitcase and the other carrying a white shopping bag\n**1048.1s:** 3 people | At the top of the stairs, the women move toward a gate surrounded by a tall metal fence and surveillance...", "reference": "**1040.6s:** 1 people | Standing by a large window overlooking an airfield, carrying a bright green bag\n**1041.9s:** 1 people | the person with the green bag is partially visible on the left; Perspective shifts to a tiled wall with a...\n**1044.4s:** 2 people | On an outdoor staircase, a woman in a dark dress descends with luggage while a blonde person ascends with a...\n**1046.9s:** 2 people | The woman with the luggage descends to the bottom left as the blonde person continues climbing the stairs\n**1049.4s:** 3 people | The blonde person reaches the top of the stairs, following another individual with a white suitcase"}
|
| 93 |
+
{"example_idx": 92, "prediction": "**1420.6s:** 15 people | A man in a white shirt and a woman with a yellow suitcase stand near a \"Tokyu\" shop entrance while...\n**1423.1s:** 12 people | A person with a colorful backpack enters the foreground, looking at a digital display kiosk as the crowd in the...\n**1425.6s:** 10 people | The camera pans right towards a \"Smoking Room\" sign as people walk down a corridor lined with shops\n**1428.1s:** 12 people | A group of people, including a couple in matching grey shirts, stands near a shop entrance as the camera continues...", "reference": "**1420.6s:** 12 people | A family is posing for a photo while travelers with luggage walk past shops\n**1423.1s:** 15 people | A group of people is visible further down the hallway near a restaurant entrance\n**1425.6s:** 18 people | Several people are queued or walking in the distance\n**1428.1s:** 14 people | A group of travelers with suitcases stands near the restaurant entrance"}
|
| 94 |
+
{"example_idx": 93, "prediction": "**650.6s:** 6 people | A man in a grey shirt walks away through a food court while a woman stands at a Thai food...\n**653.1s:** 12 people | The man continues walking past a seating area where several people are eating at tables on an artificial lawn\n**656.9s:** 15 people | scene static, no change\n**659.4s:** 0 people | scene static, no change", "reference": "**650.6s:** 7 people | A woman in a grey vest stands at a food counter while another woman in dark blue walks away down...\n**651.9s:** 8 people | The woman in the grey vest exits the scene as the camera moves forward, revealing a man in a grey...\n**656.9s:** 14 people | A staff member in a white shirt and face mask appears behind the food stall counter\n**659.4s:** 16 people | scene static, no change"}
|
| 95 |
+
{"example_idx": 94, "prediction": "**870.6s:** 0 people | Close-up of a decorative wall featuring a large map and model airplane\n**871.9s:** 5 people | scene static, no change\n**874.4s:** 15 people | scene static, no change\n**876.9s:** 20 people | Further right reveals a man in a black shirt walking toward the camera and a crowded background hallway\n**879.4s:** 25 people | a large crowd of travelers with luggage is visible near distant gates", "reference": "**870.6s:** 0 people | View of an airport terminal hall featuring a large abstract mural, decorative flags, and a small wooden shrine\n**871.9s:** 12 people | scene static, no change\n**874.4s:** 20 people | Panning continues to show a \"TAXI SERVICE\" counter and a wider view of the terminal with increased crowd density\n**875.6s:** 8 people | scene static, no change\n**876.9s:** 11 people | A woman walks across the foreground past the \"True\" booth while more people gather near the currency exchange and background..."}
|
| 96 |
+
{"example_idx": 95, "prediction": "**1180.6s:** 15 people | a man in a red shirt walks toward the camera while a man and two children stand near a luggage...\n**1181.9s:** 12 people | The man in the red shirt moves into the close foreground as the family near the coffee shop begins to...\n**1183.1s:** 10 people | scene static, no change\n**1186.9s:** 8 people | scene static, no change\n**1189.4s:** 7 people | A man in a grey shirt and green cap bends over to organize a luggage cart in the foreground as...", "reference": "**1180.6s:** 10 people | Travelers move through an airport corridor past a \"Mivana Coffee\" shop\n**1183.1s:** 0 people | scene static, no change\n**1184.4s:** 7 people | New viewpoint shows a \"Gates 1-6\" sign and an escalator as travelers walk toward the camera\n**1185.6s:** 1 people | The corridor clears of walking travelers, and a text overlay regarding boarding gates appears\n**1186.9s:** 2 people | A man begins descending the escalator while another traveler stands nearby with a luggage cart"}
|
| 97 |
+
{"example_idx": 96, "prediction": "**250.6s:** 6 people | A man in a black shirt checks his phone near a suitcase while a woman with a backpack walks through...\n**251.9s:** 10 people | The camera pans right to reveal a man in a white t-shirt and black backpack walking toward the foreground\n**254.4s:** 12 people | A woman in a blue denim jacket walks away as the camera tracks a growing crowd of travelers moving through...\n**258.1s:** 8 people | scene static, no change", "reference": "**250.6s:** 3 people | a woman in a green coat walks across the terminal floor near departure signs\n**251.9s:** 8 people | a woman in a white dress pulls a silver suitcase through the hall\n**253.1s:** 12 people | a crowd is visible in the background\n**255.6s:** 10 people | scene static, no change\n**259.4s:** 9 people | scene static, no change"}
|
| 98 |
+
{"example_idx": 97, "prediction": "**1140.6s:** 0 people | A Korean Air passenger jet is taxiing on the airport runway, moving from left to right\n**1145.6s:** 0 people | scene static, no change\n**1146.9s:** 0 people | The Korean Air aircraft continues to taxi, turning slightly as it moves further down the runway", "reference": "**1140.6s:** 0 people | A Japan Airlines airplane is taxiing on the tarmac, viewed from its rear-left side\n**1143.1s:** 0 people | scene static, no change\n**1145.6s:** 0 people | scene static, no change"}
|
processor_config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"image_processor": {
|
| 3 |
+
"data_format": "channels_first",
|
| 4 |
+
"do_convert_rgb": true,
|
| 5 |
+
"do_normalize": true,
|
| 6 |
+
"do_rescale": true,
|
| 7 |
+
"do_resize": true,
|
| 8 |
+
"image_mean": [
|
| 9 |
+
0.5,
|
| 10 |
+
0.5,
|
| 11 |
+
0.5
|
| 12 |
+
],
|
| 13 |
+
"image_processor_type": "Qwen2VLImageProcessorFast",
|
| 14 |
+
"image_std": [
|
| 15 |
+
0.5,
|
| 16 |
+
0.5,
|
| 17 |
+
0.5
|
| 18 |
+
],
|
| 19 |
+
"merge_size": 2,
|
| 20 |
+
"patch_size": 16,
|
| 21 |
+
"resample": 3,
|
| 22 |
+
"rescale_factor": 0.00392156862745098,
|
| 23 |
+
"size": {
|
| 24 |
+
"longest_edge": 16777216,
|
| 25 |
+
"shortest_edge": 65536
|
| 26 |
+
},
|
| 27 |
+
"temporal_patch_size": 2
|
| 28 |
+
},
|
| 29 |
+
"processor_class": "Qwen3VLProcessor",
|
| 30 |
+
"video_processor": {
|
| 31 |
+
"data_format": "channels_first",
|
| 32 |
+
"default_to_square": true,
|
| 33 |
+
"do_convert_rgb": true,
|
| 34 |
+
"do_normalize": true,
|
| 35 |
+
"do_rescale": true,
|
| 36 |
+
"do_resize": true,
|
| 37 |
+
"do_sample_frames": true,
|
| 38 |
+
"fps": 2,
|
| 39 |
+
"image_mean": [
|
| 40 |
+
0.5,
|
| 41 |
+
0.5,
|
| 42 |
+
0.5
|
| 43 |
+
],
|
| 44 |
+
"image_std": [
|
| 45 |
+
0.5,
|
| 46 |
+
0.5,
|
| 47 |
+
0.5
|
| 48 |
+
],
|
| 49 |
+
"max_frames": 768,
|
| 50 |
+
"merge_size": 2,
|
| 51 |
+
"min_frames": 4,
|
| 52 |
+
"patch_size": 16,
|
| 53 |
+
"resample": 3,
|
| 54 |
+
"rescale_factor": 0.00392156862745098,
|
| 55 |
+
"return_metadata": false,
|
| 56 |
+
"size": {
|
| 57 |
+
"longest_edge": 25165824,
|
| 58 |
+
"shortest_edge": 4096
|
| 59 |
+
},
|
| 60 |
+
"temporal_patch_size": 2,
|
| 61 |
+
"video_processor_type": "Qwen3VLVideoProcessor"
|
| 62 |
+
}
|
| 63 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87a7830d63fcf43bf241c3c5242e96e62dd3fdc29224ca26fed8ea333db72de4
|
| 3 |
+
size 19989343
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"audio_bos_token": "<|audio_start|>",
|
| 4 |
+
"audio_eos_token": "<|audio_end|>",
|
| 5 |
+
"audio_token": "<|audio_pad|>",
|
| 6 |
+
"backend": "tokenizers",
|
| 7 |
+
"bos_token": null,
|
| 8 |
+
"clean_up_tokenization_spaces": false,
|
| 9 |
+
"eos_token": "<|im_end|>",
|
| 10 |
+
"errors": "replace",
|
| 11 |
+
"image_token": "<|image_pad|>",
|
| 12 |
+
"is_local": false,
|
| 13 |
+
"model_max_length": 262144,
|
| 14 |
+
"model_specific_special_tokens": {
|
| 15 |
+
"audio_bos_token": "<|audio_start|>",
|
| 16 |
+
"audio_eos_token": "<|audio_end|>",
|
| 17 |
+
"audio_token": "<|audio_pad|>",
|
| 18 |
+
"image_token": "<|image_pad|>",
|
| 19 |
+
"video_token": "<|video_pad|>",
|
| 20 |
+
"vision_bos_token": "<|vision_start|>",
|
| 21 |
+
"vision_eos_token": "<|vision_end|>"
|
| 22 |
+
},
|
| 23 |
+
"pad_token": "<|endoftext|>",
|
| 24 |
+
"padding_side": "right",
|
| 25 |
+
"pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
|
| 26 |
+
"processor_class": "Qwen3VLProcessor",
|
| 27 |
+
"split_special_tokens": false,
|
| 28 |
+
"tokenizer_class": "TokenizersBackend",
|
| 29 |
+
"unk_token": null,
|
| 30 |
+
"video_token": "<|video_pad|>",
|
| 31 |
+
"vision_bos_token": "<|vision_start|>",
|
| 32 |
+
"vision_eos_token": "<|vision_end|>"
|
| 33 |
+
}
|