edbeeching HF Staff commited on
Commit
55054cc
·
verified ·
1 Parent(s): e4c2c81

Model save

Browse files
README.md CHANGED
@@ -5,7 +5,9 @@ model_name: Qwen3-4B-Base-SFT-tr5
5
  tags:
6
  - generated_from_trainer
7
  - trl
 
8
  - sft
 
9
  licence: license
10
  ---
11
 
 
5
  tags:
6
  - generated_from_trainer
7
  - trl
8
+ - trackio:https://huggingface.co/spaces/hf-imo-colab/trackio-distillation-sft
9
  - sft
10
+ - trackio
11
  licence: license
12
  ---
13
 
all_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 4.6268656716417915,
3
- "total_flos": 829952540540928.0,
4
- "train_loss": 0.3511713839466533,
5
- "train_runtime": 18622.9131,
6
  "train_samples": 4281,
7
- "train_samples_per_second": 1.065,
8
- "train_steps_per_second": 0.033
9
  }
 
1
  {
2
  "epoch": 4.6268656716417915,
3
+ "total_flos": 829202911068160.0,
4
+ "train_loss": 0.33651591361530364,
5
+ "train_runtime": 10914.7384,
6
  "train_samples": 4281,
7
+ "train_samples_per_second": 1.818,
8
+ "train_steps_per_second": 0.057
9
  }
generation_config.json CHANGED
@@ -1,8 +1,6 @@
1
  {
2
  "do_sample": false,
3
- "eos_token_id": [
4
- 151643
5
- ],
6
  "max_new_tokens": 2048,
7
  "pad_token_id": 151643,
8
  "transformers_version": "5.3.0.dev0"
 
1
  {
2
  "do_sample": false,
3
+ "eos_token_id": 151643,
 
 
4
  "max_new_tokens": 2048,
5
  "pad_token_id": 151643,
6
  "transformers_version": "5.3.0.dev0"
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 4.6268656716417915,
3
- "total_flos": 829952540540928.0,
4
- "train_loss": 0.3511713839466533,
5
- "train_runtime": 18622.9131,
6
  "train_samples": 4281,
7
- "train_samples_per_second": 1.065,
8
- "train_steps_per_second": 0.033
9
  }
 
1
  {
2
  "epoch": 4.6268656716417915,
3
+ "total_flos": 829202911068160.0,
4
+ "train_loss": 0.33651591361530364,
5
+ "train_runtime": 10914.7384,
6
  "train_samples": 4281,
7
+ "train_samples_per_second": 1.818,
8
+ "train_steps_per_second": 0.057
9
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff