Incomple commited on
Commit
2d2d0d2
·
verified ·
1 Parent(s): 48d12a7

End of training

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. all_results.json +2 -2
  3. train_results.json +2 -2
  4. trainer_state.json +2 -2
README.md CHANGED
@@ -3,10 +3,10 @@ library_name: peft
3
  license: llama3.1
4
  base_model: meta-llama/Llama-3.1-8B-Instruct
5
  tags:
6
- - trl
7
- - dpo
8
  - llama-factory
9
  - lora
 
 
10
  - generated_from_trainer
11
  model-index:
12
  - name: Llama-3.1-8B-Instruct_holistic
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  # Llama-3.1-8B-Instruct_holistic
20
 
21
- This model is a fine-tuned version of [meta-llama/Llama-3.1-8B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct) on an unknown dataset.
22
 
23
  ## Model description
24
 
 
3
  license: llama3.1
4
  base_model: meta-llama/Llama-3.1-8B-Instruct
5
  tags:
 
 
6
  - llama-factory
7
  - lora
8
+ - trl
9
+ - dpo
10
  - generated_from_trainer
11
  model-index:
12
  - name: Llama-3.1-8B-Instruct_holistic
 
18
 
19
  # Llama-3.1-8B-Instruct_holistic
20
 
21
+ This model is a fine-tuned version of [meta-llama/Llama-3.1-8B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct) on the holistic dataset.
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 0.9997303855486654,
3
  "total_flos": 1.1904720283191214e+18,
4
  "train_loss": 0.15248539275464632,
5
- "train_runtime": 30996.046,
6
- "train_samples_per_second": 0.479,
7
  "train_steps_per_second": 0.06
8
  }
 
2
  "epoch": 0.9997303855486654,
3
  "total_flos": 1.1904720283191214e+18,
4
  "train_loss": 0.15248539275464632,
5
+ "train_runtime": 30932.1025,
6
+ "train_samples_per_second": 0.48,
7
  "train_steps_per_second": 0.06
8
  }
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 0.9997303855486654,
3
  "total_flos": 1.1904720283191214e+18,
4
  "train_loss": 0.15248539275464632,
5
- "train_runtime": 30996.046,
6
- "train_samples_per_second": 0.479,
7
  "train_steps_per_second": 0.06
8
  }
 
2
  "epoch": 0.9997303855486654,
3
  "total_flos": 1.1904720283191214e+18,
4
  "train_loss": 0.15248539275464632,
5
+ "train_runtime": 30932.1025,
6
+ "train_samples_per_second": 0.48,
7
  "train_steps_per_second": 0.06
8
  }
trainer_state.json CHANGED
@@ -298,8 +298,8 @@
298
  "step": 1854,
299
  "total_flos": 1.1904720283191214e+18,
300
  "train_loss": 0.15248539275464632,
301
- "train_runtime": 30996.046,
302
- "train_samples_per_second": 0.479,
303
  "train_steps_per_second": 0.06
304
  }
305
  ],
 
298
  "step": 1854,
299
  "total_flos": 1.1904720283191214e+18,
300
  "train_loss": 0.15248539275464632,
301
+ "train_runtime": 30932.1025,
302
+ "train_samples_per_second": 0.48,
303
  "train_steps_per_second": 0.06
304
  }
305
  ],