cpiuk commited on
Commit
241a47f
·
verified ·
1 Parent(s): e829e30

Add v3 training summary

Browse files
training_data_v3/training_summary.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": "unsloth/Phi-4-mini-instruct",
3
+ "lora": {
4
+ "r": 32,
5
+ "alpha": 32,
6
+ "targets": [
7
+ "q_proj",
8
+ "k_proj",
9
+ "v_proj",
10
+ "o_proj",
11
+ "gate_proj",
12
+ "up_proj",
13
+ "down_proj"
14
+ ]
15
+ },
16
+ "training": {
17
+ "epochs": 7,
18
+ "batch_size": 32,
19
+ "grad_accum": 2,
20
+ "effective_batch": 64,
21
+ "lr": 0.0002,
22
+ "max_seq_len": 512,
23
+ "packing": true,
24
+ "optimizer": "adamw_8bit",
25
+ "scheduler": "cosine",
26
+ "warmup_steps": 30
27
+ },
28
+ "dataset": {
29
+ "train": 9268,
30
+ "val": 1034,
31
+ "total": 10302
32
+ },
33
+ "total_steps": 870,
34
+ "loss_curve": [
35
+ {
36
+ "epoch": 1.0,
37
+ "eval_loss": 0.40697577595710754
38
+ },
39
+ {
40
+ "epoch": 2.0,
41
+ "eval_loss": 0.14752867817878723
42
+ },
43
+ {
44
+ "epoch": 3.0,
45
+ "eval_loss": 0.09198899567127228
46
+ },
47
+ {
48
+ "epoch": 4.0,
49
+ "eval_loss": 0.06869391351938248
50
+ },
51
+ {
52
+ "epoch": 5.0,
53
+ "eval_loss": 0.06067777797579765
54
+ },
55
+ {
56
+ "epoch": 6.0,
57
+ "eval_loss": 0.05765723064541817
58
+ }
59
+ ],
60
+ "final_train_loss": 0.0327,
61
+ "final_eval_loss": 0.05765723064541817,
62
+ "gpu": "NVIDIA RTX A6000 48GB",
63
+ "framework": "Unsloth 2026.4.4 + TRL SFTTrainer"
64
+ }