HuggingBaymax commited on
Commit
b6e6903
·
verified ·
1 Parent(s): 1dff3c8

Pushed the IDEFICS2 fine-tuned model.

Browse files
checkpoint-25/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b966f7d4ed03a7cc5f0d9f12d11c6a36291778d9bbbf782adafd78784a19840
3
  size 93378688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:211756393169a47923b018f9f1a4c1ff9fbedf416c232c273405a6535035e520
3
  size 93378688
checkpoint-25/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acbe89ccd613a30390efd87c851995b5d2229722780b43fab32b11d369a27e7d
3
  size 48071944
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b442cfd495fcaa5f9aa918d20aa7676a7668d382bc9867031a88d6c6e08e7d26
3
  size 48071944
checkpoint-25/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:614fcea8e73d817edc55868e83a17dea664dce6af99624cd6b07cf229ea0cb30
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17389751b3edcf49720757d9d28af25dc2449922678632e2f6f5f61dd49356cb
3
  size 14244
checkpoint-25/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e38cb40a67374f1832bcdea2ecae7e9ba187f61562de69b9f4a08e86aa1a8369
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6222650a495ea54e976d1599e55e1eec1dfa515e390e5f653027100568b23eb1
3
  size 1064
checkpoint-25/trainer_state.json CHANGED
@@ -10,53 +10,53 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.08,
13
- "grad_norm": 40.98280334472656,
14
- "learning_rate": 0.000168,
15
- "loss": 5.6666,
16
  "step": 5
17
  },
18
  {
19
  "epoch": 0.16,
20
- "grad_norm": 9.209188461303711,
21
- "learning_rate": 0.00012800000000000002,
22
- "loss": 0.6902,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 0.16,
27
- "eval_loss": 0.462746798992157,
28
- "eval_runtime": 346.7059,
29
- "eval_samples_per_second": 0.577,
30
- "eval_steps_per_second": 0.288,
31
  "step": 10
32
  },
33
  {
34
  "epoch": 0.24,
35
- "grad_norm": 5.505237102508545,
36
- "learning_rate": 8.800000000000001e-05,
37
- "loss": 0.4216,
38
  "step": 15
39
  },
40
  {
41
  "epoch": 0.32,
42
- "grad_norm": 6.111878871917725,
43
- "learning_rate": 4.8e-05,
44
- "loss": 0.3347,
45
  "step": 20
46
  },
47
  {
48
  "epoch": 0.32,
49
- "eval_loss": 0.34206879138946533,
50
- "eval_runtime": 345.9828,
51
- "eval_samples_per_second": 0.578,
52
- "eval_steps_per_second": 0.289,
53
  "step": 20
54
  },
55
  {
56
  "epoch": 0.4,
57
- "grad_norm": 3.1234376430511475,
58
- "learning_rate": 8.000000000000001e-06,
59
- "loss": 0.2831,
60
  "step": 25
61
  }
62
  ],
@@ -77,7 +77,7 @@
77
  "attributes": {}
78
  }
79
  },
80
- "total_flos": 1864510458066432.0,
81
  "train_batch_size": 2,
82
  "trial_name": null,
83
  "trial_params": null
 
10
  "log_history": [
11
  {
12
  "epoch": 0.08,
13
+ "grad_norm": 250.87176513671875,
14
+ "learning_rate": 0.00018400000000000003,
15
+ "loss": 7.6096,
16
  "step": 5
17
  },
18
  {
19
  "epoch": 0.16,
20
+ "grad_norm": 31.689001083374023,
21
+ "learning_rate": 0.000144,
22
+ "loss": 2.8395,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 0.16,
27
+ "eval_loss": 1.5643075704574585,
28
+ "eval_runtime": 335.0339,
29
+ "eval_samples_per_second": 0.597,
30
+ "eval_steps_per_second": 0.298,
31
  "step": 10
32
  },
33
  {
34
  "epoch": 0.24,
35
+ "grad_norm": 6.646055221557617,
36
+ "learning_rate": 0.00010400000000000001,
37
+ "loss": 0.9643,
38
  "step": 15
39
  },
40
  {
41
  "epoch": 0.32,
42
+ "grad_norm": 4.9765520095825195,
43
+ "learning_rate": 6.400000000000001e-05,
44
+ "loss": 0.3674,
45
  "step": 20
46
  },
47
  {
48
  "epoch": 0.32,
49
+ "eval_loss": 0.36727723479270935,
50
+ "eval_runtime": 334.6508,
51
+ "eval_samples_per_second": 0.598,
52
+ "eval_steps_per_second": 0.299,
53
  "step": 20
54
  },
55
  {
56
  "epoch": 0.4,
57
+ "grad_norm": 3.7046844959259033,
58
+ "learning_rate": 2.4e-05,
59
+ "loss": 0.2732,
60
  "step": 25
61
  }
62
  ],
 
77
  "attributes": {}
78
  }
79
  },
80
+ "total_flos": 1976516367999360.0,
81
  "train_batch_size": 2,
82
  "trial_name": null,
83
  "trial_params": null
checkpoint-25/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1d6473005f07867644da79cc6c4e621e7921819ba6d9ec1fa889bd7c906a9f8
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6befa3566f15769a7c667b3c47ab9f99e4cfced81d36604ee1e11af15a613d72
3
  size 5240