nomsgadded commited on
Commit
cae50e6
1 Parent(s): 460664f

End of training

Browse files
Files changed (4) hide show
  1. README.md +3 -1
  2. all_results.json +5 -5
  3. train_results.json +5 -5
  4. trainer_state.json +12 -24
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: other
3
  base_model: nvidia/mit-b0
4
  tags:
 
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: Segments
@@ -13,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # Segments
15
 
16
- This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on an unknown dataset.
17
 
18
  ## Model description
19
 
 
2
  license: other
3
  base_model: nvidia/mit-b0
4
  tags:
5
+ - image-segmentation
6
+ - vision
7
  - generated_from_trainer
8
  model-index:
9
  - name: Segments
 
15
 
16
  # Segments
17
 
18
+ This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on the segments/sidewalk-semantic dataset.
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "epoch": 19.81,
3
  "eval_accuracy_construction-bridge": 0.0,
4
  "eval_accuracy_construction-building": 0.9044887536731845,
5
  "eval_accuracy_construction-door": 0.0,
@@ -77,8 +77,8 @@
77
  "eval_runtime": 166.5888,
78
  "eval_samples_per_second": 0.9,
79
  "eval_steps_per_second": 0.114,
80
- "train_loss": 1.3936616789619878,
81
- "train_runtime": 1998.0806,
82
- "train_samples_per_second": 8.508,
83
- "train_steps_per_second": 0.531
84
  }
 
1
  {
2
+ "epoch": 0.99,
3
  "eval_accuracy_construction-bridge": 0.0,
4
  "eval_accuracy_construction-building": 0.9044887536731845,
5
  "eval_accuracy_construction-door": 0.0,
 
77
  "eval_runtime": 166.5888,
78
  "eval_samples_per_second": 0.9,
79
  "eval_steps_per_second": 0.114,
80
+ "train_loss": 3.0431386119914503,
81
+ "train_runtime": 103.8023,
82
+ "train_samples_per_second": 8.189,
83
+ "train_steps_per_second": 0.511
84
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 19.81,
3
- "train_loss": 1.3936616789619878,
4
- "train_runtime": 1998.0806,
5
- "train_samples_per_second": 8.508,
6
- "train_steps_per_second": 0.531
7
  }
 
1
  {
2
+ "epoch": 0.99,
3
+ "train_loss": 3.0431386119914503,
4
+ "train_runtime": 103.8023,
5
+ "train_samples_per_second": 8.189,
6
+ "train_steps_per_second": 0.511
7
  }
trainer_state.json CHANGED
@@ -1,40 +1,28 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 19.813084112149532,
5
  "eval_steps": 500,
6
- "global_step": 1060,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 9.35,
13
- "learning_rate": 2.641509433962264e-05,
14
- "loss": 1.7451,
15
- "step": 500
16
- },
17
- {
18
- "epoch": 18.69,
19
- "learning_rate": 2.830188679245283e-06,
20
- "loss": 1.087,
21
- "step": 1000
22
- },
23
- {
24
- "epoch": 19.81,
25
- "step": 1060,
26
- "total_flos": 2.9595008832425165e+17,
27
- "train_loss": 1.3936616789619878,
28
- "train_runtime": 1998.0806,
29
- "train_samples_per_second": 8.508,
30
- "train_steps_per_second": 0.531
31
  }
32
  ],
33
  "logging_steps": 500,
34
- "max_steps": 1060,
35
- "num_train_epochs": 20,
36
  "save_steps": 200,
37
- "total_flos": 2.9595008832425165e+17,
38
  "trial_name": null,
39
  "trial_params": null
40
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9906542056074766,
5
  "eval_steps": 500,
6
+ "global_step": 53,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.99,
13
+ "step": 53,
14
+ "total_flos": 1.4897641867444224e+16,
15
+ "train_loss": 3.0431386119914503,
16
+ "train_runtime": 103.8023,
17
+ "train_samples_per_second": 8.189,
18
+ "train_steps_per_second": 0.511
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 53,
23
+ "num_train_epochs": 1,
24
  "save_steps": 200,
25
+ "total_flos": 1.4897641867444224e+16,
26
  "trial_name": null,
27
  "trial_params": null
28
  }