kevinoli commited on
Commit
9c811ce
1 Parent(s): f75dba2

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_loss": 0.49561700224876404,
4
- "eval_runtime": 72.0108,
5
- "eval_samples_per_second": 16.761,
6
- "eval_steps_per_second": 2.097,
7
- "total_flos": 7811792839259640.0,
8
- "train_loss": 0.07694113771750283,
9
- "train_runtime": 16520.0957,
10
- "train_samples_per_second": 2.629,
11
- "train_steps_per_second": 1.314
12
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_loss": 0.17657655477523804,
4
+ "eval_runtime": 7.3821,
5
+ "eval_samples_per_second": 16.391,
6
+ "eval_steps_per_second": 2.167,
7
+ "total_flos": 8593187978196360.0,
8
+ "train_loss": 0.0035514953327706023,
9
+ "train_runtime": 1405.6232,
10
+ "train_samples_per_second": 33.984,
11
+ "train_steps_per_second": 16.992
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_loss": 0.49561700224876404,
4
- "eval_runtime": 72.0108,
5
- "eval_samples_per_second": 16.761,
6
- "eval_steps_per_second": 2.097
7
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_loss": 0.17657655477523804,
4
+ "eval_runtime": 7.3821,
5
+ "eval_samples_per_second": 16.391,
6
+ "eval_steps_per_second": 2.167
7
  }
runs/Aug23_10-36-57_winter-park/events.out.tfevents.1724432742.winter-park.1153123.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c02e9bee007be85dbdcda75ef4b7c638613cf554c9da4539f759c6239bc99ce
3
+ size 316
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
- "total_flos": 7811792839259640.0,
4
- "train_loss": 0.07694113771750283,
5
- "train_runtime": 16520.0957,
6
- "train_samples_per_second": 2.629,
7
- "train_steps_per_second": 1.314
8
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "total_flos": 8593187978196360.0,
4
+ "train_loss": 0.0035514953327706023,
5
+ "train_runtime": 1405.6232,
6
+ "train_samples_per_second": 33.984,
7
+ "train_steps_per_second": 16.992
8
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.49561700224876404,
3
- "best_model_checkpoint": "./output/clip-finetuned-csu-p14-336-e4l57-l/checkpoint-21000",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 21712,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -653,18 +653,78 @@
653
  "eval_steps_per_second": 2.025,
654
  "step": 21500
655
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
656
  {
657
  "epoch": 4.0,
658
- "step": 21712,
659
- "total_flos": 7811792839259640.0,
660
- "train_loss": 0.07694113771750283,
661
- "train_runtime": 16520.0957,
662
- "train_samples_per_second": 2.629,
663
- "train_steps_per_second": 1.314
664
  }
665
  ],
666
  "logging_steps": 500,
667
- "max_steps": 21712,
668
  "num_input_tokens_seen": 0,
669
  "num_train_epochs": 4,
670
  "save_steps": 500,
@@ -680,7 +740,7 @@
680
  "attributes": {}
681
  }
682
  },
683
- "total_flos": 7811792839259640.0,
684
  "train_batch_size": 2,
685
  "trial_name": null,
686
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.17657655477523804,
3
+ "best_model_checkpoint": "./output/clip-finetuned-csu-p14-336-e4l57-l/checkpoint-23500",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 23884,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
653
  "eval_steps_per_second": 2.025,
654
  "step": 21500
655
  },
656
+ {
657
+ "epoch": 3.6844749623178696,
658
+ "grad_norm": 0.022144177928566933,
659
+ "learning_rate": 3.944062971026629e-08,
660
+ "loss": 0.0432,
661
+ "step": 22000
662
+ },
663
+ {
664
+ "epoch": 3.6844749623178696,
665
+ "eval_loss": 0.17835669219493866,
666
+ "eval_runtime": 7.4507,
667
+ "eval_samples_per_second": 16.24,
668
+ "eval_steps_per_second": 2.147,
669
+ "step": 22000
670
+ },
671
+ {
672
+ "epoch": 3.7682130296432756,
673
+ "grad_norm": 2.4324751279891643e-07,
674
+ "learning_rate": 2.897337129459052e-08,
675
+ "loss": 0.0461,
676
+ "step": 22500
677
+ },
678
+ {
679
+ "epoch": 3.7682130296432756,
680
+ "eval_loss": 0.17669138312339783,
681
+ "eval_runtime": 7.5623,
682
+ "eval_samples_per_second": 16.0,
683
+ "eval_steps_per_second": 2.116,
684
+ "step": 22500
685
+ },
686
+ {
687
+ "epoch": 3.851951096968682,
688
+ "grad_norm": 4.172260048562748e-07,
689
+ "learning_rate": 1.8506112878914754e-08,
690
+ "loss": 0.0513,
691
+ "step": 23000
692
+ },
693
+ {
694
+ "epoch": 3.851951096968682,
695
+ "eval_loss": 0.1774093359708786,
696
+ "eval_runtime": 7.8193,
697
+ "eval_samples_per_second": 15.475,
698
+ "eval_steps_per_second": 2.046,
699
+ "step": 23000
700
+ },
701
+ {
702
+ "epoch": 3.935689164294088,
703
+ "grad_norm": 0.5274502038955688,
704
+ "learning_rate": 8.038854463238988e-09,
705
+ "loss": 0.0326,
706
+ "step": 23500
707
+ },
708
+ {
709
+ "epoch": 3.935689164294088,
710
+ "eval_loss": 0.17657655477523804,
711
+ "eval_runtime": 7.7889,
712
+ "eval_samples_per_second": 15.535,
713
+ "eval_steps_per_second": 2.054,
714
+ "step": 23500
715
+ },
716
  {
717
  "epoch": 4.0,
718
+ "step": 23884,
719
+ "total_flos": 8593187978196360.0,
720
+ "train_loss": 0.0035514953327706023,
721
+ "train_runtime": 1405.6232,
722
+ "train_samples_per_second": 33.984,
723
+ "train_steps_per_second": 16.992
724
  }
725
  ],
726
  "logging_steps": 500,
727
+ "max_steps": 23884,
728
  "num_input_tokens_seen": 0,
729
  "num_train_epochs": 4,
730
  "save_steps": 500,
 
740
  "attributes": {}
741
  }
742
  },
743
+ "total_flos": 8593187978196360.0,
744
  "train_batch_size": 2,
745
  "trial_name": null,
746
  "trial_params": null