fajrijrifa commited on
Commit
4327584
1 Parent(s): 5513ce0

Model save

Browse files
Files changed (3) hide show
  1. README.md +3 -3
  2. config.json +1 -1
  3. config_sentence_transformers.json +2 -2
README.md CHANGED
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
40
  - distributed_type: multi-GPU
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 5.0
44
  - mixed_precision_training: Native AMP
45
 
46
  ### Training results
@@ -50,6 +50,6 @@ The following hyperparameters were used during training:
50
  ### Framework versions
51
 
52
  - Transformers 4.44.2
53
- - Pytorch 2.4.1+cu121
54
- - Datasets 3.0.0
55
  - Tokenizers 0.19.1
 
40
  - distributed_type: multi-GPU
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
+ - num_epochs: 50.0
44
  - mixed_precision_training: Native AMP
45
 
46
  ### Training results
 
50
  ### Framework versions
51
 
52
  - Transformers 4.44.2
53
+ - Pytorch 2.5.0+cu121
54
+ - Datasets 3.0.2
55
  - Tokenizers 0.19.1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/content/drive/MyDrive/THESIS_MSIT/checkpoint-3450",
3
  "architectures": [
4
  "XLMRobertaModel"
5
  ],
 
1
  {
2
+ "_name_or_path": "/content/drive/MyDrive/THESIS_MSIT",
3
  "architectures": [
4
  "XLMRobertaModel"
5
  ],
config_sentence_transformers.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "__version__": {
3
- "sentence_transformers": "3.1.1",
4
  "transformers": "4.44.2",
5
- "pytorch": "2.4.1+cu121"
6
  },
7
  "prompts": {},
8
  "default_prompt_name": null,
 
1
  {
2
  "__version__": {
3
+ "sentence_transformers": "3.2.1",
4
  "transformers": "4.44.2",
5
+ "pytorch": "2.5.0+cu121"
6
  },
7
  "prompts": {},
8
  "default_prompt_name": null,