fajrijrifa
commited on
Commit
•
4327584
1
Parent(s):
5513ce0
Model save
Browse files- README.md +3 -3
- config.json +1 -1
- config_sentence_transformers.json +2 -2
README.md
CHANGED
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
|
|
40 |
- distributed_type: multi-GPU
|
41 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
42 |
- lr_scheduler_type: linear
|
43 |
-
- num_epochs:
|
44 |
- mixed_precision_training: Native AMP
|
45 |
|
46 |
### Training results
|
@@ -50,6 +50,6 @@ The following hyperparameters were used during training:
|
|
50 |
### Framework versions
|
51 |
|
52 |
- Transformers 4.44.2
|
53 |
-
- Pytorch 2.
|
54 |
-
- Datasets 3.0.
|
55 |
- Tokenizers 0.19.1
|
|
|
40 |
- distributed_type: multi-GPU
|
41 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
42 |
- lr_scheduler_type: linear
|
43 |
+
- num_epochs: 50.0
|
44 |
- mixed_precision_training: Native AMP
|
45 |
|
46 |
### Training results
|
|
|
50 |
### Framework versions
|
51 |
|
52 |
- Transformers 4.44.2
|
53 |
+
- Pytorch 2.5.0+cu121
|
54 |
+
- Datasets 3.0.2
|
55 |
- Tokenizers 0.19.1
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "/content/drive/MyDrive/THESIS_MSIT
|
3 |
"architectures": [
|
4 |
"XLMRobertaModel"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "/content/drive/MyDrive/THESIS_MSIT",
|
3 |
"architectures": [
|
4 |
"XLMRobertaModel"
|
5 |
],
|
config_sentence_transformers.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"__version__": {
|
3 |
-
"sentence_transformers": "3.
|
4 |
"transformers": "4.44.2",
|
5 |
-
"pytorch": "2.
|
6 |
},
|
7 |
"prompts": {},
|
8 |
"default_prompt_name": null,
|
|
|
1 |
{
|
2 |
"__version__": {
|
3 |
+
"sentence_transformers": "3.2.1",
|
4 |
"transformers": "4.44.2",
|
5 |
+
"pytorch": "2.5.0+cu121"
|
6 |
},
|
7 |
"prompts": {},
|
8 |
"default_prompt_name": null,
|