kardosdrur
commited on
Commit
•
79cea8d
1
Parent(s):
228ed50
Saved model checkpoint after epoch 0
Browse files- .gitattributes +1 -0
- README.md +2 -2
- model.safetensors +1 -1
.gitattributes
CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
|
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
37 |
+
.git/lfs/objects/fb/47/fb47583d9ebb29cc3a89ffd4acaa3c3c7376f14705eda1a9f62f076dd44a9813 filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
@@ -100,7 +100,7 @@ The model was trained with the parameters:
|
|
100 |
Parameters of the fit()-Method:
|
101 |
```
|
102 |
{
|
103 |
-
"epochs":
|
104 |
"evaluator": "dfm_sentence_trf.evaluation.task_evaluator.TaskListEvaluator",
|
105 |
"max_grad_norm": 1,
|
106 |
"optimizer_class": "<class 'torch.optim.adamw.AdamW'>",
|
@@ -108,7 +108,7 @@ Parameters of the fit()-Method:
|
|
108 |
"lr": 2e-05
|
109 |
},
|
110 |
"scheduler": "WarmupLinear",
|
111 |
-
"steps_per_epoch":
|
112 |
"warmup_steps": 100,
|
113 |
"weight_decay": 0.01
|
114 |
}
|
|
|
100 |
Parameters of the fit()-Method:
|
101 |
```
|
102 |
{
|
103 |
+
"epochs": 20,
|
104 |
"evaluator": "dfm_sentence_trf.evaluation.task_evaluator.TaskListEvaluator",
|
105 |
"max_grad_norm": 1,
|
106 |
"optimizer_class": "<class 'torch.optim.adamw.AdamW'>",
|
|
|
108 |
"lr": 2e-05
|
109 |
},
|
110 |
"scheduler": "WarmupLinear",
|
111 |
+
"steps_per_epoch": 5000,
|
112 |
"warmup_steps": 100,
|
113 |
"weight_decay": 0.01
|
114 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 87532520
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4074bdfa870dd130ef7020cca37ef2afa2e98d99afbf525e0bba156a51f06808
|
3 |
size 87532520
|