end
Browse files- checkpoints/checkpoint_epoch=2499.ckpt +3 -0
- checkpoints/checkpoint_epoch=2599.ckpt +3 -0
- checkpoints/checkpoint_epoch=2699.ckpt +3 -0
- checkpoints/checkpoint_epoch=2799.ckpt +3 -0
- checkpoints/checkpoint_epoch=2899.ckpt +3 -0
- checkpoints/checkpoint_epoch=2999.ckpt +3 -0
- checkpoints/checkpoint_epoch=3099.ckpt +3 -0
- checkpoints/checkpoint_epoch=3199.ckpt +3 -0
- checkpoints/checkpoint_epoch=3299.ckpt +3 -0
- checkpoints/checkpoint_epoch=3399.ckpt +3 -0
- checkpoints/last.ckpt +2 -2
- tensorboard/version_0/events.out.tfevents.1729438040.842e86ef2042.2233.0 +2 -2
- train.log +40 -0
checkpoints/checkpoint_epoch=2499.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1846fa7198ed55388dcf730520e72a98f9b9483056f92c8964d558c0f88ed9de
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=2599.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:673384e1021c0005a3345ee17c6c14239d4453c7c940db013f319aad6aeadb13
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=2699.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca43ec07f833b767266fe851928f7c1ef1628ad0cac426792bfe329aec4c826c
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=2799.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ed31508937a591157d1dd6889283068875abb2cee50b46225e4de155834a45
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=2899.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37de60f9729a3dff88b541339e9ad211b9145b5aeef0f0467e882dd875cd3fd2
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=2999.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e0cc706f2c29a483e4910dfe3f3657f8133956c651a21593a52bb1d59cdfb64
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=3099.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eca36c56b5f11e944cdaef9edbfe818a05820dd6193d4fa69d54e7fe5088fc7d
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=3199.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:500c384d4c23cc412030e4140cb3fecce934850493abf7c361c06d45a0b48fdc
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=3299.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffc03785b0dd0607f4a6e2565869e87466571d84ced1ee5d363ed8e414f24080
|
3 |
+
size 218842306
|
checkpoints/checkpoint_epoch=3399.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fd4d59e487b7fd27149d6a19cec7b7611c7a0de940e15b51c0f8c3e3b20a526
|
3 |
+
size 218842306
|
checkpoints/last.ckpt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5182282e82fcbdbb45e5c04fa38b164ad1a81cfc1094cd2dbaf7cb3f1bd895c3
|
3 |
+
size 218842306
|
tensorboard/version_0/events.out.tfevents.1729438040.842e86ef2042.2233.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:296e938933539883d4f8c288af09ddfedaaef4435d1dcb125ffcf93357cae1f8
|
3 |
+
size 1066585206
|
train.log
CHANGED
@@ -11,3 +11,43 @@
|
|
11 |
[2024-10-20 15:27:20,323][__main__][INFO] - Instantiating trainer <lightning.pytorch.trainer.Trainer>
|
12 |
[2024-10-20 15:27:20,367][__main__][INFO] - Logging hyperparameters!
|
13 |
[2024-10-20 15:27:20,422][__main__][INFO] - Starting training!
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
[2024-10-20 15:27:20,323][__main__][INFO] - Instantiating trainer <lightning.pytorch.trainer.Trainer>
|
12 |
[2024-10-20 15:27:20,367][__main__][INFO] - Logging hyperparameters!
|
13 |
[2024-10-20 15:27:20,422][__main__][INFO] - Starting training!
|
14 |
+
[2024-10-22 01:31:06,012][matcha.utils.utils][ERROR] -
|
15 |
+
Traceback (most recent call last):
|
16 |
+
File "/workspace/Matcha-TTS/matcha/utils/utils.py", line 77, in wrap
|
17 |
+
metric_dict, object_dict = task_func(cfg=cfg)
|
18 |
+
File "/workspace/Matcha-TTS/matcha/train.py", line 79, in train
|
19 |
+
trainer.fit(model=model, datamodule=datamodule, ckpt_path=cfg.get("ckpt_path"))
|
20 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 538, in fit
|
21 |
+
call._call_and_handle_interrupt(
|
22 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/call.py", line 47, in _call_and_handle_interrupt
|
23 |
+
return trainer_fn(*args, **kwargs)
|
24 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 574, in _fit_impl
|
25 |
+
self._run(model, ckpt_path=ckpt_path)
|
26 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 981, in _run
|
27 |
+
results = self._run_stage()
|
28 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 1025, in _run_stage
|
29 |
+
self.fit_loop.run()
|
30 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/loops/fit_loop.py", line 206, in run
|
31 |
+
self.on_advance_end()
|
32 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/loops/fit_loop.py", line 378, in on_advance_end
|
33 |
+
call._call_callback_hooks(trainer, "on_train_epoch_end", monitoring_callbacks=True)
|
34 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/call.py", line 218, in _call_callback_hooks
|
35 |
+
fn(trainer, trainer.lightning_module, *args, **kwargs)
|
36 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/callbacks/model_checkpoint.py", line 326, in on_train_epoch_end
|
37 |
+
self._save_last_checkpoint(trainer, monitor_candidates)
|
38 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/callbacks/model_checkpoint.py", line 696, in _save_last_checkpoint
|
39 |
+
self._save_checkpoint(trainer, filepath)
|
40 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/callbacks/model_checkpoint.py", line 390, in _save_checkpoint
|
41 |
+
trainer.save_checkpoint(filepath, self.save_weights_only)
|
42 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 1365, in save_checkpoint
|
43 |
+
self.strategy.save_checkpoint(checkpoint, filepath, storage_options=storage_options)
|
44 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/pytorch/strategies/strategy.py", line 490, in save_checkpoint
|
45 |
+
self.checkpoint_io.save_checkpoint(checkpoint, filepath, storage_options=storage_options)
|
46 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/fabric/plugins/io/torch_io.py", line 58, in save_checkpoint
|
47 |
+
_atomic_save(checkpoint, path)
|
48 |
+
File "/opt/conda/lib/python3.10/site-packages/lightning/fabric/utilities/cloud_io.py", line 90, in _atomic_save
|
49 |
+
f.write(bytesbuffer.getvalue())
|
50 |
+
File "/opt/conda/lib/python3.10/site-packages/fsspec/implementations/local.py", line 373, in write
|
51 |
+
return self.f.write(*args, **kwargs)
|
52 |
+
OSError: [Errno 28] No space left on device
|
53 |
+
[2024-10-22 01:31:06,020][matcha.utils.utils][INFO] - Output dir: /workspace/Matcha-TTS/logs/train/darkman/runs/2024-10-20_15-27-18
|