diff --git "a/train.ipynb" "b/train.ipynb" --- "a/train.ipynb" +++ "b/train.ipynb" @@ -3,21 +3,62 @@ { "cell_type": "code", "execution_count": 1, - "id": "1a08ff40", + "id": "8d07f027", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "Using custom data configuration default-8bef3afded73c387\n", - "Reusing dataset json (/workspace/.cache/huggingface/datasets/json/default-8bef3afded73c387/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b)\n" + "Using custom data configuration default-8f1be135afea2a5e\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Downloading and preparing dataset json/default to /workspace/.cache/huggingface/datasets/json/default-8f1be135afea2a5e/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b...\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "1b68f3c845a14540b7fa4feb0b78d3e9", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "54002c8dc2044b3987377cf519579109", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Dataset json downloaded and prepared to /workspace/.cache/huggingface/datasets/json/default-8f1be135afea2a5e/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b. Subsequent calls will reuse this data.\n" ] }, { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "19b2e8b501604f2daa38a71c2cffd8de", + "model_id": "861f78e0c3b3458faa9cc42cde173d84", "version_major": 2, "version_minor": 0 }, @@ -32,14 +73,55 @@ "name": "stderr", "output_type": "stream", "text": [ - "Using custom data configuration default-ee895f61a8bce75c\n", - "Reusing dataset json (/workspace/.cache/huggingface/datasets/json/default-ee895f61a8bce75c/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b)\n" + "Using custom data configuration default-cb03ad945d4a24ac\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Downloading and preparing dataset json/default to /workspace/.cache/huggingface/datasets/json/default-cb03ad945d4a24ac/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b...\n" ] }, { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "e3ad786830e94c4898a43c3a426b4f0c", + "model_id": "f61b1f0086c340f9a8b2d9f20a08e0c1", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "7d18344e823a4848a9b98cfdec90b2ce", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Dataset json downloaded and prepared to /workspace/.cache/huggingface/datasets/json/default-cb03ad945d4a24ac/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b. Subsequent calls will reuse this data.\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "77bc9aad0b494696942e0fbd0663a29c", "version_major": 2, "version_minor": 0 }, @@ -54,14 +136,55 @@ "name": "stderr", "output_type": "stream", "text": [ - "Using custom data configuration default-85a752aaa77917b6\n", - "Reusing dataset json (/workspace/.cache/huggingface/datasets/json/default-85a752aaa77917b6/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b)\n" + "Using custom data configuration default-eec7a48f9eca7cd5\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Downloading and preparing dataset json/default to /workspace/.cache/huggingface/datasets/json/default-eec7a48f9eca7cd5/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b...\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "200634fba7454dc5a611c6a79855bc42", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "d2246049976343659ce829d6c1f1e42e", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Dataset json downloaded and prepared to /workspace/.cache/huggingface/datasets/json/default-eec7a48f9eca7cd5/0.0.0/ac0ca5f5289a6cf108e706efcf040422dbbfa8e658dee6a819f20d76bb84d26b. Subsequent calls will reuse this data.\n" ] }, { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "47b6125c2b994076b4182ff75942cf01", + "model_id": "43219229d82c4e2a9d3cb916d1b56801", "version_major": 2, "version_minor": 0 }, @@ -92,9 +215,7 @@ "\n", "def load_local_dataset(dsname):\n", " d = datasets.load_dataset('json', data_files=f'/workspace/data/{dsname}.json')\n", - " d = d.cast_column('path', datasets.features.Audio(sampling_rate=16000))\n", - " d = d.rename_column('path', 'audio')\n", - " d = d.rename_column('transcription', 'sentence')\n", + " d = d.cast_column('audio', datasets.features.Audio(sampling_rate=16000))\n", " return d\n", "\n", "ovm = load_local_dataset('ovm')\n", @@ -107,7 +228,7 @@ { "cell_type": "code", "execution_count": 2, - "id": "60022ef2", + "id": "890ba811", "metadata": {}, "outputs": [ { @@ -143,17 +264,17 @@ { "cell_type": "code", "execution_count": 3, - "id": "ffe44f86", + "id": "3855ccb3", "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "{'audio': {'path': '/workspace/data/pscr/sound_110619_001010-1555.wav',\n", - " 'array': array([0.00177002, 0.00085449, 0.00042725, ..., 0.056427 , 0.04852295,\n", - " 0.03656006], dtype=float32),\n", + "{'audio': {'path': '/workspace/data/vystadial2016/train/10/62/vad-2015-09-20--12-34-27.561625.wav',\n", + " 'array': array([ 0.00564575, 0.00588989, 0.00363159, ..., -0.01358032,\n", + " -0.01220703, -0.00946045], dtype=float32),\n", " 'sampling_rate': 16000},\n", - " 'sentence': 'děkuji pane ministře nevim co bude obsahovat ten',\n", + " 'sentence': 'olomouc hlavní nádraží',\n", " 'path': None}" ] }, @@ -171,7 +292,7 @@ { "cell_type": "code", "execution_count": 4, - "id": "cf977436", + "id": "7c896f08", "metadata": {}, "outputs": [ { @@ -201,7 +322,7 @@ { "cell_type": "code", "execution_count": null, - "id": "d4dc3c39", + "id": "2eb3eb20", "metadata": {}, "outputs": [], "source": [] @@ -209,7 +330,7 @@ { "cell_type": "code", "execution_count": 5, - "id": "a80782b9", + "id": "f43b8d3d", "metadata": { "id": "ZcVsD0ETElrR" }, @@ -264,13 +385,13 @@ { "cell_type": "code", "execution_count": 6, - "id": "3666167a", + "id": "d1fd4858", "metadata": {}, "outputs": [ { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "0c6540473c674c09a2b9dd25c78d56bb", + "model_id": "10a4628ef8454147a54a6d97fefe3532", "version_major": 2, "version_minor": 0 }, @@ -297,7 +418,7 @@ { "cell_type": "code", "execution_count": null, - "id": "1bac3c43", + "id": "ffb2e6ba", "metadata": {}, "outputs": [], "source": [] @@ -305,7 +426,7 @@ { "cell_type": "code", "execution_count": 7, - "id": "c716c423", + "id": "9acd28b1", "metadata": { "id": "LwCshNbbeRZR" }, @@ -320,13 +441,13 @@ { "cell_type": "code", "execution_count": 8, - "id": "521e5ffb", + "id": "c009de89", "metadata": {}, "outputs": [ { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "e2d45ce36e7743a58141aa97afa52594", + "model_id": "d7103c4475a9464cb7dd5c66a68ddbf7", "version_major": 2, "version_minor": 0 }, @@ -399,7 +520,7 @@ { "cell_type": "code", "execution_count": 9, - "id": "1a217a7a", + "id": "7b237346", "metadata": { "id": "npbIbBoLgaFX" }, @@ -426,7 +547,7 @@ { "cell_type": "code", "execution_count": 10, - "id": "5f709e78", + "id": "a08bda02", "metadata": {}, "outputs": [ { @@ -455,7 +576,7 @@ { "cell_type": "code", "execution_count": null, - "id": "9c8441aa", + "id": "154e541c", "metadata": {}, "outputs": [], "source": [] @@ -463,7 +584,7 @@ { "cell_type": "code", "execution_count": 11, - "id": "e17037d8", + "id": "411e1255", "metadata": { "colab": { "base_uri": "https://localhost:8080/" @@ -492,7 +613,7 @@ { "cell_type": "code", "execution_count": null, - "id": "24c934e4", + "id": "e3f0c2f5", "metadata": {}, "outputs": [], "source": [] @@ -500,7 +621,7 @@ { "cell_type": "code", "execution_count": 12, - "id": "176e054d", + "id": "8ab39e55", "metadata": { "colab": { "base_uri": "https://localhost:8080/", @@ -519,7 +640,7 @@ { "cell_type": "code", "execution_count": 13, - "id": "b26ff01c", + "id": "5c1c8b06", "metadata": { "id": "A1XApZBAF2zr" }, @@ -531,7 +652,7 @@ { "cell_type": "code", "execution_count": 14, - "id": "55245bee", + "id": "b4b326f8", "metadata": { "id": "kAR0-2KLkopp" }, @@ -545,7 +666,7 @@ { "cell_type": "code", "execution_count": 15, - "id": "17d24172", + "id": "30a92bc9", "metadata": { "id": "KYZtoW-tlZgl" }, @@ -559,7 +680,7 @@ { "cell_type": "code", "execution_count": 16, - "id": "6d7d04c5", + "id": "de95a6dc", "metadata": { "id": "kMv1VGCJoX8D" }, @@ -572,7 +693,7 @@ { "cell_type": "code", "execution_count": null, - "id": "3f9ac963", + "id": "6369313a", "metadata": { "colab": { "base_uri": "https://localhost:8080/", @@ -587,7 +708,7 @@ { "cell_type": "code", "execution_count": 17, - "id": "d214b124", + "id": "d74c0b80", "metadata": { "colab": { "base_uri": "https://localhost:8080/", @@ -604,7 +725,7 @@ { "cell_type": "code", "execution_count": 18, - "id": "c630337a", + "id": "a8b4ce20", "metadata": { "colab": { "base_uri": "https://localhost:8080/" @@ -616,9 +737,9 @@ { "data": { "text/plain": [ - "{'path': '/workspace/data/pscr/sound_110619_001010-1555.wav',\n", - " 'array': array([0.00177002, 0.00085449, 0.00042725, ..., 0.056427 , 0.04852295,\n", - " 0.03656006], dtype=float32),\n", + "{'path': '/workspace/data/vystadial2016/train/10/62/vad-2015-09-20--12-34-27.561625.wav',\n", + " 'array': array([ 0.00564575, 0.00588989, 0.00363159, ..., -0.01358032,\n", + " -0.01220703, -0.00946045], dtype=float32),\n", " 'sampling_rate': 16000}" ] }, @@ -634,7 +755,7 @@ { "cell_type": "code", "execution_count": 19, - "id": "e8cc7fa2", + "id": "8a006882", "metadata": { "id": "rrv65aj7G95i" }, @@ -648,7 +769,7 @@ { "cell_type": "code", "execution_count": 20, - "id": "b46aa8cd", + "id": "fc328f00", "metadata": { "colab": { "base_uri": "https://localhost:8080/" @@ -660,9 +781,9 @@ { "data": { "text/plain": [ - "{'path': '/workspace/data/pscr/sound_110619_001010-1555.wav',\n", - " 'array': array([0.00177002, 0.00085449, 0.00042725, ..., 0.056427 , 0.04852295,\n", - " 0.03656006], dtype=float32),\n", + "{'path': '/workspace/data/vystadial2016/train/10/62/vad-2015-09-20--12-34-27.561625.wav',\n", + " 'array': array([ 0.00564575, 0.00588989, 0.00363159, ..., -0.01358032,\n", + " -0.01220703, -0.00946045], dtype=float32),\n", " 'sampling_rate': 16000}" ] }, @@ -678,7 +799,7 @@ { "cell_type": "code", "execution_count": 21, - "id": "ed9fb5e2", + "id": "14fc4dc7", "metadata": { "colab": { "base_uri": "https://localhost:8080/", @@ -692,7 +813,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "máš ho tady\n" + "dobrý den chtěl bych jet\n" ] }, { @@ -700,7 +821,7 @@ "text/html": [ "\n", " \n", " " @@ -728,7 +849,7 @@ { "cell_type": "code", "execution_count": 22, - "id": "1d66bd44", + "id": "5607b522", "metadata": { "id": "eJY7I0XAwe9p" }, @@ -749,7 +870,7 @@ { "cell_type": "code", "execution_count": 23, - "id": "f5360bdd", + "id": "00e34422", "metadata": { "colab": { "base_uri": "https://localhost:8080/", @@ -786,7 +907,7 @@ { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "c97a52c72198489f89a4481f722ac35a", + "model_id": "45634e805c76453a94ffac3f287df33f", "version_major": 2, "version_minor": 0 }, @@ -813,7 +934,7 @@ { "cell_type": "code", "execution_count": 24, - "id": "5e8bb4ee", + "id": "4207ffd0", "metadata": { "id": "tborvC9hx88e" }, @@ -874,7 +995,7 @@ { "cell_type": "code", "execution_count": 25, - "id": "98dfd52e", + "id": "2b346d91", "metadata": { "id": "lbQf5GuZyQ4_" }, @@ -886,7 +1007,7 @@ { "cell_type": "code", "execution_count": 26, - "id": "5efc8697", + "id": "3afc8d2a", "metadata": { "id": "9Xsux2gmyXso" }, @@ -902,7 +1023,7 @@ { "cell_type": "code", "execution_count": 27, - "id": "ec29ec29", + "id": "9119abc6", "metadata": { "id": "1XZ-kjweyTy_" }, @@ -927,7 +1048,7 @@ { "cell_type": "code", "execution_count": 28, - "id": "d6d68f86", + "id": "172587ca", "metadata": { "colab": { "base_uri": "https://localhost:8080/" @@ -940,7 +1061,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "Some weights of the model checkpoint at facebook/wav2vec2-xls-r-300m were not used when initializing Wav2Vec2ForCTC: ['project_hid.weight', 'quantizer.weight_proj.bias', 'quantizer.codevectors', 'quantizer.weight_proj.weight', 'project_q.bias', 'project_hid.bias', 'project_q.weight']\n", + "Some weights of the model checkpoint at facebook/wav2vec2-xls-r-300m were not used when initializing Wav2Vec2ForCTC: ['project_hid.bias', 'project_q.weight', 'quantizer.weight_proj.bias', 'project_hid.weight', 'quantizer.weight_proj.weight', 'project_q.bias', 'quantizer.codevectors']\n", "- This IS expected if you are initializing Wav2Vec2ForCTC from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n", "- This IS NOT expected if you are initializing Wav2Vec2ForCTC from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n", "Some weights of Wav2Vec2ForCTC were not initialized from the model checkpoint at facebook/wav2vec2-xls-r-300m and are newly initialized: ['lm_head.weight', 'lm_head.bias']\n", @@ -955,7 +1076,7 @@ " #\"comodoro/wav2vec2-xls-r-300m-cs-cv8\", \n", " \"facebook/wav2vec2-xls-r-300m\", \n", " attention_dropout=0.1,\n", - " hidden_dropout=0.1,\n", + " hidden_dropout=0.2,\n", " feat_proj_dropout=0.0,\n", " mask_time_prob=0.1,\n", " layerdrop=0.1,\n", @@ -968,7 +1089,7 @@ { "cell_type": "code", "execution_count": 29, - "id": "23d91592", + "id": "94625b79", "metadata": { "id": "oGI8zObtZ3V0" }, @@ -989,7 +1110,7 @@ { "cell_type": "code", "execution_count": 30, - "id": "bf112a3a", + "id": "9c173ad4", "metadata": { "id": "KbeKSV7uzGPP" }, @@ -1000,18 +1121,18 @@ "training_args = TrainingArguments(\n", " output_dir=repo_name,\n", " group_by_length=True,\n", - " per_device_train_batch_size=16,\n", + " per_device_train_batch_size=32,\n", " gradient_accumulation_steps=1,\n", " eval_accumulation_steps=1,\n", " evaluation_strategy=\"steps\",\n", - " num_train_epochs=50,\n", + " num_train_epochs=5,\n", " gradient_checkpointing=True,\n", " fp16=True,\n", " save_steps=800,\n", " eval_steps=800,\n", " logging_steps=250,\n", - " learning_rate=1e-5,\n", - " warmup_steps=600,\n", + " learning_rate=1e-4,\n", + " warmup_steps=800,\n", " save_total_limit=2,\n", " report_to=\"tensorboard\"\n", ")" @@ -1020,7 +1141,7 @@ { "cell_type": "code", "execution_count": 31, - "id": "6d209cae", + "id": "38cc611b", "metadata": { "colab": { "base_uri": "https://localhost:8080/" @@ -1054,7 +1175,7 @@ { "cell_type": "code", "execution_count": 32, - "id": "350ccf96", + "id": "ab7b22fa", "metadata": { "colab": { "base_uri": "https://localhost:8080/", @@ -1073,11 +1194,11 @@ " warnings.warn(\n", "***** Running training *****\n", " Num examples = 159605\n", - " Num Epochs = 50\n", - " Instantaneous batch size per device = 16\n", - " Total train batch size (w. parallel, distributed & accumulation) = 16\n", + " Num Epochs = 5\n", + " Instantaneous batch size per device = 32\n", + " Total train batch size (w. parallel, distributed & accumulation) = 32\n", " Gradient Accumulation steps = 1\n", - " Total optimization steps = 498800\n" + " Total optimization steps = 24940\n" ] }, { @@ -1086,8 +1207,8 @@ "\n", "
800 | \n", - "4.750000 | \n", - "3.766450 | \n", + "3.420300 | \n", + "3.314820 | \n", "1.000000 | \n", "1.000000 | \n", "||
1600 | \n", - "3.479800 | \n", - "3.361168 | \n", - "1.000000 | \n", - "1.000000 | \n", + "2.815100 | \n", + "0.850840 | \n", + "0.893788 | \n", + "0.234479 | \n", "
2400 | \n", - "3.331700 | \n", - "3.301482 | \n", - "1.000000 | \n", - "1.000000 | \n", + "0.941100 | \n", + "0.333538 | \n", + "0.372315 | \n", + "0.084735 | \n", "
3200 | \n", - "3.197300 | \n", - "2.584765 | \n", - "0.999802 | \n", - "0.856619 | \n", + "0.740800 | \n", + "0.257277 | \n", + "0.283963 | \n", + "0.064233 | \n", "
4000 | \n", - "1.807400 | \n", - "0.908614 | \n", - "0.640853 | \n", - "0.151860 | \n", + "0.651600 | \n", + "0.236474 | \n", + "0.258103 | \n", + "0.059464 | \n", "
4800 | \n", - "1.342100 | \n", - "0.550420 | \n", - "0.432450 | \n", - "0.095473 | \n", + "0.624200 | \n", + "0.203933 | \n", + "0.243332 | \n", + "0.054062 | \n", "
5600 | \n", - "1.132700 | \n", - "0.394087 | \n", - "0.347781 | \n", - "0.073488 | \n", + "0.575400 | \n", + "0.183210 | \n", + "0.215611 | \n", + "0.048234 | \n", "
6400 | \n", - "0.999300 | \n", - "0.323176 | \n", - "0.293804 | \n", - "0.061316 | \n", + "0.562600 | \n", + "0.182699 | \n", + "0.209116 | \n", + "0.046281 | \n", "
7200 | \n", - "0.928100 | \n", - "0.273187 | \n", - "0.263014 | \n", - "0.054848 | \n", + "0.534200 | \n", + "0.174398 | \n", + "0.203315 | \n", + "0.046776 | \n", "
8000 | \n", - "0.897600 | \n", - "0.244686 | \n", - "0.247510 | \n", - "0.051767 | \n", + "0.496500 | \n", + "0.170528 | \n", + "0.196285 | \n", + "0.044429 | \n", "
8800 | \n", - "0.813400 | \n", - "0.227193 | \n", - "0.236362 | \n", - "0.049280 | \n", + "0.504700 | \n", + "0.160374 | \n", + "0.188880 | \n", + "0.042167 | \n", "
9600 | \n", - "0.775800 | \n", - "0.211454 | \n", - "0.225769 | \n", - "0.047510 | \n", + "0.481400 | \n", + "0.160427 | \n", + "0.182742 | \n", + "0.041052 | \n", "
10400 | \n", - "0.757200 | \n", - "0.200528 | \n", - "0.216522 | \n", - "0.045622 | \n", + "0.447100 | \n", + "0.156585 | \n", + "0.182207 | \n", + "0.040592 | \n", "
11200 | \n", - "0.729700 | \n", - "0.194056 | \n", - "0.210582 | \n", - "0.044185 | \n", + "0.450900 | \n", + "0.161888 | \n", + "0.185296 | \n", + "0.043243 | \n", "
12000 | \n", - "0.698300 | \n", - "0.189558 | \n", - "0.205671 | \n", - "0.043360 | \n", + "0.441500 | \n", + "0.151254 | \n", + "0.176386 | \n", + "0.039725 | \n", "
12800 | \n", - "0.681800 | \n", - "0.180987 | \n", - "0.198444 | \n", - "0.042125 | \n", + "0.431300 | \n", + "0.151478 | \n", + "0.173930 | \n", + "0.039213 | \n", "
13600 | \n", - "0.644600 | \n", - "0.176266 | \n", - "0.191612 | \n", - "0.040599 | \n", + "0.416300 | \n", + "0.144519 | \n", + "0.169515 | \n", + "0.037672 | \n", "
14400 | \n", - "0.645400 | \n", - "0.167550 | \n", - "0.188999 | \n", - "0.040012 | \n", + "0.414200 | \n", + "0.147759 | \n", + "0.169871 | \n", + "0.038473 | \n", "
15200 | \n", - "0.646100 | \n", - "0.166065 | \n", - "0.182326 | \n", - "0.038584 | \n", + "0.418400 | \n", + "0.143047 | \n", + "0.166921 | \n", + "0.037583 | \n", "
16000 | \n", - "0.648300 | \n", - "0.165056 | \n", - "0.180920 | \n", - "0.038490 | \n", + "0.388600 | \n", + "0.143273 | \n", + "0.164426 | \n", + "0.037388 | \n", "
16800 | \n", - "0.622600 | \n", - "0.158542 | \n", - "0.178583 | \n", - "0.038353 | \n", + "0.379500 | \n", + "0.142606 | \n", + "0.164822 | \n", + "0.037258 | \n", "
17600 | \n", - "0.602400 | \n", - "0.152548 | \n", - "0.174485 | \n", - "0.037284 | \n", + "0.385900 | \n", + "0.135660 | \n", + "0.160446 | \n", + "0.036143 | \n", "
18400 | \n", - "0.615900 | \n", - "0.153470 | \n", - "0.174366 | \n", - "0.037303 | \n", + "0.376200 | \n", + "0.134396 | \n", + "0.155832 | \n", + "0.034930 | \n", "
19200 | \n", - "0.587300 | \n", - "0.149551 | \n", - "0.169594 | \n", - "0.036240 | \n", + "0.384000 | \n", + "0.137933 | \n", + "0.157595 | \n", + "0.035875 | \n", "
20000 | \n", - "0.582300 | \n", - "0.147552 | \n", - "0.169594 | \n", - "0.036146 | \n", + "0.376200 | \n", + "0.134363 | \n", + "0.153892 | \n", + "0.034552 | \n", "
20800 | \n", - "0.541400 | \n", - "0.145685 | \n", - "0.167792 | \n", - "0.035813 | \n", + "0.355900 | \n", + "0.133945 | \n", + "0.152526 | \n", + "0.035080 | \n", "
21600 | \n", - "0.571100 | \n", - "0.146135 | \n", - "0.167455 | \n", - "0.036029 | \n", + "0.368300 | \n", + "0.131489 | \n", + "0.151753 | \n", + "0.034226 | \n", "
22400 | \n", - "0.565000 | \n", - "0.142886 | \n", - "0.164624 | \n", - "0.035194 | \n", + "0.357200 | \n", + "0.130721 | \n", + "0.150664 | \n", + "0.034154 | \n", "
23200 | \n", - "0.555500 | \n", - "0.141050 | \n", - "0.162901 | \n", - "0.034871 | \n", + "0.349400 | \n", + "0.129449 | \n", + "0.149100 | \n", + "0.033476 | \n", "
24000 | \n", - "0.522600 | \n", - "0.140978 | \n", - "0.162050 | \n", - "0.034359 | \n", + "0.347600 | \n", + "0.128731 | \n", + "0.149120 | \n", + "0.033597 | \n", "
24800 | \n", - "0.535000 | \n", - "0.137778 | \n", - "0.160585 | \n", - "0.035011 | \n", - "||||
25600 | \n", - "0.552500 | \n", - "0.136405 | \n", - "0.159119 | \n", - "0.034666 | \n", - "||||
26400 | \n", - "0.519000 | \n", - "0.138575 | \n", - "0.157397 | \n", - "0.034004 | \n", - "||||
27200 | \n", - "0.522700 | \n", - "0.132574 | \n", - "0.159060 | \n", - "0.034317 | \n", - "||||
28000 | \n", - "0.493100 | \n", - "0.133862 | \n", - "0.155753 | \n", - "0.033766 | \n", - "||||
28800 | \n", - "0.494900 | \n", - "0.132223 | \n", - "0.154723 | \n", - "0.033183 | \n", - "||||
29600 | \n", - "0.509100 | \n", - "0.131310 | \n", - "0.153535 | \n", - "0.033147 | \n", - "||||
30400 | \n", - "0.487900 | \n", - "0.128967 | \n", - "0.150704 | \n", - "0.032260 | \n", - "||||
31200 | \n", - "0.500500 | \n", - "0.130414 | \n", - "0.151654 | \n", - "0.032628 | \n", + "0.347500 | \n", + "0.127098 | \n", + "0.147457 | \n", + "0.032896 | \n", "
"
@@ -1395,7 +1460,7 @@
"Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-800/config.json\n",
"Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-800/pytorch_model.bin\n",
"Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-800/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-4000] due to args.save_total_limit\n",
+ "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-30400] due to args.save_total_limit\n",
"The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
"***** Running Evaluation *****\n",
" Num examples = 7267\n",
@@ -1404,7 +1469,7 @@
"Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-1600/config.json\n",
"Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-1600/pytorch_model.bin\n",
"Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-1600/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-4800] due to args.save_total_limit\n",
+ "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-31200] due to args.save_total_limit\n",
"The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
"***** Running Evaluation *****\n",
" Num examples = 7267\n",
@@ -1666,101 +1731,22 @@
"Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-24800/pytorch_model.bin\n",
"Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-24800/preprocessor_config.json\n",
"Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-23200] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-25600\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-25600/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-25600/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-25600/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-24000] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-26400\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-26400/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-26400/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-26400/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-24800] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-27200\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-27200/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-27200/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-27200/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-25600] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-28000\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-28000/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-28000/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-28000/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-26400] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-28800\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-28800/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-28800/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-28800/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-27200] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-29600\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-29600/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-29600/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-29600/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-28000] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-30400\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-30400/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-30400/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-30400/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-28800] due to args.save_total_limit\n",
- "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n",
- "***** Running Evaluation *****\n",
- " Num examples = 7267\n",
- " Batch size = 8\n",
- "Saving model checkpoint to wav2vec2-xls-r-300m-cs-250/checkpoint-31200\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-31200/config.json\n",
- "Model weights saved in wav2vec2-xls-r-300m-cs-250/checkpoint-31200/pytorch_model.bin\n",
- "Configuration saved in wav2vec2-xls-r-300m-cs-250/checkpoint-31200/preprocessor_config.json\n",
- "Deleting older checkpoint [wav2vec2-xls-r-300m-cs-250/checkpoint-29600] due to args.save_total_limit\n"
+ "\n",
+ "\n",
+ "Training completed. Do not forget to share your model on huggingface.co/models =)\n",
+ "\n",
+ "\n"
]
},
{
- "ename": "KeyboardInterrupt",
- "evalue": "",
- "output_type": "error",
- "traceback": [
- "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
- "\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)",
- "\u001b[0;32m