Training in progress, step 1000

Files changed (10) hide show

added_tokens.json CHANGED Viewed

@@ -17,7 +17,6 @@
   "<|da|>": 50285,
   "<|de|>": 50261,
   "<|el|>": 50281,
-  "<|endoftext|>": 50257,
   "<|en|>": 50259,
   "<|es|>": 50262,
   "<|et|>": 50307,
@@ -30,6 +29,7 @@
   "<|gu|>": 50333,
   "<|haw|>": 50352,
   "<|ha|>": 50354,
   "<|hi|>": 50276,
   "<|hr|>": 50291,
   "<|ht|>": 50339,
@@ -38,7 +38,6 @@
   "<|id|>": 50275,
   "<|is|>": 50311,
   "<|it|>": 50274,
-  "<|iw|>": 50279,
   "<|ja|>": 50266,
   "<|jw|>": 50356,
   "<|ka|>": 50329,

   "<|da|>": 50285,
   "<|de|>": 50261,
   "<|el|>": 50281,
   "<|en|>": 50259,
   "<|es|>": 50262,
   "<|et|>": 50307,
   "<|gu|>": 50333,
   "<|haw|>": 50352,
   "<|ha|>": 50354,
+  "<|he|>": 50279,
   "<|hi|>": 50276,
   "<|hr|>": 50291,
   "<|ht|>": 50339,
   "<|id|>": 50275,
   "<|is|>": 50311,
   "<|it|>": 50274,
   "<|ja|>": 50266,
   "<|jw|>": 50356,
   "<|ka|>": 50329,

nohup.out ADDED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c700aca1251b4c28be3894c734c12a20f221265bbf4c5c01ff35a97f692a6d52
 size 967102601

 version https://git-lfs.github.com/spec/v1
+oid sha256:dde53cf5fed853761b41e7ea0af91878d15f20c79d2499a3c3bf33d1288db232
 size 967102601

run.sh CHANGED Viewed

@@ -1,6 +1,6 @@
 python run_speech_recognition_seq2seq_streaming.py \
 	--model_name_or_path="openai/whisper-small" \
-	--dataset_name="mozilla-foundation/common_voice_11_0" \
 	--dataset_config_name="eu" \
 	--language="basque" \
 	--train_split_name="train+validation" \

 python run_speech_recognition_seq2seq_streaming.py \
 	--model_name_or_path="openai/whisper-small" \
+	--dataset_name="mozilla-foundation/common_voice_13_0" \
 	--dataset_config_name="eu" \
 	--language="basque" \
 	--train_split_name="train+validation" \

runs/Jul20_11-05-05_tknadmin-System-Product-Name/1689843926.5927894/events.out.tfevents.1689843926.tknadmin-System-Product-Name.2399.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4da669066da0745142fafdae02990c3ba43e82dcf98bd6ded128e5f548f9536f
+size 5884

runs/Jul20_11-05-05_tknadmin-System-Product-Name/events.out.tfevents.1689843926.tknadmin-System-Product-Name.2399.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b34c8a964304c86412222ffbf172dded1cd8302326d17eb5246c5ec42d396c61
+size 10864

special_tokens_map.json CHANGED Viewed

@@ -22,7 +22,7 @@
     "<|hi|>",
     "<|fi|>",
     "<|vi|>",
-    "<|iw|>",
     "<|uk|>",
     "<|el|>",
     "<|ms|>",
@@ -124,7 +124,7 @@
   },
   "pad_token": "<|endoftext|>",
   "unk_token": {
-    "content": "",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,

     "<|hi|>",
     "<|fi|>",
     "<|vi|>",
+    "<|he|>",
     "<|uk|>",
     "<|el|>",
     "<|ms|>",
   },
   "pad_token": "<|endoftext|>",
   "unk_token": {
+    "content": "<|endoftext|>",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -27,7 +27,7 @@
   "tokenizer_class": "WhisperTokenizer",
   "unk_token": {
     "__type": "AddedToken",
-    "content": "",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,

   "tokenizer_class": "WhisperTokenizer",
   "unk_token": {
     "__type": "AddedToken",
+    "content": "<|endoftext|>",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:72d55d0427f58602fb4bf5f34f2662f2de850d5c66dbc6cd9f3df3b36274ce51
 size 3643

 version https://git-lfs.github.com/spec/v1
+oid sha256:3d621f52817860d9aa272439631c6b2bfec18ad203c2627c0ed03f1989afcad1
 size 3643

vocab.json CHANGED Viewed

@@ -314,6 +314,7 @@
   ";;": 35746,
   "<": 27,
   "</": 3433,
   "=": 28,
   "=\"": 13114,
   "=\"#": 34106,

   ";;": 35746,
   "<": 27,
   "</": 3433,
+  "<|endoftext|>": 50257,
   "=": 28,
   "=\"": 13114,
   "=\"#": 34106,