Training in progress, epoch 1
Browse files- config.json +45 -159
- model.safetensors +2 -2
- preprocessor_config.json +3 -3
- runs/Jun24_13-45-10_ip-10-192-12-219/events.out.tfevents.1750772727.ip-10-192-12-219.20599.0 +3 -0
- runs/Jun24_15-23-31_ip-10-192-12-219/events.out.tfevents.1750778629.ip-10-192-12-219.113148.0 +3 -0
- runs/Jun24_15-26-40_ip-10-192-12-219/events.out.tfevents.1750778817.ip-10-192-12-219.113148.1 +3 -0
- training_args.bin +2 -2
config.json
CHANGED
|
@@ -3,178 +3,64 @@
|
|
| 3 |
"ASTForAudioClassification"
|
| 4 |
],
|
| 5 |
"attention_probs_dropout_prob": 0.0,
|
| 6 |
-
"frequency_stride":
|
| 7 |
"hidden_act": "gelu",
|
| 8 |
"hidden_dropout_prob": 0.0,
|
| 9 |
"hidden_size": 768,
|
| 10 |
"id2label": {
|
| 11 |
"0": "_silence_",
|
| 12 |
"1": "_unknown_",
|
| 13 |
-
"10": "
|
| 14 |
-
"11": "
|
| 15 |
-
"12": "
|
| 16 |
-
"13": "
|
| 17 |
-
"14": "
|
| 18 |
-
"15": "
|
| 19 |
-
"16": "
|
| 20 |
-
"17": "
|
| 21 |
-
"18": "
|
| 22 |
-
"19": "
|
| 23 |
-
"2": "
|
| 24 |
-
"20": "
|
| 25 |
-
"21": "
|
| 26 |
-
"22": "
|
| 27 |
-
"
|
| 28 |
-
"
|
| 29 |
-
"
|
| 30 |
-
"
|
| 31 |
-
"
|
| 32 |
-
"
|
| 33 |
-
"
|
| 34 |
-
"3": "apple",
|
| 35 |
-
"30": "iron",
|
| 36 |
-
"31": "jelly",
|
| 37 |
-
"32": "juice",
|
| 38 |
-
"33": "jump",
|
| 39 |
-
"34": "key",
|
| 40 |
-
"35": "kid",
|
| 41 |
-
"36": "kite",
|
| 42 |
-
"37": "lamp",
|
| 43 |
-
"38": "leaf",
|
| 44 |
-
"39": "lion",
|
| 45 |
-
"4": "arm",
|
| 46 |
-
"40": "milk",
|
| 47 |
-
"41": "monkey",
|
| 48 |
-
"42": "moon",
|
| 49 |
-
"43": "nest",
|
| 50 |
-
"44": "net",
|
| 51 |
-
"45": "nose",
|
| 52 |
-
"46": "ocean",
|
| 53 |
-
"47": "open",
|
| 54 |
-
"48": "orange",
|
| 55 |
-
"49": "pen",
|
| 56 |
-
"5": "ball",
|
| 57 |
-
"50": "pig",
|
| 58 |
-
"51": "pizza",
|
| 59 |
-
"52": "queen",
|
| 60 |
-
"53": "question",
|
| 61 |
-
"54": "quiet",
|
| 62 |
-
"55": "red",
|
| 63 |
-
"56": "room",
|
| 64 |
-
"57": "run",
|
| 65 |
-
"58": "six",
|
| 66 |
-
"59": "snake",
|
| 67 |
-
"6": "bear",
|
| 68 |
-
"60": "star",
|
| 69 |
-
"61": "sun",
|
| 70 |
-
"62": "tiger",
|
| 71 |
-
"63": "toy",
|
| 72 |
-
"64": "tree",
|
| 73 |
-
"65": "umbrella",
|
| 74 |
-
"66": "under",
|
| 75 |
-
"67": "unlike",
|
| 76 |
-
"68": "van",
|
| 77 |
-
"69": "vest",
|
| 78 |
-
"7": "bed",
|
| 79 |
-
"70": "violin",
|
| 80 |
-
"71": "water",
|
| 81 |
-
"72": "white",
|
| 82 |
-
"73": "window",
|
| 83 |
-
"74": "year",
|
| 84 |
-
"75": "yellow",
|
| 85 |
-
"76": "youth",
|
| 86 |
-
"77": "zero",
|
| 87 |
-
"78": "zone",
|
| 88 |
-
"79": "zoo",
|
| 89 |
-
"8": "box",
|
| 90 |
-
"9": "cake"
|
| 91 |
},
|
| 92 |
"initializer_range": 0.02,
|
| 93 |
"intermediate_size": 3072,
|
| 94 |
"label2id": {
|
| 95 |
"_silence_": "0",
|
| 96 |
"_unknown_": "1",
|
| 97 |
-
"
|
| 98 |
-
"
|
| 99 |
-
"
|
| 100 |
-
"
|
| 101 |
-
"
|
| 102 |
-
"
|
| 103 |
-
"
|
| 104 |
-
"
|
| 105 |
-
"
|
| 106 |
-
"
|
| 107 |
-
"
|
| 108 |
-
"
|
| 109 |
-
"
|
| 110 |
-
"
|
| 111 |
-
"
|
| 112 |
-
"
|
| 113 |
-
"
|
| 114 |
-
"
|
| 115 |
-
"
|
| 116 |
-
"
|
| 117 |
-
"
|
| 118 |
-
"gate": "23",
|
| 119 |
-
"gold": "24",
|
| 120 |
-
"hand": "25",
|
| 121 |
-
"hat": "26",
|
| 122 |
-
"home": "27",
|
| 123 |
-
"ice": "28",
|
| 124 |
-
"ill": "29",
|
| 125 |
-
"iron": "30",
|
| 126 |
-
"jelly": "31",
|
| 127 |
-
"juice": "32",
|
| 128 |
-
"jump": "33",
|
| 129 |
-
"key": "34",
|
| 130 |
-
"kid": "35",
|
| 131 |
-
"kite": "36",
|
| 132 |
-
"lamp": "37",
|
| 133 |
-
"leaf": "38",
|
| 134 |
-
"lion": "39",
|
| 135 |
-
"milk": "40",
|
| 136 |
-
"monkey": "41",
|
| 137 |
-
"moon": "42",
|
| 138 |
-
"nest": "43",
|
| 139 |
-
"net": "44",
|
| 140 |
-
"nose": "45",
|
| 141 |
-
"ocean": "46",
|
| 142 |
-
"open": "47",
|
| 143 |
-
"orange": "48",
|
| 144 |
-
"pen": "49",
|
| 145 |
-
"pig": "50",
|
| 146 |
-
"pizza": "51",
|
| 147 |
-
"queen": "52",
|
| 148 |
-
"question": "53",
|
| 149 |
-
"quiet": "54",
|
| 150 |
-
"red": "55",
|
| 151 |
-
"room": "56",
|
| 152 |
-
"run": "57",
|
| 153 |
-
"six": "58",
|
| 154 |
-
"snake": "59",
|
| 155 |
-
"star": "60",
|
| 156 |
-
"sun": "61",
|
| 157 |
-
"tiger": "62",
|
| 158 |
-
"toy": "63",
|
| 159 |
-
"tree": "64",
|
| 160 |
-
"umbrella": "65",
|
| 161 |
-
"under": "66",
|
| 162 |
-
"unlike": "67",
|
| 163 |
-
"van": "68",
|
| 164 |
-
"vest": "69",
|
| 165 |
-
"violin": "70",
|
| 166 |
-
"water": "71",
|
| 167 |
-
"white": "72",
|
| 168 |
-
"window": "73",
|
| 169 |
-
"year": "74",
|
| 170 |
-
"yellow": "75",
|
| 171 |
-
"youth": "76",
|
| 172 |
-
"zero": "77",
|
| 173 |
-
"zone": "78",
|
| 174 |
-
"zoo": "79"
|
| 175 |
},
|
| 176 |
"layer_norm_eps": 1e-12,
|
| 177 |
-
"max_length":
|
| 178 |
"model_type": "audio-spectrogram-transformer",
|
| 179 |
"num_attention_heads": 12,
|
| 180 |
"num_hidden_layers": 12,
|
|
@@ -182,7 +68,7 @@
|
|
| 182 |
"patch_size": 16,
|
| 183 |
"problem_type": "single_label_classification",
|
| 184 |
"qkv_bias": true,
|
| 185 |
-
"time_stride":
|
| 186 |
"torch_dtype": "float32",
|
| 187 |
"transformers_version": "4.51.3"
|
| 188 |
}
|
|
|
|
| 3 |
"ASTForAudioClassification"
|
| 4 |
],
|
| 5 |
"attention_probs_dropout_prob": 0.0,
|
| 6 |
+
"frequency_stride": 12,
|
| 7 |
"hidden_act": "gelu",
|
| 8 |
"hidden_dropout_prob": 0.0,
|
| 9 |
"hidden_size": 768,
|
| 10 |
"id2label": {
|
| 11 |
"0": "_silence_",
|
| 12 |
"1": "_unknown_",
|
| 13 |
+
"10": "four",
|
| 14 |
+
"11": "fox",
|
| 15 |
+
"12": "green",
|
| 16 |
+
"13": "horse",
|
| 17 |
+
"14": "nine",
|
| 18 |
+
"15": "one",
|
| 19 |
+
"16": "red",
|
| 20 |
+
"17": "seven",
|
| 21 |
+
"18": "six",
|
| 22 |
+
"19": "ten",
|
| 23 |
+
"2": "black",
|
| 24 |
+
"20": "three",
|
| 25 |
+
"21": "two",
|
| 26 |
+
"22": "white",
|
| 27 |
+
"3": "blue",
|
| 28 |
+
"4": "brown",
|
| 29 |
+
"5": "cat",
|
| 30 |
+
"6": "dog",
|
| 31 |
+
"7": "eight",
|
| 32 |
+
"8": "fish",
|
| 33 |
+
"9": "five"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 34 |
},
|
| 35 |
"initializer_range": 0.02,
|
| 36 |
"intermediate_size": 3072,
|
| 37 |
"label2id": {
|
| 38 |
"_silence_": "0",
|
| 39 |
"_unknown_": "1",
|
| 40 |
+
"black": "2",
|
| 41 |
+
"blue": "3",
|
| 42 |
+
"brown": "4",
|
| 43 |
+
"cat": "5",
|
| 44 |
+
"dog": "6",
|
| 45 |
+
"eight": "7",
|
| 46 |
+
"fish": "8",
|
| 47 |
+
"five": "9",
|
| 48 |
+
"four": "10",
|
| 49 |
+
"fox": "11",
|
| 50 |
+
"green": "12",
|
| 51 |
+
"horse": "13",
|
| 52 |
+
"nine": "14",
|
| 53 |
+
"one": "15",
|
| 54 |
+
"red": "16",
|
| 55 |
+
"seven": "17",
|
| 56 |
+
"six": "18",
|
| 57 |
+
"ten": "19",
|
| 58 |
+
"three": "20",
|
| 59 |
+
"two": "21",
|
| 60 |
+
"white": "22"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 61 |
},
|
| 62 |
"layer_norm_eps": 1e-12,
|
| 63 |
+
"max_length": 1024,
|
| 64 |
"model_type": "audio-spectrogram-transformer",
|
| 65 |
"num_attention_heads": 12,
|
| 66 |
"num_hidden_layers": 12,
|
|
|
|
| 68 |
"patch_size": 16,
|
| 69 |
"problem_type": "single_label_classification",
|
| 70 |
"qkv_bias": true,
|
| 71 |
+
"time_stride": 12,
|
| 72 |
"torch_dtype": "float32",
|
| 73 |
"transformers_version": "4.51.3"
|
| 74 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2aa6cfa17d8f6b8ec8b65063f7776dec8e12965f7f449dcf90e8686d10b811e7
|
| 3 |
+
size 343742580
|
preprocessor_config.json
CHANGED
|
@@ -2,12 +2,12 @@
|
|
| 2 |
"do_normalize": true,
|
| 3 |
"feature_extractor_type": "ASTFeatureExtractor",
|
| 4 |
"feature_size": 1,
|
| 5 |
-
"max_length":
|
| 6 |
-
"mean": -
|
| 7 |
"num_mel_bins": 128,
|
| 8 |
"padding_side": "right",
|
| 9 |
"padding_value": 0.0,
|
| 10 |
"return_attention_mask": false,
|
| 11 |
"sampling_rate": 16000,
|
| 12 |
-
"std":
|
| 13 |
}
|
|
|
|
| 2 |
"do_normalize": true,
|
| 3 |
"feature_extractor_type": "ASTFeatureExtractor",
|
| 4 |
"feature_size": 1,
|
| 5 |
+
"max_length": 1024,
|
| 6 |
+
"mean": -4.2677393,
|
| 7 |
"num_mel_bins": 128,
|
| 8 |
"padding_side": "right",
|
| 9 |
"padding_value": 0.0,
|
| 10 |
"return_attention_mask": false,
|
| 11 |
"sampling_rate": 16000,
|
| 12 |
+
"std": 4.5689974
|
| 13 |
}
|
runs/Jun24_13-45-10_ip-10-192-12-219/events.out.tfevents.1750772727.ip-10-192-12-219.20599.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99e5f5de41bfe81645fdac5f77661af105cef8a557066f066983adb5f8d6c5c4
|
| 3 |
+
size 56970
|
runs/Jun24_15-23-31_ip-10-192-12-219/events.out.tfevents.1750778629.ip-10-192-12-219.113148.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14fcd3673ea91968409a2f6adb8b6a5ad55d068573a2872f4826beadcf6349fd
|
| 3 |
+
size 6832
|
runs/Jun24_15-26-40_ip-10-192-12-219/events.out.tfevents.1750778817.ip-10-192-12-219.113148.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a341c342b2a0e72057f9c4fa9ee3f177beb02e954afa25175295e8a20dad7d9
|
| 3 |
+
size 153606
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a3be538dafb46e36e32c403a2562dace028434f1b4b4a7c52490f2b3164bc2e
|
| 3 |
+
size 5777
|