mahmoudmamdouh13 commited on
Commit
2101fe5
·
verified ·
1 Parent(s): 5bf0c4d

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -3,178 +3,64 @@
3
  "ASTForAudioClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.0,
6
- "frequency_stride": 10,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.0,
9
  "hidden_size": 768,
10
  "id2label": {
11
  "0": "_silence_",
12
  "1": "_unknown_",
13
- "10": "car",
14
- "11": "cat",
15
- "12": "doctor",
16
- "13": "dog",
17
- "14": "door",
18
- "15": "ear",
19
- "16": "egg",
20
- "17": "elephant",
21
- "18": "fan",
22
- "19": "fish",
23
- "2": "air",
24
- "20": "fox",
25
- "21": "frog",
26
- "22": "game",
27
- "23": "gate",
28
- "24": "gold",
29
- "25": "hand",
30
- "26": "hat",
31
- "27": "home",
32
- "28": "ice",
33
- "29": "ill",
34
- "3": "apple",
35
- "30": "iron",
36
- "31": "jelly",
37
- "32": "juice",
38
- "33": "jump",
39
- "34": "key",
40
- "35": "kid",
41
- "36": "kite",
42
- "37": "lamp",
43
- "38": "leaf",
44
- "39": "lion",
45
- "4": "arm",
46
- "40": "milk",
47
- "41": "monkey",
48
- "42": "moon",
49
- "43": "nest",
50
- "44": "net",
51
- "45": "nose",
52
- "46": "ocean",
53
- "47": "open",
54
- "48": "orange",
55
- "49": "pen",
56
- "5": "ball",
57
- "50": "pig",
58
- "51": "pizza",
59
- "52": "queen",
60
- "53": "question",
61
- "54": "quiet",
62
- "55": "red",
63
- "56": "room",
64
- "57": "run",
65
- "58": "six",
66
- "59": "snake",
67
- "6": "bear",
68
- "60": "star",
69
- "61": "sun",
70
- "62": "tiger",
71
- "63": "toy",
72
- "64": "tree",
73
- "65": "umbrella",
74
- "66": "under",
75
- "67": "unlike",
76
- "68": "van",
77
- "69": "vest",
78
- "7": "bed",
79
- "70": "violin",
80
- "71": "water",
81
- "72": "white",
82
- "73": "window",
83
- "74": "year",
84
- "75": "yellow",
85
- "76": "youth",
86
- "77": "zero",
87
- "78": "zone",
88
- "79": "zoo",
89
- "8": "box",
90
- "9": "cake"
91
  },
92
  "initializer_range": 0.02,
93
  "intermediate_size": 3072,
94
  "label2id": {
95
  "_silence_": "0",
96
  "_unknown_": "1",
97
- "air": "2",
98
- "apple": "3",
99
- "arm": "4",
100
- "ball": "5",
101
- "bear": "6",
102
- "bed": "7",
103
- "box": "8",
104
- "cake": "9",
105
- "car": "10",
106
- "cat": "11",
107
- "doctor": "12",
108
- "dog": "13",
109
- "door": "14",
110
- "ear": "15",
111
- "egg": "16",
112
- "elephant": "17",
113
- "fan": "18",
114
- "fish": "19",
115
- "fox": "20",
116
- "frog": "21",
117
- "game": "22",
118
- "gate": "23",
119
- "gold": "24",
120
- "hand": "25",
121
- "hat": "26",
122
- "home": "27",
123
- "ice": "28",
124
- "ill": "29",
125
- "iron": "30",
126
- "jelly": "31",
127
- "juice": "32",
128
- "jump": "33",
129
- "key": "34",
130
- "kid": "35",
131
- "kite": "36",
132
- "lamp": "37",
133
- "leaf": "38",
134
- "lion": "39",
135
- "milk": "40",
136
- "monkey": "41",
137
- "moon": "42",
138
- "nest": "43",
139
- "net": "44",
140
- "nose": "45",
141
- "ocean": "46",
142
- "open": "47",
143
- "orange": "48",
144
- "pen": "49",
145
- "pig": "50",
146
- "pizza": "51",
147
- "queen": "52",
148
- "question": "53",
149
- "quiet": "54",
150
- "red": "55",
151
- "room": "56",
152
- "run": "57",
153
- "six": "58",
154
- "snake": "59",
155
- "star": "60",
156
- "sun": "61",
157
- "tiger": "62",
158
- "toy": "63",
159
- "tree": "64",
160
- "umbrella": "65",
161
- "under": "66",
162
- "unlike": "67",
163
- "van": "68",
164
- "vest": "69",
165
- "violin": "70",
166
- "water": "71",
167
- "white": "72",
168
- "window": "73",
169
- "year": "74",
170
- "yellow": "75",
171
- "youth": "76",
172
- "zero": "77",
173
- "zone": "78",
174
- "zoo": "79"
175
  },
176
  "layer_norm_eps": 1e-12,
177
- "max_length": 128,
178
  "model_type": "audio-spectrogram-transformer",
179
  "num_attention_heads": 12,
180
  "num_hidden_layers": 12,
@@ -182,7 +68,7 @@
182
  "patch_size": 16,
183
  "problem_type": "single_label_classification",
184
  "qkv_bias": true,
185
- "time_stride": 10,
186
  "torch_dtype": "float32",
187
  "transformers_version": "4.51.3"
188
  }
 
3
  "ASTForAudioClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.0,
6
+ "frequency_stride": 12,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.0,
9
  "hidden_size": 768,
10
  "id2label": {
11
  "0": "_silence_",
12
  "1": "_unknown_",
13
+ "10": "four",
14
+ "11": "fox",
15
+ "12": "green",
16
+ "13": "horse",
17
+ "14": "nine",
18
+ "15": "one",
19
+ "16": "red",
20
+ "17": "seven",
21
+ "18": "six",
22
+ "19": "ten",
23
+ "2": "black",
24
+ "20": "three",
25
+ "21": "two",
26
+ "22": "white",
27
+ "3": "blue",
28
+ "4": "brown",
29
+ "5": "cat",
30
+ "6": "dog",
31
+ "7": "eight",
32
+ "8": "fish",
33
+ "9": "five"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  },
35
  "initializer_range": 0.02,
36
  "intermediate_size": 3072,
37
  "label2id": {
38
  "_silence_": "0",
39
  "_unknown_": "1",
40
+ "black": "2",
41
+ "blue": "3",
42
+ "brown": "4",
43
+ "cat": "5",
44
+ "dog": "6",
45
+ "eight": "7",
46
+ "fish": "8",
47
+ "five": "9",
48
+ "four": "10",
49
+ "fox": "11",
50
+ "green": "12",
51
+ "horse": "13",
52
+ "nine": "14",
53
+ "one": "15",
54
+ "red": "16",
55
+ "seven": "17",
56
+ "six": "18",
57
+ "ten": "19",
58
+ "three": "20",
59
+ "two": "21",
60
+ "white": "22"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
61
  },
62
  "layer_norm_eps": 1e-12,
63
+ "max_length": 1024,
64
  "model_type": "audio-spectrogram-transformer",
65
  "num_attention_heads": 12,
66
  "num_hidden_layers": 12,
 
68
  "patch_size": 16,
69
  "problem_type": "single_label_classification",
70
  "qkv_bias": true,
71
+ "time_stride": 12,
72
  "torch_dtype": "float32",
73
  "transformers_version": "4.51.3"
74
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aad6886ca688689e5142e159174f38c01f967712cd687699f304025ac568307f
3
- size 341749072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aa6cfa17d8f6b8ec8b65063f7776dec8e12965f7f449dcf90e8686d10b811e7
3
+ size 343742580
preprocessor_config.json CHANGED
@@ -2,12 +2,12 @@
2
  "do_normalize": true,
3
  "feature_extractor_type": "ASTFeatureExtractor",
4
  "feature_size": 1,
5
- "max_length": 128,
6
- "mean": -6.845978,
7
  "num_mel_bins": 128,
8
  "padding_side": "right",
9
  "padding_value": 0.0,
10
  "return_attention_mask": false,
11
  "sampling_rate": 16000,
12
- "std": 5.5654526
13
  }
 
2
  "do_normalize": true,
3
  "feature_extractor_type": "ASTFeatureExtractor",
4
  "feature_size": 1,
5
+ "max_length": 1024,
6
+ "mean": -4.2677393,
7
  "num_mel_bins": 128,
8
  "padding_side": "right",
9
  "padding_value": 0.0,
10
  "return_attention_mask": false,
11
  "sampling_rate": 16000,
12
+ "std": 4.5689974
13
  }
runs/Jun24_13-45-10_ip-10-192-12-219/events.out.tfevents.1750772727.ip-10-192-12-219.20599.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99e5f5de41bfe81645fdac5f77661af105cef8a557066f066983adb5f8d6c5c4
3
+ size 56970
runs/Jun24_15-23-31_ip-10-192-12-219/events.out.tfevents.1750778629.ip-10-192-12-219.113148.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14fcd3673ea91968409a2f6adb8b6a5ad55d068573a2872f4826beadcf6349fd
3
+ size 6832
runs/Jun24_15-26-40_ip-10-192-12-219/events.out.tfevents.1750778817.ip-10-192-12-219.113148.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a341c342b2a0e72057f9c4fa9ee3f177beb02e954afa25175295e8a20dad7d9
3
+ size 153606
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a069d67b065ce361b1b3f330f79ee54299b538bba0cd4d23fbbdde581a5e7d95
3
- size 5841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a3be538dafb46e36e32c403a2562dace028434f1b4b4a7c52490f2b3164bc2e
3
+ size 5777