Skip to content

Commit a58ed0a

Browse files
committed
Updated notebook to 20*12 values.
1 parent f268a7c commit a58ed0a

File tree

4 files changed

+32
-31
lines changed

4 files changed

+32
-31
lines changed
38 Bytes
Binary file not shown.
38 Bytes
Binary file not shown.

code/test.ipynb

Lines changed: 32 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
"cells": [
33
{
44
"cell_type": "code",
5-
"execution_count": 1,
5+
"execution_count": 2,
66
"metadata": {},
77
"outputs": [],
88
"source": [
@@ -16,7 +16,7 @@
1616
},
1717
{
1818
"cell_type": "code",
19-
"execution_count": 52,
19+
"execution_count": 20,
2020
"metadata": {},
2121
"outputs": [],
2222
"source": [
@@ -26,19 +26,20 @@
2626
" return a[p], b[p]\n",
2727
" \n",
2828
"def get_data_set(count, speakers):\n",
29-
" third = int(count/speakers)\n",
29+
" nn_input_chunks_per_speaker = int(count/speakers)\n",
3030
" X = np.zeros((count, 12*20))\n",
3131
" y = np.zeros(count, dtype='uint8')\n",
3232
" \n",
33-
" coefficients_per_speaker = third * 20\n",
33+
" frames_per_speaker = nn_input_chunks_per_speaker * 20\n",
3434
" \n",
3535
" all_speakers = []\n",
36+
" \n",
3637
" for i in range(0, speakers):\n",
3738
" all_speakers.append([])\n",
3839
" index = 0\n",
39-
" while (len(all_speakers[i]) < coefficients_per_speaker):\n",
40+
" while (len(all_speakers[i]) < frames_per_speaker):\n",
4041
" print(index, end=\"\\r\")\n",
41-
" y_, sr = Utils.load_file(f\"C:\\\\Users\\\\SCU8BH\\\\Documents\\\\T3000\\\\Studienarbeit\\\\Data\\\\50_speakers_audio_data\\\\Speaker{i+30:04}\\\\Speaker{i+30:02}_{index:03}.wav\")\n",
42+
" y_, sr = Utils.load_file(f\"/home/henry/Downloads/archive/50_speakers_audio_data/Speaker_{10+i:04}/Speaker_{10+i:04}_{index:05}.wav\")\n",
4243
" \n",
4344
" y_ = AudioPreprocessor.remove_noise(y=y_, sr=sr)\n",
4445
" y_ = AudioPreprocessor.remove_silence(y=y_)\n",
@@ -54,8 +55,8 @@
5455
" print()\n",
5556
" \n",
5657
" for i in range(0, speakers):\n",
57-
" for j in range(0, third):\n",
58-
" X[i*third + j] = np.concatenate((all_speakers[i][20*j][1:13], \n",
58+
" for j in range(0, nn_input_chunks_per_speaker):\n",
59+
" X[i*nn_input_chunks_per_speaker + j] = np.concatenate((all_speakers[i][20*j][1:13], \n",
5960
" all_speakers[i][20*j+1][1:13], \n",
6061
" all_speakers[i][20*j+2][1:13],\n",
6162
" all_speakers[i][20*j+3][1:13],\n",
@@ -76,25 +77,25 @@
7677
" all_speakers[i][20*j+18][1:13],\n",
7778
" all_speakers[i][20*j+19][1:13]\n",
7879
" ))\n",
79-
" y[i*third + j] = i\n",
80+
" y[i*nn_input_chunks_per_speaker + j] = i\n",
8081
" \n",
8182
" return X, y"
8283
]
8384
},
8485
{
8586
"cell_type": "code",
86-
"execution_count": 53,
87+
"execution_count": 21,
8788
"metadata": {},
8889
"outputs": [
8990
{
9091
"name": "stdout",
9192
"output_type": "stream",
9293
"text": [
9394
"8\n",
94-
"11\n",
95+
"9\n",
9596
"9\n",
9697
"10\n",
97-
"10\n"
98+
"9\n"
9899
]
99100
}
100101
],
@@ -106,28 +107,28 @@
106107
},
107108
{
108109
"cell_type": "code",
109-
"execution_count": 63,
110+
"execution_count": 28,
110111
"metadata": {},
111112
"outputs": [
112113
{
113114
"name": "stdout",
114115
"output_type": "stream",
115116
"text": [
116117
"[0 0 0 ... 4 4 4]\n",
117-
"[4 2 3 ... 2 2 4]\n",
118-
"29/29 [==============================] - 0s 1ms/step - loss: 2.1533e-05 - accuracy: 1.0000\n",
119-
"Test accuracy: 1.0\n",
120-
"Test loss: 2.1533451217692345e-05\n",
121-
"4/4 [==============================] - 0s 1ms/step\n",
122-
"[4 2 2 2 2 2 2 2 2 2 2 2 1 4 2 2 1 1 1 1 2 2 4 2 1 2 2 2 2 2 2 4 2 2 2 2 2\n",
123-
" 2 2 2 2 2 2 2 2 2 2 2 0 2 2 2 2 4 1 2 2 2 2 2 1 2 3 1 1 2 2 2 4 2 4 2 2 2\n",
124-
" 2 2 2 2 4 1 0 2 4 2 4 2 4 2 1 2 4 2 3 3 2 2 2 2 2 2 2 4 3 4 1 0 2 1 2 2 4\n",
125-
" 2 2 4 2 2 0 0 0]\n",
126-
"6\n",
127-
"14\n",
128-
"79\n",
129-
"4\n",
130-
"16\n"
118+
"[2 3 2 ... 0 4 2]\n",
119+
"29/29 [==============================] - 0s 1ms/step - loss: 0.8353 - accuracy: 0.6485\n",
120+
"Test accuracy: 0.6484715938568115\n",
121+
"Test loss: 0.8353310227394104\n",
122+
"4/4 [==============================] - 0s 2ms/step\n",
123+
"[2 4 2 4 4 4 4 4 2 4 0 2 2 2 1 2 2 4 2 3 4 4 3 4 2 2 3 3 2 2 2 4 4 2 3 4 4\n",
124+
" 0 4 0 2 4 2 4 4 4 4 4 2 3 0 2 2 4 2 2 4 2 0 2 4 2 2 4 4 2 0 4 2 2 4 4 2 2\n",
125+
" 3 0 2 4 3 2 2 2 4 2 2 0 4 0 3 4 3 2 2 0 4 2 0 2 2 4 3 2 2 4 2 0 2 2 2 4 4\n",
126+
" 2 2 2 2 2 2 4]\n",
127+
"12\n",
128+
"1\n",
129+
"54\n",
130+
"11\n",
131+
"40\n"
131132
]
132133
}
133134
],
@@ -154,7 +155,7 @@
154155
" print(f\"Test loss: {test_loss}\")\n",
155156
" \n",
156157
" \n",
157-
" y_, sr = Utils.load_file(f\"C:\\\\Users\\\\SCU8BH\\\\Documents\\\\T3000\\\\Studienarbeit\\\\Data\\\\50_speakers_audio_data\\\\Speaker0032\\\\Speaker32_012.wav\")\n",
158+
" y_, sr = Utils.load_file(f\"/home/henry/Downloads/archive/50_speakers_audio_data/Speaker_0014/Speaker_0014_00020.wav\")\n",
158159
" \n",
159160
" y_ = AudioPreprocessor.remove_noise(y=y_, sr=sr)\n",
160161
" y_ = AudioPreprocessor.remove_silence(y=y_)\n",
@@ -207,7 +208,7 @@
207208
],
208209
"metadata": {
209210
"kernelspec": {
210-
"display_name": "Python 3.10.4 64-bit",
211+
"display_name": "Python 3",
211212
"language": "python",
212213
"name": "python3"
213214
},
@@ -221,12 +222,12 @@
221222
"name": "python",
222223
"nbconvert_exporter": "python",
223224
"pygments_lexer": "ipython3",
224-
"version": "3.10.4"
225+
"version": "3.10.6 (main, Nov 14 2022, 16:10:14) [GCC 11.3.0]"
225226
},
226227
"orig_nbformat": 4,
227228
"vscode": {
228229
"interpreter": {
229-
"hash": "2fc4d7ba6602d69fe52dcf13f0361bb9556610661c910f56182baab83bdef03f"
230+
"hash": "916dbcbb3f70747c44a77c7bcd40155683ae19c65e1c03b4aa3499c5328201f1"
230231
}
231232
}
232233
},
38 Bytes
Binary file not shown.

0 commit comments

Comments
 (0)