update stuff for last two tutorials

fs446 · fs446 · commit 4af20b7c2ba6 · 2023-01-13T17:29:29.000+01:00
diff --git a/exercise12_HyperParameterTuning.ipynb b/exercise12_HyperParameterTuning.ipynb
@@ -27,17 +27,17 @@
    "id": "46f6f98a-12a4-4bcd-975e-18a7d404cb9c",
    "metadata": {},
    "source": [
-    "# Exercise 12\n",
+    "# Multiclass Classification with Hyper Parameter Tuning\n",
     "\n",
-    "## Multiclass Classification with Hyper Parameter Tuning\n",
-    "\n",
-    "- Softmax Activation Function at Output\n",
-    "- CategoricalCrossentropy Loss\n",
-    "- Split Data into Training, Validating, Testing Set\n",
-    "- Avoid Over-/Underfit by\n",
-    "    - deploying Early Stopping\n",
-    "    - deploying Hyper Parameter Tuning using Keras Tuner\n",
-    "- we use convenient stuff from Scikit-learn"
+    "- **Softmax** activation Function at Output\n",
+    "- Categorical crossentropy loss\n",
+    "- Split data into training, validating, testing data sets\n",
+    "    - training, validating used for hyper parameter tuning (validate serves as the unseen test data here)\n",
+    "    - training, testing used for train/test the best model (test data was never used before! and is here only and once used to finally check model performance) \n",
+    "- Avoid over-/underfit by\n",
+    "    - deploying early stopping\n",
+    "    - deploying hyper parameter tuning using Keras tuner\n",
+    "- we use convenient stuff from scikit-learn"
    ]
   },
   {
@@ -67,8 +67,8 @@
     "import tensorflow.keras.backend as K\n",
     "import time\n",
     "\n",
-    "print('TF version', tf.__version__,  # we used 2.4.3\n",
-    "      '\\nKeras version', keras.__version__,  # we used 2.4.0\n",
+    "print('TF version', tf.__version__,  # we used 2.10.0\n",
+    "      '\\nKeras version', keras.__version__,  # we used 2.10.0\n",
     "      '\\nKeras Tuner version', kt.__version__)  # we used 1.1.0\n",
     "verbose = 1  # plot training status"
    ]
@@ -78,7 +78,7 @@
    "id": "5249aa49-d2da-4aec-be0a-769001eb010d",
    "metadata": {},
    "source": [
-    "## Folder Structure"
+    "## Folder Structure For Log Data"
    ]
   },
   {
@@ -134,12 +134,12 @@
    "source": [
     "nlabels = 3  # number of classes\n",
     "labels = np.arange(nlabels)  # we encode as integers\n",
-    "nx = 2*nlabels  # number of features\n",
+    "nx = 2*nlabels  # number of features, here we use 6\n",
     "m = 100000  # data examples\n",
     "\n",
-    "train_size = 7/10  # 7/10 of whole data set\n",
-    "validate_size = 3/10 * 2/3  # 1/5 of whole data set\n",
-    "test_size = 1 - train_size - validate_size  # must be > 0\n",
+    "train_size = 7/10  # 7/10 of the whole data set\n",
+    "validate_size = 3/10 * 2/3  # 1/5 of the whole data set\n",
+    "test_size = 1 - train_size - validate_size  # remaining data, must be > 0\n",
     "\n",
     "X, Y = make_classification(n_samples=m,\n",
     "                           n_features=nx, n_informative=nx,\n",
@@ -159,9 +159,7 @@
     "X_val, X_test, Y_val, Y_test = train_test_split(\n",
     "    X_tmp, Y_tmp, train_size=val_size, random_state=None)\n",
     "\n",
-    "m_train = X_train.shape[0]\n",
-    "m_val = X_val.shape[0]\n",
-    "m_test = X_test.shape[0]\n",
+    "m_train, m_val, m_test = X_train.shape[0], X_val.shape[0], X_test.shape[0]\n",
     "\n",
     "print(train_size, validate_size, test_size)\n",
     "print(m_train, m_val, m_test, m_train+m_val+m_test == m)\n",
@@ -197,7 +195,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# in future we might also consider dropout / regularization in the model\n",
+    "# as homework we might also consider dropout and regularization in the model\n",
     "def build_model(hp):  # with hyper parameter ranges\n",
     "    model = keras.Sequential()\n",
     "    # input layer\n",
@@ -238,7 +236,7 @@
     "model = build_model(kt.HyperParameters())\n",
     "hptuner = kt.RandomSearch(\n",
     "    hypermodel=build_model,\n",
-    "    objective='val_categorical_accuracy',  # on val data!\n",
+    "    objective='val_categorical_accuracy',  # check performance on val data!\n",
     "    max_trials=max_trials,\n",
     "    executions_per_trial=executions_per_trial,\n",
     "    overwrite=True,\n",
@@ -288,7 +286,7 @@
    "outputs": [],
    "source": [
     "# we might check the best XX models in detail\n",
-    "# for didactical purpose we choose only the very best one\n",
+    "# for didactical purpose we choose only the very best one, located in [0]:\n",
     "model = hptuner.get_best_models(num_models=1)[0]\n",
     "model.save(tf_logdir+'/best_model')"
    ]
@@ -326,7 +324,7 @@
    "source": [
     "# load best model and reset weights\n",
     "model = keras.models.load_model(tf_logdir+'/best_model')\n",
-    "reset_weights(model)\n",
+    "reset_weights(model)  # start training from scratch \n",
     "print(model.summary())"
    ]
   },
diff --git a/exercise12_MulticlassClassification_CategoricalCrossentropy.ipynb b/exercise12_MulticlassClassification_CategoricalCrossentropy.ipynb
@@ -27,14 +27,12 @@
    "id": "46f6f98a-12a4-4bcd-975e-18a7d404cb9c",
    "metadata": {},
    "source": [
-    "# Exercise 12\n",
-    "\n",
-    "## Multiclass Classification\n",
-    "- One Hot Encoding\n",
+    "# Multiclass Classification\n",
+    "- One Hot encoding\n",
     "- Data set splitting into train, test\n",
-    "- Softmax Activation Function at Output\n",
-    "- CategoricalCrossentropy loss\n",
-    "- we use convenient stuff from Scikit-learn\n"
+    "- **Softmax** activation function at output layer\n",
+    "- categorical cross-entropy loss\n",
+    "- we use convenient stuff from scikit-learn"
    ]
   },
   {
@@ -61,8 +59,10 @@
     "import tensorflow.keras as keras\n",
     "# import tensorflow.keras.backend as K\n",
     "\n",
-    "print('TF version', tf.__version__,  # we used 2.4.3\n",
-    "      '\\nKeras version', keras.__version__)  # we used 2.4.0\n",
+    "print('TF version', tf.__version__,  # we used 2.10.0\n",
+    "      '\\nKeras version', keras.__version__)  # we used 2.10.0\n",
+    "\n",
+    "tf.keras.backend.set_floatx('float64')  # we could use double precision\n",
     "\n",
     "verbose = 1  # plot training status"
    ]
@@ -72,7 +72,7 @@
    "id": "8902728d-14a9-4f64-8f49-364953c88f08",
    "metadata": {},
    "source": [
-    "## Data Synthesis / One Hot Encoding / Splitting"
+    "## Data Synthesis, One Hot Encoding, Train/TestSplitting"
    ]
   },
   {
@@ -86,9 +86,9 @@
     "labels = np.arange(nlabels)  # we encode as integers\n",
     "\n",
     "m = int(5/4*80000)  # data examples\n",
-    "nx = 2*nlabels  # number of features\n",
+    "nx = 2*nlabels  # number of features, we set it to 6 here\n",
     "\n",
-    "train_size = 4/5  # 80% are used for training\n",
+    "train_size = 4/5  # 80% of data are used for training\n",
     "\n",
     "X, Y = make_classification(n_samples=m,\n",
     "                           n_features=nx, n_informative=nx,\n",
@@ -100,9 +100,8 @@
     "encoder = OneHotEncoder(sparse=False)\n",
     "Y = encoder.fit_transform(Y.reshape(-1, 1))\n",
     "\n",
-    "X_train, X_test,\\\n",
-    "    Y_train, Y_test = train_test_split(\n",
-    "        X, Y, train_size=train_size, random_state=None)\n",
+    "X_train, X_test, Y_train, Y_test = train_test_split(\n",
+    "    X, Y, train_size=train_size, random_state=None)\n",
     "m_train = X_train.shape[0]\n",
     "m_test = X_test.shape[0]\n",
     "print('m_train', m_train)\n",
@@ -116,7 +115,7 @@
    "id": "c0445a58-1b59-4e48-84df-2ebe2d233649",
    "metadata": {},
    "source": [
-    "## Setup of Model "
+    "## Setup of Model Using Fully Connected Layers"
    ]
   },
   {
@@ -126,27 +125,29 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# hyper parameters should be learned as well,\n",
-    "# for this toy example we set them for reasonable\n",
-    "# computing time and results\n",
+    "# hyper parameters should be learned as well, however for this toy example\n",
+    "# we set them for reasonable computing time and approriate results\n",
     "epochs = 10\n",
-    "batch_size = 32\n",
     "no_perceptron_in_hl = np.array([2*nx, 4*nx, nlabels])\n",
+    "batch_size = 32\n",
     "\n",
+    "# model architecture\n",
     "optimizer = keras.optimizers.Adam()\n",
-    "loss = keras.losses.CategoricalCrossentropy(\n",
-    "    from_logits=False, label_smoothing=0)\n",
+    "loss = keras.losses.CategoricalCrossentropy(from_logits=False,\n",
+    "                                            label_smoothing=0)\n",
     "metrics = [keras.metrics.CategoricalCrossentropy(),\n",
     "           keras.metrics.CategoricalAccuracy()]\n",
     "\n",
     "model = keras.Sequential()\n",
-    "# input layer\n",
+    "# apply input layer\n",
     "model.add(keras.Input(shape=(nx,)))\n",
-    "# hidden layers\n",
+    "# apply hidden layers\n",
     "for n in no_perceptron_in_hl:\n",
     "    model.add(keras.layers.Dense(n, activation='relu'))\n",
-    "# output layer with softmax for multi-label classificaton\n",
+    "# apply output layer with softmax for multi-label classificaton\n",
     "model.add(keras.layers.Dense(nlabels, activation='softmax'))\n",
+    "# let TF compile the model architecture, one key step in compiling\n",
+    "# is to set up the forward and backward propagation workflow through the model\n",
     "model.compile(optimizer=optimizer, loss=loss, metrics=metrics)\n",
     "print(model.summary())\n",
     "# tw = np.sum([K.count_params(w) for w in model.trainable_weights])\n",
diff --git a/exercise12_MusicGenreClassification.ipynb b/exercise12_MusicGenreClassification.ipynb
@@ -27,7 +27,7 @@
    "id": "a46602eb-0171-412d-990c-a0a63f4d47f9",
    "metadata": {},
    "source": [
-    "# Exercise 12: Music Genre Classification\n",
+    "# Music Genre Classification with Fully Connected Layers\n",
     "\n",
     "In this toy example we have a special look at\n",
     "- feature design (loudness, crest, peak, rms, spectral weight)\n",
@@ -89,8 +89,8 @@
     "import time\n",
     "\n",
     "\n",
-    "print('TF version', tf.__version__,  # we used 2.4.3\n",
-    "      '\\nKeras version', keras.__version__,  # we used 2.4.0\n",
+    "print('TF version', tf.__version__,  # we used 2.10.0\n",
+    "      '\\nKeras version', keras.__version__,  # we used 2.10.0\n",
     "      '\\nKeras Tuner version', kt.__version__)  # we used 1.1.0\n",
     "verbose = 1  # plot training status"
    ]
@@ -100,7 +100,7 @@
    "id": "41669170-f69b-43e4-acc8-8ab001d90404",
    "metadata": {},
    "source": [
-    "## Folder Structure"
+    "## Folder Structure for Log Data"
    ]
   },
   {
@@ -111,7 +111,7 @@
    "outputs": [],
    "source": [
     "audiofolder = './audio_ex12/'\n",
-    "ex_str = 'ex12_'\n",
+    "ex_str = 'mgc_'\n",
     "time_str = '%Y_%m_%d_%H_%M_'\n",
     "\n",
     "\n",
@@ -271,8 +271,13 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# with np.load(audiofolder+'/_raw_data.npz') as data:  #  use this line when features were extracted above\n",
+    "# we use this option when features were extracted in cell [5] above\n",
+    "# with np.load(audiofolder+'/_raw_data.npz') as data:  \n",
+    "\n",
+    "# we use this when we want to use 'large' toy example data set \n",
     "# with np.load(audiofolder+'/_raw_data_large.npz') as data:\n",
+    "\n",
+    "# we use this when we want to use 'small' toy example data set \n",
     "with np.load(audiofolder+'/_raw_data_small.npz') as data:\n",
     "\n",
     "    Xdata = data['Xdata']\n",
@@ -387,7 +392,7 @@
     "#  9 crest_lin\n",
     "# 10 crest_db\n",
     "# 11 low_high_ratio\n",
-    "# 2, 3, 5, 7, 8, 10, 11 might be useful:\n",
+    "# the seven features [2, 3, 5, 7, 8, 10, 11] might be useful:\n",
     "which_features = [2, 3, 5, 7, 8, 10, 11]\n",
     "X = np.copy(Xdata_norm[:, which_features])\n",
     "Y = np.copy(Ydata)\n",
@@ -458,7 +463,7 @@
    "source": [
     "train_size = 5/10\n",
     "validate_size = 5/10 * 1/2\n",
-    "test_size = 1 - train_size - validate_size  # must be > 0\n",
+    "test_size = 1 - train_size - validate_size  # remaining data, must be > 0\n",
     "\n",
     "# split into train, val, test data:\n",
     "X_train, X_tmp, Y_train, Y_tmp = train_test_split(\n",
@@ -517,7 +522,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# in future we might also consider dropout / regularization in the model\n",
+    "# as homework we might also consider dropout / regularization in the model\n",
     "def build_model(hp):  # with hyper parameter ranges\n",
     "    model = keras.Sequential()\n",
     "    # input layer\n",
@@ -558,7 +563,7 @@
     "model = build_model(kt.HyperParameters())\n",
     "hptuner = kt.RandomSearch(\n",
     "    hypermodel=build_model,\n",
-    "    objective='val_categorical_accuracy',  # on val data!\n",
+    "    objective='val_categorical_accuracy',  # check performance on val data!\n",
     "    max_trials=max_trials,\n",
     "    executions_per_trial=executions_per_trial,\n",
     "    overwrite=True,\n",
@@ -608,7 +613,7 @@
    "outputs": [],
    "source": [
     "# we might check (train) the best XX models in detail\n",
-    "# for didactical purpose we choose only the very best one\n",
+    "# for didactical purpose we choose only the very best one, located in [0]:\n",
     "model = hptuner.get_best_models(num_models=1)[0]\n",
     "model.save(tf_logdir+'/best_model')"
    ]
@@ -646,7 +651,7 @@
    "source": [
     "# load best model and reset weights\n",
     "model = keras.models.load_model(tf_logdir+'/best_model')\n",
-    "reset_weights(model)\n",
+    "reset_weights(model)  # start training from scratch \n",
     "print(model.summary())"
    ]
   },
diff --git a/index.ipynb b/index.ipynb