solidglue
diff --git a/‎02_Keras/02_01_The_sequential_model.ipynb‎
Lines changed: 301 additions & 3 deletions b/‎02_Keras/02_01_The_sequential_model.ipynb‎
Lines changed: 301 additions & 3 deletions
@@ -1,19 +1,317 @@
 {
  "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "WARNING:tensorflow:From c:\\Users\\yuanshuai\\AppData\\Local\\anaconda3\\envs\\tensorflow2\\Lib\\site-packages\\keras\\src\\losses.py:2976: The name tf.losses.sparse_softmax_cross_entropy is deprecated. Please use tf.compat.v1.losses.sparse_softmax_cross_entropy instead.\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "import tensorflow as tf\n",
+    "import keras\n",
+    "from keras import layers\n",
+    "\n",
+    "### Sequential模型"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "WARNING:tensorflow:From c:\\Users\\yuanshuai\\AppData\\Local\\anaconda3\\envs\\tensorflow2\\Lib\\site-packages\\keras\\src\\backend.py:873: The name tf.get_default_graph is deprecated. Please use tf.compat.v1.get_default_graph instead.\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "### 2.1.1 何时使用顺序模型\n",
+    "#序列模型适用于每个层恰好有一个输入张量和一个输出张量的普通层堆栈。\n",
+    "\n",
+    "#示意性地，以下模型：Sequential\n",
+    "# Define Sequential model with 3 layers\n",
+    "model = keras.Sequential(\n",
+    "    [\n",
+    "        layers.Dense(2, activation=\"relu\", name=\"layer1\"),\n",
+    "        layers.Dense(3, activation=\"relu\", name=\"layer2\"),\n",
+    "        layers.Dense(4, name=\"layer3\"),\n",
+    "    ]\n",
+    ")\n",
+    "# Call model on a test input\n",
+    "x = tf.ones((3, 3))\n",
+    "y = model(x)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#等效于此函数：\n",
+    "# Create 3 layers\n",
+    "layer1 = layers.Dense(2, activation=\"relu\", name=\"layer1\")\n",
+    "layer2 = layers.Dense(3, activation=\"relu\", name=\"layer2\")\n",
+    "layer3 = layers.Dense(4, name=\"layer3\")\n",
+    "\n",
+    "# Call layers on a test input\n",
+    "x = tf.ones((3, 3))\n",
+    "y = layer3(layer2(layer1(x)))"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
-    "#TODO\n",
-    "#INFO: demo用，单输入单输出 "
+    "## 在以下情况下，顺序模型不适用：\n",
+    "#   您的模型具有多个输入或多个输出\n",
+    "#   任何图层都具有多个输入或多个输出\n",
+    "#   您需要进行图层共享\n",
+    "#   您需要非线性拓扑（例如残差连接、多分支 模型）\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "### 2.1.2 创建顺序模型\n",
+    "#您可以通过将层列表传递给 Sequentiald的构造函数来创建 Sequential模型：\n",
+    "model = keras.Sequential(\n",
+    "    [\n",
+    "        layers.Dense(2, activation=\"relu\"),\n",
+    "        layers.Dense(3, activation=\"relu\"),\n",
+    "        layers.Dense(4),\n",
+    "    ]\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[<keras.src.layers.core.dense.Dense at 0x1ba1a83a010>,\n",
+       " <keras.src.layers.core.dense.Dense at 0x1ba1a6e1410>,\n",
+       " <keras.src.layers.core.dense.Dense at 0x1ba18782190>]"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "#其图层可通过以下属性访问：layers\n",
+    "model.layers"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#您还可以通过以下方法以增量方式创建顺序模型：add()\n",
+    "model = keras.Sequential()\n",
+    "model.add(layers.Dense(2, activation=\"relu\"))\n",
+    "model.add(layers.Dense(3, activation=\"relu\"))\n",
+    "model.add(layers.Dense(4))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2\n"
+     ]
+    }
+   ],
+   "source": [
+    "#请注意，还有一种相应的方法可以删除图层： 顺序模型的行为非常类似于层列表。pop()\n",
+    "model.pop()\n",
+    "print(len(model.layers))  # 2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#另请注意，Sequential 构造函数接受一个参数，就像 Keras 中的任何图层或模型。\n",
+    "#这对于注释 TensorBoard 图形很有用 具有语义上有意义的名称。name\n",
+    "\n",
+    "model = keras.Sequential(name=\"my_sequential\")\n",
+    "model.add(layers.Dense(2, activation=\"relu\", name=\"layer1\"))\n",
+    "model.add(layers.Dense(3, activation=\"relu\", name=\"layer2\"))\n",
+    "model.add(layers.Dense(4, name=\"layer3\"))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[]"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "### 2.1.3 提前指定输入形状\n",
+    "#通常，Keras中的所有层都需要知道其输入的形状，以便能够创建其权重。\n",
+    "#因此，当您创建这样的层时，最初它没有权重：\n",
+    "layer = layers.Dense(3)\n",
+    "layer.weights  # Empty"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[<tf.Variable 'dense_6/kernel:0' shape=(4, 3) dtype=float32, numpy=\n",
+       " array([[ 0.51047623, -0.17564982, -0.6607744 ],\n",
+       "        [ 0.7689657 ,  0.17553306,  0.82802343],\n",
+       "        [-0.13806897, -0.24232322,  0.18856204],\n",
+       "        [ 0.36269712, -0.23856878, -0.25139934]], dtype=float32)>,\n",
+       " <tf.Variable 'dense_6/bias:0' shape=(3,) dtype=float32, numpy=array([0., 0., 0.], dtype=float32)>]"
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "#它在第一次调用输入时创建其权重，因为形状 权重取决于输入的形状：\n",
+    "# Call layer on a test input\n",
+    "x = tf.ones((1, 4))\n",
+    "y = layer(x)\n",
+    "layer.weights  # Now it has weights, of shape (4, 3) and (3,)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Number of weights after calling the model: 6\n"
+     ]
+    }
+   ],
+   "source": [
+    "#当然，这也适用于Sequential模型。当您实例化一个没有输入形状的Sequential模型时，\n",
+    "#它不是“构建”的：它没有权重（调用model.weights会导致一个错误，说明这一点）。\n",
+    "#权重是在模型第一次看到一些输入数据时创建的：\n",
+    "model = keras.Sequential(\n",
+    "    [\n",
+    "        layers.Dense(2, activation=\"relu\"),\n",
+    "        layers.Dense(3, activation=\"relu\"),\n",
+    "        layers.Dense(4),\n",
+    "    ]\n",
+    ")  # No weights at this stage!\n",
+    "\n",
+    "# At this point, you can't do this:\n",
+    "# model.weights\n",
+    "\n",
+    "# You also can't do this:\n",
+    "# model.summary()\n",
+    "\n",
+    "# Call the model on a test input\n",
+    "x = tf.ones((1, 4))\n",
+    "y = model(x)\n",
+    "print(\"Number of weights after calling the model:\", len(model.weights))  # 6"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Model: \"sequential_3\"\n",
+      "_________________________________________________________________\n",
+      " Layer (type)                Output Shape              Param #   \n",
+      "=================================================================\n",
+      " dense_7 (Dense)             (1, 2)                    10        \n",
+      "                                                                 \n",
+      " dense_8 (Dense)             (1, 3)                    9         \n",
+      "                                                                 \n",
+      " dense_9 (Dense)             (1, 4)                    16        \n",
+      "                                                                 \n",
+      "=================================================================\n",
+      "Total params: 35 (140.00 Byte)\n",
+      "Trainable params: 35 (140.00 Byte)\n",
+      "Non-trainable params: 0 (0.00 Byte)\n",
+      "_________________________________________________________________\n"
+     ]
+    }
+   ],
+   "source": [
+    "#“构建”模型后，可以调用其方法来显示其 内容：summary()\n",
+    "model.summary()"
    ]
   }
  ],
  "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
   "language_info": {
-   "name": "python"
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.8"
   }
  },
  "nbformat": 4,