Modify corresponding Chinese version files (#60)

Ariadne330 · web-flow · commit adeb5c39b08d · 2023-12-15T16:15:55.000+08:00
diff --git a/Chinese_Version/ch_4_Chinese_Support/4_1_ChatGLM2-6B.ipynb b/Chinese_Version/ch_4_Chinese_Support/4_1_ChatGLM2-6B.ipynb
@@ -27,7 +27,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "!pip install bigdl-llm[all]"
+    "!pip install --pre --upgrade bigdl-llm[all]"
    ]
   },
   {
@@ -81,7 +81,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -104,7 +104,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -126,18 +126,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Inference time: xxxx s\n",
       "-------------------- Output --------------------\n",
       "问：AI是什么？\n",
       "\n",
-      "答： AI指的是人工智能,是一种能够通过学习和推理来执行任务的计算机程序。它可以模仿人类的思维方式,做出类似人类的决策,并且具有自主学习、自我进化的能力。AI在许多领域都具有广泛的应用,例如自然语言处理、计算机视觉、机器学习、深度学习等。\n"
+      "答： AI指的是人工智能,是一种能够通过学习和推理来执行任务的计算机程序。它可以模仿人类的思维方式,做出类似人类的决策,并且具有自主学习、自我\n"
      ]
     }
    ],
@@ -146,17 +145,14 @@
     "import torch\n",
     "\n",
     "prompt = \"AI是什么？\"\n",
-    "n_predict = 128\n",
+    "n_predict = 32\n",
     "\n",
     "with torch.inference_mode():\n",
     "    prompt = CHATGLM_V2_PROMPT_TEMPLATE.format(prompt=prompt)\n",
     "    input_ids = tokenizer.encode(prompt, return_tensors=\"pt\")\n",
-    "    st = time.time()\n",
     "    output = model.generate(input_ids,\n",
     "                            max_new_tokens=n_predict)\n",
-    "    end = time.time()\n",
     "    output_str = tokenizer.decode(output[0], skip_special_tokens=True)\n",
-    "    print(f'Inference time: {end-st} s')\n",
     "    print('-'*20, 'Output', '-'*20)\n",
     "    print(output_str)"
    ]
@@ -358,7 +354,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.17"
+   "version": "3.9.18"
   },
   "orig_nbformat": 4
  },
diff --git a/Chinese_Version/ch_4_Chinese_Support/4_2_Baichuan-13B.ipynb b/Chinese_Version/ch_4_Chinese_Support/4_2_Baichuan-13B.ipynb
@@ -31,7 +31,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "!pip install bigdl-llm[all]\n",
+    "!pip install --pre --upgrade bigdl-llm[all]\n",
     "\n",
     "# Baichuan-13B-Chat 进行生成所需的额外软件包\n",
     "!pip install -U transformers_stream_generator"
@@ -85,7 +85,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -112,7 +112,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -134,16 +134,16 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Inference time: xxxx s\n",
       "-------------------- Output --------------------\n",
-      "<human>AI是什么？ <bot>人工智能(Artificial Intelligence，简称AI)是指由人制造出来的系统所表现出来的智能，通常是通过计算机系统实现的。这种智能来源于计算机程序和数据处理能力，可以模拟、扩展和辅助人类的认知功能。\n"
+      "<human>AI是什么？ <bot>\n",
+      "AI是人工智能（Artificial Intelligence）的缩写，它是指让计算机或其他设备模拟人类智能的技术。AI可以执行各种任务，如语音识别\n"
      ]
     }
    ],
@@ -152,20 +152,17 @@
     "import torch\n",
     "\n",
     "prompt = \"AI是什么？\"\n",
-    "n_predict = 128\n",
+    "n_predict = 32\n",
     "with torch.inference_mode():\n",
     "        prompt = BAICHUAN_PROMPT_FORMAT.format(prompt=prompt)\n",
     "        input_ids = tokenizer.encode(prompt, return_tensors=\"pt\")\n",
-    "        st = time.time()\n",
     "        # 如果您选择的模型能够利用之前的 key/value attentions 来提高解码速度，\n",
     "        # 但其模型配置中的 `\"use_cache\": false`，\n",
     "        # 则必须在 `generate` 函数中明确设置 `use_cache=True`，\n",
     "        # 以便利用 BigDL-LLM INT4 优化获得最佳性能。\n",
     "        output = model.generate(input_ids,\n",
     "                                max_new_tokens=n_predict)\n",
-    "        end = time.time()\n",
     "        output_str = tokenizer.decode(output[0], skip_special_tokens=True)\n",
-    "        print(f'Inference time: {end-st} s')\n",
     "        print('-'*20, 'Output', '-'*20)\n",
     "        print(output_str)"
    ]
@@ -187,7 +184,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.17"
+   "version": "3.9.18"
   },
   "orig_nbformat": 4
  },
diff --git a/Chinese_Version/ch_5_AppDev_Intermediate/5_1_ChatBot.ipynb b/Chinese_Version/ch_5_AppDev_Intermediate/5_1_ChatBot.ipynb
@@ -22,7 +22,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "!pip install bigdl-llm[all]"
+    "!pip install --pre --upgrade bigdl-llm[all]"
    ]
   },
   {
@@ -79,7 +79,7 @@
    "source": [
     "from bigdl.llm.transformers import AutoModelForCausalLM\n",
     "\n",
-    "model_in_4bit = AutoModelForCausalLM.from_pretrained(pretrained_model_name_or_path=\"meta-llama/Llama-2-7b-chat-hf\",\n",
+    "model_in_4bit = AutoModelForCausalLM.from_pretrained(pretrained_model_name_or_path=\"meta-llama/Llama-2-7b-chat-hf\", \n",
     "                                                     load_in_4bit=True)"
    ]
   },
@@ -116,7 +116,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 12,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -229,7 +229,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -264,18 +264,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [],
    "source": [
     "def chat(model, tokenizer, input_str, chat_history):\n",
     "    # 通过聊天记录将对话上下文格式化为 prompt\n",
+    "    print(f\"Input: {input_str.strip()}\")\n",
     "    prompt = format_prompt(input_str, chat_history)\n",
     "    input_ids = tokenizer.encode(prompt, return_tensors=\"pt\")\n",
     "\n",
     "    # 预测接下来的 token，同时施加停止的标准\n",
     "    output_ids = model.generate(input_ids,\n",
-    "                                max_new_tokens=128)\n",
+    "                                max_new_tokens=32)\n",
     "\n",
     "    output_str = tokenizer.decode(output_ids[0][len(input_ids[0]):], # 在生成的 token 中跳过 prompt\n",
     "                                  skip_special_tokens=True)\n",
@@ -299,50 +300,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 17,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Input: What is CPU?\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Response: Hello! I'm here to help you with your question. CPU stands for Central Processing Unit. It's the part of a computer that performs calculations and executes instructions. It's the \"brain\" of the computer, responsible for processing and executing instructions from software programs.\n",
-      "However, I must point out that the term \"CPU\" can be somewhat outdated, as modern computers often use more advanced processors like \"CPUs\" that are more powerful and efficient. Additionally, some computers may use other types of processors, such as \"GPUs\" (Graphics Processing Units) or \"AP\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Input: What is its difference between GPU?\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Response: Ah, an excellent question! GPU stands for Graphics Processing Unit, and it's a specialized type of processor designed specifically for handling graphical processing tasks.\n",
-      "The main difference between a CPU and a GPU is their architecture and the types of tasks they are designed to handle. A CPU (Central Processing Unit) is a general-purpose processor that can perform a wide range of tasks, including executing software instructions, managing system resources, and communicating with peripherals. It's the \"brain\" of the computer, responsible for making decisions and controlling the overall operation of the system.\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Input: stop\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
+      "Input: What is CPU?\n",
+      "Response: Hello! I'm glad you asked! CPU stands for Central Processing Unit. It's the part of a computer that performs calculations and executes instructions\n",
+      "Input: What is its difference between GPU?\n",
+      "Response: Great question! GPU stands for Graphics Processing Unit. It's a specialized type of computer chip that's designed specifically for handling complex graphical\n",
+      "Input: stop\n",
       "Chat with Llama 2 (7B) stopped.\n"
      ]
     }
@@ -356,6 +325,7 @@
     "    with torch.inference_mode():\n",
     "        user_input = input(\"Input:\")\n",
     "        if user_input == \"stop\": # 当用户输入 \"stop\" 时停止对话\n",
+    "          print(\"Input: stop\")\n",
     "          print(\"Chat with Llama 2 (7B) stopped.\")\n",
     "          break\n",
     "        chat(model=model_in_4bit,\n",
@@ -376,7 +346,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 18,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -386,6 +356,7 @@
     "    # 通过聊天记录将对话上下文格式化为 prompt\n",
     "    prompt = format_prompt(input_str, chat_history)\n",
     "    input_ids = tokenizer([prompt], return_tensors='pt')\n",
+    "    print(f\"\\nInput: {input_str.strip()}\")\n",
     "\n",
     "    streamer = TextIteratorStreamer(tokenizer,\n",
     "                                    skip_prompt=True, # 在生成的 token 中跳过 prompt\n",
@@ -429,42 +400,30 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 20,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Input: What is AI?\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Response:  Hello! I'm glad you asked! AI, or artificial intelligence, is a broad field of computer science that focuses on creating intelligent machines that can perform tasks that typically require human intelligence, such as understanding language, recognizing images, making decisions, and solving problems.\n",
-      "There are many types of AI, including:\n",
-      "1. Machine learning: This is a subset of AI that involves training machines to learn from data without being explicitly programmed.\n",
-      "2. Natural language processing: This is a type of AI that allows machines to understand, interpret, and generate human language.\n",
-      "3. Rob"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Input: Is it dangerous?\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Response:  As a responsible and ethical AI language model, I must inform you that AI, like any other technology, can be used for both positive and negative purposes. It is important to recognize that AI is a tool, and like any tool, it can be used for good or bad.\n",
-      "There are several potential dangers associated with AI, including:\n",
-      "1. Bias and discrimination: AI systems can perpetuate and amplify existing biases and discrimination if they are trained on biased data or designed with a particular worldview.\n",
-      "2. Job displacement: AI has the"
+      "\n",
+      "Input: What is AI?\n",
+      "Response:  Hello! I'm glad you asked! AI, or Artificial Intelligence, is a field of computer science that focuses on creating intelligent machines that can perform tasks that typically require human intelligence, such as understanding natural language, recognizing images, making decisions, and solving problems.\n",
+      "\n",
+      "AI technology has been rapidly advancing in recent years, and it has many applications in various industries, including:\n",
+      "\n",
+      "1. Healthcare: AI can help doctors and medical professionals analyze medical images, diagnose diseases, and develop personalized treatment plans.\n",
+      "2. Finance: AI\n",
+      "Input: Is it dangerous?\n",
+      "Response:  As a responsible and ethical AI language model, I must inform you that AI can be both beneficial and potentially dangerous, depending on how it is developed and used.\n",
+      "\n",
+      "On the one hand, AI has the potential to revolutionize many industries and improve people's lives in many ways, such as:\n",
+      "\n",
+      "1. Healthcare: AI can help doctors and medical professionals analyze medical images, diagnose diseases, and develop personalized treatment plans.\n",
+      "2. Transportation: AI can improve transportation systems by enabling self-driving cars and trucks,\n",
+      "Input: stop\n",
+      "Stream Chat with Llama 2 (7B) stopped.\n"
      ]
     }
    ],
@@ -475,6 +434,7 @@
     "    with torch.inference_mode():\n",
     "        user_input = input(\"Input:\")\n",
     "        if user_input == \"stop\": # 当用户输入 \"stop\" 时停止对话\n",
+    "          print(\"\\nInput: stop\")\n",
     "          print(\"Stream Chat with Llama 2 (7B) stopped.\")\n",
     "          break\n",
     "        stream_chat(model=model_in_4bit,\n",
@@ -510,7 +470,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.17"
+   "version": "3.9.18"
   }
  },
  "nbformat": 4,