eric496
diff --git a/‎0. Data Type.ipynb
Lines changed: 303 additions & 0 deletions b/‎0. Data Type.ipynb
Lines changed: 303 additions & 0 deletions
@@ -0,0 +1,303 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### A list of Numpy Data Types"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Type</th>\n",
+       "      <th>Type Code</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>int8</td>\n",
+       "      <td>i1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>uint8</td>\n",
+       "      <td>u1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>int16</td>\n",
+       "      <td>i2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>uint16</td>\n",
+       "      <td>u2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>int32</td>\n",
+       "      <td>i4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>uint32</td>\n",
+       "      <td>u4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>int64</td>\n",
+       "      <td>i8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>uint64</td>\n",
+       "      <td>u8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>float16</td>\n",
+       "      <td>f2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>float32</td>\n",
+       "      <td>f4 or f</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>float64</td>\n",
+       "      <td>f8 or d</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>float128</td>\n",
+       "      <td>f16 or g</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>complex64</td>\n",
+       "      <td>c8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>complex128</td>\n",
+       "      <td>c16</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>14</th>\n",
+       "      <td>bool</td>\n",
+       "      <td></td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>15</th>\n",
+       "      <td>object</td>\n",
+       "      <td>O</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>16</th>\n",
+       "      <td>string_</td>\n",
+       "      <td>S</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>17</th>\n",
+       "      <td>unicode_</td>\n",
+       "      <td>U</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "          Type Type Code\n",
+       "0         int8        i1\n",
+       "1        uint8        u1\n",
+       "2        int16        i2\n",
+       "3       uint16        u2\n",
+       "4        int32        i4\n",
+       "5       uint32        u4\n",
+       "6        int64        i8\n",
+       "7       uint64        u8\n",
+       "8      float16        f2\n",
+       "9      float32   f4 or f\n",
+       "10     float64   f8 or d\n",
+       "11    float128  f16 or g\n",
+       "12   complex64        c8\n",
+       "13  complex128       c16\n",
+       "14        bool          \n",
+       "15      object         O\n",
+       "16     string_         S\n",
+       "17    unicode_         U"
+      ]
+     },
+     "execution_count": 2,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import pandas as pd\n",
+    "dtypes = pd.DataFrame(\n",
+    "    {\n",
+    "        'Type': ['int8', 'uint8', 'int16', 'uint16', 'int32', 'uint32', 'int64', 'uint64', 'float16', 'float32', 'float64', 'float128', 'complex64', 'complex128', 'bool', 'object', 'string_', 'unicode_'],\n",
+    "        'Type Code': ['i1', 'u1', 'i2', 'u2', 'i4', 'u4', 'i8', 'u8', 'f2', 'f4 or f', 'f8 or d', 'f16 or g', 'c8', 'c16', '', 'O', 'S', 'U']\n",
+    "    }\n",
+    ")\n",
+    "\n",
+    "dtypes"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[1. 2. 3.]\n",
+      "float32\n",
+      "[1.+2.j 3.-4.j]\n",
+      "complex64\n",
+      "[False  True  True]\n",
+      "bool\n"
+     ]
+    }
+   ],
+   "source": [
+    "# create an array with a specified data type\n",
+    "arr = np.array([1,2,3], dtype='f4')\n",
+    "print(arr)\n",
+    "print(arr.dtype)\n",
+    "\n",
+    "arr = np.array([1+2j, 3-4j], dtype=np.complex64)\n",
+    "print(arr)\n",
+    "print(arr.dtype)\n",
+    "\n",
+    "arr = np.array([0, 1, 1], dtype=np.bool)\n",
+    "print(arr)\n",
+    "print(arr.dtype)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### string data type"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[b'abc' b'def']\n",
+      "|S3\n"
+     ]
+    }
+   ],
+   "source": [
+    "# set the max length of the string using S + some number, such as 'S3'\n",
+    "# any string longer than the max length will be truncated\n",
+    "s = np.array(['abc', 'defg'], dtype='S3')\n",
+    "print(s)\n",
+    "print(s.dtype)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "|S3\n",
+      "<U3\n"
+     ]
+    }
+   ],
+   "source": [
+    "# numpy string and unicode data types are fixed-length\n",
+    "# string_ and unicode_ will treat the longest string in the array as the default length when creating an array\n",
+    "arr = np.array(['a', 'ab', 'abc'], dtype=np.string_)\n",
+    "print(arr.dtype)\n",
+    "\n",
+    "arr = np.array(['a', 'ab', 'abc'], dtype=np.unicode_)\n",
+    "print(arr.dtype)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# what does the above \"|\" and \"<\" mean?\n",
+    "# they are the byte order indicators, which is beyond the scope of this tutorial\n",
+    "# you can check it out here: https://docs.scipy.org/doc/numpy/reference/generated/numpy.dtype.byteorder.html\n",
+    "# and here: https://en.wikipedia.org/wiki/Endianness"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}