feat: 新增技能扩展N12一章相关示例源码

2023-01-26 12:13:27 +08:00
parent ed5238b04f
commit 924966e89e
1 changed files with 816 additions and 0 deletions
--- a/code/newsletter/N12/tablib.ipynb
+++ b/code/newsletter/N12/tablib.ipynb
@@ -0,0 +1,816 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 创建一个 Dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "100gle|male|author\n"
+     ]
+    }
+   ],
+   "source": [
+    "import tablib\n",
+    "\n",
+    "data = tablib.Dataset([\"100gle\", \"male\", \"author\"])\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 为 Dataset 设置字段名"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "name  |gender|job   \n",
+      "------|------|------\n",
+      "100gle|male  |author\n"
+     ]
+    }
+   ],
+   "source": [
+    "data.headers = (\"name\", \"gender\", \"job\")\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "a|b|c\n",
+      "-|-|-\n",
+      "1|2|3\n",
+      "4|5|6\n"
+     ]
+    }
+   ],
+   "source": [
+    "data = tablib.Dataset(\n",
+    "    *[[1, 2, 3], [4, 5, 6]],\n",
+    "    headers=[\"a\", \"b\", \"c\"],\n",
+    ")\n",
+    "\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 将数据添加进 Dataset 中"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "name  |gender|job       \n",
+      "------|------|----------\n",
+      "100gle|male  |author    \n",
+      "100gle|male  |programmer\n"
+     ]
+    }
+   ],
+   "source": [
+    "data = tablib.Dataset()\n",
+    "data.headers = (\"name\", \"gender\", \"job\")\n",
+    "data.append([\"100gle\", \"male\", \"author\"])\n",
+    "data.append([\"100gle\", \"male\", \"programmer\"])\n",
+    "\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "name  |gender|job       \n",
+      "------|------|----------\n",
+      "Marry |female|artist    \n",
+      "100gle|male  |author    \n",
+      "100gle|male  |programmer\n"
+     ]
+    }
+   ],
+   "source": [
+    "data.lpush([\"Marry\", \"female\", \"artist\"])\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "name  |gender|job       |tag\n",
+      "------|------|----------|---\n",
+      "Marry |female|artist    |1  \n",
+      "100gle|male  |author    |2  \n",
+      "100gle|male  |programmer|3  \n"
+     ]
+    }
+   ],
+   "source": [
+    "data.append_col([1, 2, 3], header=\"tag\")\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "id|name  |gender|job       |tag\n",
+      "--|------|------|----------|---\n",
+      "a |Marry |female|artist    |1  \n",
+      "b |100gle|male  |author    |2  \n",
+      "c |100gle|male  |programmer|3  \n"
+     ]
+    }
+   ],
+   "source": [
+    "data.lpush_col([\"a\", \"b\", \"c\"], header=\"id\")\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 索引与删除 Dataset 数据"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "['Marry', '100gle', '100gle']"
+      ]
+     },
+     "execution_count": 8,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data[\"name\"]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "['artist', 'author', 'programmer']"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data.get_col(3)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "('a', 'Marry', 'female', 'artist', 1)"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data[0]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[('b', '100gle', 'male', 'author', 2),\n",
+       " ('c', '100gle', 'male', 'programmer', 3)]"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data[1:]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "('c', '100gle', 'male', 'programmer', 3)"
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data[-1]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "id|name  |gender|job       |tag\n",
+      "--|------|------|----------|---\n",
+      "b |100gle|male  |author    |2  \n",
+      "c |100gle|male  |programmer|3  \n"
+     ]
+    }
+   ],
+   "source": [
+    "del data[0]\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "id|name  |job       |tag\n",
+      "--|------|----------|---\n",
+      "b |100gle|author    |2  \n",
+      "c |100gle|programmer|3  \n"
+     ]
+    }
+   ],
+   "source": [
+    "del data[\"gender\"]\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "data.wipe()\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 通过标签筛选数据"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "id                                  |title                  |content           |create_at \n",
+      "------------------------------------|-----------------------|------------------|----------\n",
+      "f2097b2c-6d62-469a-a7ee-d44e53fc5458|URL Schema 的 1000 种使用方式|如何使用 URL Schema...|2022-09-06\n",
+      "2cb43639-a76f-4e9f-8e7f-d7c5809b5489|Python 基础快速入门          |快速入门 Python...    |2022-09-06\n",
+      "9eca4106-6520-4b82-93fd-a273eaf0cb6f|使用 Tablib 来完成数据表格操作    |有关 Tablib 的使用技巧...|2022-10-01\n",
+      "cbcf0041-5198-47c7-84e5-e9a88bd09ecc|使用 Django 从零打造一个博客系统   |Django 基础...      |2022-09-30\n"
+     ]
+    }
+   ],
+   "source": [
+    "from uuid import uuid4\n",
+    "\n",
+    "import tablib\n",
+    "\n",
+    "blogs = tablib.Dataset(headers=[\"id\", \"title\", \"content\", \"create_at\"])\n",
+    "records = [\n",
+    "    [\n",
+    "        (uuid4(), \"URL Schema 的 1000 种使用方式\", \"如何使用 URL Schema...\", \"2022-09-06\"),\n",
+    "        [\"iOS\", \"Automatic\"],\n",
+    "    ],\n",
+    "    [(uuid4(), \"Python 基础快速入门\", \"快速入门 Python...\", \"2022-09-06\"), [\"Python\", \"Basic\"]],\n",
+    "    [\n",
+    "        (uuid4(), \"使用 Tablib 来完成数据表格操作\", \"有关 Tablib 的使用技巧...\", \"2022-10-01\"),\n",
+    "        [\"Python\", \"Python Library\"],\n",
+    "    ],\n",
+    "    [\n",
+    "        (uuid4(), \"使用 Django 从零打造一个博客系统\", \"Django 基础...\", \"2022-09-30\"),\n",
+    "        [\"Python\", \"Web\", \"Django\", \"Python Library\"],\n",
+    "    ],\n",
+    "]\n",
+    "\n",
+    "for record, tags in records:\n",
+    "    blogs.append(record, tags=tags)\n",
+    "\n",
+    "print(blogs)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[OrderedDict([('id', UUID('f2097b2c-6d62-469a-a7ee-d44e53fc5458')),\n",
+       "              ('title', 'URL Schema 的 1000 种使用方式'),\n",
+       "              ('content', '如何使用 URL Schema...'),\n",
+       "              ('create_at', '2022-09-06')])]"
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "blogs.filter([\"iOS\"]).dict"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[OrderedDict([('id', UUID('2cb43639-a76f-4e9f-8e7f-d7c5809b5489')),\n",
+       "              ('title', 'Python 基础快速入门'),\n",
+       "              ('content', '快速入门 Python...'),\n",
+       "              ('create_at', '2022-09-06')]),\n",
+       " OrderedDict([('id', UUID('9eca4106-6520-4b82-93fd-a273eaf0cb6f')),\n",
+       "              ('title', '使用 Tablib 来完成数据表格操作'),\n",
+       "              ('content', '有关 Tablib 的使用技巧...'),\n",
+       "              ('create_at', '2022-10-01')]),\n",
+       " OrderedDict([('id', UUID('cbcf0041-5198-47c7-84e5-e9a88bd09ecc')),\n",
+       "              ('title', '使用 Django 从零打造一个博客系统'),\n",
+       "              ('content', 'Django 基础...'),\n",
+       "              ('create_at', '2022-09-30')])]"
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "blogs.filter([\"Python\"]).dict"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 动态列"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "title                  |content           |create_at \n",
+      "-----------------------|------------------|----------\n",
+      "URL Schema 的 1000 种使用方式|如何使用 URL Schema...|2022-09-06\n",
+      "Python 基础快速入门          |快速入门 Python...    |2022-09-06\n",
+      "使用 Tablib 来完成数据表格操作    |有关 Tablib 的使用技巧...|2022-10-01\n",
+      "使用 Django 从零打造一个博客系统   |Django 基础...      |2022-09-30\n"
+     ]
+    }
+   ],
+   "source": [
+    "del blogs[\"id\"]\n",
+    "print(blogs)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "title                  |content           |create_at |uid                                 \n",
+      "-----------------------|------------------|----------|------------------------------------\n",
+      "URL Schema 的 1000 种使用方式|如何使用 URL Schema...|2022-09-06|140f7af0-63fc-43b9-847b-666c76075cfb\n",
+      "Python 基础快速入门          |快速入门 Python...    |2022-09-06|5ec020fd-6a10-4c4b-935c-19220f642b92\n",
+      "使用 Tablib 来完成数据表格操作    |有关 Tablib 的使用技巧...|2022-10-01|6c3f75f6-a9f0-490e-9725-de7ec2712323\n",
+      "使用 Django 从零打造一个博客系统   |Django 基础...      |2022-09-30|d5e9c8ac-3d8e-4c98-be5f-d9ba4182cecf\n"
+     ]
+    }
+   ],
+   "source": [
+    "def uid(row):\n",
+    "    return uuid4()\n",
+    "\n",
+    "blogs.append_col(uid, header=\"uid\")\n",
+    "print(blogs)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 21,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "title                  |content           |create_at |uid                                 |month\n",
+      "-----------------------|------------------|----------|------------------------------------|-----\n",
+      "URL Schema 的 1000 种使用方式|如何使用 URL Schema...|2022-09-06|140f7af0-63fc-43b9-847b-666c76075cfb|9    \n",
+      "Python 基础快速入门          |快速入门 Python...    |2022-09-06|5ec020fd-6a10-4c4b-935c-19220f642b92|9    \n",
+      "使用 Tablib 来完成数据表格操作    |有关 Tablib 的使用技巧...|2022-10-01|6c3f75f6-a9f0-490e-9725-de7ec2712323|10   \n",
+      "使用 Django 从零打造一个博客系统   |Django 基础...      |2022-09-30|d5e9c8ac-3d8e-4c98-be5f-d9ba4182cecf|9    \n"
+     ]
+    }
+   ],
+   "source": [
+    "from datetime import datetime\n",
+    "\n",
+    "def month(row):\n",
+    "    date_str = row[2]\n",
+    "    date = datetime.strptime(date_str, \"%Y-%m-%d\")\n",
+    "    return date.month\n",
+    "\n",
+    "\n",
+    "blogs.append_col(month, header=\"month\")\n",
+    "print(blogs)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 读取数据并转换成 Dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 22,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "id|name  |email             \n",
+      "--|------|------------------\n",
+      "1 |100gle|100gle@example.com\n",
+      "2 |Steve |steve@example.com \n",
+      "3 |Harry |harry@exmaple.com \n"
+     ]
+    }
+   ],
+   "source": [
+    "import tablib\n",
+    "\n",
+    "csv = \"\"\"\\\n",
+    "id,name,email\n",
+    "1,100gle,100gle@example.com\n",
+    "2,Steve,steve@example.com\n",
+    "3,Harry,harry@exmaple.com\n",
+    "\"\"\"\n",
+    "\n",
+    "data = tablib.Dataset().load(csv)\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "id|name  |email             \n",
+      "--|------|------------------\n",
+      "1 |100gle|100gle@example.com\n",
+      "2 |Steve |steve@example.com \n",
+      "3 |Harry |harry@example.com \n"
+     ]
+    }
+   ],
+   "source": [
+    "json = \"\"\"\\\n",
+    "[\n",
+    "    {\n",
+    "        \"id\": 1,\n",
+    "        \"name\": \"100gle\",\n",
+    "        \"email\": \"100gle@example.com\"\n",
+    "    },\n",
+    "    {\n",
+    "        \"id\": 2,\n",
+    "        \"name\": \"Steve\",\n",
+    "        \"email\": \"steve@example.com\"\n",
+    "    },\n",
+    "    {\n",
+    "        \"id\": 3,\n",
+    "        \"name\": \"Harry\",\n",
+    "        \"email\": \"harry@example.com\"\n",
+    "    }\n",
+    "]\n",
+    "\"\"\"\n",
+    "\n",
+    "data = tablib.Dataset().load(json, format=\"json\")\n",
+    "print(data)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 将 Dataset 数据导出"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[OrderedDict([('id', 1), ('name', '100gle'), ('email', '100gle@example.com')]),\n",
+       " OrderedDict([('id', 2), ('name', 'Steve'), ('email', 'steve@example.com')]),\n",
+       " OrderedDict([('id', 3), ('name', 'Harry'), ('email', 'harry@example.com')])]"
+      ]
+     },
+     "execution_count": 24,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data.dict"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 25,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'[{\"id\": 1, \"name\": \"100gle\", \"email\": \"100gle@example.com\"}, {\"id\": 2, \"name\": \"Steve\", \"email\": \"steve@example.com\"}, {\"id\": 3, \"name\": \"Harry\", \"email\": \"harry@example.com\"}]'"
+      ]
+     },
+     "execution_count": 25,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data.json"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'- {email: 100gle@example.com, id: 1, name: 100gle}\\n- {email: steve@example.com, id: 2, name: Steve}\\n- {email: harry@example.com, id: 3, name: Harry}\\n'"
+      ]
+     },
+     "execution_count": 26,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data.yaml"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'  id  name    email\\n   1  100gle  100gle@example.com\\n   2  Steve   steve@example.com\\n   3  Harry   harry@example.com'"
+      ]
+     },
+     "execution_count": 27,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data.cli"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "+------+--------+--------------------+\n",
+      "|   id | name   | email              |\n",
+      "+======+========+====================+\n",
+      "|    1 | 100gle | 100gle@example.com |\n",
+      "+------+--------+--------------------+\n",
+      "|    2 | Steve  | steve@example.com  |\n",
+      "+------+--------+--------------------+\n",
+      "|    3 | Harry  | harry@example.com  |\n",
+      "+------+--------+--------------------+\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(data.export(\"cli\", tablefmt=\"grid\"))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 29,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "╒══════╤════════╤════════════════════╕\n",
+      "│   id │ name   │ email              │\n",
+      "╞══════╪════════╪════════════════════╡\n",
+      "│    1 │ 100gle │ 100gle@example.com │\n",
+      "├──────┼────────┼────────────────────┤\n",
+      "│    2 │ Steve  │ steve@example.com  │\n",
+      "├──────┼────────┼────────────────────┤\n",
+      "│    3 │ Harry  │ harry@example.com  │\n",
+      "╘══════╧════════╧════════════════════╛\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(data.export(\"cli\", tablefmt=\"fancy_grid\"))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 30,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "||id||name||email||\n",
+      "|1|100gle|100gle@example.com|\n",
+      "|2|Steve|steve@example.com|\n",
+      "|3|Harry|harry@example.com|\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(data.export(\"jira\"))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3.9.0 ('pandas-startup')",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.0"
+  },
+  "orig_nbformat": 4,
+  "vscode": {
+   "interpreter": {
+    "hash": "13977d4cc82dee5f9d9535ceb495bd0ab12a43c33c664e5f0d53c24cf634b67f"
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}