You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

02-LeNet5.ipynb 5.1 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. {
  2. "cells": [
  3. {
  4. "cell_type": "markdown",
  5. "metadata": {},
  6. "source": [
  7. "# LeNet5\n",
  8. "\n",
  9. "LeNet 诞生于 1994 年,是最早的卷积神经网络之一,并且推动了深度学习领域的发展。自从 1988 年开始,在多次迭代后这个开拓性成果被命名为 LeNet5。LeNet5 的架构的提出是基于如下的观点:图像的特征分布在整张图像上,通过带有可学习参数的卷积,从而有效的减少了参数数量,能够在多个位置上提取相似特征。\n",
  10. "\n",
  11. "在LeNet5提出的时候,没有 GPU 帮助训练,甚至 CPU 的速度也很慢,因此,LeNet5的规模并不大。其包含七个处理层,每一层都包含可训练参数(权重),当时使用的输入数据是 $32 \\times 32$ 像素的图像。LeNet-5 这个网络虽然很小,但是它包含了深度学习的基本模块:卷积层,池化层,全连接层。它是其他深度学习模型的基础,这里对LeNet5进行深入分析和讲解,通过实例分析,加深对与卷积层和池化层的理解。"
  12. ]
  13. },
  14. {
  15. "cell_type": "code",
  16. "execution_count": 1,
  17. "metadata": {
  18. "collapsed": true
  19. },
  20. "outputs": [],
  21. "source": [
  22. "import sys\n",
  23. "sys.path.append('..')\n",
  24. "\n",
  25. "import numpy as np\n",
  26. "import torch\n",
  27. "from torch import nn\n",
  28. "from torch.autograd import Variable\n",
  29. "from torchvision.datasets import CIFAR10\n",
  30. "from torchvision import transforms as tfs"
  31. ]
  32. },
  33. {
  34. "cell_type": "code",
  35. "execution_count": 1,
  36. "metadata": {
  37. "collapsed": true
  38. },
  39. "outputs": [],
  40. "source": [
  41. "import torch\n",
  42. "from torch import nn\n",
  43. "\n",
  44. "lenet5 = nn.Sequential(\n",
  45. " nn.Conv2d(1, 6, kernel_size=5, padding=2), nn.Sigmoid(),\n",
  46. " nn.AvgPool2d(kernel_size=2, stride=2),\n",
  47. " nn.Conv2d(6, 16, kernel_size=5), nn.Sigmoid(),\n",
  48. " nn.AvgPool2d(kernel_size=2, stride=2),\n",
  49. " nn.Flatten(),\n",
  50. " nn.Linear(16 * 5 * 5, 120), nn.Sigmoid(),\n",
  51. " nn.Linear(120, 84), nn.Sigmoid(),\n",
  52. " nn.Linear(84, 10) )"
  53. ]
  54. },
  55. {
  56. "cell_type": "code",
  57. "execution_count": null,
  58. "metadata": {
  59. "collapsed": true
  60. },
  61. "outputs": [],
  62. "source": [
  63. "from utils import train\n",
  64. "\n",
  65. "# 使用数据增强\n",
  66. "def train_tf(x):\n",
  67. " im_aug = tfs.Compose([\n",
  68. " tfs.Resize(224),\n",
  69. " tfs.ToTensor(),\n",
  70. " tfs.Normalize([0.5, 0.5, 0.5], [0.5, 0.5, 0.5])\n",
  71. " ])\n",
  72. " x = im_aug(x)\n",
  73. " return x\n",
  74. "\n",
  75. "def test_tf(x):\n",
  76. " im_aug = tfs.Compose([\n",
  77. " tfs.Resize(224),\n",
  78. " tfs.ToTensor(),\n",
  79. " tfs.Normalize([0.5, 0.5, 0.5], [0.5, 0.5, 0.5])\n",
  80. " ])\n",
  81. " x = im_aug(x)\n",
  82. " return x\n",
  83. " \n",
  84. "train_set = CIFAR10('../../data', train=True, transform=train_tf)\n",
  85. "train_data = torch.utils.data.DataLoader(train_set, batch_size=64, shuffle=True)\n",
  86. "test_set = CIFAR10('../../data', train=False, transform=test_tf)\n",
  87. "test_data = torch.utils.data.DataLoader(test_set, batch_size=128, shuffle=False)\n",
  88. "\n",
  89. "net = lenet5\n",
  90. "optimizer = torch.optim.SGD(net.parameters(), lr=1e-1)\n",
  91. "criterion = nn.CrossEntropyLoss()"
  92. ]
  93. },
  94. {
  95. "cell_type": "code",
  96. "execution_count": null,
  97. "metadata": {
  98. "collapsed": true
  99. },
  100. "outputs": [],
  101. "source": [
  102. "(l_train_loss, l_train_acc, l_valid_loss, l_valid_acc) = train(net, \n",
  103. " train_data, test_data, \n",
  104. " 20, \n",
  105. " optimizer, criterion,\n",
  106. " use_cuda=False)"
  107. ]
  108. },
  109. {
  110. "cell_type": "code",
  111. "execution_count": null,
  112. "metadata": {
  113. "collapsed": true
  114. },
  115. "outputs": [],
  116. "source": [
  117. "import matplotlib.pyplot as plt\n",
  118. "%matplotlib inline\n",
  119. "\n",
  120. "plt.plot(l_train_loss, label='train')\n",
  121. "plt.plot(l_valid_loss, label='valid')\n",
  122. "plt.xlabel('epoch')\n",
  123. "plt.legend(loc='best')\n",
  124. "plt.savefig('fig-res-lenet5-train-validate-loss.pdf')\n",
  125. "plt.show()\n",
  126. "\n",
  127. "plt.plot(l_train_acc, label='train')\n",
  128. "plt.plot(l_valid_acc, label='valid')\n",
  129. "plt.xlabel('epoch')\n",
  130. "plt.legend(loc='best')\n",
  131. "plt.savefig('fig-res-lenet5-train-validate-acc.pdf')\n",
  132. "plt.show()"
  133. ]
  134. }
  135. ],
  136. "metadata": {
  137. "kernelspec": {
  138. "display_name": "Python 3",
  139. "language": "python",
  140. "name": "python3"
  141. },
  142. "language_info": {
  143. "codemirror_mode": {
  144. "name": "ipython",
  145. "version": 3
  146. },
  147. "file_extension": ".py",
  148. "mimetype": "text/x-python",
  149. "name": "python",
  150. "nbconvert_exporter": "python",
  151. "pygments_lexer": "ipython3",
  152. "version": "3.5.4"
  153. }
  154. },
  155. "nbformat": 4,
  156. "nbformat_minor": 2
  157. }

机器学习越来越多应用到飞行器、机器人等领域,其目的是利用计算机实现类似人类的智能,从而实现装备的智能化与无人化。本课程旨在引导学生掌握机器学习的基本知识、典型方法与技术,通过具体的应用案例激发学生对该学科的兴趣,鼓励学生能够从人工智能的角度来分析、解决飞行器、机器人所面临的问题和挑战。本课程主要内容包括Python编程基础,机器学习模型,无监督学习、监督学习、深度学习基础知识与实现,并学习如何利用机器学习解决实际问题,从而全面提升自我的《综合能力》。