devopsgitpython
diff --git a/‎week03_convnets/HagridsHut_PM_B6C28_Hagrid_sHutFireHarryFang.jpg
169 KB b/‎week03_convnets/HagridsHut_PM_B6C28_Hagrid_sHutFireHarryFang.jpg
169 KB
diff --git a/‎week03_convnets/README.md
Lines changed: 19 additions & 0 deletions b/‎week03_convnets/README.md
Lines changed: 19 additions & 0 deletions
diff --git a/‎week03_convnets/how_to_shoot_yourself_in_the_foot_with_cnn.ipynb
Lines changed: 156 additions & 0 deletions b/‎week03_convnets/how_to_shoot_yourself_in_the_foot_with_cnn.ipynb
Lines changed: 156 additions & 0 deletions
diff --git a/‎week03_convnets/load_images.py b/‎week03_convnets/load_images.py
@@ -0,0 +1,19 @@
+__Note__: Seminars assume that you remember batch normalization and dropout from last lecture. If you don't, go recap week2.
+
+## Materials
+- [russian] Convolutional networks - [video](https://yadi.sk/i/hDIkaR4H3EtnXM)
+- [english] Convolutional networks (karpathy) - [video](https://www.youtube.com/watch?v=AQirPKrAyDg)
+
+- Reading
+  - http://cs231n.github.io/convolutional-networks/
+  - http://cs231n.github.io/understanding-cnn/
+  - [a deep learning neophite cheat sheet](http://www.kdnuggets.com/2016/03/must-know-tips-deep-learning-part-1.html)
+  - [more stuff for vision](https://bavm2013.splashthat.com/img/events/46439/assets/34a7.ranzato.pdf)
+  - a [CNN trainer in a browser](https://cs.stanford.edu/people/karpathy/convnetjs/demo/cifar10.html)
+
+
+## Assignment
+
+As usual, go to seminar_pytorch.ipynb and folow instructons from there.
+
+There's also ./other_frameworks if you're more into theano/tf.
@@ -0,0 +1,156 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import torch, torch.nn as nn\n",
+    "import torch.nn.functional as F\n",
+    "from torch.autograd import Variable\n",
+    "\n",
+    "# a special module that converts [batch, channel, w, h] to [batch, units]\n",
+    "class Flatten(nn.Module):\n",
+    "    def forward(self, input):\n",
+    "        return input.view(input.size(0), -1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "# assuming input shape [batch, 3, 64, 64]\n",
+    "cnn = nn.Sequential(\n",
+    "    nn.Conv2d(in_channels=3, out_channels=2048, kernel_size=(3,3)),\n",
+    "    nn.Conv2d(in_channels=2048, out_channels=1024, kernel_size=(3,3)),\n",
+    "    nn.Conv2d(in_channels=1024, out_channels=512, kernel_size=(3,3)),\n",
+    "    nn.ReLU(),\n",
+    "    nn.MaxPool2d((6,6)),\n",
+    "    nn.Conv2d(in_channels=6, out_channels=32, kernel_size=(20,20)),\n",
+    "    nn.Conv2d(in_channels=32, out_channels=64, kernel_size=(20,20)),\n",
+    "    nn.Conv2d(in_channels=64, out_channels=128, kernel_size=(20,20)),\n",
+    "    nn.Softmax(),\n",
+    "    Flatten(),\n",
+    "    nn.Linear(64, 256),\n",
+    "    nn.Softmax(),\n",
+    "    nn.Linear(256, 10),\n",
+    "    nn.Sigmoid(),\n",
+    "    nn.Dropout(0.5)\n",
+    "    \n",
+    ")\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "\n",
+    "\n",
+    "# Book of grudges\n",
+    "* Input channels are wrong literally half the time (after pooling, after flatten).\n",
+    "* Too many filters for first 3x3 convolution - will lead to enormous matrix while there's just not enough relevant combinations of 3x3 images (overkill).\n",
+    "* Usually the further you go, the more filters you need.\n",
+    "* large filters (10x10 is generally a bad pactice, and you definitely need more than 10 of them\n",
+    "* the second of 10x10 convolution gets 8x6x6 image as input, so it's technically unable to perform such convolution.\n",
+    "* Softmax nonlinearity effectively makes only 1 or a few neurons from the entire layer to \"fire\", rendering 512-neuron layer almost useless. Softmax at the output layer is okay though\n",
+    "* Dropout after probability prediciton is just lame. A few random classes get probability of 0, so your probabilities no longer sum to 1 and crossentropy goes -inf."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.4"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}