tatsy
diff --git a/‎.vscode/settings.json
+3 b/‎.vscode/settings.json
+3
diff --git a/‎_contents/python/logistic-regression-01.md
+6-5 b/‎_contents/python/logistic-regression-01.md
+6-5
diff --git a/‎_contents/python/logistic-regression-02.md
+1-1 b/‎_contents/python/logistic-regression-02.md
+1-1
diff --git a/‎_contents/python/read-binary.md
+2-1 b/‎_contents/python/read-binary.md
+2-1
diff --git a/‎_programs/python/.gitignore
+2-1 b/‎_programs/python/.gitignore
+2-1
diff --git a/‎_programs/python/environment.yaml
+13 b/‎_programs/python/environment.yaml
+13
diff --git a/‎_programs/python/convolution-network.ipynb ‎_programs/python/gan/convolution-network.ipynb b/‎_programs/python/convolution-network.ipynb ‎_programs/python/gan/convolution-network.ipynb
diff --git a/‎_programs/python/logistic/.ipynb_checkpoints/logistic_regression_01-checkpoint.ipynb
+222 b/‎_programs/python/logistic/.ipynb_checkpoints/logistic_regression_01-checkpoint.ipynb
+222
diff --git a/‎_programs/python/download.py ‎_programs/python/logistic/download.py
+29-12 b/‎_programs/python/download.py ‎_programs/python/logistic/download.py
+29-12
@@ -0,0 +1,3 @@
+{
+    "python.pythonPath": "/Users/tatsuya/miniconda3/bin/python"
+}
@@ -18,17 +18,17 @@ $$
 
 $$
 \begin{aligned}
-    \mathbf{y} = \text{sigmoid}(\mathbf{Ax} + \mathbf{b}) \\
-    \mathbf{y} = \text{softmax}(\mathbf{Ax} + \mathbf{b}) \\
+    \mathbf{y} &= \text{sigmoid}(\mathbf{Ax} + \mathbf{b}) \\
+    \mathbf{y} &= \text{softmax}(\mathbf{Ax} + \mathbf{b}) \\
 \end{aligned}
 $$
 
 のようにする。特にsigmoid関数を使うものをロジスティック回帰という(softmaxを使うものも含む場合もある)。なお、sigmoid関数、softmax関数はそれぞれ次のように表される。
 
 $$
 \begin{aligned}
-    \text{sigmoid}(x) = \frac{1}{1 + e^{-x}} \\
-    \text{softmax}(\mathbf{x})_i = \frac{e^{x_i}}{\sum_{k=1}^d e^{x_k}}
+    \text{sigmoid}(x) &= \frac{1}{1 + e^{-x}} \\
+    \text{softmax}(\mathbf{x})_i &= \frac{e^{x_i}}{\sum_{k=1}^d e^{x_k}}
 \end{aligned}
 $$ 
 
@@ -55,7 +55,8 @@ X = X.astype('float32')
 
 ```python
 from sklearn.linear_model import LogisticRegression
-clf = LogisticRegression(random_state=0, multi_class='multinomial', max_iter=20).fit(X, y)
+clf = LogisticRegression(random_state=0, multi_class='multinomial', max_iter=20)
+clf.fit(X, y)
 ```
 
 少し時間がかかるが、しばらくすると学習が終わる。なお上記のコード内での `y` は整数型のラベルを格納したNumPyの配列で良い(分かりやすくするために名前を変更した)。
 
@@ -132,7 +132,7 @@ dLdb = np.dot(dLdt, dtdb)
 
 ### 確率的勾配法
 
-ただ、残念なことにMNISTの場合でいえば60000もある学習データ全てに対しての平均を計算することは、計算効率があまり良くない。今回は数字が10種類しかないので、おそらく60000万個を一度に考えなくても、それなりの数のデータをサンプルして勾配を計算すれば全体の平均で計算した勾配と似たものが得られそうだ。
+ただ、残念なことにMNISTの場合でいえば60000もある学習データ全てに対しての平均を計算することは、計算効率があまり良くない。今回は数字が10種類しかないので、おそらく60000個を一度に考えなくても、それなりの数のデータをサンプルして勾配を計算すれば全体の平均で計算した勾配と似たものが得られそうだ。
 
 このような確率的なサンプリングにより選んだデータから勾配を計算する方法を確率的勾配法と呼ぶ。特に最急降下法の勾配をサンプルしたデータから選ぶ方法を**確率的最急降下法** (SGD = stochastic gradient descent) と呼ぶ。今回のMNISTのケースで言えば、だいたい30-50くらいのサンプルを取って勾配を計算すれば、十分にうまく収束する。
 
 
@@ -66,9 +66,10 @@ pixels = np.asarray(pixels, dtype='uint8')
 pixels = pixels.reshape((height, width))
 ```
 
-試しに表示してみる。
+次に**Matplotlib**を使って、この画像を表示してみる。
 
 ```python
+import matplotlib.pyplot as plt
 plt.imshow(pixels)
 plt.show()
 ```
 
@@ -1,4 +1,5 @@
 .ipynb_checkpoints/*
-mnist/*
+*/mnist/*
+*/kmnist/*
 
 .DS_Store
@@ -0,0 +1,13 @@
+name: beginners
+channels:
+  - conda-forge
+dependencies:
+  - python>=3
+  - numpy
+  - scipy
+  - opencv
+  - requests
+  - matplotlib
+  - scikit-learn
+  - scikit-image
+  - conda-forge::jupyterlab
@@ -0,0 +1,222 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# ロジスティック回帰 -その1-"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import struct\n",
+    "import numpy as np\n",
+    "import matplotlib.pyplot as plt\n",
+    "from sklearn.linear_model import LogisticRegression"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# MNISTのファイル (あらかじめダウンロードしておく)\n",
+    "train_image_file = 'mnist/train-images-idx3-ubyte'\n",
+    "train_label_file = 'mnist/train-labels-idx1-ubyte'\n",
+    "test_image_file = 'mnist/t10k-images-idx3-ubyte'\n",
+    "test_label_file = 'mnist/t10k-labels-idx1-ubyte'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## データの読み込み"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def load_images(filename):\n",
+    "    \"\"\" MNISTの画像データを読み込む \"\"\"\n",
+    "\n",
+    "    fp = open(filename, 'rb')\n",
+    "    \n",
+    "    # マジックナンバー\n",
+    "    magic = struct.unpack('>i', fp.read(4))[0]\n",
+    "    if magic != 2051:\n",
+    "        raise RuntimeError('Invalid MNIST file!')\n",
+    "        \n",
+    "    # 各種サイズ\n",
+    "    n_images, height, width = struct.unpack('>iii', fp.read(4 * 3))\n",
+    "    \n",
+    "    # 画像の読み込み\n",
+    "    total_pixels = n_images * height * width\n",
+    "    images = struct.unpack('>' + 'B' * total_pixels, fp.read(total_pixels))\n",
+    "    \n",
+    "    images = np.asarray(images, dtype='uint8')\n",
+    "    images = images.reshape((n_images, height, width, 1))\n",
+    "    \n",
+    "    # 値の範囲を[0, 1]に変更する\n",
+    "    images = images.astype('float32') / 255.0\n",
+    "    \n",
+    "    fp.close()\n",
+    "    \n",
+    "    return images"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def load_labels(filename):\n",
+    "    \"\"\" MNISTのラベルデータを読み込む \"\"\"\n",
+    "\n",
+    "    fp = open(filename, 'rb')\n",
+    "    \n",
+    "    # マジックナンバー\n",
+    "    magic = struct.unpack('>i', fp.read(4))[0]\n",
+    "    if magic != 2049:\n",
+    "        raise RuntimeError('Invalid MNIST file!')\n",
+    "        \n",
+    "    # 各種サイズ\n",
+    "    n_labels = struct.unpack('>i', fp.read(4))[0]\n",
+    "    \n",
+    "    # ラベルの読み込み\n",
+    "    labels = struct.unpack('>' + 'B' * n_labels, fp.read(n_labels))\n",
+    "    labels = np.asarray(labels, dtype='int32')\n",
+    "    \n",
+    "    fp.close()\n",
+    "    \n",
+    "    return labels"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def to_onehot(labels):\n",
+    "    \"\"\" one-hot形式への変換 \"\"\"\n",
+    "    return np.identity(10)[labels]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "images = load_images(train_image_file)\n",
+    "labels = load_labels(train_label_file)\n",
+    "onehot = to_onehot(labels)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## scikit-learnによるロジスティック回帰"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/tatsuya/miniconda3/envs/beginners/lib/python3.9/site-packages/sklearn/linear_model/_logistic.py:763: ConvergenceWarning: lbfgs failed to converge (status=1):\n",
+      "STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.\n",
+      "\n",
+      "Increase the number of iterations (max_iter) or scale the data as shown in:\n",
+      "    https://scikit-learn.org/stable/modules/preprocessing.html\n",
+      "Please also refer to the documentation for alternative solver options:\n",
+      "    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression\n",
+      "  n_iter_i = _check_optimize_result(\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "LogisticRegression(max_iter=20, multi_class='multinomial', random_state=0)"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "n = len(images)\n",
+    "X = images.reshape((n, -1))\n",
+    "y = labels.reshape((n))\n",
+    "clf = LogisticRegression(random_state=0, multi_class='multinomial', max_iter=20)\n",
+    "clf.fit(X, y)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## テストデータを用いた精度計算"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy: 0.9130\n"
+     ]
+    }
+   ],
+   "source": [
+    "test_images = load_images(test_image_file)\n",
+    "test_labels = load_labels(test_label_file)\n",
+    "pred_labels = clf.predict(test_images.reshape(10000, -1))\n",
+    "acc = (pred_labels == test_labels).mean()\n",
+    "print('Accuracy: {:.4f}'.format(acc))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.1"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
@@ -1,26 +1,19 @@
-import gzip
 import os
 import sys
+import gzip
 
 import requests
 
-url = 'http://yann.lecun.com/exdb/mnist/'
-x_train_file = 'train-images-idx3-ubyte.gz'
-y_train_file = 'train-labels-idx1-ubyte.gz'
-x_test_file = 't10k-images-idx3-ubyte.gz'
-y_test_file = 't10k-labels-idx1-ubyte.gz'
-
 curdir = os.path.abspath(os.path.dirname(__file__))
-outdir = os.path.join(curdir, 'mnist')
 
 CHUNK_SIZE = 32768
 
 
-def main():
+def download(name, url, files):
+    outdir = os.path.join(curdir, name)
     if not os.path.exists(outdir):
         os.makedirs(outdir)
 
-    files = [x_train_file, y_train_file, x_test_file, y_test_file]
     for f in files:
         # Download files
         session = requests.Session()
@@ -44,11 +37,35 @@ def main():
 
         # Unzip
         unzip_file = os.path.splitext(local_file)[0]
-        with open(unzip_file, 'wb') as fout, gzip.open(local_file,
-                                                       'rb') as fin:
+        with open(unzip_file, 'wb') as fout, gzip.open(local_file, 'rb') as fin:
             data = fin.read()
             fout.write(data)
 
+        os.remove(local_file)
+
+
+def main():
+    urls = [
+        ('mnist', 'http://yann.lecun.com/exdb/mnist/'),
+        ('kmnist', 'http://codh.rois.ac.jp/kmnist/dataset/kmnist/'),
+    ]
+
+    target = 0
+    while target <= 0:
+        for i, (name, url) in enumerate(urls):
+            print('[%d] %s: %s' % (i + 1, name, url))
+        target = input('Choose dataset to download: ')
+        target = int(target)
+
+    name, url = urls[target - 1]
+    files = [
+        'train-images-idx3-ubyte.gz',
+        'train-labels-idx1-ubyte.gz',
+        't10k-images-idx3-ubyte.gz',
+        't10k-labels-idx1-ubyte.gz',
+    ]
+    download(name, url, files)
+
 
 if __name__ == '__main__':
     main()
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+{`
	`2`	`+ "python.pythonPath": "/Users/tatsuya/miniconda3/bin/python"`
	`3`	`+}`