diff --git a/Workshop_notebooks/Day1_notebook/logistic_regression.ipynb b/Workshop_notebooks/Day1_notebook/logistic_regression.ipynb new file mode 100644 index 0000000..cfb9783 --- /dev/null +++ b/Workshop_notebooks/Day1_notebook/logistic_regression.ipynb @@ -0,0 +1,194 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 134, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "from sklearn.linear_model import LogisticRegression\n", + "from sklearn.model_selection import train_test_split" + ] + }, + { + "cell_type": "code", + "execution_count": 135, + "metadata": {}, + "outputs": [], + "source": [ + "from GetData.read_data import get_stock_data\n", + "from _datetime import datetime" + ] + }, + { + "cell_type": "code", + "execution_count": 136, + "metadata": {}, + "outputs": [], + "source": [ + "Amazon = get_stock_data(name = 'AMZN', start = datetime(2017, 1, 1), end=datetime(2019, 1, 1))" + ] + }, + { + "cell_type": "code", + "execution_count": 178, + "metadata": {}, + "outputs": [], + "source": [ + "y = 1 * ((Amazon.Close - np.mean(Amazon.Close))>0)" + ] + }, + { + "cell_type": "code", + "execution_count": 179, + "metadata": {}, + "outputs": [], + "source": [ + "" + ] + }, + { + "cell_type": "code", + "execution_count": 179, + "metadata": {}, + "outputs": [], + "source": [ + "[train_data_x, test_data_x, train_data_y, test_data_y] = train_test_split(Amazon.Close, y, test_size=0.3, random_state=5)" + ] + }, + { + "cell_type": "code", + "execution_count": 180, + "metadata": {}, + "outputs": [], + "source": [ + "LG = LogisticRegression(solver='lbfgs')" + ] + }, + { + "cell_type": "code", + "execution_count": 181, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,\n intercept_scaling=1, max_iter=100, multi_class='warn',\n n_jobs=None, penalty='l2', random_state=None, solver='lbfgs',\n tol=0.0001, verbose=0, warm_start=False)\n" + ] + } + ], + "source": [ + "import numpy as np\n", + "train_x = np.asarray(train_data_x).reshape(-1, 1)\n", + "test_x = np.asarray(test_data_x).reshape(-1, 1)\n", + "train_y = np.asarray(train_data_y)\n", + "test_y = np.asarray(test_data_y)\n", + "estimator = LG.fit(train_x, train_y)\n", + "print(estimator)" + ] + }, + { + "cell_type": "code", + "execution_count": 192, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[0 1 0 0 0 0 0 0 0 0 0 0 0 1 0 1 0 0 1 0 0 1 0 0 1 0 0 1 0 0 1 0 0 0 1 1 1\n 1 1 0 0 0 1 1 0 0 0 1 0 0 0 1 0 1 1 1 0 1 1 0 1 1 1 1 0 1 0 0 1 0 0 1 1 0\n 0 0 0 0 0 0 0 0 0 1 0 1 0 1 0 0 0 0 0]\n" + ] + } + ], + "source": [ + "y_hat = estimator.predict(test_x)\n", + "print(y_hat)" + ] + }, + { + "cell_type": "code", + "execution_count": 193, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "100.0" + ] + }, + "execution_count": 193, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "accuracy = np.mean(test_y == y_hat) * 100\n", + "accuracy" + ] + }, + { + "cell_type": "code", + "execution_count": 197, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "[]" + ] + }, + "execution_count": 197, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "plt.plot(range(0, len(y_hat)), y_hat)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 2", + "language": "python", + "name": "python2" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 2 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython2", + "version": "2.7.6" + } + }, + "nbformat": 4, + "nbformat_minor": 0 +}