diff --git a/2-Regression/1-Tools/notebook.ipynb b/2-Regression/1-Tools/notebook.ipynb index 5dfc6f31..9388433f 100644 --- a/2-Regression/1-Tools/notebook.ipynb +++ b/2-Regression/1-Tools/notebook.ipynb @@ -33,7 +33,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 238, "metadata": {}, "outputs": [ { @@ -50,7 +50,7 @@ }, { "cell_type": "code", - "execution_count": 27, + "execution_count": 239, "metadata": {}, "outputs": [], "source": [ @@ -61,7 +61,7 @@ }, { "cell_type": "code", - "execution_count": 28, + "execution_count": 240, "metadata": {}, "outputs": [ { @@ -90,11 +90,136 @@ }, { "cell_type": "code", - "execution_count": 30, + "execution_count": 241, "metadata": {}, "outputs": [], "source": [ - "X = X[:, np.newaxis, 2]" + "# print(X.shape) -> 442*10 feature\n", + "X = X[:, np.newaxis, 9]\n", + "# print(X.shape) -> 442*1 feature\n" + ] + }, + { + "source": [ + "Split the data into a test set and a training set for the axis and the colmns " + ], + "cell_type": "markdown", + "metadata": {} + }, + { + "cell_type": "code", + "execution_count": 242, + "metadata": {}, + "outputs": [], + "source": [ + "X_train, X_test, y_train, y_test = model_selection.train_test_split(X, y, test_size=0.33)\n", + "# print(X_test.shape)\n", + "# print(y_test.shape)\n", + "# print(y_train.shape)\n", + "# print(X_train.shape)" + ] + }, + { + "source": [ + "Creation of a Linear model (using linear regression) from the training subsets" + ], + "cell_type": "markdown", + "metadata": {} + }, + { + "cell_type": "code", + "execution_count": 243, + "metadata": {}, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "LinearRegression()" + ] + }, + "metadata": {}, + "execution_count": 243 + } + ], + "source": [ + " model = linear_model.LinearRegression()\n", + " model.fit(X_train, y_train)" + ] + }, + { + "source": [ + "Making predictions" + ], + "cell_type": "markdown", + "metadata": {} + }, + { + "cell_type": "code", + "execution_count": 244, + "metadata": {}, + "outputs": [], + "source": [ + "y_pred = model.predict(X_test)" + ] + }, + { + "source": [ + "Making a graphic represenntation with the actual testing data and the linear estimations(can be represented by a line)." + ], + "cell_type": "markdown", + "metadata": {} + }, + { + "cell_type": "code", + "execution_count": 245, + "metadata": {}, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": "
", + "image/svg+xml": "\r\n\r\n\r\n \r\n \r\n \r\n \r\n 2021-07-19T02:34:28.560224\r\n image/svg+xml\r\n \r\n \r\n Matplotlib v3.4.1, https://matplotlib.org/\r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n \r\n\r\n", + "image/png": "\n" + }, + "metadata": { + "needs_background": "light" + } + } + ], + "source": [ + " plt.scatter(X_test, y_test, color='black')\n", + " plt.plot(X_test, y_pred, color='blue', linewidth=3)\n", + " plt.show()" + ] + }, + { + "source": [ + "## assignement" + ], + "cell_type": "markdown", + "metadata": {} + }, + { + "cell_type": "code", + "execution_count": 246, + "metadata": {}, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[ 5. 162. 60.]\n [ 2. 110. 60.]\n [ 12. 101. 101.]\n [ 12. 105. 37.]\n [ 13. 155. 58.]\n [ 4. 101. 42.]\n [ 8. 101. 38.]\n [ 6. 125. 40.]\n [ 15. 200. 40.]\n [ 17. 251. 250.]\n [ 17. 120. 38.]\n [ 13. 210. 115.]\n [ 14. 215. 105.]\n [ 1. 50. 50.]\n [ 6. 70. 31.]\n [ 12. 210. 120.]\n [ 4. 60. 25.]\n [ 11. 230. 80.]\n [ 15. 225. 73.]\n [ 2. 110. 43.]]\n" + ] + } + ], + "source": [ + "X ,y= datasets.load_linnerud( return_X_y=True, as_frame=False)\n", + "# print(X.shape)\n", + "# print(X[0])\n", + "# Target \n", + "print(X)\n", + "X = X[:, np.newaxis, 1]\n" ] }, {