{ "cells": [ { "cell_type": "code", "execution_count": 2, "id": "7d1db536", "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 3, "id": "76b100fc", "metadata": {}, "outputs": [], "source": [ "df = pd.read_csv(\"carprices.csv\")" ] }, { "cell_type": "code", "execution_count": 6, "id": "806166f8", "metadata": {}, "outputs": [], "source": [ "df = df.drop(\"Car Model\", axis=\"columns\")" ] }, { "cell_type": "code", "execution_count": 8, "id": "1dfdbd5a", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
MileageSell Price($)Age(yrs)
069000180006
135000340003
257000261005
322500400002
446000315004
559000294005
652000320005
772000193006
891000120008
967000220006
1083000200007
1179000210007
1259000330005
\n", "
" ], "text/plain": [ " Mileage Sell Price($) Age(yrs)\n", "0 69000 18000 6\n", "1 35000 34000 3\n", "2 57000 26100 5\n", "3 22500 40000 2\n", "4 46000 31500 4\n", "5 59000 29400 5\n", "6 52000 32000 5\n", "7 72000 19300 6\n", "8 91000 12000 8\n", "9 67000 22000 6\n", "10 83000 20000 7\n", "11 79000 21000 7\n", "12 59000 33000 5" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df" ] }, { "cell_type": "code", "execution_count": 7, "id": "d76d64b6", "metadata": {}, "outputs": [], "source": [ "%matplotlib inline\n", "import matplotlib.pyplot as plt" ] }, { "cell_type": "code", "execution_count": 9, "id": "acdf9d06", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 9, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plt.scatter(df[\"Mileage\"], df[\"Sell Price($)\"])" ] }, { "cell_type": "code", "execution_count": 10, "id": "1627f829", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 10, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plt.scatter(df[\"Age(yrs)\"], df[\"Sell Price($)\"])" ] }, { "cell_type": "code", "execution_count": 13, "id": "932ff8d6", "metadata": {}, "outputs": [], "source": [ "x = df.drop(\"Sell Price($)\", axis=\"columns\")\n", "y = df[\"Sell Price($)\"]" ] }, { "cell_type": "code", "execution_count": 15, "id": "a3714dd8", "metadata": {}, "outputs": [], "source": [ "from sklearn.model_selection import train_test_split" ] }, { "cell_type": "code", "execution_count": 18, "id": "f7263cf1", "metadata": {}, "outputs": [], "source": [ "x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=10)#random_state可以保证每次运行结果都一样,否则每次都是随机划分。" ] }, { "cell_type": "code", "execution_count": 20, "id": "48944228", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "(10, 3)" ] }, "execution_count": 20, "metadata": {}, "output_type": "execute_result" } ], "source": [ "len(x_train), len(x_test)" ] }, { "cell_type": "code", "execution_count": 21, "id": "524b6f13", "metadata": {}, "outputs": [], "source": [ "from sklearn.linear_model import LinearRegression" ] }, { "cell_type": "code", "execution_count": 22, "id": "29f0bfaf", "metadata": {}, "outputs": [], "source": [ "lr = LinearRegression()" ] }, { "cell_type": "code", "execution_count": 23, "id": "e60d2dd9", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "LinearRegression()" ] }, "execution_count": 23, "metadata": {}, "output_type": "execute_result" } ], "source": [ "lr.fit(x_train, y_train)" ] }, { "cell_type": "code", "execution_count": 27, "id": "dcefda82", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array([41842.49106079, 22531.68057211, 18423.93325387])" ] }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "lr.predict(x_test)" ] }, { "cell_type": "code", "execution_count": 25, "id": "ecefdb9b", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0.9224816911971742" ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "lr.score(x_test, y_test)" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.9" } }, "nbformat": 4, "nbformat_minor": 5 }