Добавлен анализ данных в JupyterLab
This commit is contained in:
parent
beea950236
commit
c6fb265a2f
21
movies.csv
Normal file
21
movies.csv
Normal file
@ -0,0 +1,21 @@
|
|||||||
|
title,year,country,rating,duration,genre
|
||||||
|
The Shawshank Redemption,1994,USA,9.3,142,Drama
|
||||||
|
The Godfather,1972,USA,9.2,175,Crime
|
||||||
|
The Dark Knight,2008,USA,9.0,152,Action
|
||||||
|
Pulp Fiction,1994,USA,8.9,154,Crime
|
||||||
|
Forrest Gump,1994,USA,8.8,142,Drama
|
||||||
|
Inception,2010,USA,8.8,148,Sci-Fi
|
||||||
|
Fight Club,1999,USA,8.8,139,Drama
|
||||||
|
Interstellar,2014,USA,8.7,169,Sci-Fi
|
||||||
|
The Matrix,1999,USA,8.7,136,Sci-Fi
|
||||||
|
Gladiator,2000,USA,8.5,155,Action
|
||||||
|
The Green Mile,1999,USA,8.6,189,Drama
|
||||||
|
Whiplash,2014,USA,8.5,106,Drama
|
||||||
|
Parasite,2019,South Korea,8.5,132,Thriller
|
||||||
|
Joker,2019,USA,8.4,122,Drama
|
||||||
|
Avengers Endgame,2019,USA,8.4,181,Action
|
||||||
|
Django Unchained,2012,USA,8.5,165,Western
|
||||||
|
The Departed,2006,USA,8.5,151,Crime
|
||||||
|
The Prestige,2006,USA,8.5,130,Drama
|
||||||
|
Coco,2017,USA,8.4,105,Animation
|
||||||
|
WALL-E,2008,USA,8.4,98,Animation
|
||||||
|
@ -1,5 +1,102 @@
|
|||||||
|
anyio==4.13.0
|
||||||
|
argon2-cffi==25.1.0
|
||||||
|
argon2-cffi-bindings==25.1.0
|
||||||
|
arrow==1.4.0
|
||||||
|
asttokens==3.0.1
|
||||||
|
async-lru==2.3.0
|
||||||
|
attrs==26.1.0
|
||||||
|
babel==2.18.0
|
||||||
|
beautifulsoup4==4.14.3
|
||||||
|
bleach==6.3.0
|
||||||
|
certifi==2026.5.20
|
||||||
|
cffi==2.0.0
|
||||||
|
charset-normalizer==3.4.7
|
||||||
|
colorama==0.4.6
|
||||||
|
comm==0.2.3
|
||||||
|
contourpy==1.3.3
|
||||||
|
cycler==0.12.1
|
||||||
|
debugpy==1.8.20
|
||||||
|
decorator==5.3.1
|
||||||
|
defusedxml==0.7.1
|
||||||
|
executing==2.2.1
|
||||||
|
fastjsonschema==2.21.2
|
||||||
|
fonttools==4.63.0
|
||||||
|
fqdn==1.5.1
|
||||||
|
h11==0.16.0
|
||||||
|
httpcore==1.0.9
|
||||||
|
httpx==0.28.1
|
||||||
|
idna==3.16
|
||||||
|
ipykernel==7.2.0
|
||||||
|
ipython==9.13.0
|
||||||
|
ipython_pygments_lexers==1.1.1
|
||||||
|
isoduration==20.11.0
|
||||||
|
jedi==0.20.0
|
||||||
|
Jinja2==3.1.6
|
||||||
|
json5==0.14.0
|
||||||
|
jsonpointer==3.1.1
|
||||||
|
jsonschema==4.26.0
|
||||||
|
jsonschema-specifications==2025.9.1
|
||||||
|
jupyter-events==0.12.1
|
||||||
|
jupyter-lsp==2.3.1
|
||||||
|
jupyter_client==8.8.0
|
||||||
|
jupyter_core==5.9.1
|
||||||
|
jupyter_server==2.18.2
|
||||||
|
jupyter_server_terminals==0.5.4
|
||||||
|
jupyterlab==4.5.7
|
||||||
|
jupyterlab_pygments==0.3.0
|
||||||
|
jupyterlab_server==2.28.0
|
||||||
|
kiwisolver==1.5.0
|
||||||
|
lark==1.3.1
|
||||||
|
MarkupSafe==3.0.3
|
||||||
|
matplotlib==3.10.9
|
||||||
|
matplotlib-inline==0.2.2
|
||||||
|
mistune==3.2.1
|
||||||
|
nbclient==0.10.4
|
||||||
|
nbconvert==7.17.1
|
||||||
|
nbformat==5.10.4
|
||||||
|
nest-asyncio==1.6.0
|
||||||
|
notebook_shim==0.2.4
|
||||||
numpy==2.4.6
|
numpy==2.4.6
|
||||||
|
packaging==26.2
|
||||||
pandas==3.0.3
|
pandas==3.0.3
|
||||||
|
pandocfilters==1.5.1
|
||||||
|
parso==0.8.7
|
||||||
|
pillow==12.2.0
|
||||||
|
platformdirs==4.9.6
|
||||||
|
prometheus_client==0.25.0
|
||||||
|
prompt_toolkit==3.0.52
|
||||||
|
psutil==7.2.2
|
||||||
|
pure_eval==0.2.3
|
||||||
|
pycparser==3.0
|
||||||
|
Pygments==2.20.0
|
||||||
|
pyparsing==3.3.2
|
||||||
python-dateutil==2.9.0.post0
|
python-dateutil==2.9.0.post0
|
||||||
|
python-json-logger==4.1.0
|
||||||
|
pywinpty==3.0.3
|
||||||
|
PyYAML==6.0.3
|
||||||
|
pyzmq==27.1.0
|
||||||
|
referencing==0.37.0
|
||||||
|
requests==2.34.2
|
||||||
|
rfc3339-validator==0.1.4
|
||||||
|
rfc3986-validator==0.1.1
|
||||||
|
rfc3987-syntax==1.1.0
|
||||||
|
rpds-py==0.30.0
|
||||||
|
seaborn==0.13.2
|
||||||
|
Send2Trash==2.1.0
|
||||||
|
setuptools==82.0.1
|
||||||
six==1.17.0
|
six==1.17.0
|
||||||
|
soupsieve==2.8.4
|
||||||
|
stack-data==0.6.3
|
||||||
|
terminado==0.18.1
|
||||||
|
tinycss2==1.4.0
|
||||||
|
tornado==6.5.6
|
||||||
|
tqdm==4.67.3
|
||||||
|
traitlets==5.15.0
|
||||||
|
typing_extensions==4.15.0
|
||||||
tzdata==2026.2
|
tzdata==2026.2
|
||||||
|
uri-template==1.3.0
|
||||||
|
urllib3==2.7.0
|
||||||
|
wcwidth==0.7.0
|
||||||
|
webcolors==25.10.0
|
||||||
|
webencodings==0.5.1
|
||||||
|
websocket-client==1.9.0
|
||||||
|
|||||||
156
week2_analysis.ipynb
Normal file
156
week2_analysis.ipynb
Normal file
@ -0,0 +1,156 @@
|
|||||||
|
{
|
||||||
|
"cells": [
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "e7297b19-5736-4a17-911d-645849a628a6",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"import pandas as pd\n",
|
||||||
|
"import numpy as np\n",
|
||||||
|
"import matplotlib.pyplot as plt\n",
|
||||||
|
"import seaborn as sns\n",
|
||||||
|
"from tqdm import tqdm\n",
|
||||||
|
"import time"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "711ef140-61f6-4b64-8fcf-598247617d65",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"df = pd.read_csv(\"movies.csv\")\n",
|
||||||
|
"\n",
|
||||||
|
"print(\"Размер таблицы:\", df.shape)\n",
|
||||||
|
"df.head()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "8d269a73-b428-421b-a9e7-e1158368d099",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"df.info()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "965d5583-2cc3-409c-8db4-a7a00494a6ed",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"df.describe()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "c74ac668-6c80-49c8-8b72-eea13fdf5ded",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"df.isnull().sum()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "4940a598-773c-4f6e-8bce-e841404eebc3",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"plt.figure(figsize=(8, 5))\n",
|
||||||
|
"sns.histplot(df[\"rating\"], bins=8, kde=True)\n",
|
||||||
|
"plt.title(\"Распределение рейтингов фильмов\")\n",
|
||||||
|
"plt.xlabel(\"Рейтинг\")\n",
|
||||||
|
"plt.ylabel(\"Количество фильмов\")\n",
|
||||||
|
"plt.show()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "906ffd6f-e7a2-402a-9a33-40a075cc5685",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"plt.figure(figsize=(8, 5))\n",
|
||||||
|
"sns.scatterplot(data=df, x=\"year\", y=\"rating\", hue=\"genre\")\n",
|
||||||
|
"plt.title(\"Связь года выпуска и рейтинга фильма\")\n",
|
||||||
|
"plt.xlabel(\"Год выпуска\")\n",
|
||||||
|
"plt.ylabel(\"Рейтинг\")\n",
|
||||||
|
"plt.legend(title=\"Жанр\", bbox_to_anchor=(1.05, 1), loc=\"upper left\")\n",
|
||||||
|
"plt.show()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "a05e677a-74e7-4a3a-adce-02f8dc04153e",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"plt.figure(figsize=(10, 5))\n",
|
||||||
|
"sns.boxplot(data=df, x=\"genre\", y=\"rating\")\n",
|
||||||
|
"plt.title(\"Распределение рейтингов по жанрам\")\n",
|
||||||
|
"plt.xlabel(\"Жанр\")\n",
|
||||||
|
"plt.ylabel(\"Рейтинг\")\n",
|
||||||
|
"plt.xticks(rotation=45)\n",
|
||||||
|
"plt.show()"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "55e5ea86-f072-419c-b937-d752f8fec4e3",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"ratings = df[\"rating\"].to_numpy()\n",
|
||||||
|
"\n",
|
||||||
|
"print(\"Средний рейтинг:\", np.mean(ratings))\n",
|
||||||
|
"print(\"Минимальный рейтинг:\", np.min(ratings))\n",
|
||||||
|
"print(\"Максимальный рейтинг:\", np.max(ratings))\n",
|
||||||
|
"print(\"Стандартное отклонение:\", np.std(ratings))"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"id": "86546195-d108-4c55-9401-9d7017d96277",
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"for i in tqdm(range(100)):\n",
|
||||||
|
" time.sleep(0.01)"
|
||||||
|
]
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"metadata": {
|
||||||
|
"kernelspec": {
|
||||||
|
"display_name": "Python 3 (ipykernel)",
|
||||||
|
"language": "python",
|
||||||
|
"name": "python3"
|
||||||
|
},
|
||||||
|
"language_info": {
|
||||||
|
"codemirror_mode": {
|
||||||
|
"name": "ipython",
|
||||||
|
"version": 3
|
||||||
|
},
|
||||||
|
"file_extension": ".py",
|
||||||
|
"mimetype": "text/x-python",
|
||||||
|
"name": "python",
|
||||||
|
"nbconvert_exporter": "python",
|
||||||
|
"pygments_lexer": "ipython3",
|
||||||
|
"version": "3.14.5"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"nbformat": 4,
|
||||||
|
"nbformat_minor": 5
|
||||||
|
}
|
||||||
Loading…
Reference in New Issue
Block a user