diff --git a/analysis_external.ipynb b/analysis_external.ipynb new file mode 100644 index 0000000..310a641 --- /dev/null +++ b/analysis_external.ipynb @@ -0,0 +1,1032 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: textblob in /Users/sayaka/.pyenv/versions/3.10.12/lib/python3.10/site-packages (0.18.0.post0)\n", + "Requirement already satisfied: nltk>=3.8 in /Users/sayaka/.pyenv/versions/3.10.12/lib/python3.10/site-packages (from textblob) (3.9.1)\n", + "Requirement already satisfied: click in /Users/sayaka/.pyenv/versions/3.10.12/lib/python3.10/site-packages (from nltk>=3.8->textblob) (8.1.6)\n", + "Requirement already satisfied: joblib in /Users/sayaka/.pyenv/versions/3.10.12/lib/python3.10/site-packages (from nltk>=3.8->textblob) (1.3.2)\n", + "Requirement already satisfied: regex>=2021.8.3 in /Users/sayaka/.pyenv/versions/3.10.12/lib/python3.10/site-packages (from nltk>=3.8->textblob) (2023.6.3)\n", + "Requirement already satisfied: tqdm in /Users/sayaka/.pyenv/versions/3.10.12/lib/python3.10/site-packages (from nltk>=3.8->textblob) (4.64.0)\n", + "\n", + "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.2\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.3.1\u001b[0m\n", + "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n", + "Note: you may need to restart the kernel to use updated packages.\n" + ] + } + ], + "source": [ + "pip install textblob\n" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "\n", + "import pandas as pd\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "from textblob import TextBlob # For sentiment analysis if needed\n", + "\n", + "# Load the dataset\n", + "data = pd.read_csv(\"TMDB_movie_dataset_v11.csv\")" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | id | \n", + "title | \n", + "vote_average | \n", + "vote_count | \n", + "status | \n", + "release_date | \n", + "revenue | \n", + "runtime | \n", + "adult | \n", + "backdrop_path | \n", + "... | \n", + "original_title | \n", + "overview | \n", + "popularity | \n", + "poster_path | \n", + "tagline | \n", + "genres | \n", + "production_companies | \n", + "production_countries | \n", + "spoken_languages | \n", + "keywords | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "27205 | \n", + "Inception | \n", + "8.364 | \n", + "34495 | \n", + "Released | \n", + "2010-07-15 | \n", + "825532764 | \n", + "148 | \n", + "False | \n", + "/8ZTVqvKDQ8emSGUEMjsS4yHAwrp.jpg | \n", + "... | \n", + "Inception | \n", + "Cobb, a skilled thief who commits corporate es... | \n", + "83.952 | \n", + "/oYuLEt3zVCKq57qu2F8dT7NIa6f.jpg | \n", + "Your mind is the scene of the crime. | \n", + "Action, Science Fiction, Adventure | \n", + "Legendary Pictures, Syncopy, Warner Bros. Pict... | \n", + "United Kingdom, United States of America | \n", + "English, French, Japanese, Swahili | \n", + "rescue, mission, dream, airplane, paris, franc... | \n", + "
1 | \n", + "157336 | \n", + "Interstellar | \n", + "8.417 | \n", + "32571 | \n", + "Released | \n", + "2014-11-05 | \n", + "701729206 | \n", + "169 | \n", + "False | \n", + "/pbrkL804c8yAv3zBZR4QPEafpAR.jpg | \n", + "... | \n", + "Interstellar | \n", + "The adventures of a group of explorers who mak... | \n", + "140.241 | \n", + "/gEU2QniE6E77NI6lCU6MxlNBvIx.jpg | \n", + "Mankind was born on Earth. It was never meant ... | \n", + "Adventure, Drama, Science Fiction | \n", + "Legendary Pictures, Syncopy, Lynda Obst Produc... | \n", + "United Kingdom, United States of America | \n", + "English | \n", + "rescue, future, spacecraft, race against time,... | \n", + "
2 | \n", + "155 | \n", + "The Dark Knight | \n", + "8.512 | \n", + "30619 | \n", + "Released | \n", + "2008-07-16 | \n", + "1004558444 | \n", + "152 | \n", + "False | \n", + "/nMKdUUepR0i5zn0y1T4CsSB5chy.jpg | \n", + "... | \n", + "The Dark Knight | \n", + "Batman raises the stakes in his war on crime. ... | \n", + "130.643 | \n", + "/qJ2tW6WMUDux911r6m7haRef0WH.jpg | \n", + "Welcome to a world without rules. | \n", + "Drama, Action, Crime, Thriller | \n", + "DC Comics, Legendary Pictures, Syncopy, Isobel... | \n", + "United Kingdom, United States of America | \n", + "English, Mandarin | \n", + "joker, sadism, chaos, secret identity, crime f... | \n", + "
3 | \n", + "19995 | \n", + "Avatar | \n", + "7.573 | \n", + "29815 | \n", + "Released | \n", + "2009-12-15 | \n", + "2923706026 | \n", + "162 | \n", + "False | \n", + "/vL5LR6WdxWPjLPFRLe133jXWsh5.jpg | \n", + "... | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "79.932 | \n", + "/kyeqWdyUXW608qlYkRqosgbbJyK.jpg | \n", + "Enter the world of Pandora. | \n", + "Action, Adventure, Fantasy, Science Fiction | \n", + "Dune Entertainment, Lightstorm Entertainment, ... | \n", + "United States of America, United Kingdom | \n", + "English, Spanish | \n", + "future, society, culture clash, space travel, ... | \n", + "
4 | \n", + "24428 | \n", + "The Avengers | \n", + "7.710 | \n", + "29166 | \n", + "Released | \n", + "2012-04-25 | \n", + "1518815515 | \n", + "143 | \n", + "False | \n", + "/9BBTo63ANSmhC4e6r62OJFuK2GL.jpg | \n", + "... | \n", + "The Avengers | \n", + "When an unexpected enemy emerges and threatens... | \n", + "98.082 | \n", + "/RYMX2wcKCBAr24UyPD7xwmjaTn.jpg | \n", + "Some assembly required. | \n", + "Science Fiction, Action, Adventure | \n", + "Marvel Studios | \n", + "United States of America | \n", + "English, Hindi, Russian | \n", + "new york city, superhero, shield, based on com... | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
1128262 | \n", + "775064 | \n", + "Schoolgirls Holiday | \n", + "0.000 | \n", + "0 | \n", + "Released | \n", + "2016-10-20 | \n", + "0 | \n", + "0 | \n", + "True | \n", + "/f1wBCtJOjr10ntxhAl9KDS3iuBc.jpg | \n", + "... | \n", + "Schoolgirls Holiday | \n", + "Every holiday has its own stories. Get into t... | \n", + "0.600 | \n", + "/A4xzsrwnUshl3xLwrzXyhVlN4eK.jpg | \n", + "NaN | \n", + "NaN | \n", + "Video Art Holland | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
1128263 | \n", + "775065 | \n", + "Window | \n", + "0.000 | \n", + "0 | \n", + "Released | \n", + "2012-03-26 | \n", + "0 | \n", + "15 | \n", + "False | \n", + "NaN | \n", + "... | \n", + "Logs | \n", + "Mr. Schmidt, a young man who is recovering fro... | \n", + "0.600 | \n", + "/Ad9h4c3c6wpN9e2oZ0bk9STpkRW.jpg | \n", + "NaN | \n", + "Mystery, Drama | \n", + "Tarhun Sisters | \n", + "Latvia | \n", + "NaN | \n", + "NaN | \n", + "
1128264 | \n", + "775067 | \n", + "How to Get Away With Cheating | \n", + "0.000 | \n", + "0 | \n", + "Released | \n", + "2018-01-01 | \n", + "0 | \n", + "105 | \n", + "False | \n", + "/rTZfGs1d7VHLPQoUMzTWw2wPweQ.jpg | \n", + "... | \n", + "How to Get Away With Cheating | \n", + "Although Professor Alex P. Keating and his wif... | \n", + "0.600 | \n", + "/xEDLbhYyEBqoWpX8lydrlbrovkt.jpg | \n", + "NaN | \n", + "Thriller | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "
1128265 | \n", + "279414 | \n", + "Once My Mother | \n", + "0.000 | \n", + "0 | \n", + "Released | \n", + "2014-07-24 | \n", + "0 | \n", + "75 | \n", + "False | \n", + "NaN | \n", + "... | \n", + "Once My Mother | \n", + "Australian filmmaker Sophia Turkiewicz investi... | \n", + "0.600 | \n", + "NaN | \n", + "NaN | \n", + "History, Documentary, War, Family | \n", + "Change Focus Media | \n", + "Ukraine, Australia, Poland | \n", + "English | \n", + "daughter, mother, parent child relationship, r... | \n", + "
1128266 | \n", + "1383393 | \n", + "Honkai: Star Rail - Harmony Greets the New Year | \n", + "0.000 | \n", + "0 | \n", + "Released | \n", + "2024-02-07 | \n", + "0 | \n", + "4 | \n", + "False | \n", + "None | \n", + "... | \n", + "Honkai: Star Rail - Harmony Greets the New Year | \n", + "A new year dawns and prosperity beckons. In a ... | \n", + "0.600 | \n", + "/ly1xMzCfsEWlweFiMv8Xbc5kAhE.jpg | \n", + "NaN | \n", + "Animation, Science Fiction | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "honkai | \n", + "
1128267 rows × 24 columns
\n", + "