diff --git "a/notebook.ipynb" "b/notebook.ipynb" new file mode 100644--- /dev/null +++ "b/notebook.ipynb" @@ -0,0 +1,2684 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "id": "04fb6bab", + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "0442ec60", + "metadata": {}, + "outputs": [], + "source": [ + "movies = pd.read_csv('./data/movies.csv')\n", + "credits = pd.read_csv('./data/credits.csv')" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "2e772eac", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | budget | \n", + "genres | \n", + "homepage | \n", + "id | \n", + "keywords | \n", + "original_language | \n", + "original_title | \n", + "overview | \n", + "popularity | \n", + "production_companies | \n", + "production_countries | \n", + "release_date | \n", + "revenue | \n", + "runtime | \n", + "spoken_languages | \n", + "status | \n", + "tagline | \n", + "title | \n", + "vote_average | \n", + "vote_count | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "237000000 | \n", + "[{\"id\": 28, \"name\": \"Action\"}, {\"id\": 12, \"nam... | \n", + "http://www.avatarmovie.com/ | \n", + "19995 | \n", + "[{\"id\": 1463, \"name\": \"culture clash\"}, {\"id\":... | \n", + "en | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "150.437577 | \n", + "[{\"name\": \"Ingenious Film Partners\", \"id\": 289... | \n", + "[{\"iso_3166_1\": \"US\", \"name\": \"United States o... | \n", + "2009-12-10 | \n", + "2787965087 | \n", + "162.0 | \n", + "[{\"iso_639_1\": \"en\", \"name\": \"English\"}, {\"iso... | \n", + "Released | \n", + "Enter the World of Pandora. | \n", + "Avatar | \n", + "7.2 | \n", + "11800 | \n", + "
\n", + " | budget | \n", + "genres | \n", + "homepage | \n", + "movie_id | \n", + "keywords | \n", + "original_language | \n", + "original_title | \n", + "overview | \n", + "popularity | \n", + "production_companies | \n", + "production_countries | \n", + "release_date | \n", + "revenue | \n", + "runtime | \n", + "spoken_languages | \n", + "status | \n", + "tagline | \n", + "title | \n", + "vote_average | \n", + "vote_count | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "237000000 | \n", + "[{\"id\": 28, \"name\": \"Action\"}, {\"id\": 12, \"nam... | \n", + "http://www.avatarmovie.com/ | \n", + "19995 | \n", + "[{\"id\": 1463, \"name\": \"culture clash\"}, {\"id\":... | \n", + "en | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "150.437577 | \n", + "[{\"name\": \"Ingenious Film Partners\", \"id\": 289... | \n", + "[{\"iso_3166_1\": \"US\", \"name\": \"United States o... | \n", + "2009-12-10 | \n", + "2787965087 | \n", + "162.0 | \n", + "[{\"iso_639_1\": \"en\", \"name\": \"English\"}, {\"iso... | \n", + "Released | \n", + "Enter the World of Pandora. | \n", + "Avatar | \n", + "7.2 | \n", + "11800 | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "[{\"cast_id\": 242, \"character\": \"Jake Sully\", \"... | \n", + "[{\"credit_id\": \"52fe48009251416c750aca23\", \"de... | \n", + "
\n", + " | budget | \n", + "genres | \n", + "homepage | \n", + "movie_id | \n", + "keywords | \n", + "original_language | \n", + "original_title | \n", + "overview | \n", + "popularity | \n", + "production_companies | \n", + "... | \n", + "revenue | \n", + "runtime | \n", + "spoken_languages | \n", + "status | \n", + "tagline | \n", + "title | \n", + "vote_average | \n", + "vote_count | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "237000000 | \n", + "[{\"id\": 28, \"name\": \"Action\"}, {\"id\": 12, \"nam... | \n", + "http://www.avatarmovie.com/ | \n", + "19995 | \n", + "[{\"id\": 1463, \"name\": \"culture clash\"}, {\"id\":... | \n", + "en | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "150.437577 | \n", + "[{\"name\": \"Ingenious Film Partners\", \"id\": 289... | \n", + "... | \n", + "2787965087 | \n", + "162.0 | \n", + "[{\"iso_639_1\": \"en\", \"name\": \"English\"}, {\"iso... | \n", + "Released | \n", + "Enter the World of Pandora. | \n", + "Avatar | \n", + "7.2 | \n", + "11800 | \n", + "[{\"cast_id\": 242, \"character\": \"Jake Sully\", \"... | \n", + "[{\"credit_id\": \"52fe48009251416c750aca23\", \"de... | \n", + "
1 rows × 22 columns
\n", + "\n", + " | budget | \n", + "movie_id | \n", + "popularity | \n", + "revenue | \n", + "runtime | \n", + "vote_average | \n", + "vote_count | \n", + "
---|---|---|---|---|---|---|---|
count | \n", + "4.803000e+03 | \n", + "4803.000000 | \n", + "4803.000000 | \n", + "4.803000e+03 | \n", + "4801.000000 | \n", + "4803.000000 | \n", + "4803.000000 | \n", + "
mean | \n", + "2.904504e+07 | \n", + "57165.484281 | \n", + "21.492301 | \n", + "8.226064e+07 | \n", + "106.875859 | \n", + "6.092172 | \n", + "690.217989 | \n", + "
std | \n", + "4.072239e+07 | \n", + "88694.614033 | \n", + "31.816650 | \n", + "1.628571e+08 | \n", + "22.611935 | \n", + "1.194612 | \n", + "1234.585891 | \n", + "
min | \n", + "0.000000e+00 | \n", + "5.000000 | \n", + "0.000000 | \n", + "0.000000e+00 | \n", + "0.000000 | \n", + "0.000000 | \n", + "0.000000 | \n", + "
25% | \n", + "7.900000e+05 | \n", + "9014.500000 | \n", + "4.668070 | \n", + "0.000000e+00 | \n", + "94.000000 | \n", + "5.600000 | \n", + "54.000000 | \n", + "
50% | \n", + "1.500000e+07 | \n", + "14629.000000 | \n", + "12.921594 | \n", + "1.917000e+07 | \n", + "103.000000 | \n", + "6.200000 | \n", + "235.000000 | \n", + "
75% | \n", + "4.000000e+07 | \n", + "58610.500000 | \n", + "28.313505 | \n", + "9.291719e+07 | \n", + "118.000000 | \n", + "6.800000 | \n", + "737.000000 | \n", + "
max | \n", + "3.800000e+08 | \n", + "459488.000000 | \n", + "875.581305 | \n", + "2.787965e+09 | \n", + "338.000000 | \n", + "10.000000 | \n", + "13752.000000 | \n", + "
\n", + " | budget | \n", + "genres | \n", + "homepage | \n", + "movie_id | \n", + "keywords | \n", + "original_language | \n", + "original_title | \n", + "overview | \n", + "popularity | \n", + "production_companies | \n", + "... | \n", + "revenue | \n", + "runtime | \n", + "spoken_languages | \n", + "status | \n", + "tagline | \n", + "title | \n", + "vote_average | \n", + "vote_count | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "237000000 | \n", + "[{\"id\": 28, \"name\": \"Action\"}, {\"id\": 12, \"nam... | \n", + "http://www.avatarmovie.com/ | \n", + "19995 | \n", + "[{\"id\": 1463, \"name\": \"culture clash\"}, {\"id\":... | \n", + "en | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "150.437577 | \n", + "[{\"name\": \"Ingenious Film Partners\", \"id\": 289... | \n", + "... | \n", + "2787965087 | \n", + "162.0 | \n", + "[{\"iso_639_1\": \"en\", \"name\": \"English\"}, {\"iso... | \n", + "Released | \n", + "Enter the World of Pandora. | \n", + "Avatar | \n", + "7.2 | \n", + "11800 | \n", + "[{\"cast_id\": 242, \"character\": \"Jake Sully\", \"... | \n", + "[{\"credit_id\": \"52fe48009251416c750aca23\", \"de... | \n", + "
1 rows × 22 columns
\n", + "\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "[{\"id\": 28, \"name\": \"Action\"}, {\"id\": 12, \"nam... | \n", + "[{\"id\": 1463, \"name\": \"culture clash\"}, {\"id\":... | \n", + "[{\"cast_id\": 242, \"character\": \"Jake Sully\", \"... | \n", + "[{\"credit_id\": \"52fe48009251416c750aca23\", \"de... | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "[Action, Adventure, Fantasy, Science Fiction] | \n", + "[culture clash, future, space war, space colon... | \n", + "[{\"cast_id\": 242, \"character\": \"Jake Sully\", \"... | \n", + "[{\"credit_id\": \"52fe48009251416c750aca23\", \"de... | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "[Action, Adventure, Fantasy, Science Fiction] | \n", + "[culture clash, future, space war, space colon... | \n", + "[Sam Worthington, Zoe Saldana, Sigourney Weaver] | \n", + "[{\"credit_id\": \"52fe48009251416c750aca23\", \"de... | \n", + "
1 | \n", + "285 | \n", + "Pirates of the Caribbean: At World's End | \n", + "Captain Barbossa, long believed to be dead, ha... | \n", + "[Adventure, Fantasy, Action] | \n", + "[ocean, drug abuse, exotic island, east india ... | \n", + "[Johnny Depp, Orlando Bloom, Keira Knightley] | \n", + "[{\"credit_id\": \"52fe4232c3a36847f800b579\", \"de... | \n", + "
2 | \n", + "206647 | \n", + "Spectre | \n", + "A cryptic message from Bond’s past sends him o... | \n", + "[Action, Adventure, Crime] | \n", + "[spy, based on novel, secret agent, sequel, mi... | \n", + "[Daniel Craig, Christoph Waltz, Léa Seydoux] | \n", + "[{\"credit_id\": \"54805967c3a36829b5002c41\", \"de... | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "[Action, Adventure, Fantasy, Science Fiction] | \n", + "[culture clash, future, space war, space colon... | \n", + "[Sam Worthington, Zoe Saldana, Sigourney Weaver] | \n", + "[James Cameron] | \n", + "
1 | \n", + "285 | \n", + "Pirates of the Caribbean: At World's End | \n", + "Captain Barbossa, long believed to be dead, ha... | \n", + "[Adventure, Fantasy, Action] | \n", + "[ocean, drug abuse, exotic island, east india ... | \n", + "[Johnny Depp, Orlando Bloom, Keira Knightley] | \n", + "[Gore Verbinski] | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "In the 22nd century, a paraplegic Marine is di... | \n", + "[Action, Adventure, Fantasy, ScienceFiction] | \n", + "[cultureclash, future, spacewar, spacecolony, ... | \n", + "[SamWorthington, ZoeSaldana, SigourneyWeaver] | \n", + "[JamesCameron] | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "
---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "[In, the, 22nd, century,, a, paraplegic, Marin... | \n", + "[Action, Adventure, Fantasy, ScienceFiction] | \n", + "[cultureclash, future, spacewar, spacecolony, ... | \n", + "[SamWorthington, ZoeSaldana, SigourneyWeaver] | \n", + "[JamesCameron] | \n", + "
1 | \n", + "285 | \n", + "Pirates of the Caribbean: At World's End | \n", + "[Captain, Barbossa,, long, believed, to, be, d... | \n", + "[Adventure, Fantasy, Action] | \n", + "[ocean, drugabuse, exoticisland, eastindiatrad... | \n", + "[JohnnyDepp, OrlandoBloom, KeiraKnightley] | \n", + "[GoreVerbinski] | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "overview | \n", + "genres | \n", + "keywords | \n", + "cast | \n", + "crew | \n", + "tags | \n", + "
---|---|---|---|---|---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "[In, the, 22nd, century,, a, paraplegic, Marin... | \n", + "[Action, Adventure, Fantasy, ScienceFiction] | \n", + "[cultureclash, future, spacewar, spacecolony, ... | \n", + "[SamWorthington, ZoeSaldana, SigourneyWeaver] | \n", + "[JamesCameron] | \n", + "[Action, Adventure, Fantasy, ScienceFiction, c... | \n", + "
1 | \n", + "285 | \n", + "Pirates of the Caribbean: At World's End | \n", + "[Captain, Barbossa,, long, believed, to, be, d... | \n", + "[Adventure, Fantasy, Action] | \n", + "[ocean, drugabuse, exoticisland, eastindiatrad... | \n", + "[JohnnyDepp, OrlandoBloom, KeiraKnightley] | \n", + "[GoreVerbinski] | \n", + "[Adventure, Fantasy, Action, ocean, drugabuse,... | \n", + "
2 | \n", + "206647 | \n", + "Spectre | \n", + "[A, cryptic, message, from, Bond’s, past, send... | \n", + "[Action, Adventure, Crime] | \n", + "[spy, basedonnovel, secretagent, sequel, mi6, ... | \n", + "[DanielCraig, ChristophWaltz, LéaSeydoux] | \n", + "[SamMendes] | \n", + "[Action, Adventure, Crime, spy, basedonnovel, ... | \n", + "
3 | \n", + "49026 | \n", + "The Dark Knight Rises | \n", + "[Following, the, death, of, District, Attorney... | \n", + "[Action, Crime, Drama, Thriller] | \n", + "[dccomics, crimefighter, terrorist, secretiden... | \n", + "[ChristianBale, MichaelCaine, GaryOldman] | \n", + "[ChristopherNolan] | \n", + "[Action, Crime, Drama, Thriller, dccomics, cri... | \n", + "
4 | \n", + "49529 | \n", + "John Carter | \n", + "[John, Carter, is, a, war-weary,, former, mili... | \n", + "[Action, Adventure, ScienceFiction] | \n", + "[basedonnovel, mars, medallion, spacetravel, p... | \n", + "[TaylorKitsch, LynnCollins, SamanthaMorton] | \n", + "[AndrewStanton] | \n", + "[Action, Adventure, ScienceFiction, basedonnov... | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "tags | \n", + "
---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "[Action, Adventure, Fantasy, ScienceFiction, c... | \n", + "
1 | \n", + "285 | \n", + "Pirates of the Caribbean: At World's End | \n", + "[Adventure, Fantasy, Action, ocean, drugabuse,... | \n", + "
\n", + " | movie_id | \n", + "title | \n", + "tags | \n", + "
---|---|---|---|
0 | \n", + "19995 | \n", + "Avatar | \n", + "action adventure fantasy sciencefiction cultur... | \n", + "
1 | \n", + "285 | \n", + "Pirates of the Caribbean: At World's End | \n", + "adventure fantasy action ocean drugabuse exoti... | \n", + "