diff --git a/notebooks/suresh_template.ipynb b/notebooks/suresh_template.ipynb new file mode 100644 index 0000000..509ff72 --- /dev/null +++ b/notebooks/suresh_template.ipynb @@ -0,0 +1,2907 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Title" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2017-07-03 16:52:06 \n", + "\n", + "CPython 3.6.1\n", + "IPython 6.1.0\n", + "\n", + "pea 0.0.7\n", + "pandas 0.20.2\n", + "\n", + "compiler : MSC v.1900 64 bit (AMD64)\n", + "system : Windows\n", + "release : 7\n", + "machine : AMD64\n", + "processor : Intel64 Family 6 Model 42 Stepping 7, GenuineIntel\n", + "CPU cores : 8\n", + "interpreter: 64bit\n" + ] + } + ], + "source": [ + "import os\n", + "import pandas as pd\n", + "import settings\n", + "import etl\n", + "\n", + "%matplotlib inline\n", + "\n", + "%load_ext watermark\n", + "%watermark -d -t -v -m -p pea,pandas" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "data = etl.Data()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Available DataFrames\n", + "\n", + "the Data object has 3 DataFrames available movie, keyword, and genre. keyword and genre can be linked back to movie by the index column and the index of movie" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | color | \n", + "director_name | \n", + "num_critic_for_reviews | \n", + "duration | \n", + "director_facebook_likes | \n", + "actor_3_facebook_likes | \n", + "actor_2_name | \n", + "actor_1_facebook_likes | \n", + "gross | \n", + "genres | \n", + "... | \n", + "country | \n", + "content_rating | \n", + "budget | \n", + "title_year | \n", + "actor_2_facebook_likes | \n", + "imdb_score | \n", + "aspect_ratio | \n", + "movie_facebook_likes | \n", + "net | \n", + "profitable | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "Color | \n", + "James Cameron | \n", + "723.0 | \n", + "178.0 | \n", + "0.0 | \n", + "855.0 | \n", + "Joel David Moore | \n", + "1000.0 | \n", + "760505847.0 | \n", + "Action|Adventure|Fantasy|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "237000000.0 | \n", + "2009-01-01 | \n", + "936.0 | \n", + "7.9 | \n", + "1.78 | \n", + "33000 | \n", + "523505847.0 | \n", + "1 | \n", + "
| 1 | \n", + "Color | \n", + "Gore Verbinski | \n", + "302.0 | \n", + "169.0 | \n", + "563.0 | \n", + "1000.0 | \n", + "Orlando Bloom | \n", + "40000.0 | \n", + "309404152.0 | \n", + "Action|Adventure|Fantasy | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "300000000.0 | \n", + "2007-01-01 | \n", + "5000.0 | \n", + "7.1 | \n", + "2.35 | \n", + "0 | \n", + "9404152.0 | \n", + "1 | \n", + "
| 2 | \n", + "Color | \n", + "Sam Mendes | \n", + "602.0 | \n", + "148.0 | \n", + "0.0 | \n", + "161.0 | \n", + "Rory Kinnear | \n", + "11000.0 | \n", + "200074175.0 | \n", + "Action|Adventure|Thriller | \n", + "... | \n", + "UK | \n", + "PG-13 | \n", + "245000000.0 | \n", + "2015-01-01 | \n", + "393.0 | \n", + "6.8 | \n", + "2.35 | \n", + "85000 | \n", + "-44925825.0 | \n", + "0 | \n", + "
| 3 | \n", + "Color | \n", + "Christopher Nolan | \n", + "813.0 | \n", + "164.0 | \n", + "22000.0 | \n", + "23000.0 | \n", + "Christian Bale | \n", + "27000.0 | \n", + "448130642.0 | \n", + "Action|Thriller | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "250000000.0 | \n", + "2012-01-01 | \n", + "23000.0 | \n", + "8.5 | \n", + "2.35 | \n", + "164000 | \n", + "198130642.0 | \n", + "1 | \n", + "
| 4 | \n", + "NaN | \n", + "Doug Walker | \n", + "NaN | \n", + "NaN | \n", + "131.0 | \n", + "NaN | \n", + "Rob Walker | \n", + "131.0 | \n", + "NaN | \n", + "Documentary | \n", + "... | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaT | \n", + "12.0 | \n", + "7.1 | \n", + "NaN | \n", + "0 | \n", + "NaN | \n", + "0 | \n", + "
| 5 | \n", + "Color | \n", + "Andrew Stanton | \n", + "462.0 | \n", + "132.0 | \n", + "475.0 | \n", + "530.0 | \n", + "Samantha Morton | \n", + "640.0 | \n", + "73058679.0 | \n", + "Action|Adventure|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "263700000.0 | \n", + "2012-01-01 | \n", + "632.0 | \n", + "6.6 | \n", + "2.35 | \n", + "24000 | \n", + "-190641321.0 | \n", + "0 | \n", + "
| 6 | \n", + "Color | \n", + "Sam Raimi | \n", + "392.0 | \n", + "156.0 | \n", + "0.0 | \n", + "4000.0 | \n", + "James Franco | \n", + "24000.0 | \n", + "336530303.0 | \n", + "Action|Adventure|Romance | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "258000000.0 | \n", + "2007-01-01 | \n", + "11000.0 | \n", + "6.2 | \n", + "2.35 | \n", + "0 | \n", + "78530303.0 | \n", + "1 | \n", + "
| 7 | \n", + "Color | \n", + "Nathan Greno | \n", + "324.0 | \n", + "100.0 | \n", + "15.0 | \n", + "284.0 | \n", + "Donna Murphy | \n", + "799.0 | \n", + "200807262.0 | \n", + "Adventure|Animation|Comedy|Family|Fantasy|Musi... | \n", + "... | \n", + "USA | \n", + "PG | \n", + "260000000.0 | \n", + "2010-01-01 | \n", + "553.0 | \n", + "7.8 | \n", + "1.85 | \n", + "29000 | \n", + "-59192738.0 | \n", + "0 | \n", + "
| 8 | \n", + "Color | \n", + "Joss Whedon | \n", + "635.0 | \n", + "141.0 | \n", + "0.0 | \n", + "19000.0 | \n", + "Robert Downey Jr. | \n", + "26000.0 | \n", + "458991599.0 | \n", + "Action|Adventure|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "250000000.0 | \n", + "2015-01-01 | \n", + "21000.0 | \n", + "7.5 | \n", + "2.35 | \n", + "118000 | \n", + "208991599.0 | \n", + "1 | \n", + "
| 9 | \n", + "Color | \n", + "David Yates | \n", + "375.0 | \n", + "153.0 | \n", + "282.0 | \n", + "10000.0 | \n", + "Daniel Radcliffe | \n", + "25000.0 | \n", + "301956980.0 | \n", + "Adventure|Family|Fantasy|Mystery | \n", + "... | \n", + "UK | \n", + "PG | \n", + "250000000.0 | \n", + "2009-01-01 | \n", + "11000.0 | \n", + "7.5 | \n", + "2.35 | \n", + "10000 | \n", + "51956980.0 | \n", + "1 | \n", + "
| 10 | \n", + "Color | \n", + "Zack Snyder | \n", + "673.0 | \n", + "183.0 | \n", + "0.0 | \n", + "2000.0 | \n", + "Lauren Cohan | \n", + "15000.0 | \n", + "330249062.0 | \n", + "Action|Adventure|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "250000000.0 | \n", + "2016-01-01 | \n", + "4000.0 | \n", + "6.9 | \n", + "2.35 | \n", + "197000 | \n", + "80249062.0 | \n", + "1 | \n", + "
| 11 | \n", + "Color | \n", + "Bryan Singer | \n", + "434.0 | \n", + "169.0 | \n", + "0.0 | \n", + "903.0 | \n", + "Marlon Brando | \n", + "18000.0 | \n", + "200069408.0 | \n", + "Action|Adventure|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "209000000.0 | \n", + "2006-01-01 | \n", + "10000.0 | \n", + "6.1 | \n", + "2.35 | \n", + "0 | \n", + "-8930592.0 | \n", + "0 | \n", + "
| 12 | \n", + "Color | \n", + "Marc Forster | \n", + "403.0 | \n", + "106.0 | \n", + "395.0 | \n", + "393.0 | \n", + "Mathieu Amalric | \n", + "451.0 | \n", + "168368427.0 | \n", + "Action|Adventure | \n", + "... | \n", + "UK | \n", + "PG-13 | \n", + "200000000.0 | \n", + "2008-01-01 | \n", + "412.0 | \n", + "6.7 | \n", + "2.35 | \n", + "0 | \n", + "-31631573.0 | \n", + "0 | \n", + "
| 13 | \n", + "Color | \n", + "Gore Verbinski | \n", + "313.0 | \n", + "151.0 | \n", + "563.0 | \n", + "1000.0 | \n", + "Orlando Bloom | \n", + "40000.0 | \n", + "423032628.0 | \n", + "Action|Adventure|Fantasy | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "225000000.0 | \n", + "2006-01-01 | \n", + "5000.0 | \n", + "7.3 | \n", + "2.35 | \n", + "5000 | \n", + "198032628.0 | \n", + "1 | \n", + "
| 14 | \n", + "Color | \n", + "Gore Verbinski | \n", + "450.0 | \n", + "150.0 | \n", + "563.0 | \n", + "1000.0 | \n", + "Ruth Wilson | \n", + "40000.0 | \n", + "89289910.0 | \n", + "Action|Adventure|Western | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "215000000.0 | \n", + "2013-01-01 | \n", + "2000.0 | \n", + "6.5 | \n", + "2.35 | \n", + "48000 | \n", + "-125710090.0 | \n", + "0 | \n", + "
| 15 | \n", + "Color | \n", + "Zack Snyder | \n", + "733.0 | \n", + "143.0 | \n", + "0.0 | \n", + "748.0 | \n", + "Christopher Meloni | \n", + "15000.0 | \n", + "291021565.0 | \n", + "Action|Adventure|Fantasy|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "225000000.0 | \n", + "2013-01-01 | \n", + "3000.0 | \n", + "7.2 | \n", + "2.35 | \n", + "118000 | \n", + "66021565.0 | \n", + "1 | \n", + "
| 16 | \n", + "Color | \n", + "Andrew Adamson | \n", + "258.0 | \n", + "150.0 | \n", + "80.0 | \n", + "201.0 | \n", + "Pierfrancesco Favino | \n", + "22000.0 | \n", + "141614023.0 | \n", + "Action|Adventure|Family|Fantasy | \n", + "... | \n", + "USA | \n", + "PG | \n", + "225000000.0 | \n", + "2008-01-01 | \n", + "216.0 | \n", + "6.6 | \n", + "2.35 | \n", + "0 | \n", + "-83385977.0 | \n", + "0 | \n", + "
| 17 | \n", + "Color | \n", + "Joss Whedon | \n", + "703.0 | \n", + "173.0 | \n", + "0.0 | \n", + "19000.0 | \n", + "Robert Downey Jr. | \n", + "26000.0 | \n", + "623279547.0 | \n", + "Action|Adventure|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "220000000.0 | \n", + "2012-01-01 | \n", + "21000.0 | \n", + "8.1 | \n", + "1.85 | \n", + "123000 | \n", + "403279547.0 | \n", + "1 | \n", + "
| 18 | \n", + "Color | \n", + "Rob Marshall | \n", + "448.0 | \n", + "136.0 | \n", + "252.0 | \n", + "1000.0 | \n", + "Sam Claflin | \n", + "40000.0 | \n", + "241063875.0 | \n", + "Action|Adventure|Fantasy | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "250000000.0 | \n", + "2011-01-01 | \n", + "11000.0 | \n", + "6.7 | \n", + "2.35 | \n", + "58000 | \n", + "-8936125.0 | \n", + "0 | \n", + "
| 19 | \n", + "Color | \n", + "Barry Sonnenfeld | \n", + "451.0 | \n", + "106.0 | \n", + "188.0 | \n", + "718.0 | \n", + "Michael Stuhlbarg | \n", + "10000.0 | \n", + "179020854.0 | \n", + "Action|Adventure|Comedy|Family|Fantasy|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "225000000.0 | \n", + "2012-01-01 | \n", + "816.0 | \n", + "6.8 | \n", + "1.85 | \n", + "40000 | \n", + "-45979146.0 | \n", + "0 | \n", + "
| 20 | \n", + "Color | \n", + "Peter Jackson | \n", + "422.0 | \n", + "164.0 | \n", + "0.0 | \n", + "773.0 | \n", + "Adam Brown | \n", + "5000.0 | \n", + "255108370.0 | \n", + "Adventure|Fantasy | \n", + "... | \n", + "New Zealand | \n", + "PG-13 | \n", + "250000000.0 | \n", + "2014-01-01 | \n", + "972.0 | \n", + "7.5 | \n", + "2.35 | \n", + "65000 | \n", + "5108370.0 | \n", + "1 | \n", + "
| 21 | \n", + "Color | \n", + "Marc Webb | \n", + "599.0 | \n", + "153.0 | \n", + "464.0 | \n", + "963.0 | \n", + "Andrew Garfield | \n", + "15000.0 | \n", + "262030663.0 | \n", + "Action|Adventure|Fantasy | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "230000000.0 | \n", + "2012-01-01 | \n", + "10000.0 | \n", + "7.0 | \n", + "2.35 | \n", + "56000 | \n", + "32030663.0 | \n", + "1 | \n", + "
| 22 | \n", + "Color | \n", + "Ridley Scott | \n", + "343.0 | \n", + "156.0 | \n", + "0.0 | \n", + "738.0 | \n", + "William Hurt | \n", + "891.0 | \n", + "105219735.0 | \n", + "Action|Adventure|Drama|History | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "200000000.0 | \n", + "2010-01-01 | \n", + "882.0 | \n", + "6.7 | \n", + "2.35 | \n", + "17000 | \n", + "-94780265.0 | \n", + "0 | \n", + "
| 23 | \n", + "Color | \n", + "Peter Jackson | \n", + "509.0 | \n", + "186.0 | \n", + "0.0 | \n", + "773.0 | \n", + "Adam Brown | \n", + "5000.0 | \n", + "258355354.0 | \n", + "Adventure|Fantasy | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "225000000.0 | \n", + "2013-01-01 | \n", + "972.0 | \n", + "7.9 | \n", + "2.35 | \n", + "83000 | \n", + "33355354.0 | \n", + "1 | \n", + "
| 24 | \n", + "Color | \n", + "Chris Weitz | \n", + "251.0 | \n", + "113.0 | \n", + "129.0 | \n", + "1000.0 | \n", + "Eva Green | \n", + "16000.0 | \n", + "70083519.0 | \n", + "Adventure|Family|Fantasy | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "180000000.0 | \n", + "2007-01-01 | \n", + "6000.0 | \n", + "6.1 | \n", + "2.35 | \n", + "0 | \n", + "-109916481.0 | \n", + "0 | \n", + "
| 25 | \n", + "Color | \n", + "Peter Jackson | \n", + "446.0 | \n", + "201.0 | \n", + "0.0 | \n", + "84.0 | \n", + "Thomas Kretschmann | \n", + "6000.0 | \n", + "218051260.0 | \n", + "Action|Adventure|Drama|Romance | \n", + "... | \n", + "New Zealand | \n", + "PG-13 | \n", + "207000000.0 | \n", + "2005-01-01 | \n", + "919.0 | \n", + "7.2 | \n", + "2.35 | \n", + "0 | \n", + "11051260.0 | \n", + "1 | \n", + "
| 26 | \n", + "Color | \n", + "James Cameron | \n", + "315.0 | \n", + "194.0 | \n", + "0.0 | \n", + "794.0 | \n", + "Kate Winslet | \n", + "29000.0 | \n", + "658672302.0 | \n", + "Drama|Romance | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "200000000.0 | \n", + "1997-01-01 | \n", + "14000.0 | \n", + "7.7 | \n", + "2.35 | \n", + "26000 | \n", + "458672302.0 | \n", + "1 | \n", + "
| 27 | \n", + "Color | \n", + "Anthony Russo | \n", + "516.0 | \n", + "147.0 | \n", + "94.0 | \n", + "11000.0 | \n", + "Scarlett Johansson | \n", + "21000.0 | \n", + "407197282.0 | \n", + "Action|Adventure|Sci-Fi | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "250000000.0 | \n", + "2016-01-01 | \n", + "19000.0 | \n", + "8.2 | \n", + "2.35 | \n", + "72000 | \n", + "157197282.0 | \n", + "1 | \n", + "
| 28 | \n", + "Color | \n", + "Peter Berg | \n", + "377.0 | \n", + "131.0 | \n", + "532.0 | \n", + "627.0 | \n", + "Alexander Skarsgård | \n", + "14000.0 | \n", + "65173160.0 | \n", + "Action|Adventure|Sci-Fi|Thriller | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "209000000.0 | \n", + "2012-01-01 | \n", + "10000.0 | \n", + "5.9 | \n", + "2.35 | \n", + "44000 | \n", + "-143826840.0 | \n", + "0 | \n", + "
| 29 | \n", + "Color | \n", + "Colin Trevorrow | \n", + "644.0 | \n", + "124.0 | \n", + "365.0 | \n", + "1000.0 | \n", + "Judy Greer | \n", + "3000.0 | \n", + "652177271.0 | \n", + "Action|Adventure|Sci-Fi|Thriller | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "150000000.0 | \n", + "2015-01-01 | \n", + "2000.0 | \n", + "7.0 | \n", + "2.00 | \n", + "150000 | \n", + "502177271.0 | \n", + "1 | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 5013 | \n", + "Color | \n", + "Eric Eason | \n", + "28.0 | \n", + "79.0 | \n", + "3.0 | \n", + "42.0 | \n", + "Panchito Gómez | \n", + "93.0 | \n", + "NaN | \n", + "Drama|Family | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "24000.0 | \n", + "2002-01-01 | \n", + "46.0 | \n", + "7.0 | \n", + "1.78 | \n", + "61 | \n", + "NaN | \n", + "0 | \n", + "
| 5014 | \n", + "Color | \n", + "Uwe Boll | \n", + "58.0 | \n", + "80.0 | \n", + "892.0 | \n", + "492.0 | \n", + "Katharine Isabelle | \n", + "986.0 | \n", + "NaN | \n", + "Action|Crime|Thriller | \n", + "... | \n", + "Canada | \n", + "R | \n", + "NaN | \n", + "2009-01-01 | \n", + "918.0 | \n", + "6.3 | \n", + "2.35 | \n", + "0 | \n", + "NaN | \n", + "0 | \n", + "
| 5015 | \n", + "Black and White | \n", + "Richard Linklater | \n", + "61.0 | \n", + "100.0 | \n", + "0.0 | \n", + "0.0 | \n", + "Richard Linklater | \n", + "5.0 | \n", + "1227508.0 | \n", + "Comedy|Drama | \n", + "... | \n", + "USA | \n", + "R | \n", + "23000.0 | \n", + "1991-01-01 | \n", + "0.0 | \n", + "7.1 | \n", + "1.37 | \n", + "2000 | \n", + "1204508.0 | \n", + "1 | \n", + "
| 5016 | \n", + "Color | \n", + "Joseph Mazzella | \n", + "NaN | \n", + "90.0 | \n", + "0.0 | \n", + "9.0 | \n", + "Mikaal Bates | \n", + "313.0 | \n", + "NaN | \n", + "Crime|Drama|Thriller | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "25000.0 | \n", + "2015-01-01 | \n", + "25.0 | \n", + "4.8 | \n", + "NaN | \n", + "33 | \n", + "NaN | \n", + "0 | \n", + "
| 5017 | \n", + "Color | \n", + "Travis Legge | \n", + "1.0 | \n", + "90.0 | \n", + "138.0 | \n", + "138.0 | \n", + "Suzi Lorraine | \n", + "370.0 | \n", + "NaN | \n", + "Comedy|Romance | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "22000.0 | \n", + "2013-01-01 | \n", + "184.0 | \n", + "3.3 | \n", + "1.78 | \n", + "200 | \n", + "NaN | \n", + "0 | \n", + "
| 5018 | \n", + "Color | \n", + "Alex Kendrick | \n", + "5.0 | \n", + "120.0 | \n", + "589.0 | \n", + "4.0 | \n", + "Lisa Arnold | \n", + "51.0 | \n", + "NaN | \n", + "Drama | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "20000.0 | \n", + "2003-01-01 | \n", + "49.0 | \n", + "6.9 | \n", + "1.85 | \n", + "725 | \n", + "NaN | \n", + "0 | \n", + "
| 5019 | \n", + "Color | \n", + "Marcus Nispel | \n", + "43.0 | \n", + "91.0 | \n", + "158.0 | \n", + "265.0 | \n", + "Brittany Curran | \n", + "630.0 | \n", + "NaN | \n", + "Horror|Mystery|Thriller | \n", + "... | \n", + "USA | \n", + "R | \n", + "NaN | \n", + "2015-01-01 | \n", + "512.0 | \n", + "4.6 | \n", + "1.85 | \n", + "0 | \n", + "NaN | \n", + "0 | \n", + "
| 5020 | \n", + "NaN | \n", + "Brandon Landers | \n", + "NaN | \n", + "143.0 | \n", + "8.0 | \n", + "8.0 | \n", + "Alana Kaniewski | \n", + "720.0 | \n", + "NaN | \n", + "Drama|Horror|Thriller | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "17350.0 | \n", + "2011-01-01 | \n", + "19.0 | \n", + "3.0 | \n", + "NaN | \n", + "33 | \n", + "NaN | \n", + "0 | \n", + "
| 5021 | \n", + "Color | \n", + "Jay Duplass | \n", + "51.0 | \n", + "85.0 | \n", + "157.0 | \n", + "10.0 | \n", + "Katie Aselton | \n", + "830.0 | \n", + "192467.0 | \n", + "Comedy|Drama|Romance | \n", + "... | \n", + "USA | \n", + "R | \n", + "15000.0 | \n", + "2005-01-01 | \n", + "224.0 | \n", + "6.6 | \n", + "NaN | \n", + "297 | \n", + "177467.0 | \n", + "1 | \n", + "
| 5022 | \n", + "Black and White | \n", + "Jim Chuchu | \n", + "6.0 | \n", + "60.0 | \n", + "0.0 | \n", + "4.0 | \n", + "Olwenya Maina | \n", + "147.0 | \n", + "NaN | \n", + "Drama | \n", + "... | \n", + "Kenya | \n", + "NaN | \n", + "15000.0 | \n", + "2014-01-01 | \n", + "19.0 | \n", + "7.4 | \n", + "NaN | \n", + "45 | \n", + "NaN | \n", + "0 | \n", + "
| 5023 | \n", + "Color | \n", + "Daryl Wein | \n", + "22.0 | \n", + "88.0 | \n", + "38.0 | \n", + "211.0 | \n", + "Heather Burns | \n", + "331.0 | \n", + "76382.0 | \n", + "Romance | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "15000.0 | \n", + "2009-01-01 | \n", + "212.0 | \n", + "6.2 | \n", + "2.35 | \n", + "324 | \n", + "61382.0 | \n", + "1 | \n", + "
| 5024 | \n", + "Color | \n", + "Jason Trost | \n", + "42.0 | \n", + "78.0 | \n", + "91.0 | \n", + "86.0 | \n", + "Jason Trost | \n", + "407.0 | \n", + "NaN | \n", + "Sci-Fi|Thriller | \n", + "... | \n", + "USA | \n", + "Unrated | \n", + "20000.0 | \n", + "2011-01-01 | \n", + "91.0 | \n", + "4.0 | \n", + "2.35 | \n", + "835 | \n", + "NaN | \n", + "0 | \n", + "
| 5025 | \n", + "Color | \n", + "John Waters | \n", + "73.0 | \n", + "108.0 | \n", + "0.0 | \n", + "105.0 | \n", + "Mink Stole | \n", + "462.0 | \n", + "180483.0 | \n", + "Comedy|Crime|Horror | \n", + "... | \n", + "USA | \n", + "NC-17 | \n", + "10000.0 | \n", + "1972-01-01 | \n", + "143.0 | \n", + "6.1 | \n", + "1.37 | \n", + "0 | \n", + "170483.0 | \n", + "1 | \n", + "
| 5026 | \n", + "Color | \n", + "Olivier Assayas | \n", + "81.0 | \n", + "110.0 | \n", + "107.0 | \n", + "45.0 | \n", + "Béatrice Dalle | \n", + "576.0 | \n", + "136007.0 | \n", + "Drama|Music|Romance | \n", + "... | \n", + "France | \n", + "R | \n", + "4500.0 | \n", + "2004-01-01 | \n", + "133.0 | \n", + "6.9 | \n", + "2.35 | \n", + "171 | \n", + "131507.0 | \n", + "1 | \n", + "
| 5027 | \n", + "Color | \n", + "Jafar Panahi | \n", + "64.0 | \n", + "90.0 | \n", + "397.0 | \n", + "0.0 | \n", + "Nargess Mamizadeh | \n", + "5.0 | \n", + "673780.0 | \n", + "Drama | \n", + "... | \n", + "Iran | \n", + "Not Rated | \n", + "10000.0 | \n", + "2000-01-01 | \n", + "0.0 | \n", + "7.5 | \n", + "1.85 | \n", + "697 | \n", + "663780.0 | \n", + "1 | \n", + "
| 5028 | \n", + "Black and White | \n", + "Ivan Kavanagh | \n", + "12.0 | \n", + "83.0 | \n", + "18.0 | \n", + "0.0 | \n", + "Michael Parle | \n", + "10.0 | \n", + "NaN | \n", + "Horror | \n", + "... | \n", + "Ireland | \n", + "NaN | \n", + "10000.0 | \n", + "2007-01-01 | \n", + "5.0 | \n", + "6.7 | \n", + "1.33 | \n", + "105 | \n", + "NaN | \n", + "0 | \n", + "
| 5029 | \n", + "Color | \n", + "Kiyoshi Kurosawa | \n", + "78.0 | \n", + "111.0 | \n", + "62.0 | \n", + "6.0 | \n", + "Anna Nakagawa | \n", + "89.0 | \n", + "94596.0 | \n", + "Crime|Horror|Mystery|Thriller | \n", + "... | \n", + "Japan | \n", + "NaN | \n", + "1000000.0 | \n", + "1997-01-01 | \n", + "13.0 | \n", + "7.4 | \n", + "1.85 | \n", + "817 | \n", + "-905404.0 | \n", + "0 | \n", + "
| 5030 | \n", + "Color | \n", + "Tadeo Garcia | \n", + "NaN | \n", + "84.0 | \n", + "5.0 | \n", + "12.0 | \n", + "Michael Cortez | \n", + "21.0 | \n", + "NaN | \n", + "Drama | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "NaN | \n", + "2004-01-01 | \n", + "20.0 | \n", + "6.1 | \n", + "NaN | \n", + "22 | \n", + "NaN | \n", + "0 | \n", + "
| 5031 | \n", + "Color | \n", + "Thomas L. Phillips | \n", + "13.0 | \n", + "82.0 | \n", + "120.0 | \n", + "84.0 | \n", + "Joe Coffey | \n", + "785.0 | \n", + "NaN | \n", + "Comedy|Horror|Thriller | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "200000.0 | \n", + "2012-01-01 | \n", + "98.0 | \n", + "5.4 | \n", + "16.00 | \n", + "424 | \n", + "NaN | \n", + "0 | \n", + "
| 5032 | \n", + "Color | \n", + "Ash Baron-Cohen | \n", + "10.0 | \n", + "98.0 | \n", + "3.0 | \n", + "152.0 | \n", + "Stanley B. Herman | \n", + "789.0 | \n", + "NaN | \n", + "Crime|Drama | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "NaN | \n", + "1995-01-01 | \n", + "194.0 | \n", + "6.4 | \n", + "NaN | \n", + "20 | \n", + "NaN | \n", + "0 | \n", + "
| 5033 | \n", + "Color | \n", + "Shane Carruth | \n", + "143.0 | \n", + "77.0 | \n", + "291.0 | \n", + "8.0 | \n", + "David Sullivan | \n", + "291.0 | \n", + "424760.0 | \n", + "Drama|Sci-Fi|Thriller | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "7000.0 | \n", + "2004-01-01 | \n", + "45.0 | \n", + "7.0 | \n", + "1.85 | \n", + "19000 | \n", + "417760.0 | \n", + "1 | \n", + "
| 5034 | \n", + "Color | \n", + "Neill Dela Llana | \n", + "35.0 | \n", + "80.0 | \n", + "0.0 | \n", + "0.0 | \n", + "Edgar Tancangco | \n", + "0.0 | \n", + "70071.0 | \n", + "Thriller | \n", + "... | \n", + "Philippines | \n", + "Not Rated | \n", + "7000.0 | \n", + "2005-01-01 | \n", + "0.0 | \n", + "6.3 | \n", + "NaN | \n", + "74 | \n", + "63071.0 | \n", + "1 | \n", + "
| 5035 | \n", + "Color | \n", + "Robert Rodriguez | \n", + "56.0 | \n", + "81.0 | \n", + "0.0 | \n", + "6.0 | \n", + "Peter Marquardt | \n", + "121.0 | \n", + "2040920.0 | \n", + "Action|Crime|Drama|Romance|Thriller | \n", + "... | \n", + "USA | \n", + "R | \n", + "7000.0 | \n", + "1992-01-01 | \n", + "20.0 | \n", + "6.9 | \n", + "1.37 | \n", + "0 | \n", + "2033920.0 | \n", + "1 | \n", + "
| 5036 | \n", + "Color | \n", + "Anthony Vallone | \n", + "NaN | \n", + "84.0 | \n", + "2.0 | \n", + "2.0 | \n", + "John Considine | \n", + "45.0 | \n", + "NaN | \n", + "Crime|Drama | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "3250.0 | \n", + "2005-01-01 | \n", + "44.0 | \n", + "7.8 | \n", + "NaN | \n", + "4 | \n", + "NaN | \n", + "0 | \n", + "
| 5037 | \n", + "Color | \n", + "Edward Burns | \n", + "14.0 | \n", + "95.0 | \n", + "0.0 | \n", + "133.0 | \n", + "Caitlin FitzGerald | \n", + "296.0 | \n", + "4584.0 | \n", + "Comedy|Drama | \n", + "... | \n", + "USA | \n", + "Not Rated | \n", + "9000.0 | \n", + "2011-01-01 | \n", + "205.0 | \n", + "6.4 | \n", + "NaN | \n", + "413 | \n", + "-4416.0 | \n", + "0 | \n", + "
| 5038 | \n", + "Color | \n", + "Scott Smith | \n", + "1.0 | \n", + "87.0 | \n", + "2.0 | \n", + "318.0 | \n", + "Daphne Zuniga | \n", + "637.0 | \n", + "NaN | \n", + "Comedy|Drama | \n", + "... | \n", + "Canada | \n", + "NaN | \n", + "NaN | \n", + "2013-01-01 | \n", + "470.0 | \n", + "7.7 | \n", + "NaN | \n", + "84 | \n", + "NaN | \n", + "0 | \n", + "
| 5039 | \n", + "Color | \n", + "NaN | \n", + "43.0 | \n", + "43.0 | \n", + "NaN | \n", + "319.0 | \n", + "Valorie Curry | \n", + "841.0 | \n", + "NaN | \n", + "Crime|Drama|Mystery|Thriller | \n", + "... | \n", + "USA | \n", + "TV-14 | \n", + "NaN | \n", + "NaT | \n", + "593.0 | \n", + "7.5 | \n", + "16.00 | \n", + "32000 | \n", + "NaN | \n", + "0 | \n", + "
| 5040 | \n", + "Color | \n", + "Benjamin Roberds | \n", + "13.0 | \n", + "76.0 | \n", + "0.0 | \n", + "0.0 | \n", + "Maxwell Moody | \n", + "0.0 | \n", + "NaN | \n", + "Drama|Horror|Thriller | \n", + "... | \n", + "USA | \n", + "NaN | \n", + "1400.0 | \n", + "2013-01-01 | \n", + "0.0 | \n", + "6.3 | \n", + "NaN | \n", + "16 | \n", + "NaN | \n", + "0 | \n", + "
| 5041 | \n", + "Color | \n", + "Daniel Hsia | \n", + "14.0 | \n", + "100.0 | \n", + "0.0 | \n", + "489.0 | \n", + "Daniel Henney | \n", + "946.0 | \n", + "10443.0 | \n", + "Comedy|Drama|Romance | \n", + "... | \n", + "USA | \n", + "PG-13 | \n", + "NaN | \n", + "2012-01-01 | \n", + "719.0 | \n", + "6.3 | \n", + "2.35 | \n", + "660 | \n", + "NaN | \n", + "0 | \n", + "
| 5042 | \n", + "Color | \n", + "Jon Gunn | \n", + "43.0 | \n", + "90.0 | \n", + "16.0 | \n", + "16.0 | \n", + "Brian Herzlinger | \n", + "86.0 | \n", + "85222.0 | \n", + "Documentary | \n", + "... | \n", + "USA | \n", + "PG | \n", + "1100.0 | \n", + "2004-01-01 | \n", + "23.0 | \n", + "6.6 | \n", + "1.85 | \n", + "456 | \n", + "84122.0 | \n", + "1 | \n", + "
5043 rows × 30 columns
\n", + "| \n", + " | index | \n", + "plot_keywords | \n", + "
|---|---|---|
| 0 | \n", + "0 | \n", + "avatar | \n", + "
| 1 | \n", + "0 | \n", + "future | \n", + "
| 2 | \n", + "0 | \n", + "marine | \n", + "
| 3 | \n", + "0 | \n", + "native | \n", + "
| 4 | \n", + "0 | \n", + "paraplegic | \n", + "
| 5 | \n", + "1 | \n", + "goddess | \n", + "
| 6 | \n", + "1 | \n", + "marriage ceremony | \n", + "
| 7 | \n", + "1 | \n", + "marriage proposal | \n", + "
| 8 | \n", + "1 | \n", + "pirate | \n", + "
| 9 | \n", + "1 | \n", + "singapore | \n", + "
| 10 | \n", + "2 | \n", + "bomb | \n", + "
| 11 | \n", + "2 | \n", + "espionage | \n", + "
| 12 | \n", + "2 | \n", + "sequel | \n", + "
| 13 | \n", + "2 | \n", + "spy | \n", + "
| 14 | \n", + "2 | \n", + "terrorist | \n", + "
| 15 | \n", + "3 | \n", + "deception | \n", + "
| 16 | \n", + "3 | \n", + "imprisonment | \n", + "
| 17 | \n", + "3 | \n", + "lawlessness | \n", + "
| 18 | \n", + "3 | \n", + "police officer | \n", + "
| 19 | \n", + "3 | \n", + "terrorist plot | \n", + "
| 20 | \n", + "4 | \n", + "\n", + " |
| 21 | \n", + "5 | \n", + "alien | \n", + "
| 22 | \n", + "5 | \n", + "american civil war | \n", + "
| 23 | \n", + "5 | \n", + "male nipple | \n", + "
| 24 | \n", + "5 | \n", + "mars | \n", + "
| 25 | \n", + "5 | \n", + "princess | \n", + "
| 26 | \n", + "6 | \n", + "sandman | \n", + "
| 27 | \n", + "6 | \n", + "spider man | \n", + "
| 28 | \n", + "6 | \n", + "symbiote | \n", + "
| 29 | \n", + "6 | \n", + "venom | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "
| 24220 | \n", + "5034 | \n", + "security guard | \n", + "
| 24221 | \n", + "5034 | \n", + "squatter | \n", + "
| 24222 | \n", + "5035 | \n", + "assassin | \n", + "
| 24223 | \n", + "5035 | \n", + "death | \n", + "
| 24224 | \n", + "5035 | \n", + "guitar | \n", + "
| 24225 | \n", + "5035 | \n", + "gun | \n", + "
| 24226 | \n", + "5035 | \n", + "mariachi | \n", + "
| 24227 | \n", + "5036 | \n", + "jewell | \n", + "
| 24228 | \n", + "5036 | \n", + "mongol | \n", + "
| 24229 | \n", + "5036 | \n", + "nostradamus | \n", + "
| 24230 | \n", + "5036 | \n", + "stepnicka | \n", + "
| 24231 | \n", + "5036 | \n", + "vallone | \n", + "
| 24232 | \n", + "5037 | \n", + "written and directed by cast member | \n", + "
| 24233 | \n", + "5038 | \n", + "fraud | \n", + "
| 24234 | \n", + "5038 | \n", + "postal worker | \n", + "
| 24235 | \n", + "5038 | \n", + "prison | \n", + "
| 24236 | \n", + "5038 | \n", + "theft | \n", + "
| 24237 | \n", + "5038 | \n", + "trial | \n", + "
| 24238 | \n", + "5039 | \n", + "cult | \n", + "
| 24239 | \n", + "5039 | \n", + "fbi | \n", + "
| 24240 | \n", + "5039 | \n", + "hideout | \n", + "
| 24241 | \n", + "5039 | \n", + "prison escape | \n", + "
| 24242 | \n", + "5039 | \n", + "serial killer | \n", + "
| 24243 | \n", + "5040 | \n", + "\n", + " |
| 24244 | \n", + "5041 | \n", + "\n", + " |
| 24245 | \n", + "5042 | \n", + "actress name in title | \n", + "
| 24246 | \n", + "5042 | \n", + "crush | \n", + "
| 24247 | \n", + "5042 | \n", + "date | \n", + "
| 24248 | \n", + "5042 | \n", + "four word title | \n", + "
| 24249 | \n", + "5042 | \n", + "video camera | \n", + "
24250 rows × 2 columns
\n", + "| \n", + " | index | \n", + "genres | \n", + "
|---|---|---|
| 0 | \n", + "0 | \n", + "Action | \n", + "
| 1 | \n", + "0 | \n", + "Adventure | \n", + "
| 2 | \n", + "0 | \n", + "Fantasy | \n", + "
| 3 | \n", + "0 | \n", + "Sci-Fi | \n", + "
| 4 | \n", + "1 | \n", + "Action | \n", + "
| 5 | \n", + "1 | \n", + "Adventure | \n", + "
| 6 | \n", + "1 | \n", + "Fantasy | \n", + "
| 7 | \n", + "2 | \n", + "Action | \n", + "
| 8 | \n", + "2 | \n", + "Adventure | \n", + "
| 9 | \n", + "2 | \n", + "Thriller | \n", + "
| 10 | \n", + "3 | \n", + "Action | \n", + "
| 11 | \n", + "3 | \n", + "Thriller | \n", + "
| 12 | \n", + "4 | \n", + "Documentary | \n", + "
| 13 | \n", + "5 | \n", + "Action | \n", + "
| 14 | \n", + "5 | \n", + "Adventure | \n", + "
| 15 | \n", + "5 | \n", + "Sci-Fi | \n", + "
| 16 | \n", + "6 | \n", + "Action | \n", + "
| 17 | \n", + "6 | \n", + "Adventure | \n", + "
| 18 | \n", + "6 | \n", + "Romance | \n", + "
| 19 | \n", + "7 | \n", + "Adventure | \n", + "
| 20 | \n", + "7 | \n", + "Animation | \n", + "
| 21 | \n", + "7 | \n", + "Comedy | \n", + "
| 22 | \n", + "7 | \n", + "Family | \n", + "
| 23 | \n", + "7 | \n", + "Fantasy | \n", + "
| 24 | \n", + "7 | \n", + "Musical | \n", + "
| 25 | \n", + "7 | \n", + "Romance | \n", + "
| 26 | \n", + "8 | \n", + "Action | \n", + "
| 27 | \n", + "8 | \n", + "Adventure | \n", + "
| 28 | \n", + "8 | \n", + "Sci-Fi | \n", + "
| 29 | \n", + "9 | \n", + "Adventure | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "
| 14474 | \n", + "5031 | \n", + "Horror | \n", + "
| 14475 | \n", + "5031 | \n", + "Thriller | \n", + "
| 14476 | \n", + "5032 | \n", + "Crime | \n", + "
| 14477 | \n", + "5032 | \n", + "Drama | \n", + "
| 14478 | \n", + "5033 | \n", + "Drama | \n", + "
| 14479 | \n", + "5033 | \n", + "Sci-Fi | \n", + "
| 14480 | \n", + "5033 | \n", + "Thriller | \n", + "
| 14481 | \n", + "5034 | \n", + "Thriller | \n", + "
| 14482 | \n", + "5035 | \n", + "Action | \n", + "
| 14483 | \n", + "5035 | \n", + "Crime | \n", + "
| 14484 | \n", + "5035 | \n", + "Drama | \n", + "
| 14485 | \n", + "5035 | \n", + "Romance | \n", + "
| 14486 | \n", + "5035 | \n", + "Thriller | \n", + "
| 14487 | \n", + "5036 | \n", + "Crime | \n", + "
| 14488 | \n", + "5036 | \n", + "Drama | \n", + "
| 14489 | \n", + "5037 | \n", + "Comedy | \n", + "
| 14490 | \n", + "5037 | \n", + "Drama | \n", + "
| 14491 | \n", + "5038 | \n", + "Comedy | \n", + "
| 14492 | \n", + "5038 | \n", + "Drama | \n", + "
| 14493 | \n", + "5039 | \n", + "Crime | \n", + "
| 14494 | \n", + "5039 | \n", + "Drama | \n", + "
| 14495 | \n", + "5039 | \n", + "Mystery | \n", + "
| 14496 | \n", + "5039 | \n", + "Thriller | \n", + "
| 14497 | \n", + "5040 | \n", + "Drama | \n", + "
| 14498 | \n", + "5040 | \n", + "Horror | \n", + "
| 14499 | \n", + "5040 | \n", + "Thriller | \n", + "
| 14500 | \n", + "5041 | \n", + "Comedy | \n", + "
| 14501 | \n", + "5041 | \n", + "Drama | \n", + "
| 14502 | \n", + "5041 | \n", + "Romance | \n", + "
| 14503 | \n", + "5042 | \n", + "Documentary | \n", + "
14504 rows × 2 columns
\n", + "