import pandas as pd
# read excel and load into dataframe
mov = pd.read_excel("movies.xlsx")
# display first 7 rows
mov.head(7)
| Title | US Gross | Worldwide Gross | Production Budget | Release Date | Distributor | Source | Major Genre | Creative Type | Director | Rotten Tomatoes Rating | IMDB Rating | IMDB Votes | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | The Land Girls | 146083 | 146083 | 8000000.0 | 1998-06-12 00:00:00 | Gramercy | NaN | NaN | NaN | NaN | NaN | 6.1 | 1071.0 |
| 1 | First Love, Last Rites | 10876 | 10876 | 300000.0 | 1998-08-07 00:00:00 | Strand | NaN | Drama | NaN | NaN | NaN | 6.9 | 207.0 |
| 2 | I Married a Strange Person | 203134 | 203134 | 250000.0 | 1998-08-28 00:00:00 | Lionsgate | NaN | Comedy | NaN | NaN | NaN | 6.8 | 865.0 |
| 3 | Let's Talk About Sex | 373615 | 373615 | 300000.0 | 1998-09-11 00:00:00 | Fine Line | NaN | Comedy | NaN | NaN | 13.0 | NaN | NaN |
| 4 | Slam | 1009819 | 1087521 | 1000000.0 | 1998-10-09 00:00:00 | Trimark | Original Screenplay | Drama | Contemporary Fiction | NaN | 62.0 | 3.4 | 165.0 |
| 5 | Mississippi Mermaid | 24551 | 2624551 | 1600000.0 | 1999-01-15 00:00:00 | MGM | NaN | NaN | NaN | NaN | NaN | NaN | NaN |
| 6 | Following | 44705 | 44705 | 6000.0 | 1999-04-04 00:00:00 | Zeitgeist | NaN | NaN | NaN | Christopher Nolan | NaN | 7.7 | 15133.0 |
# display last 5 rows
mov.tail()
| Title | US Gross | Worldwide Gross | Production Budget | Release Date | Distributor | Source | Major Genre | Creative Type | Director | Rotten Tomatoes Rating | IMDB Rating | IMDB Votes | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 3196 | Zack and Miri Make a Porno | 31452765 | 36851125 | 24000000.0 | 2008-10-31 00:00:00 | Weinstein Co. | Original Screenplay | Comedy | Contemporary Fiction | Kevin Smith | 65.0 | 7.0 | 55687.0 |
| 3197 | Zodiac | 33080084 | 83080084 | 85000000.0 | 2007-03-02 00:00:00 | Paramount Pictures | Based on Book/Short Story | Thriller/Suspense | Dramatization | David Fincher | 89.0 | NaN | NaN |
| 3198 | Zoom | 11989328 | 12506188 | 35000000.0 | 2006-08-11 00:00:00 | Sony Pictures | Based on Comic/Graphic Novel | Adventure | Super Hero | Peter Hewitt | 3.0 | 3.4 | 7424.0 |
| 3199 | The Legend of Zorro | 45575336 | 141475336 | 80000000.0 | 2005-10-28 00:00:00 | Sony Pictures | Remake | Adventure | Historical Fiction | Martin Campbell | 26.0 | 5.7 | 21161.0 |
| 3200 | The Mask of Zorro | 93828745 | 233700000 | 65000000.0 | 1998-07-17 00:00:00 | Sony Pictures | Remake | Adventure | Historical Fiction | Martin Campbell | 82.0 | 6.7 | 4789.0 |
# get all column names
mov.columns
Index(['Title', 'US Gross', 'Worldwide Gross', 'Production Budget',
'Release Date', 'Distributor', 'Source', 'Major Genre', 'Creative Type',
'Director', 'Rotten Tomatoes Rating', 'IMDB Rating', 'IMDB Votes'],
dtype='object')
mov['Production Budget']
0 8000000.0
1 300000.0
2 250000.0
3 300000.0
4 1000000.0
...
3196 24000000.0
3197 85000000.0
3198 35000000.0
3199 80000000.0
3200 65000000.0
Name: Production Budget, Length: 3201, dtype: float64
# total rows
len(mov)
3201
mov['Production Budget'].max()
300000000.0
mov['Production Budget'].min()
218.0
mov['IMDB Votes'].describe()
count 2988.000000 mean 29908.644578 std 44937.582335 min 18.000000 25% 4828.500000 50% 15106.000000 75% 35810.500000 max 519541.000000 Name: IMDB Votes, dtype: float64
# movies directed by Steven Spielberg
mov_ss = mov[mov['Director'] == 'Steven Spielberg']
mov_ss
| Title | US Gross | Worldwide Gross | Production Budget | Release Date | Distributor | Source | Major Genre | Creative Type | Director | Rotten Tomatoes Rating | IMDB Rating | IMDB Votes | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 22 | 1941 | 34175000 | 94875000 | 32000000.0 | 1979-12-14 00:00:00 | Universal | Original Screenplay | Comedy | Historical Fiction | Steven Spielberg | 33.0 | 5.6 | 13364.0 |
| 163 | Close Encounters of the Third Kind | 166000000 | 337700000 | 20000000.0 | 1977-11-16 00:00:00 | Sony Pictures | Original Screenplay | Adventure | Science Fiction | Steven Spielberg | 95.0 | 7.8 | 59049.0 |
| 183 | The Color Purple | 93589701 | 93589701 | 15000000.0 | 1985-12-18 00:00:00 | Warner Bros. | Based on Book/Short Story | Drama | Historical Fiction | Steven Spielberg | 88.0 | 7.7 | 26962.0 |
| 296 | ET: The Extra-Terrestrial | 435110554 | 792910554 | 10500000.0 | 1982-06-11 00:00:00 | Universal | Original Screenplay | Drama | Science Fiction | Steven Spielberg | NaN | 7.9 | 105028.0 |
| 429 | Hook | 119654823 | 300854823 | 70000000.0 | 1991-12-11 00:00:00 | Sony Pictures | Based on Book/Short Story | Adventure | Kids Fiction | Steven Spielberg | 24.0 | 6.2 | 60159.0 |
| 485 | Jurassic Park | 357067947 | 923067947 | 63000000.0 | 1993-06-10 00:00:00 | Universal | Based on Book/Short Story | Action | Science Fiction | Steven Spielberg | 87.0 | 7.9 | 151365.0 |
| 487 | Jaws | 260000000 | 470700000 | 12000000.0 | 1975-06-20 00:00:00 | Universal | Based on Book/Short Story | Horror | Contemporary Fiction | Steven Spielberg | 100.0 | 8.3 | 138017.0 |
| 640 | Indiana Jones and the Temple of Doom | 179880271 | 333080271 | 28000000.0 | 1984-05-23 00:00:00 | Paramount Pictures | Original Screenplay | Adventure | Historical Fiction | Steven Spielberg | 85.0 | 7.5 | 110761.0 |
| 641 | Indiana Jones and the Last Crusade | 197171806 | 474171806 | 48000000.0 | 1989-05-24 00:00:00 | Paramount Pictures | Original Screenplay | Adventure | Historical Fiction | Steven Spielberg | 89.0 | 8.3 | 171572.0 |
| 767 | Raiders of the Lost Ark | 245034358 | 386800358 | 20000000.0 | 1981-06-12 00:00:00 | Paramount Pictures | Original Screenplay | Adventure | Historical Fiction | Steven Spielberg | NaN | 8.7 | 242661.0 |
| 816 | Schindler's List | 96067179 | 321200000 | 25000000.0 | 1993-12-15 00:00:00 | Universal | Based on Real Life Events | Drama | Dramatization | Steven Spielberg | 97.0 | 8.9 | 276283.0 |
| 993 | Twilight Zone: The Movie | 29500000 | 29500000 | 10000000.0 | 1983-06-24 00:00:00 | Warner Bros. | Based on TV | Horror | Fantasy | Steven Spielberg | 67.0 | 6.3 | 12054.0 |
| 1167 | Amistad | 44212592 | 44212592 | 40000000.0 | 1997-12-12 00:00:00 | Dreamworks SKG | Based on Real Life Events | Drama | Dramatization | Steven Spielberg | 77.0 | 7.1 | 28477.0 |
| 1208 | Artificial Intelligence: AI | 78616689 | 235900000 | 90000000.0 | 2001-06-29 00:00:00 | Warner Bros. | Based on Book/Short Story | Drama | Science Fiction | Steven Spielberg | NaN | 6.9 | 91901.0 |
| 1418 | Catch Me if You Can | 164606800 | 351106800 | 52000000.0 | 2002-12-25 00:00:00 | Dreamworks SKG | Based on Book/Short Story | Drama | Dramatization | Steven Spielberg | 96.0 | 5.7 | 224.0 |
| 2029 | Indiana Jones and the Kingdom of the Crystal S... | 317023851 | 786558145 | 185000000.0 | 2008-05-22 00:00:00 | Paramount Pictures | Original Screenplay | Adventure | Historical Fiction | Steven Spielberg | 77.0 | 6.6 | 135071.0 |
| 2217 | The Lost World: Jurassic Park | 229086679 | 786686679 | 75000000.0 | 1997-05-22 00:00:00 | Universal | Based on Book/Short Story | Action | Science Fiction | Steven Spielberg | NaN | 6.0 | 77124.0 |
| 2347 | Minority Report | 132024714 | 358824714 | 102000000.0 | 2002-06-21 00:00:00 | 20th Century Fox | Based on Book/Short Story | Action | Science Fiction | Steven Spielberg | 91.0 | 7.7 | 135142.0 |
| 2372 | Munich | 47379090 | 130279090 | 75000000.0 | 2005-12-23 00:00:00 | Universal | Based on Real Life Events | Drama | Dramatization | Steven Spielberg | 78.0 | 7.8 | 79529.0 |
| 2893 | Saving Private Ryan | 216335085 | 481635085 | 65000000.0 | 1998-07-24 00:00:00 | Dreamworks SKG | Original Screenplay | Drama | Historical Fiction | Steven Spielberg | 91.0 | 8.5 | 270540.0 |
| 2967 | The Adventures of Tintin: Secret of the Unicorn | 0 | 0 | 130000000.0 | 2011-12-23 00:00:00 | Paramount Pictures | Based on Comic/Graphic Novel | Adventure | Contemporary Fiction | Steven Spielberg | NaN | NaN | NaN |
| 2998 | The Terminal | 77073959 | 218673959 | 75000000.0 | 2004-06-18 00:00:00 | Dreamworks SKG | Based on Real Life Events | Drama | Dramatization | Steven Spielberg | 60.0 | 7.1 | 79803.0 |
| 3099 | The War of the Worlds | 234280354 | 591745532 | 132000000.0 | 2005-06-29 00:00:00 | Paramount Pictures | Remake | Action | Science Fiction | Steven Spielberg | NaN | 7.2 | 12074.0 |
# highest grossing movie in US by SS
mov_ss[mov_ss['US Gross'] == mov_ss['US Gross'].max()]
| Title | US Gross | Worldwide Gross | Production Budget | Release Date | Distributor | Source | Major Genre | Creative Type | Director | Rotten Tomatoes Rating | IMDB Rating | IMDB Votes | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 296 | ET: The Extra-Terrestrial | 435110554 | 792910554 | 10500000.0 | 1982-06-11 00:00:00 | Universal | Original Screenplay | Drama | Science Fiction | Steven Spielberg | NaN | 7.9 | 105028.0 |
# highest grossing movie worldwide by SS
mov_ss[mov_ss['Worldwide Gross'] == mov_ss['Worldwide Gross'].max()]
| Title | US Gross | Worldwide Gross | Production Budget | Release Date | Distributor | Source | Major Genre | Creative Type | Director | Rotten Tomatoes Rating | IMDB Rating | IMDB Votes | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 485 | Jurassic Park | 357067947 | 923067947 | 63000000.0 | 1993-06-10 00:00:00 | Universal | Based on Book/Short Story | Action | Science Fiction | Steven Spielberg | 87.0 | 7.9 | 151365.0 |
# least grossing movie in US by SS
mov_ss[mov_ss['US Gross'] == mov_ss['US Gross'].min()]
| Title | US Gross | Worldwide Gross | Production Budget | Release Date | Distributor | Source | Major Genre | Creative Type | Director | Rotten Tomatoes Rating | IMDB Rating | IMDB Votes | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2967 | The Adventures of Tintin: Secret of the Unicorn | 0 | 0 | 130000000.0 | 2011-12-23 00:00:00 | Paramount Pictures | Based on Comic/Graphic Novel | Adventure | Contemporary Fiction | Steven Spielberg | NaN | NaN | NaN |