file_path = !pwd #%cd%
print(file_path)
['/home/jujubinha/opensubtitle']
import pandas as pd
pd.set_option('display.max_columns', 500)
import numpy as np
import requests
import base64
import gzip
for dataset in ['basics','ratings']: #,'akas']:
raw_data = requests.get('https://datasets.imdbws.com/title.'+dataset+'.tsv.gz')
with open(dataset+'.gz', 'wb+') as file:
file.write(raw_data.content)
df = pd.read_csv(dataset+'.gz', compression='gzip', sep=r'\t', engine='python')
df.to_pickle(dataset+'.pickle')
basics = pd.read_pickle('basics.pickle')
ratings = pd.read_pickle('ratings.pickle')
#akas = pd.read_pickle('akas.pickle')
basics.head()
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | titleType | primaryTitle | originalTitle | isAdult | startYear | endYear | runtimeMinutes | genres | |
---|---|---|---|---|---|---|---|---|---|
0 | tt0000001 | short | Carmencita | Carmencita | 0 | 1894 | \N | 1 | Documentary,Short |
1 | tt0000002 | short | Le clown et ses chiens | Le clown et ses chiens | 0 | 1892 | \N | 5 | Animation,Short |
2 | tt0000003 | short | Pauvre Pierrot | Pauvre Pierrot | 0 | 1892 | \N | 4 | Animation,Comedy,Romance |
3 | tt0000004 | short | Un bon bock | Un bon bock | 0 | 1892 | \N | \N | Animation,Short |
4 | tt0000005 | short | Blacksmith Scene | Blacksmith Scene | 0 | 1893 | \N | 1 | Comedy,Short |
ratings.head()
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | averageRating | numVotes | |
---|---|---|---|
0 | tt0000001 | 5.8 | 1486 |
1 | tt0000002 | 6.4 | 179 |
2 | tt0000003 | 6.6 | 1119 |
3 | tt0000004 | 6.4 | 109 |
4 | tt0000005 | 6.2 | 1822 |
final = pd.merge(basics,ratings, on='tconst')
final.plot.scatter('averageRating','numVotes',alpha=0.1, figsize=(15,15))
<matplotlib.axes._subplots.AxesSubplot at 0x7f41f8829710>
final.dtypes
tconst object
titleType object
primaryTitle object
originalTitle object
isAdult int64
startYear object
endYear object
runtimeMinutes object
genres object
averageRating float64
numVotes int64
dtype: object
#final['genres'] = final['genres'].str.split(',')
final.titleType.unique()
array(['short', 'movie', 'tvMovie', 'tvSeries', 'tvEpisode', 'tvShort',
'tvMiniSeries', 'tvSpecial', 'video', 'videoGame'], dtype=object)
def arruma(series):
return pd.to_numeric(series, errors='coerse', downcast ='integer') #.fillna(0).astype(int).replace(0,'')
final['isAdult'] = final['isAdult'].astype(bool)
final['runtimeMinutes'] = arruma(final['runtimeMinutes'])
final['startYear'] = arruma(final['startYear'])
final['endYear'] = arruma(final['endYear'])
final.to_pickle('final.pickle')
final.dtypes
tconst object
titleType object
primaryTitle object
originalTitle object
isAdult bool
startYear float64
endYear float64
runtimeMinutes float64
genres object
averageRating float64
numVotes int64
dtype: object
final
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | titleType | primaryTitle | originalTitle | isAdult | startYear | endYear | runtimeMinutes | genres | averageRating | numVotes | |
---|---|---|---|---|---|---|---|---|---|---|---|
0 | tt0000001 | short | Carmencita | Carmencita | False | 1894.0 | NaN | 1.0 | Documentary,Short | 5.8 | 1486 |
1 | tt0000002 | short | Le clown et ses chiens | Le clown et ses chiens | False | 1892.0 | NaN | 5.0 | Animation,Short | 6.4 | 179 |
2 | tt0000003 | short | Pauvre Pierrot | Pauvre Pierrot | False | 1892.0 | NaN | 4.0 | Animation,Comedy,Romance | 6.6 | 1119 |
3 | tt0000004 | short | Un bon bock | Un bon bock | False | 1892.0 | NaN | NaN | Animation,Short | 6.4 | 109 |
4 | tt0000005 | short | Blacksmith Scene | Blacksmith Scene | False | 1893.0 | NaN | 1.0 | Comedy,Short | 6.2 | 1822 |
5 | tt0000006 | short | Chinese Opium Den | Chinese Opium Den | False | 1894.0 | NaN | 1.0 | Short | 5.6 | 96 |
6 | tt0000007 | short | Corbett and Courtney Before the Kinetograph | Corbett and Courtney Before the Kinetograph | False | 1894.0 | NaN | 1.0 | Short,Sport | 5.5 | 596 |
7 | tt0000008 | short | Edison Kinetoscopic Record of a Sneeze | Edison Kinetoscopic Record of a Sneeze | False | 1894.0 | NaN | 1.0 | Documentary,Short | 5.6 | 1587 |
8 | tt0000009 | movie | Miss Jerry | Miss Jerry | False | 1894.0 | NaN | 45.0 | Romance | 5.5 | 77 |
9 | tt0000010 | short | Exiting the Factory | La sortie de l'usine Lumière à Lyon | False | 1895.0 | NaN | 1.0 | Documentary,Short | 6.9 | 5287 |
10 | tt0000011 | short | Akrobatisches Potpourri | Akrobatisches Potpourri | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.4 | 220 |
11 | tt0000012 | short | The Arrival of a Train | L'arrivée d'un train à La Ciotat | False | 1896.0 | NaN | 1.0 | Documentary,Short | 7.4 | 8961 |
12 | tt0000013 | short | The Photographical Congress Arrives in Lyon | Neuville-sur-Saône: Débarquement du congrès de... | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.8 | 1374 |
13 | tt0000014 | short | The Sprinkler Sprinkled | L'arroseur arrosé | False | 1895.0 | NaN | 1.0 | Comedy,Short | 7.2 | 3901 |
14 | tt0000015 | short | Autour d'une cabine | Autour d'une cabine | False | 1894.0 | NaN | 2.0 | Animation,Short | 6.2 | 694 |
15 | tt0000016 | short | Barque sortant du port | Barque sortant du port | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.9 | 1019 |
16 | tt0000017 | short | Italienischer Bauerntanz | Italienischer Bauerntanz | False | 1895.0 | NaN | 1.0 | Documentary,Short | 4.8 | 202 |
17 | tt0000018 | short | Das boxende Känguruh | Das boxende Känguruh | False | 1895.0 | NaN | 1.0 | Short | 5.5 | 424 |
18 | tt0000019 | short | The Clown Barber | The Clown Barber | False | 1898.0 | NaN | NaN | Comedy,Short | 6.6 | 13 |
19 | tt0000020 | short | The Derby 1895 | The Derby 1895 | False | 1895.0 | NaN | 1.0 | Documentary,Short,Sport | 5.1 | 233 |
20 | tt0000022 | short | Blacksmith Scene | Les forgerons | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.2 | 766 |
21 | tt0000023 | short | The Sea | Baignade en mer | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.7 | 971 |
22 | tt0000024 | short | Opening of the Kiel Canal | Opening of the Kiel Canal | False | 1895.0 | NaN | NaN | News,Short | 5.8 | 21 |
23 | tt0000025 | short | The Oxford and Cambridge University Boat Race | The Oxford and Cambridge University Boat Race | False | 1895.0 | NaN | NaN | News,Short,Sport | 4.8 | 19 |
24 | tt0000026 | short | The Messers. Lumière at Cards | Partie d'écarté | False | 1896.0 | NaN | 1.0 | Documentary,Short | 5.7 | 1173 |
25 | tt0000027 | short | Cordeliers' Square in Lyon | Place des Cordeliers à Lyon | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.6 | 801 |
26 | tt0000028 | short | Fishing for Goldfish | La pêche aux poissons rouges | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.2 | 729 |
27 | tt0000029 | short | Baby's Dinner | Repas de bébé | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.9 | 2531 |
28 | tt0000030 | short | Rough Sea at Dover | Rough Sea at Dover | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.3 | 618 |
29 | tt0000031 | short | Jumping the Blanket | Le saut à la couverture | False | 1895.0 | NaN | 1.0 | Documentary,Short | 5.6 | 710 |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
922739 | tt9910056 | tvEpisode | 205 (Auditions) | 205 (Auditions) | False | 2019.0 | NaN | 84.0 | Game-Show,Music,Reality-TV | 6.9 | 14 |
922740 | tt9910118 | tvEpisode | Episode #7.4 | Episode #7.4 | False | 2019.0 | NaN | NaN | Reality-TV | 7.4 | 10 |
922741 | tt9910120 | tvEpisode | Episode #7.5 | Episode #7.5 | False | 2019.0 | NaN | NaN | Reality-TV | 7.4 | 8 |
922742 | tt9910122 | tvEpisode | Episode #7.6 | Episode #7.6 | False | 2019.0 | NaN | NaN | Reality-TV | 6.9 | 8 |
922743 | tt9910124 | tvEpisode | Episode #7.7 | Episode #7.7 | False | 2019.0 | NaN | NaN | Reality-TV | 7.1 | 8 |
922744 | tt9910506 | short | Bulanti | Bulanti | False | 2017.0 | NaN | 7.0 | Short | 8.7 | 7 |
922745 | tt9910572 | tvEpisode | Jûgo to juin | Jûgo to juin | False | 2019.0 | NaN | NaN | Action,Adventure,Animation | 8.3 | 19 |
922746 | tt9910728 | tvSeries | Zalim Istanbul | Zalim Istanbul | False | 2019.0 | NaN | 120.0 | Drama | 8.9 | 7 |
922747 | tt9911774 | movie | Padmavyuhathile Abhimanyu | Padmavyuhathile Abhimanyu | False | 2019.0 | NaN | 130.0 | Drama | 8.5 | 363 |
922748 | tt9913056 | movie | Swarm Season | Swarm Season | False | 2019.0 | NaN | 86.0 | Documentary | 6.2 | 5 |
922749 | tt9913084 | movie | Diabolik sono io | Diabolik sono io | False | 2019.0 | NaN | 75.0 | Documentary | 6.2 | 6 |
922750 | tt9913544 | tvMovie | Un Américain nommé Kazan | Un Américain nommé Kazan | False | 2018.0 | NaN | 53.0 | Biography,Documentary | 6.6 | 5 |
922751 | tt9914120 | tvEpisode | Episode #1.2 | Episode #1.2 | False | 2019.0 | NaN | NaN | Biography,Drama,History | 7.0 | 9 |
922752 | tt9914156 | tvEpisode | Triple Frontier | Triple Frontier | False | 2019.0 | NaN | NaN | Talk-Show | 6.4 | 132 |
922753 | tt9914286 | movie | Sokagin Çocuklari | Sokagin Çocuklari | False | 2019.0 | NaN | 98.0 | Drama,Family | 9.7 | 59 |
922754 | tt9914458 | video | Alien Messiah | Alien Messiah | False | 2019.0 | NaN | 75.0 | Sci-Fi | 2.5 | 13 |
922755 | tt9914546 | tvSeries | Moja Generacija Z | Moja Generacija Z | False | 2019.0 | NaN | 30.0 | Comedy | 3.7 | 25 |
922756 | tt9915144 | tvSeries | Never Ever | Never Ever | False | 2018.0 | NaN | NaN | Documentary,Talk-Show | 10.0 | 6 |
922757 | tt9915686 | tvSeries | Khatra Khatra Khatra | Khatra Khatra Khatra | False | 2019.0 | NaN | NaN | Reality-TV | 8.4 | 14 |
922758 | tt9915898 | tvEpisode | Time for Farewell! Pudding's One Last Request! | Time for Farewell! Pudding's One Last Request! | False | 2019.0 | NaN | NaN | Action,Adventure,Animation | 9.1 | 36 |
922759 | tt9915906 | tvEpisode | The World in Shock! The Fifth Emperor of the S... | The World in Shock! The Fifth Emperor of the S... | False | 2019.0 | NaN | NaN | Action,Adventure,Animation | 7.5 | 23 |
922760 | tt9915910 | tvEpisode | Episode #1.34 | Episode #1.34 | False | 2019.0 | NaN | NaN | Comedy,Romance | 8.6 | 28 |
922761 | tt9916114 | tvEpisode | Nothing But Truffle | Nothing But Truffle | False | 2019.0 | NaN | NaN | Action,Adventure,Animation | 6.0 | 5 |
922762 | tt9916192 | tvMovie | Danielle Darrieux: Il est poli d'être gai! | Danielle Darrieux: Il est poli d'être gai! | False | 2019.0 | NaN | 53.0 | Biography | 7.8 | 5 |
922763 | tt9916316 | tvEpisode | Tim Mälzer vs. Max Strohe | Tim Mälzer vs. Max Strohe | False | 2019.0 | NaN | NaN | Reality-TV | 8.4 | 5 |
922764 | tt9916380 | tvSeries | Meie aasta Aafrikas | Meie aasta Aafrikas | False | 2019.0 | NaN | 43.0 | Adventure,Comedy,Family | 9.7 | 58 |
922765 | tt9916420 | tvEpisode | Episode #21.1 | Episode #21.1 | False | 2019.0 | NaN | NaN | Comedy,Game-Show | 7.0 | 5 |
922766 | tt9916460 | tvMovie | Pink Taxi | Pink Taxi | False | 2019.0 | NaN | NaN | Comedy | 9.2 | 12 |
922767 | tt9916720 | short | The Nun 2 | The Nun 2 | False | 2019.0 | NaN | 10.0 | Horror,Short | 5.2 | 11 |
922768 | tt9916766 | tvEpisode | Episode #10.15 | Episode #10.15 | False | 2019.0 | NaN | 43.0 | Family,Reality-TV | 7.2 | 5 |
922769 rows × 11 columns
movie = final[final.titleType == 'movie']
movie
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | titleType | primaryTitle | originalTitle | isAdult | startYear | endYear | runtimeMinutes | genres | averageRating | numVotes | |
---|---|---|---|---|---|---|---|---|---|---|---|
8 | tt0000009 | movie | Miss Jerry | Miss Jerry | False | 1894.0 | NaN | 45.0 | Romance | 5.5 | 77 |
143 | tt0000147 | movie | The Corbett-Fitzsimmons Fight | The Corbett-Fitzsimmons Fight | False | 1897.0 | NaN | 20.0 | Documentary,News,Sport | 5.2 | 290 |
237 | tt0000335 | movie | Soldiers of the Cross | Soldiers of the Cross | False | 1900.0 | NaN | NaN | Biography,Drama | 6.3 | 39 |
343 | tt0000574 | movie | The Story of the Kelly Gang | The Story of the Kelly Gang | False | 1906.0 | NaN | 70.0 | Biography,Crime,Drama | 6.2 | 505 |
361 | tt0000615 | movie | Robbery Under Arms | Robbery Under Arms | False | 1907.0 | NaN | NaN | Drama | 4.8 | 14 |
367 | tt0000630 | movie | Hamlet | Amleto | False | 1908.0 | NaN | NaN | Drama | 2.9 | 11 |
394 | tt0000675 | movie | Don Quijote | Don Quijote | False | 1908.0 | NaN | NaN | Drama | 4.3 | 10 |
395 | tt0000676 | movie | Don Álvaro o la fuerza del sino | Don Álvaro o la fuerza del sino | False | 1908.0 | NaN | NaN | Drama | 3.8 | 8 |
396 | tt0000679 | movie | The Fairylogue and Radio-Plays | The Fairylogue and Radio-Plays | False | 1908.0 | NaN | 120.0 | Adventure,Fantasy | 4.8 | 33 |
428 | tt0000739 | movie | El pastorcito de Torrente | El pastorcito de Torrente | False | 1908.0 | NaN | NaN | Drama | 6.1 | 8 |
457 | tt0000793 | movie | Andreas Hofer | Andreas Hofer | False | 1909.0 | NaN | NaN | Drama | 4.4 | 8 |
497 | tt0000862 | movie | Faldgruben | Faldgruben | False | 1909.0 | NaN | NaN | \N | 4.6 | 9 |
510 | tt0000886 | movie | Hamlet, Prince of Denmark | Hamlet | False | 1910.0 | NaN | NaN | Drama | 5.1 | 19 |
513 | tt0000891 | movie | Cycle Rider and the Witch | Heksen og cyklisten | False | 1909.0 | NaN | NaN | \N | 5.1 | 17 |
538 | tt0000941 | movie | Locura de amor | Locura de amor | False | 1909.0 | NaN | NaN | Drama | 4.4 | 9 |
562 | tt0000992 | movie | De onde Veje | De onde Veje | False | 1909.0 | NaN | NaN | \N | 4.6 | 8 |
575 | tt0001028 | movie | Salome Mad | Salome Mad | False | 1909.0 | NaN | NaN | Comedy | 4.1 | 9 |
582 | tt0001038 | movie | Sherlock Holmes VI | Sherlock Holmes VI | False | 1910.0 | NaN | NaN | \N | 4.1 | 12 |
585 | tt0001049 | movie | Gøngehøvdingen | Gøngehøvdingen | False | 1909.0 | NaN | NaN | Drama,War | 3.8 | 8 |
604 | tt0001101 | movie | Abraham Lincoln's Clemency | Abraham Lincoln's Clemency | False | 1910.0 | NaN | NaN | \N | 4.5 | 15 |
611 | tt0001112 | movie | Amleto | Amleto | False | 1910.0 | NaN | NaN | Drama | 3.4 | 15 |
612 | tt0001113 | movie | Amor gitano | Amor gitano | False | 1910.0 | NaN | NaN | \N | 5.5 | 8 |
613 | tt0001115 | movie | Ansigttyven I | Ansigttyven I | False | 1910.0 | NaN | NaN | Crime | 4.7 | 11 |
614 | tt0001116 | movie | Ansigttyven II | Ansigttyven II | False | 1910.0 | NaN | NaN | \N | 4.9 | 10 |
619 | tt0001122 | movie | The Red Inn | L'auberge rouge | False | 1910.0 | NaN | NaN | \N | 5.2 | 8 |
630 | tt0001159 | movie | The Connecticut Yankee | The Connecticut Yankee | False | 1910.0 | NaN | NaN | \N | 5.5 | 8 |
633 | tt0001175 | movie | Camille | La dame aux camélias | False | 1912.0 | NaN | NaN | Drama,Romance | 5.6 | 22 |
635 | tt0001184 | movie | Don Juan de Serrallonga | Don Juan de Serrallonga | False | 1910.0 | NaN | 58.0 | Adventure,Drama | 3.1 | 10 |
637 | tt0001186 | movie | Dorothy and the Scarecrow in Oz | Dorothy and the Scarecrow in Oz | False | 1910.0 | NaN | NaN | \N | 5.2 | 43 |
651 | tt0001230 | movie | Gentleman Joe | Gentleman Joe | False | 1910.0 | NaN | NaN | \N | 5.0 | 8 |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
922443 | tt9863566 | movie | Urbanus: De Vuilnisheld | Urbanus: De Vuilnisheld | False | 2019.0 | NaN | 72.0 | Animation,Comedy | 5.1 | 24 |
922463 | tt9866284 | movie | The Far Green Country | The Far Green Country | False | 2018.0 | NaN | 69.0 | Documentary | 7.5 | 16 |
922465 | tt9866344 | movie | Mon Ami Walid | Mon Ami Walid | False | 2019.0 | NaN | 72.0 | Comedy,Drama | 6.9 | 15 |
922467 | tt9866700 | movie | Paranormal Investigation | Paranormal Investigation | False | 2018.0 | NaN | 92.0 | Horror,Thriller | 3.6 | 244 |
922469 | tt9866736 | movie | Rise: Ini Kalilah | Rise: Ini Kalilah | False | 2018.0 | NaN | NaN | \N | 5.7 | 6 |
922519 | tt9870612 | movie | Randy Writes a Novel | Randy Writes a Novel | False | 2018.0 | NaN | 70.0 | Comedy | 9.2 | 18 |
922521 | tt9870726 | movie | Gholamreza Takhti | Gholamreza Takhti | False | 2019.0 | NaN | NaN | Biography,Drama,Sport | 7.1 | 47 |
922531 | tt9872556 | movie | Momenti di trascurabile felicità | Momenti di trascurabile felicità | False | 2019.0 | NaN | 93.0 | Comedy | 6.6 | 121 |
922532 | tt9872616 | movie | Marid | Marid | False | 2019.0 | NaN | NaN | Horror | 4.2 | 10 |
922556 | tt9878504 | movie | Hollywood aan de schelde | Hollywood aan de schelde | False | 2018.0 | NaN | 119.0 | Documentary | 7.6 | 5 |
922573 | tt9880724 | movie | Verdict 19 | Verdict 19 | False | 2019.0 | NaN | NaN | Biography,Documentary,Drama | 10.0 | 13 |
922579 | tt9881616 | movie | La filla d'algú | La filla d'algú | False | 2019.0 | NaN | NaN | Drama | 8.0 | 5 |
922617 | tt9886806 | movie | Conversazione su Tiresia | Conversazione su Tiresia | False | 2018.0 | NaN | NaN | Documentary | 8.4 | 5 |
922623 | tt9887568 | movie | Turned Out | Turned Out | False | 2019.0 | NaN | 131.0 | Drama | 8.7 | 7 |
922626 | tt9888844 | movie | Vosotros sois mi película | Vosotros sois mi película | False | 2019.0 | NaN | 98.0 | Documentary | 4.2 | 179 |
922648 | tt9894098 | movie | Sathru | Sathru | False | 2019.0 | NaN | 129.0 | Thriller | 7.5 | 20 |
922649 | tt9894394 | movie | Upin & Ipin: The Lone Gibbon Kris | Upin & Ipin: Keris Siamang Tunggal | False | 2019.0 | NaN | 100.0 | Animation | 8.6 | 180 |
922668 | tt9899290 | movie | Band Together with Logic | Band Together with Logic | False | 2019.0 | NaN | NaN | Documentary | 8.8 | 9 |
922670 | tt9899850 | movie | The Agitation | Ashoftegi | False | 2019.0 | NaN | NaN | Drama,Thriller | 4.6 | 8 |
922672 | tt9900180 | movie | Aavahayami | Aavahayami | False | 2017.0 | NaN | 97.0 | Mystery | 10.0 | 8 |
922677 | tt9900552 | movie | The Sacred Riana: Beginning | The Sacred Riana: Beginning | False | 2019.0 | NaN | 111.0 | Horror | 6.7 | 13 |
922698 | tt9903716 | movie | Jessie | Jessie | False | 2019.0 | NaN | 106.0 | Horror,Thriller | 9.2 | 89 |
922709 | tt9905412 | movie | Ottam | Ottam | False | 2019.0 | NaN | 120.0 | Drama | 8.2 | 504 |
922710 | tt9905462 | movie | Pengalila | Pengalila | False | 2019.0 | NaN | 111.0 | Drama | 8.5 | 597 |
922711 | tt9905476 | movie | Hand Rolled | Hand Rolled | False | 2019.0 | NaN | 90.0 | Documentary | 10.0 | 12 |
922731 | tt9908960 | movie | Pliusas | Pliusas | False | 2018.0 | NaN | 90.0 | Comedy | 4.2 | 6 |
922747 | tt9911774 | movie | Padmavyuhathile Abhimanyu | Padmavyuhathile Abhimanyu | False | 2019.0 | NaN | 130.0 | Drama | 8.5 | 363 |
922748 | tt9913056 | movie | Swarm Season | Swarm Season | False | 2019.0 | NaN | 86.0 | Documentary | 6.2 | 5 |
922749 | tt9913084 | movie | Diabolik sono io | Diabolik sono io | False | 2019.0 | NaN | 75.0 | Documentary | 6.2 | 6 |
922753 | tt9914286 | movie | Sokagin Çocuklari | Sokagin Çocuklari | False | 2019.0 | NaN | 98.0 | Drama,Family | 9.7 | 59 |
232382 rows × 11 columns
movie.plot.scatter('averageRating','startYear',alpha=0.1, figsize=(15,15))
<matplotlib.axes._subplots.AxesSubplot at 0x7f41ee91b3c8>
def onehot(df):
categories = []
lista = list(df['genres'].unique())
for cat in lista:
for c in cat.split(','):
if c not in categories:
if c != '\\N':
categories.append(c)
for c in categories:
df['genre_'+c] = df['genres'].apply(lambda x: 1 if c in x else 0)
return df
m = onehot(movie)
m
/home/jujubinha/.local/lib/python3.6/site-packages/ipykernel_launcher.py:10: SettingWithCopyWarning:
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead
See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
# Remove the CWD from sys.path while we load stuff.
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | titleType | primaryTitle | originalTitle | isAdult | startYear | endYear | runtimeMinutes | genres | averageRating | numVotes | genre_Romance | genre_Documentary | genre_News | genre_Sport | genre_Biography | genre_Drama | genre_Crime | genre_Adventure | genre_Fantasy | genre_Comedy | genre_War | genre_Family | genre_History | genre_Sci-Fi | genre_Thriller | genre_Mystery | genre_Horror | genre_Action | genre_Western | genre_Music | genre_Animation | genre_Musical | genre_Short | genre_Film-Noir | genre_Talk-Show | genre_Adult | genre_Reality-TV | genre_Game-Show | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
8 | tt0000009 | movie | Miss Jerry | Miss Jerry | False | 1894.0 | NaN | 45.0 | Romance | 5.5 | 77 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
143 | tt0000147 | movie | The Corbett-Fitzsimmons Fight | The Corbett-Fitzsimmons Fight | False | 1897.0 | NaN | 20.0 | Documentary,News,Sport | 5.2 | 290 | 0 | 1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
237 | tt0000335 | movie | Soldiers of the Cross | Soldiers of the Cross | False | 1900.0 | NaN | NaN | Biography,Drama | 6.3 | 39 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
343 | tt0000574 | movie | The Story of the Kelly Gang | The Story of the Kelly Gang | False | 1906.0 | NaN | 70.0 | Biography,Crime,Drama | 6.2 | 505 | 0 | 0 | 0 | 0 | 1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
361 | tt0000615 | movie | Robbery Under Arms | Robbery Under Arms | False | 1907.0 | NaN | NaN | Drama | 4.8 | 14 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
367 | tt0000630 | movie | Hamlet | Amleto | False | 1908.0 | NaN | NaN | Drama | 2.9 | 11 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
394 | tt0000675 | movie | Don Quijote | Don Quijote | False | 1908.0 | NaN | NaN | Drama | 4.3 | 10 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
395 | tt0000676 | movie | Don Álvaro o la fuerza del sino | Don Álvaro o la fuerza del sino | False | 1908.0 | NaN | NaN | Drama | 3.8 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
396 | tt0000679 | movie | The Fairylogue and Radio-Plays | The Fairylogue and Radio-Plays | False | 1908.0 | NaN | 120.0 | Adventure,Fantasy | 4.8 | 33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
428 | tt0000739 | movie | El pastorcito de Torrente | El pastorcito de Torrente | False | 1908.0 | NaN | NaN | Drama | 6.1 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
457 | tt0000793 | movie | Andreas Hofer | Andreas Hofer | False | 1909.0 | NaN | NaN | Drama | 4.4 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
497 | tt0000862 | movie | Faldgruben | Faldgruben | False | 1909.0 | NaN | NaN | \N | 4.6 | 9 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
510 | tt0000886 | movie | Hamlet, Prince of Denmark | Hamlet | False | 1910.0 | NaN | NaN | Drama | 5.1 | 19 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
513 | tt0000891 | movie | Cycle Rider and the Witch | Heksen og cyklisten | False | 1909.0 | NaN | NaN | \N | 5.1 | 17 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
538 | tt0000941 | movie | Locura de amor | Locura de amor | False | 1909.0 | NaN | NaN | Drama | 4.4 | 9 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
562 | tt0000992 | movie | De onde Veje | De onde Veje | False | 1909.0 | NaN | NaN | \N | 4.6 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
575 | tt0001028 | movie | Salome Mad | Salome Mad | False | 1909.0 | NaN | NaN | Comedy | 4.1 | 9 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
582 | tt0001038 | movie | Sherlock Holmes VI | Sherlock Holmes VI | False | 1910.0 | NaN | NaN | \N | 4.1 | 12 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
585 | tt0001049 | movie | Gøngehøvdingen | Gøngehøvdingen | False | 1909.0 | NaN | NaN | Drama,War | 3.8 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
604 | tt0001101 | movie | Abraham Lincoln's Clemency | Abraham Lincoln's Clemency | False | 1910.0 | NaN | NaN | \N | 4.5 | 15 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
611 | tt0001112 | movie | Amleto | Amleto | False | 1910.0 | NaN | NaN | Drama | 3.4 | 15 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
612 | tt0001113 | movie | Amor gitano | Amor gitano | False | 1910.0 | NaN | NaN | \N | 5.5 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
613 | tt0001115 | movie | Ansigttyven I | Ansigttyven I | False | 1910.0 | NaN | NaN | Crime | 4.7 | 11 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
614 | tt0001116 | movie | Ansigttyven II | Ansigttyven II | False | 1910.0 | NaN | NaN | \N | 4.9 | 10 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
619 | tt0001122 | movie | The Red Inn | L'auberge rouge | False | 1910.0 | NaN | NaN | \N | 5.2 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
630 | tt0001159 | movie | The Connecticut Yankee | The Connecticut Yankee | False | 1910.0 | NaN | NaN | \N | 5.5 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
633 | tt0001175 | movie | Camille | La dame aux camélias | False | 1912.0 | NaN | NaN | Drama,Romance | 5.6 | 22 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
635 | tt0001184 | movie | Don Juan de Serrallonga | Don Juan de Serrallonga | False | 1910.0 | NaN | 58.0 | Adventure,Drama | 3.1 | 10 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
637 | tt0001186 | movie | Dorothy and the Scarecrow in Oz | Dorothy and the Scarecrow in Oz | False | 1910.0 | NaN | NaN | \N | 5.2 | 43 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
651 | tt0001230 | movie | Gentleman Joe | Gentleman Joe | False | 1910.0 | NaN | NaN | \N | 5.0 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
922443 | tt9863566 | movie | Urbanus: De Vuilnisheld | Urbanus: De Vuilnisheld | False | 2019.0 | NaN | 72.0 | Animation,Comedy | 5.1 | 24 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922463 | tt9866284 | movie | The Far Green Country | The Far Green Country | False | 2018.0 | NaN | 69.0 | Documentary | 7.5 | 16 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922465 | tt9866344 | movie | Mon Ami Walid | Mon Ami Walid | False | 2019.0 | NaN | 72.0 | Comedy,Drama | 6.9 | 15 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922467 | tt9866700 | movie | Paranormal Investigation | Paranormal Investigation | False | 2018.0 | NaN | 92.0 | Horror,Thriller | 3.6 | 244 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922469 | tt9866736 | movie | Rise: Ini Kalilah | Rise: Ini Kalilah | False | 2018.0 | NaN | NaN | \N | 5.7 | 6 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922519 | tt9870612 | movie | Randy Writes a Novel | Randy Writes a Novel | False | 2018.0 | NaN | 70.0 | Comedy | 9.2 | 18 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922521 | tt9870726 | movie | Gholamreza Takhti | Gholamreza Takhti | False | 2019.0 | NaN | NaN | Biography,Drama,Sport | 7.1 | 47 | 0 | 0 | 0 | 1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922531 | tt9872556 | movie | Momenti di trascurabile felicità | Momenti di trascurabile felicità | False | 2019.0 | NaN | 93.0 | Comedy | 6.6 | 121 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922532 | tt9872616 | movie | Marid | Marid | False | 2019.0 | NaN | NaN | Horror | 4.2 | 10 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922556 | tt9878504 | movie | Hollywood aan de schelde | Hollywood aan de schelde | False | 2018.0 | NaN | 119.0 | Documentary | 7.6 | 5 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922573 | tt9880724 | movie | Verdict 19 | Verdict 19 | False | 2019.0 | NaN | NaN | Biography,Documentary,Drama | 10.0 | 13 | 0 | 1 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922579 | tt9881616 | movie | La filla d'algú | La filla d'algú | False | 2019.0 | NaN | NaN | Drama | 8.0 | 5 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922617 | tt9886806 | movie | Conversazione su Tiresia | Conversazione su Tiresia | False | 2018.0 | NaN | NaN | Documentary | 8.4 | 5 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922623 | tt9887568 | movie | Turned Out | Turned Out | False | 2019.0 | NaN | 131.0 | Drama | 8.7 | 7 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922626 | tt9888844 | movie | Vosotros sois mi película | Vosotros sois mi película | False | 2019.0 | NaN | 98.0 | Documentary | 4.2 | 179 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922648 | tt9894098 | movie | Sathru | Sathru | False | 2019.0 | NaN | 129.0 | Thriller | 7.5 | 20 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922649 | tt9894394 | movie | Upin & Ipin: The Lone Gibbon Kris | Upin & Ipin: Keris Siamang Tunggal | False | 2019.0 | NaN | 100.0 | Animation | 8.6 | 180 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922668 | tt9899290 | movie | Band Together with Logic | Band Together with Logic | False | 2019.0 | NaN | NaN | Documentary | 8.8 | 9 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922670 | tt9899850 | movie | The Agitation | Ashoftegi | False | 2019.0 | NaN | NaN | Drama,Thriller | 4.6 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922672 | tt9900180 | movie | Aavahayami | Aavahayami | False | 2017.0 | NaN | 97.0 | Mystery | 10.0 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922677 | tt9900552 | movie | The Sacred Riana: Beginning | The Sacred Riana: Beginning | False | 2019.0 | NaN | 111.0 | Horror | 6.7 | 13 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922698 | tt9903716 | movie | Jessie | Jessie | False | 2019.0 | NaN | 106.0 | Horror,Thriller | 9.2 | 89 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922709 | tt9905412 | movie | Ottam | Ottam | False | 2019.0 | NaN | 120.0 | Drama | 8.2 | 504 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922710 | tt9905462 | movie | Pengalila | Pengalila | False | 2019.0 | NaN | 111.0 | Drama | 8.5 | 597 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922711 | tt9905476 | movie | Hand Rolled | Hand Rolled | False | 2019.0 | NaN | 90.0 | Documentary | 10.0 | 12 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922731 | tt9908960 | movie | Pliusas | Pliusas | False | 2018.0 | NaN | 90.0 | Comedy | 4.2 | 6 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922747 | tt9911774 | movie | Padmavyuhathile Abhimanyu | Padmavyuhathile Abhimanyu | False | 2019.0 | NaN | 130.0 | Drama | 8.5 | 363 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922748 | tt9913056 | movie | Swarm Season | Swarm Season | False | 2019.0 | NaN | 86.0 | Documentary | 6.2 | 5 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922749 | tt9913084 | movie | Diabolik sono io | Diabolik sono io | False | 2019.0 | NaN | 75.0 | Documentary | 6.2 | 6 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
922753 | tt9914286 | movie | Sokagin Çocuklari | Sokagin Çocuklari | False | 2019.0 | NaN | 98.0 | Drama,Family | 9.7 | 59 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
232382 rows × 39 columns
m.describe(include='all')
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | titleType | primaryTitle | originalTitle | isAdult | startYear | endYear | runtimeMinutes | genres | averageRating | numVotes | genre_Romance | genre_Documentary | genre_News | genre_Sport | genre_Biography | genre_Drama | genre_Crime | genre_Adventure | genre_Fantasy | genre_Comedy | genre_War | genre_Family | genre_History | genre_Sci-Fi | genre_Thriller | genre_Mystery | genre_Horror | genre_Action | genre_Western | genre_Music | genre_Animation | genre_Musical | genre_Short | genre_Film-Noir | genre_Talk-Show | genre_Adult | genre_Reality-TV | genre_Game-Show | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | 232382 | 232382 | 232382 | 232382 | 232382 | 232369.000000 | 0.0 | 203722.000000 | 232382 | 232382.000000 | 2.323820e+05 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.00000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 | 232382.000000 |
unique | 232382 | 1 | 209088 | 214717 | 2 | NaN | NaN | NaN | 1240 | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN |
top | tt0879224 | movie | Hamlet | Hamlet | False | NaN | NaN | NaN | Drama | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN |
freq | 1 | 232382 | 24 | 22 | 228436 | NaN | NaN | NaN | 39453 | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN |
mean | NaN | NaN | NaN | NaN | NaN | 1990.587256 | NaN | 94.028181 | NaN | 6.229305 | 3.192833e+03 | 0.111343 | 0.135097 | 0.002707 | 0.011124 | 0.029047 | 0.438278 | 0.084585 | 0.066408 | 0.028483 | 0.253488 | 0.022218 | 0.038088 | 0.026228 | 0.024223 | 0.079085 | 0.03564 | 0.067652 | 0.105929 | 0.017850 | 0.046406 | 0.016034 | 0.023573 | 0.000026 | 0.003275 | 0.000009 | 0.015935 | 0.000116 | 0.000009 |
std | NaN | NaN | NaN | NaN | NaN | 25.398874 | NaN | 123.160258 | NaN | 1.342428 | 2.993927e+04 | 0.314557 | 0.341827 | 0.051956 | 0.104882 | 0.167939 | 0.496177 | 0.278264 | 0.248994 | 0.166349 | 0.435009 | 0.147391 | 0.191410 | 0.159814 | 0.153741 | 0.269872 | 0.18539 | 0.251148 | 0.307747 | 0.132406 | 0.210364 | 0.125606 | 0.151716 | 0.005081 | 0.057132 | 0.002934 | 0.125224 | 0.010778 | 0.002934 |
min | NaN | NaN | NaN | NaN | NaN | 1894.000000 | NaN | 1.000000 | NaN | 1.000000 | 5.000000e+00 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.00000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 |
25% | NaN | NaN | NaN | NaN | NaN | 1974.000000 | NaN | 81.000000 | NaN | 5.400000 | 1.400000e+01 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.00000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 |
50% | NaN | NaN | NaN | NaN | NaN | 2000.000000 | NaN | 91.000000 | NaN | 6.400000 | 4.500000e+01 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.00000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 |
75% | NaN | NaN | NaN | NaN | NaN | 2011.000000 | NaN | 102.000000 | NaN | 7.100000 | 2.450000e+02 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 1.000000 | 0.000000 | 0.000000 | 0.000000 | 1.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.00000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 | 0.000000 |
max | NaN | NaN | NaN | NaN | NaN | 2019.000000 | NaN | 51420.000000 | NaN | 10.000000 | 2.070726e+06 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.00000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 | 1.000000 |
m['output'] = pd.Series(0)
for c in list(m.columns[m.columns.str.startswith('genre_')]):
m['output'] = m[c].astype(str) + m['output'].astype(str)
/home/jujubinha/.local/lib/python3.6/site-packages/ipykernel_launcher.py:1: SettingWithCopyWarning:
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead
See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
"""Entry point for launching an IPython kernel.
/home/jujubinha/.local/lib/python3.6/site-packages/ipykernel_launcher.py:3: SettingWithCopyWarning:
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead
See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
This is separate from the ipykernel package so we can avoid doing imports until
m
<style scoped>
.dataframe tbody tr th:only-of-type {
vertical-align: middle;
}
</style>
.dataframe tbody tr th {
vertical-align: top;
}
.dataframe thead th {
text-align: right;
}
tconst | titleType | primaryTitle | originalTitle | isAdult | startYear | endYear | runtimeMinutes | genres | averageRating | numVotes | genre_Romance | genre_Documentary | genre_News | genre_Sport | genre_Biography | genre_Drama | genre_Crime | genre_Adventure | genre_Fantasy | genre_Comedy | genre_War | genre_Family | genre_History | genre_Sci-Fi | genre_Thriller | genre_Mystery | genre_Horror | genre_Action | genre_Western | genre_Music | genre_Animation | genre_Musical | genre_Short | genre_Film-Noir | genre_Talk-Show | genre_Adult | genre_Reality-TV | genre_Game-Show | output | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
8 | tt0000009 | movie | Miss Jerry | Miss Jerry | False | 1894.0 | NaN | 45.0 | Romance | 5.5 | 77 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000001nan |
143 | tt0000147 | movie | The Corbett-Fitzsimmons Fight | The Corbett-Fitzsimmons Fight | False | 1897.0 | NaN | 20.0 | Documentary,News,Sport | 5.2 | 290 | 0 | 1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000001110nan |
237 | tt0000335 | movie | Soldiers of the Cross | Soldiers of the Cross | False | 1900.0 | NaN | NaN | Biography,Drama | 6.3 | 39 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000110000nan |
343 | tt0000574 | movie | The Story of the Kelly Gang | The Story of the Kelly Gang | False | 1906.0 | NaN | 70.0 | Biography,Crime,Drama | 6.2 | 505 | 0 | 0 | 0 | 0 | 1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000001110000nan |
361 | tt0000615 | movie | Robbery Under Arms | Robbery Under Arms | False | 1907.0 | NaN | NaN | Drama | 4.8 | 14 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
367 | tt0000630 | movie | Hamlet | Amleto | False | 1908.0 | NaN | NaN | Drama | 2.9 | 11 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
394 | tt0000675 | movie | Don Quijote | Don Quijote | False | 1908.0 | NaN | NaN | Drama | 4.3 | 10 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
395 | tt0000676 | movie | Don Álvaro o la fuerza del sino | Don Álvaro o la fuerza del sino | False | 1908.0 | NaN | NaN | Drama | 3.8 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
396 | tt0000679 | movie | The Fairylogue and Radio-Plays | The Fairylogue and Radio-Plays | False | 1908.0 | NaN | 120.0 | Adventure,Fantasy | 4.8 | 33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000110000000nan |
428 | tt0000739 | movie | El pastorcito de Torrente | El pastorcito de Torrente | False | 1908.0 | NaN | NaN | Drama | 6.1 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
457 | tt0000793 | movie | Andreas Hofer | Andreas Hofer | False | 1909.0 | NaN | NaN | Drama | 4.4 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
497 | tt0000862 | movie | Faldgruben | Faldgruben | False | 1909.0 | NaN | NaN | \N | 4.6 | 9 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
510 | tt0000886 | movie | Hamlet, Prince of Denmark | Hamlet | False | 1910.0 | NaN | NaN | Drama | 5.1 | 19 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
513 | tt0000891 | movie | Cycle Rider and the Witch | Heksen og cyklisten | False | 1909.0 | NaN | NaN | \N | 5.1 | 17 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
538 | tt0000941 | movie | Locura de amor | Locura de amor | False | 1909.0 | NaN | NaN | Drama | 4.4 | 9 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
562 | tt0000992 | movie | De onde Veje | De onde Veje | False | 1909.0 | NaN | NaN | \N | 4.6 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
575 | tt0001028 | movie | Salome Mad | Salome Mad | False | 1909.0 | NaN | NaN | Comedy | 4.1 | 9 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000001000000000nan |
582 | tt0001038 | movie | Sherlock Holmes VI | Sherlock Holmes VI | False | 1910.0 | NaN | NaN | \N | 4.1 | 12 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
585 | tt0001049 | movie | Gøngehøvdingen | Gøngehøvdingen | False | 1909.0 | NaN | NaN | Drama,War | 3.8 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000010000100000nan |
604 | tt0001101 | movie | Abraham Lincoln's Clemency | Abraham Lincoln's Clemency | False | 1910.0 | NaN | NaN | \N | 4.5 | 15 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
611 | tt0001112 | movie | Amleto | Amleto | False | 1910.0 | NaN | NaN | Drama | 3.4 | 15 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
612 | tt0001113 | movie | Amor gitano | Amor gitano | False | 1910.0 | NaN | NaN | \N | 5.5 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
613 | tt0001115 | movie | Ansigttyven I | Ansigttyven I | False | 1910.0 | NaN | NaN | Crime | 4.7 | 11 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000001000000nan |
614 | tt0001116 | movie | Ansigttyven II | Ansigttyven II | False | 1910.0 | NaN | NaN | \N | 4.9 | 10 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
619 | tt0001122 | movie | The Red Inn | L'auberge rouge | False | 1910.0 | NaN | NaN | \N | 5.2 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
630 | tt0001159 | movie | The Connecticut Yankee | The Connecticut Yankee | False | 1910.0 | NaN | NaN | \N | 5.5 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
633 | tt0001175 | movie | Camille | La dame aux camélias | False | 1912.0 | NaN | NaN | Drama,Romance | 5.6 | 22 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100001nan |
635 | tt0001184 | movie | Don Juan de Serrallonga | Don Juan de Serrallonga | False | 1910.0 | NaN | 58.0 | Adventure,Drama | 3.1 | 10 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000010100000nan |
637 | tt0001186 | movie | Dorothy and the Scarecrow in Oz | Dorothy and the Scarecrow in Oz | False | 1910.0 | NaN | NaN | \N | 5.2 | 43 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
651 | tt0001230 | movie | Gentleman Joe | Gentleman Joe | False | 1910.0 | NaN | NaN | \N | 5.0 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
922443 | tt9863566 | movie | Urbanus: De Vuilnisheld | Urbanus: De Vuilnisheld | False | 2019.0 | NaN | 72.0 | Animation,Comedy | 5.1 | 24 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000100000000001000000000nan |
922463 | tt9866284 | movie | The Far Green Country | The Far Green Country | False | 2018.0 | NaN | 69.0 | Documentary | 7.5 | 16 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922465 | tt9866344 | movie | Mon Ami Walid | Mon Ami Walid | False | 2019.0 | NaN | 72.0 | Comedy,Drama | 6.9 | 15 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000001000100000nan |
922467 | tt9866700 | movie | Paranormal Investigation | Paranormal Investigation | False | 2018.0 | NaN | 92.0 | Horror,Thriller | 3.6 | 244 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000010100000000000000nan |
922469 | tt9866736 | movie | Rise: Ini Kalilah | Rise: Ini Kalilah | False | 2018.0 | NaN | NaN | \N | 5.7 | 6 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000000nan |
922519 | tt9870612 | movie | Randy Writes a Novel | Randy Writes a Novel | False | 2018.0 | NaN | 70.0 | Comedy | 9.2 | 18 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000001000000000nan |
922521 | tt9870726 | movie | Gholamreza Takhti | Gholamreza Takhti | False | 2019.0 | NaN | NaN | Biography,Drama,Sport | 7.1 | 47 | 0 | 0 | 0 | 1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000111000nan |
922531 | tt9872556 | movie | Momenti di trascurabile felicità | Momenti di trascurabile felicità | False | 2019.0 | NaN | 93.0 | Comedy | 6.6 | 121 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000001000000000nan |
922532 | tt9872616 | movie | Marid | Marid | False | 2019.0 | NaN | NaN | Horror | 4.2 | 10 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000010000000000000000nan |
922556 | tt9878504 | movie | Hollywood aan de schelde | Hollywood aan de schelde | False | 2018.0 | NaN | 119.0 | Documentary | 7.6 | 5 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922573 | tt9880724 | movie | Verdict 19 | Verdict 19 | False | 2019.0 | NaN | NaN | Biography,Documentary,Drama | 10.0 | 13 | 0 | 1 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000110010nan |
922579 | tt9881616 | movie | La filla d'algú | La filla d'algú | False | 2019.0 | NaN | NaN | Drama | 8.0 | 5 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
922617 | tt9886806 | movie | Conversazione su Tiresia | Conversazione su Tiresia | False | 2018.0 | NaN | NaN | Documentary | 8.4 | 5 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922623 | tt9887568 | movie | Turned Out | Turned Out | False | 2019.0 | NaN | 131.0 | Drama | 8.7 | 7 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
922626 | tt9888844 | movie | Vosotros sois mi película | Vosotros sois mi película | False | 2019.0 | NaN | 98.0 | Documentary | 4.2 | 179 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922648 | tt9894098 | movie | Sathru | Sathru | False | 2019.0 | NaN | 129.0 | Thriller | 7.5 | 20 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000100000000000000nan |
922649 | tt9894394 | movie | Upin & Ipin: The Lone Gibbon Kris | Upin & Ipin: Keris Siamang Tunggal | False | 2019.0 | NaN | 100.0 | Animation | 8.6 | 180 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000100000000000000000000nan |
922668 | tt9899290 | movie | Band Together with Logic | Band Together with Logic | False | 2019.0 | NaN | NaN | Documentary | 8.8 | 9 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922670 | tt9899850 | movie | The Agitation | Ashoftegi | False | 2019.0 | NaN | NaN | Drama,Thriller | 4.6 | 8 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000100000000100000nan |
922672 | tt9900180 | movie | Aavahayami | Aavahayami | False | 2017.0 | NaN | 97.0 | Mystery | 10.0 | 8 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000001000000000000000nan |
922677 | tt9900552 | movie | The Sacred Riana: Beginning | The Sacred Riana: Beginning | False | 2019.0 | NaN | 111.0 | Horror | 6.7 | 13 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000010000000000000000nan |
922698 | tt9903716 | movie | Jessie | Jessie | False | 2019.0 | NaN | 106.0 | Horror,Thriller | 9.2 | 89 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000010100000000000000nan |
922709 | tt9905412 | movie | Ottam | Ottam | False | 2019.0 | NaN | 120.0 | Drama | 8.2 | 504 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
922710 | tt9905462 | movie | Pengalila | Pengalila | False | 2019.0 | NaN | 111.0 | Drama | 8.5 | 597 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
922711 | tt9905476 | movie | Hand Rolled | Hand Rolled | False | 2019.0 | NaN | 90.0 | Documentary | 10.0 | 12 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922731 | tt9908960 | movie | Pliusas | Pliusas | False | 2018.0 | NaN | 90.0 | Comedy | 4.2 | 6 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000001000000000nan |
922747 | tt9911774 | movie | Padmavyuhathile Abhimanyu | Padmavyuhathile Abhimanyu | False | 2019.0 | NaN | 130.0 | Drama | 8.5 | 363 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000100000nan |
922748 | tt9913056 | movie | Swarm Season | Swarm Season | False | 2019.0 | NaN | 86.0 | Documentary | 6.2 | 5 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922749 | tt9913084 | movie | Diabolik sono io | Diabolik sono io | False | 2019.0 | NaN | 75.0 | Documentary | 6.2 | 6 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000000000000010nan |
922753 | tt9914286 | movie | Sokagin Çocuklari | Sokagin Çocuklari | False | 2019.0 | NaN | 98.0 | Drama,Family | 9.7 | 59 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0000000000000000100000100000nan |
232382 rows × 40 columns
Index(['genre_Romance', 'genre_Documentary', 'genre_News', 'genre_Sport',
'genre_Biography', 'genre_Drama', 'genre_Crime', 'genre_Adventure',
'genre_Fantasy', 'genre_Comedy', 'genre_War', 'genre_Family',
'genre_History', 'genre_Sci-Fi', 'genre_Thriller', 'genre_Mystery',
'genre_Horror', 'genre_Action', 'genre_Western', 'genre_Music',
'genre_Animation', 'genre_Musical', 'genre_Short', 'genre_Film-Noir',
'genre_Talk-Show', 'genre_Adult', 'genre_Reality-TV',
'genre_Game-Show'],
dtype='object')