import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
df = pd.read_csv('./DataSets/netflix_titles.csv')
df.head()
show_id | type | title | director | cast | country | date_added | release_year | rating | duration | listed_in | description | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | s1 | Movie | Dick Johnson Is Dead | Kirsten Johnson | NaN | United States | September 25, 2021 | 2020 | PG-13 | 90 min | Documentaries | As her father nears the end of his life, filmm... |
1 | s2 | TV Show | Blood & Water | NaN | Ama Qamata, Khosi Ngema, Gail Mabalane, Thaban... | South Africa | September 24, 2021 | 2021 | TV-MA | 2 Seasons | International TV Shows, TV Dramas, TV Mysteries | After crossing paths at a party, a Cape Town t... |
2 | s3 | TV Show | Ganglands | Julien Leclercq | Sami Bouajila, Tracy Gotoas, Samuel Jouy, Nabi... | NaN | September 24, 2021 | 2021 | TV-MA | 1 Season | Crime TV Shows, International TV Shows, TV Act... | To protect his family from a powerful drug lor... |
3 | s4 | TV Show | Jailbirds New Orleans | NaN | NaN | NaN | September 24, 2021 | 2021 | TV-MA | 1 Season | Docuseries, Reality TV | Feuds, flirtations and toilet talk go down amo... |
4 | s5 | TV Show | Kota Factory | NaN | Mayur More, Jitendra Kumar, Ranjan Raj, Alam K... | India | September 24, 2021 | 2021 | TV-MA | 2 Seasons | International TV Shows, Romantic TV Shows, TV ... | In a city of coaching centers known to train I... |
n = df.groupby(['release_year', 'type'], as_index=False).show_id.count()
n.columns = ['release_year', 'type', 'count']
pivot = n_data.pivot(index='release_year', columns='type', values='count').reset_index()
pivot.fillna(0, inplace = True)
pivot.head()
type | release_year | Movie | TV Show |
---|---|---|---|
0 | 1925 | 0.0 | 1.0 |
1 | 1942 | 2.0 | 0.0 |
2 | 1943 | 3.0 | 0.0 |
3 | 1944 | 3.0 | 0.0 |
4 | 1945 | 3.0 | 1.0 |
# Declare a chart with one Axis
fig, ax = plt.subplots()
# Creating some dummy data
ax.plot(pivot.release_year, pivot.Movie, label = 'Movies')
ax.plot(pivot.release_year, pivot['TV Show'], label = 'Tv Shows')
ax.set_ylabel('Number of Movies/TV Shows')
ax.set_xlabel('Year of Release')
ax.set_title("Trend Chart")
plt.text(x=1970, y=400, s=r'Majority Movies are released after 2000 and Tv Shows mostly after 2010')#, fontsize = 12)
fig.set_size_inches(18.5, 10.5)
plt.grid()
ax.legend();