In [ ]:
import pandas as pd
import matplotlib.pyplot as plt
df = pd.read_csv('netflix_titles.csv')
How has the number of Netflix titles changed over the years (release_year)?
In [2]:
release_trend = df['release_year'].value_counts().sort_index()
plt.figure(figsize=(10, 5))
plt.plot(release_trend.index, release_trend.values, marker='o', color='teal')
plt.title("Total Netflix Titles by Release Year")
plt.xlabel("Release Year")
plt.ylabel("Number of Titles")
plt.grid(True)
plt.tight_layout()
plt.show()
- Number of Titles Added to Netflix Each Year
In [3]:
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')
df['added_year'] = df['date_added'].dt.year
added_trend = df['added_year'].value_counts().sort_index()
plt.figure(figsize=(10, 5))
plt.plot(added_trend.index, added_trend.values, marker='o', color='green')
plt.title("Number of Titles Added to Netflix Each Year")
plt.xlabel("Year Added")
plt.ylabel("Number of Titles")
plt.grid(True)
plt.tight_layout()
plt.show()
- Yearly Trend of Content Additions by Rating
In [4]:
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')
df['added_year'] = df['date_added'].dt.year
rating_trend = df.groupby(['added_year', 'rating']).size().unstack(fill_value=0)
top_ratings = df['rating'].value_counts().head(5).index
rating_trend = rating_trend[top_ratings]
plt.figure(figsize=(10, 5))
rating_trend.plot(ax=plt.gca(), marker='o')
plt.title("Yearly Trend of Content Additions by Rating")
plt.xlabel("Year Added")
plt.ylabel("Number of Titles")
plt.grid(True)
plt.tight_layout()
plt.show()
- Trend of “Comedies” Titles Over Time
In [5]:
df['date_added'] = pd.to_datetime(df['date_added'], errors='coerce')
df['added_year'] = df['date_added'].dt.year
comedies = df[df['listed_in'].str.contains("Comedies", na=False)]
comedies_trend = comedies['added_year'].value_counts().sort_index()
plt.figure(figsize=(10, 5))
plt.plot(comedies_trend.index, comedies_trend.values, marker='o', color='orange')
plt.title("Number of 'Comedies' Titles Added Over Time")
plt.xlabel("Year Added")
plt.ylabel("Number of Comedies")
plt.grid(True)
plt.tight_layout()
plt.show()