Skip to content
import pandas as pd
import numpy as np
movies=pd.read_csv('tmdb_5000_movies.csv')
credits=pd.read_csv('tmdb_5000_credits.csv')
movies.head()
movies.columns
movies.shape
credits.head()
movies = pd.merge(movies, credits, on='title')
movies.shape
movies.head(1)
movies.info()
movies[['budget','cast','overview']].head()
movies.duplicated().sum()
movies.iloc[1].genres
import ast
def convert(text):
  L = []
  for i in ast.literal_eval(text):
    L.append(i['name'])
  return L
movies.genres = movies['genres'].apply(convert)