Learn practical skills, build real-world projects, and advance your career

Importing various python libraries and importing the dataset

import numpy as np
import pandas as pd
import seaborn as sns #visualization
import matplotlib.pyplot as plt #visualization
%matplotlib inline
sns.set(color_codes = True)
from wordcloud import WordCloud
df = pd.read_csv(r'C:\Users\Aditya Saha\Downloads\tmdb_metadata\tmdb_movies_data.csv')
df

Finding the dimensions of the Dataframe

df.shape
(10866, 21)
list(df.columns)
['id',
 'imdb_id',
 'popularity',
 'budget',
 'revenue',
 'original_title',
 'cast',
 'homepage',
 'director',
 'tagline',
 'keywords',
 'overview',
 'runtime',
 'genres',
 'production_companies',
 'release_date',
 'vote_count',
 'vote_average',
 'release_year',
 'budget_adj',
 'revenue_adj']