Skip to content
April Challenge
# Start coding here...
import pandas as pd
olp = pd.read_csv('olist_products_dataset.csv')
olp
# Explore the dataset
olp.info() # get information about the dataset
olp.describe() # get summary statistics of the dataset
# Check for missing values
olp.isnull().sum() # count the number of missing values in each column
# Clean the dataset
olp.drop_duplicates(inplace=True) # drop duplicate rows