Skip to content
Analysis of Lego sets
Understanding Lego sets popularity
💾 The data
(source):
DataFrameas
df
variable
[1]
SELECT *
FROM setsAverage number of Lego sets released per year
DataFrameas
df
variable
[51]
SELECT year,COUNT(set_num) as Lego_sets_Per_Year
FROM sets
GROUP BY year
ORDER BY year;Average number of Lego parts per year
DataFrameas
df
variable
SELECT year,ROUND(AVG(num_parts),2) as Average_Lego_Parts
FROM sets
GROUP BY year
ORDER BY year;Data Visualization for Average number of Lego parts per year
DataFrameas
df
variable
[13]
SELECT year,ROUND(AVG(num_parts),2) as Average_Lego_Parts
FROM sets
GROUP BY year
ORDER BY year;DataFrameas
df
variable
[15]
SELECT year,ROUND(AVG(num_parts),2) as Average_Lego_Parts
FROM sets
GROUP BY year
ORDER BY Average_Lego_Parts DESC
LIMIT 10;Five most Popular Colours used in Lego Parts
DataFrameas
df
variable
[21]
SELECT name,COUNT(color_id) as Total
FROM inventory_parts as ip
LEFT JOIN colors as c
on ip.color_id=c.id
GROUP BY name
ORDER BY Total DESC
LIMIT 5;The proportion of Lego parts that are transparent
DataFrameas
df
variable
[37]
WITH Total_Parts as
(SELECT COUNT(part_num) as Total
FROM inventory_parts)
SELECT is_trans,ROUND(COUNT(part_num) * 100.0/(select Total FROM Total_Parts),2) as Proportion_of_Lego_Parts
FROM inventory_parts as ip
LEFT JOIN colors as c
on ip.color_id=c.id
GROUP BY is_trans;The 5 rarest lego bricks