-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathSQL Zepto Data Analysis Project.sql
More file actions
136 lines (112 loc) · 3.24 KB
/
SQL Zepto Data Analysis Project.sql
File metadata and controls
136 lines (112 loc) · 3.24 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
-- SELECT * FROM sqlProject.zepto;
drop table if exists sqlproject.zepto;
create table sqlproject.zepto (
sku_id SERIAL PRIMARY KEY,
Category VARCHAR(120),
name VARCHAR(150) NOT NULL,
mrp NUMERIC(8,2),
discountPercent NUMERIC(5,2),
availableQuantity INTEGER,
discountedSellingPrice NUMERIC(8,2),
weightInGms INTEGER,
outOfStock BOOLEAN,
quantity INTEGER
);
-- --data exploration
-- --count of rows
select count(name) from sqlproject.zepto;
-- --sample data
SELECT * FROM sqlproject.zepto
LIMIT 10;
-- null values
SELECT * FROM sqlproject.zepto
WHERE name IS NULL
OR
Category IS NULL
OR
mrp IS NULL
OR
discountPercent IS NULL
OR
discountedSellingPrice IS NULL
OR
weightInGms IS NULL
OR
availableQuantity IS NULL
OR
outOfStock IS NULL
OR
quantity IS NULL;
-- different product categories
SELECT DISTINCT Category
FROM sqlproject.zepto
ORDER BY Category;
-- products in stock vs out of stock
SELECT outOfStock, COUNT(quantity)
FROM sqlproject.zepto
GROUP BY outOfStock;
-- product names present multiple times
SELECT name, COUNT(quantity) AS "Number of SKUs"
FROM sqlproject.zepto
GROUP BY name
HAVING count(quantity) > 1
ORDER BY count(quantity) DESC;
-- data cleaning
-- products with price = 0
SELECT * FROM sqlproject.zepto
WHERE mrp = 0 OR discountedSellingPrice = 0;
DELETE FROM sqlproject.zepto
WHERE mrp = 0;
-- convert paise to rupees
UPDATE sqlproject.zepto
SET mrp = mrp / 100.0,
discountedSellingPrice = discountedSellingPrice / 100.0;
SELECT mrp, discountedSellingPrice FROM sqlproject.zepto;
-- data analysis
-- Q1. Find the top 10 best-value products based on the discount percentage.
SELECT DISTINCT name, mrp, discountPercent
FROM sqlproject.zepto
ORDER BY discountPercent DESC
LIMIT 10;
-- Q2.What are the Products with High MRP but Out of Stock
SELECT DISTINCT name,mrp
FROM sqlproject.zepto
WHERE outOfStock = TRUE and mrp > 300
ORDER BY mrp DESC;
-- Q3.Calculate Estimated Revenue for each category
SELECT Category,
SUM(discountedSellingPrice * availableQuantity) AS total_revenue
FROM sqlproject.zepto
GROUP BY Category
ORDER BY total_revenue;
-- Q4. Find all products where MRP is greater than ₹500 and discount is less than 10%.
SELECT DISTINCT name, mrp, discountPercent
FROM sqlproject.zepto
WHERE mrp > 500 AND discountPercent < 10
ORDER BY mrp DESC, discountPercent DESC;
-- Q5. Identify the top 5 categories offering the highest average discount percentage.
SELECT Category,
ROUND(AVG(discountPercent),2) AS avg_discount
FROM sqlproject.zepto
GROUP BY Category
ORDER BY avg_discount DESC
LIMIT 5;
-- Q6. Find the price per gram for products above 100g and sort by best value.
SELECT DISTINCT name, weightInGms, discountedSellingPrice,
ROUND(discountedSellingPrice/weightInGms,2) AS price_per_gram
FROM sqlproject.zepto
WHERE weightInGms >= 100
ORDER BY price_per_gram;
-- Q7.Group the products into categories like Low, Medium, Bulk.
SELECT DISTINCT name, weightInGms,
CASE WHEN weightInGms < 1000 THEN 'Low'
WHEN weightInGms < 5000 THEN 'Medium'
ELSE 'Bulk'
END AS weight_category
FROM sqlproject.zepto;
-- Q8.What is the Total Inventory Weight Per Category
SELECT Category,
SUM(weightInGms * availableQuantity) AS total_weight
FROM sqlproject.zepto
GROUP BY Category
ORDER BY total_weight;