-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathSQL Queries.sql
More file actions
226 lines (167 loc) · 4.63 KB
/
SQL Queries.sql
File metadata and controls
226 lines (167 loc) · 4.63 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
-- SQL Retail Sales Analysis
CREATE DATABASE sales;
USE sales;
DROP TABLE IF EXISTS retail_sales;
-- Create TABLE
CREATE TABLE retail_sales
(
transaction_id INT PRIMARY KEY,
sale_date DATE,
sale_time TIME,
customer_id INT,
gender VARCHAR(15),
age INT,
category VARCHAR(15),
quantity INT,
price_per_unit FLOAT,
cogs FLOAT,
total_sale FLOAT
);
SELECT * FROM retail_sales;
SELECT * FROM retail_sales limit 10;
SELECT COUNT(*) FROM retail_sales;
-- Data Cleaning
SELECT * FROM retail_sales
WHERE
transaction_id IS NULL
OR
sale_date IS NULL
OR
sale_time IS NULL
OR
gender IS NULL
OR
category IS NULL
OR
quantity IS NULL
OR
cogs IS NULL
OR
total_sale IS NULL;
SET SQL_SAFE_UPDATES = 0;
DELETE FROM retail_sales
WHERE
transaction_id IS NULL
OR
sale_date IS NULL
OR
sale_time IS NULL
OR
gender IS NULL
OR
category IS NULL
OR
quantity IS NULL
OR
cogs IS NULL
OR
total_sale IS NULL;
SET SQL_SAFE_UPDATES = 1;
SELECT * FROM retail_sales;
-- Data Exploration
-- How many sales we have?
SELECT COUNT(*) AS total_records FROM retail_sales;
-- How many uniuque customers we have ?
SELECT COUNT(DISTINCT customer_id) as unique_customer FROM retail_sales;
-- Write a query to find all unique product categories.
SELECT DISTINCT category FROM retail_sales;
-- Data Analysis & Business Key Problems & Answers
-- My Analysis & Findings
SELECT * FROM retail_sales;
-- Q.1 Write a SQL query to retrieve all columns for sales made on '2022-11-05'.
SELECT *
FROM retail_sales
WHERE sale_date = '2022-11-05';
/* Q.2 Write a SQL query to retrieve all transactions where the category is 'Clothing' and the quantity
sold is more than 3 in the month of Nov-2022 */
SELECT * FROM retail_sales
WHERE category = 'Clothing'
AND quantity > 3
AND DATE_FORMAT(sale_date, '%Y-%m') = '2022-11';
-- Q.3 Write a SQL query to calculate the total sales (total_sale) for each category.
SELECT
category,
SUM(total_sale) AS total_sales,
COUNT(*) AS total_orders
FROM retail_sales
GROUP BY category;
-- Q.4 Write a SQL query to find the average age of customers who purchased items from the 'Beauty' category.
SELECT category, ROUND(AVG(age),0) AS average_age
FROM retail_sales
WHERE category = 'Beauty';
-- Q.5 Write a SQL query to find all transactions where the total_sale is greater than 1000.
SELECT *
FROM retail_sales
WHERE total_sale > 1000;
/* Q.6 Write a SQL query to find the total number of transactions (transaction_id) made by each gender in
each category. */
SELECT
category,
gender,
COUNT(transaction_id) AS total_transaction
FROM retail_sales
GROUP BY category, gender
ORDER BY 1;
/* Q.7 Write a SQL query to calculate the average sale for each month. Find out best selling
month in each year */
SELECT * FROM (
SELECT
YEAR(sale_date) as year,
MONTH(sale_date) as month,
ROUND(AVG(total_sale), 2) as avg_sale,
RANK() OVER(PARTITION BY YEAR(sale_date) ORDER BY AVG(total_sale) DESC) as rank_num
FROM retail_sales
GROUP BY 1, 2
) as t1
WHERE rank_num = 1;
-- Q.8 Write a SQL query to find the top 5 customers based on the highest total sales
SELECT
customer_id,
SUM(total_sale) as total_sales
FROM retail_sales
GROUP BY 1
ORDER BY 2 DESC
LIMIT 5;
-- Q.9 Write a SQL query to find the number of unique customers who purchased items from each category.
SELECT
category,
COUNT(DISTINCT customer_id) AS total_unique_customers
FROM retail_sales
GROUP BY category;
-- Q.10 Write a SQL query to create each shift and number of orders
-- (Example Morning <=12, Afternoon Between 12 & 17, Evening >17)
WITH hourly_sales AS (
SELECT *,
CASE
WHEN HOUR(sale_time) < 12 THEN 'Morning'
WHEN HOUR(sale_time) BETWEEN 12 AND 17 THEN 'Afternoon'
ELSE 'Evening'
END AS shift
FROM retail_sales
)
SELECT
shift,
COUNT(*) as total_orders
FROM hourly_sales
GROUP BY shift;
select * from retail_Sales;
DESCRIBE retail_sales;
-- Business Insights (Summary KPIs)
-- Total records (transactions)
SELECT COUNT(*) AS total_transactions
FROM retail_sales;
-- Unique customers
SELECT COUNT(DISTINCT customer_id) AS unique_customers
FROM retail_sales;
-- Total revenue
SELECT ROUND(SUM(total_sale), 2) AS total_revenue
FROM retail_sales;
-- Total categories
SELECT COUNT(DISTINCT category) AS total_categories
FROM retail_sales;
SELECT
category,
ROUND(100 * SUM(total_sale) / (SELECT SUM(total_sale) FROM retail_sales), 1) AS revenue_share_pct
FROM retail_sales
GROUP BY category
ORDER BY revenue_share_pct DESC;