-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathSQL QUERY PRJ 1.sql
More file actions
197 lines (154 loc) · 3.79 KB
/
SQL QUERY PRJ 1.sql
File metadata and controls
197 lines (154 loc) · 3.79 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
-- Retail_Sales_Analysis
select * from retail_sale
--Create Table
Create Table retail_sale
(
transactions_id int primary key,
sale_date date
sale_time time
customer_id int
gender varchar(15)
age int
category varchar(30)
quantity int
price_per_unit float
cogs float
total_sale float
)
Select * from retail_sale
--Data cleaning
Select
count(*)
from retail_sale
Select transactions_id
from retail_sale
where transactions_id is null
Select * from retail_sale
where transactions_id is null
or
sale_date is null
or
sale_time is null
or
customer_id is null
or
category is null
or
total_sale is null
Delete from retail_sale
where transactions_id is null
or
sale_date is null
or
sale_time is null
or
customer_id is null
or
category is null
or
total_sale is null
--Exploration of data
-- How many sales do we have ?
Select
count(total_sale)
from retail_sale
--How many unique customers do we have?
Select
count(Distinct customer_id) AS Num_of_Customers
from retail_sale
--How many unique Categories do we have?
Select
Distinct category
from retail_sale
--Buisness key Problems & Answers
--Q.1Write a SQL query to retrieve all columns for sales made on '2022-11-05':
Select * from retail_sale
where sale_date = '2022-11-05'
-- Q.2 Write a SQL query to retrieve all transactions where the category is 'Clothing' and the quantity sold is more than 4 in the month of Nov-2022:
Select
*
from retail_sale
where
category= 'Clothing'
and -
TO_CHAR(sale_date, 'YYYY-MM') = '2022-11'
and
quantity >=4
10 in the month of Nov-2022
-- Q.3 Write a SQL query to calculate the total sales (total_sale) for each category.
Select
category,
sum(total_sale) as net_sales,
count(*) as total_sales
From retail_sale
Group by category;
-- Q.4 Write a SQL query to find the average age of customers who purchased items from the 'Beauty' category.
Select
round(avg(age), 2)
From
retail_sale
Where
category= 'Beauty'
-- Q.5 Write a SQL query to find all transactions where the total_sale is greater than 1000.
Select
*
From
retail_sale
Where
total_sale > 1000
-- Q.6 Write a SQL query to find the total number of transactions (transaction_id) made by each gender in each category.
Select
category,
gender,
count(*) as total_trans
From retail_sale
group by gender, category
order by 1
-- Q.7 Write a SQL query to calculate the average sale for each month. Find out best selling month in each year
select
year,
month,
avg_sales
from(
select
extract(YEAR from sale_date) as year,
extract(MONTH from sale_date) as month,
avg(total_sale) as avg_sales,
rank() over(partition by extract(YEAR from sale_date) order by avg(total_sale) desc) as rank
from retail_sale
group by 1,2
) as t1
where rank = 1
-- Q.8 Write a SQL query to find the top 5 customers based on the highest total sales
select
customer_id as customers,
sum(total_sale) as total_sale
from retail_sale
group by 1
order by 2 desc
limit 5
-- Q.9 Write a SQL query to find the number of unique customers who purchased items from each category.
select
category,
count(distinct customer_id)
from retail_sale
group by 1
-- Q.10 Write a SQL query to create each shift and number of orders (Example Morning <12, Afternoon Between 12 & 17, Evening >17). Find out which shift has the most orders.
With hourly_sale
as
(
select *,
case
when extract(HOUR From sale_time) < 12 then 'Morning'
when extract(HOUR FROM sale_time) BETWEEN 12 AND 17 then 'Afternoon'
else 'Evening'
END as Shift
from retail_sale
)
Select
shift,
count(*) as total_orders
From hourly_sale
Group by 1
Order by 2 Desc
--End of Project