Brazilian E-Commerce Public Dataset by Olist의 데이터셋을 사용하여 파이썬 및 sql로 데이터 분석을 진행.
-> order_items 테이블을 기준으로 products, product_translation 테이블을 결합.
SELECT
product_category_name_translation.product_category_name_english,
COUNT(order_items.product_id) AS order_product
FROM order_items
LEFT JOIN products
ON order_items.product_id = products.product_id
# 포루투갈어로 되어있는 상품명을 영어로 변환하는 작업
LEFT JOIN product_category_name_translation
ON products.product_category_name = product_category_name_translation.product_category_name
GROUP BY product_category_name_translation.product_category_name_english
ORDER BY order_product DESC
# 상위 10개의 상품만 출력
LIMIT 10
SELECT
product_category_name_translation.product_category_name_english,
COUNT(order_items.product_id) AS order_product
FROM order_items
LEFT JOIN products
ON order_items.product_id = products.product_id
LEFT JOIN product_category_name_translation
ON products.product_category_name = product_category_name_translation.product_category_name
GROUP BY product_category_name_translation.product_category_name_english
ORDER BY order_product
# 하위 10개의 상품만 출력
LIMIT 10
-> order_payments 데이터셋을 사용하여 분석
SELECT
payment_type,
COUNT(payment_type) AS num_order
FROM order_payments
GROUP BY payment_type
ORDER BY num_order DESC
SELECT
customer_state,
COUNT(customer_state) AS count_state
FROM customers
GROUP BY customer_state
ORDER BY count_state DESC
LIMIT 10
SELECT
customer_state,
COUNT(customer_state) AS count_state
FROM customers
GROUP BY customer_state
ORDER BY count_state
LIMIT 10