Outcome
The goal of this project is to uncover customers’ opinions toward the current products of a tutoring services company and find the product efficacy using statistical methods.
I designed a survey for existing customers to research their attitudes and preferences regarding in-person-based vs. online-based courses. Discovering the potential features that can be added to current courses. I also designed and analyzed statistical experiments to investigate the potential benefits of switching to one of 3 new curricula for the educational programs provided by the company. The analysis is conducted using SQL and Tableau.
Presentation
SQL Scripts for Experiment Results
USE CASE4;
DROP VIEW IF EXISTS DataWarehouse;
CREATE VIEW DataWarehouse AS
SELECT E.student_id, E.program, E.date, E.location, E.score_reading, E.score_writing, E.score_MathNoCalc, E.score_MathCalc,
S.district,
CASE
WHEN district = 'St. Paul' THEN 'Current'
WHEN district = 'Lake Oswego' THEN 'A'
WHEN district = 'Camas' THEN 'B'
WHEN district = 'Riverdale' THEN 'C'
END AS Educational_Program,
LAG(date)
OVER (
PARTITION BY student_id
ORDER BY date
) AS last_date
FROM evals E
JOIN students S
ON E.student_id = S.student_id;
DROP VIEW IF EXISTS DataWarehouse_Obj2;
CREATE VIEW DataWarehouse_Obj2 AS
SELECT *,
# Date Diff
DATEDIFF(date, last_date) AS date_diff,
# Score Improvement
score_reading - LAG(score_reading)
OVER (
PARTITION BY student_id
ORDER BY date
) AS reading_improvement,
score_writing - LAG(score_writing)
OVER (
PARTITION BY student_id
ORDER BY date
) AS writing_improvement,
score_mathNoCalc - LAG(score_mathNoCalc)
OVER (
PARTITION BY student_id
ORDER BY date
) AS mathNoCalc_improvement,
score_mathCalc - LAG(score_mathCalc)
OVER (
PARTITION BY student_id
ORDER BY date
) AS mathCalc_improvement,
# Binary
IF(program = 'skills', '1', '0') AS is_skills,
IF(Educational_Program = 'Current', '1', '0') AS is_current,
IF(Educational_Program = 'A', '1', '0') AS is_A,
IF(Educational_Program = 'B', '1', '0') AS is_B,
IF(Educational_Program = 'C', '1', '0') AS is_C
FROM DataWarehouse;
SELECT * FROM DataWarehouse_Obj2;