Forked from taka-treasuredata/uncv_path_list.sql
Last active
September 28, 2016 03:44
-
-
Save toru-takahashi/533d6eb47eb83c0878971a2870d17209 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
-- Hive | |
SELECT user, TD_X_RANK(user) AS node_id, page_id, category, time | |
FROM | |
( | |
SELECT | |
raw_data.user, page_id, category, raw_data.time AS time | |
FROM | |
( | |
SELECT user, page_id, category, time | |
FROM raw_data_201501 | |
GROUP BY user, page_id, category, time | |
HAVING TD_TIME_RANGE(time,'2015-01-01','2015-02-01') | |
) raw_data | |
LEFT OUTER JOIN | |
( | |
SELECT user, cv_id, cv_category, cv_level, time | |
FROM itmd_conversion_history | |
GROUP BY user, cv_id, cv_category, cv_level, time | |
-- signupのみをコンバージョンとみなす -- | |
HAVING cv_category='signup' | |
AND TD_TIME_RANGE(time,'2015-01-01','2015-02-01') | |
) cv_history | |
ON | |
( raw_data.user=cv_history.user ) | |
-- conversion history に存在しなかったユーザーを絞り込み -- | |
WHERE cv_history.user IS NULL | |
ORDER BY user, time | |
) t | |
WHERE user IS NOT NULL | |
ORDER BY user, time |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment