diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..74880c7 --- /dev/null +++ b/.gitignore @@ -0,0 +1 @@ +pyspark_env/ diff --git a/data/clickhouse/courses/._SUCCESS.crc b/data/clickhouse/courses/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/clickhouse/courses/._SUCCESS.crc differ diff --git a/data/clickhouse/courses/.part-00000-3fe222ff-e4ff-40ed-bbad-b4fa49529f40-c000.csv.crc b/data/clickhouse/courses/.part-00000-3fe222ff-e4ff-40ed-bbad-b4fa49529f40-c000.csv.crc new file mode 100644 index 0000000..7f8986e Binary files /dev/null and b/data/clickhouse/courses/.part-00000-3fe222ff-e4ff-40ed-bbad-b4fa49529f40-c000.csv.crc differ diff --git a/data/clickhouse/courses/_SUCCESS b/data/clickhouse/courses/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/clickhouse/courses/part-00000-3fe222ff-e4ff-40ed-bbad-b4fa49529f40-c000.csv b/data/clickhouse/courses/part-00000-3fe222ff-e4ff-40ed-bbad-b4fa49529f40-c000.csv new file mode 100644 index 0000000..3f1ac16 --- /dev/null +++ b/data/clickhouse/courses/part-00000-3fe222ff-e4ff-40ed-bbad-b4fa49529f40-c000.csv @@ -0,0 +1,4 @@ +id,title,category,created_at +2.000000000000000000,Python для анализа данных,programming,2023-01-15 +1.000000000000000000,SQL для начинающих,data,2023-01-01 +3.000000000000000000,BI с нуля,business,2023-03-01 diff --git a/data/clickhouse/enrollments/._SUCCESS.crc b/data/clickhouse/enrollments/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/clickhouse/enrollments/._SUCCESS.crc differ diff --git a/data/clickhouse/enrollments/.part-00000-b55c9f68-b565-4cd7-9379-2469697c8def-c000.csv.crc b/data/clickhouse/enrollments/.part-00000-b55c9f68-b565-4cd7-9379-2469697c8def-c000.csv.crc new file mode 100644 index 0000000..e302d8a Binary files /dev/null and b/data/clickhouse/enrollments/.part-00000-b55c9f68-b565-4cd7-9379-2469697c8def-c000.csv.crc differ diff --git a/data/clickhouse/enrollments/_SUCCESS b/data/clickhouse/enrollments/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/clickhouse/enrollments/part-00000-b55c9f68-b565-4cd7-9379-2469697c8def-c000.csv b/data/clickhouse/enrollments/part-00000-b55c9f68-b565-4cd7-9379-2469697c8def-c000.csv new file mode 100644 index 0000000..fe120de --- /dev/null +++ b/data/clickhouse/enrollments/part-00000-b55c9f68-b565-4cd7-9379-2469697c8def-c000.csv @@ -0,0 +1,6 @@ +id,user_id,course_id,enrolled_at +2.000000000000000000,1,2,2023-02-01 +5.000000000000000000,4,3,2023-04-01 +1.000000000000000000,1,1,2023-01-15 +3.000000000000000000,2,1,2023-01-20 +4.000000000000000000,3,2,2023-03-05 diff --git a/data/clickhouse/lesson_views/._SUCCESS.crc b/data/clickhouse/lesson_views/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/clickhouse/lesson_views/._SUCCESS.crc differ diff --git a/data/clickhouse/lesson_views/.part-00000-0a022985-d877-45e1-bd29-ab290b80ada8-c000.csv.crc b/data/clickhouse/lesson_views/.part-00000-0a022985-d877-45e1-bd29-ab290b80ada8-c000.csv.crc new file mode 100644 index 0000000..9369955 Binary files /dev/null and b/data/clickhouse/lesson_views/.part-00000-0a022985-d877-45e1-bd29-ab290b80ada8-c000.csv.crc differ diff --git a/data/clickhouse/lesson_views/_SUCCESS b/data/clickhouse/lesson_views/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/clickhouse/lesson_views/part-00000-0a022985-d877-45e1-bd29-ab290b80ada8-c000.csv b/data/clickhouse/lesson_views/part-00000-0a022985-d877-45e1-bd29-ab290b80ada8-c000.csv new file mode 100644 index 0000000..e023b46 --- /dev/null +++ b/data/clickhouse/lesson_views/part-00000-0a022985-d877-45e1-bd29-ab290b80ada8-c000.csv @@ -0,0 +1,7 @@ +id,user_id,lesson_id,viewed_at +5.000000000000000000,4,4,2023-04-02T10:00:00.000+03:00 +6.000000000000000000,4,5,2023-04-03T10:00:00.000+03:00 +4.000000000000000000,3,3,2023-03-06T12:00:00.000+03:00 +1.000000000000000000,1,1,2023-01-16T10:00:00.000+03:00 +2.000000000000000000,1,2,2023-01-16T10:15:00.000+03:00 +3.000000000000000000,2,1,2023-01-21T09:00:00.000+03:00 diff --git a/data/clickhouse/lessons/._SUCCESS.crc b/data/clickhouse/lessons/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/clickhouse/lessons/._SUCCESS.crc differ diff --git a/data/clickhouse/lessons/.part-00000-1ba47d91-bbfd-426e-b4c4-5bac0f7fed60-c000.csv.crc b/data/clickhouse/lessons/.part-00000-1ba47d91-bbfd-426e-b4c4-5bac0f7fed60-c000.csv.crc new file mode 100644 index 0000000..9e0d9f9 Binary files /dev/null and b/data/clickhouse/lessons/.part-00000-1ba47d91-bbfd-426e-b4c4-5bac0f7fed60-c000.csv.crc differ diff --git a/data/clickhouse/lessons/_SUCCESS b/data/clickhouse/lessons/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/clickhouse/lessons/part-00000-1ba47d91-bbfd-426e-b4c4-5bac0f7fed60-c000.csv b/data/clickhouse/lessons/part-00000-1ba47d91-bbfd-426e-b4c4-5bac0f7fed60-c000.csv new file mode 100644 index 0000000..992a5d6 --- /dev/null +++ b/data/clickhouse/lessons/part-00000-1ba47d91-bbfd-426e-b4c4-5bac0f7fed60-c000.csv @@ -0,0 +1,6 @@ +id,course_id,title,duration_min +5.000000000000000000,3,Метрики и дашборды,18 +2.000000000000000000,1,JOIN,15 +4.000000000000000000,3,Основы BI,12 +1.000000000000000000,1,SELECT и FROM,10 +3.000000000000000000,2,Pandas,20 diff --git a/data/clickhouse/users/._SUCCESS.crc b/data/clickhouse/users/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/clickhouse/users/._SUCCESS.crc differ diff --git a/data/clickhouse/users/.part-00000-79e87344-f2e1-4e8c-ae08-472ab133b841-c000.csv.crc b/data/clickhouse/users/.part-00000-79e87344-f2e1-4e8c-ae08-472ab133b841-c000.csv.crc new file mode 100644 index 0000000..dfbbf4b Binary files /dev/null and b/data/clickhouse/users/.part-00000-79e87344-f2e1-4e8c-ae08-472ab133b841-c000.csv.crc differ diff --git a/data/clickhouse/users/_SUCCESS b/data/clickhouse/users/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/clickhouse/users/part-00000-79e87344-f2e1-4e8c-ae08-472ab133b841-c000.csv b/data/clickhouse/users/part-00000-79e87344-f2e1-4e8c-ae08-472ab133b841-c000.csv new file mode 100644 index 0000000..f49f0ab --- /dev/null +++ b/data/clickhouse/users/part-00000-79e87344-f2e1-4e8c-ae08-472ab133b841-c000.csv @@ -0,0 +1,6 @@ +id,name,age,email,registration_date +4.000000000000000000,Diana,28,diana@mail.com,2023-03-01 +3.000000000000000000,Charlie,22,charlie@mail.com,2023-02-20 +2.000000000000000000,Bob,30,bob@gmail.com,2023-02-05 +5.000000000000000000,Ethan,35,ethan@gmail.com,2023-03-10 +1.000000000000000000,Alice,25,alice@mail.com,2023-01-10 diff --git a/data/greenplum/dim_course/._SUCCESS.crc b/data/greenplum/dim_course/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/greenplum/dim_course/._SUCCESS.crc differ diff --git a/data/greenplum/dim_course/.part-00000-649ca74f-2283-48cd-8c05-4ddcdc9c965f-c000.csv.crc b/data/greenplum/dim_course/.part-00000-649ca74f-2283-48cd-8c05-4ddcdc9c965f-c000.csv.crc new file mode 100644 index 0000000..e46e171 Binary files /dev/null and b/data/greenplum/dim_course/.part-00000-649ca74f-2283-48cd-8c05-4ddcdc9c965f-c000.csv.crc differ diff --git a/data/greenplum/dim_course/_SUCCESS b/data/greenplum/dim_course/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/greenplum/dim_course/part-00000-649ca74f-2283-48cd-8c05-4ddcdc9c965f-c000.csv b/data/greenplum/dim_course/part-00000-649ca74f-2283-48cd-8c05-4ddcdc9c965f-c000.csv new file mode 100644 index 0000000..ad2e3fe --- /dev/null +++ b/data/greenplum/dim_course/part-00000-649ca74f-2283-48cd-8c05-4ddcdc9c965f-c000.csv @@ -0,0 +1,4 @@ +course_id,title,category +2,Python для анализа данных,programming +3,BI с нуля,business +1,SQL для начинающих,data diff --git a/data/greenplum/dim_lesson/._SUCCESS.crc b/data/greenplum/dim_lesson/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/greenplum/dim_lesson/._SUCCESS.crc differ diff --git a/data/greenplum/dim_lesson/.part-00000-50809363-8e16-4ec2-8caf-47074b281021-c000.csv.crc b/data/greenplum/dim_lesson/.part-00000-50809363-8e16-4ec2-8caf-47074b281021-c000.csv.crc new file mode 100644 index 0000000..8e4d31c Binary files /dev/null and b/data/greenplum/dim_lesson/.part-00000-50809363-8e16-4ec2-8caf-47074b281021-c000.csv.crc differ diff --git a/data/greenplum/dim_lesson/_SUCCESS b/data/greenplum/dim_lesson/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/greenplum/dim_lesson/part-00000-50809363-8e16-4ec2-8caf-47074b281021-c000.csv b/data/greenplum/dim_lesson/part-00000-50809363-8e16-4ec2-8caf-47074b281021-c000.csv new file mode 100644 index 0000000..797f475 --- /dev/null +++ b/data/greenplum/dim_lesson/part-00000-50809363-8e16-4ec2-8caf-47074b281021-c000.csv @@ -0,0 +1,6 @@ +lesson_id,title,duration_min,course_id +5,Метрики и дашборды,18,3 +1,SELECT и FROM,10,1 +3,Pandas,20,2 +4,Основы BI,12,3 +2,JOIN,15,1 diff --git a/data/greenplum/dim_user/._SUCCESS.crc b/data/greenplum/dim_user/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/greenplum/dim_user/._SUCCESS.crc differ diff --git a/data/greenplum/dim_user/.part-00000-d05900af-4ef1-4c92-8c32-c9cecac6e029-c000.csv.crc b/data/greenplum/dim_user/.part-00000-d05900af-4ef1-4c92-8c32-c9cecac6e029-c000.csv.crc new file mode 100644 index 0000000..c097ade Binary files /dev/null and b/data/greenplum/dim_user/.part-00000-d05900af-4ef1-4c92-8c32-c9cecac6e029-c000.csv.crc differ diff --git a/data/greenplum/dim_user/_SUCCESS b/data/greenplum/dim_user/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/greenplum/dim_user/part-00000-d05900af-4ef1-4c92-8c32-c9cecac6e029-c000.csv b/data/greenplum/dim_user/part-00000-d05900af-4ef1-4c92-8c32-c9cecac6e029-c000.csv new file mode 100644 index 0000000..5bc7b33 --- /dev/null +++ b/data/greenplum/dim_user/part-00000-d05900af-4ef1-4c92-8c32-c9cecac6e029-c000.csv @@ -0,0 +1,6 @@ +user_id,name,age,email,registration_date +1,Alice,25,alice@mail.com,2023-01-10 +5,Ethan,35,ethan@gmail.com,2023-03-10 +2,Bob,30,bob@gmail.com,2023-02-05 +3,Charlie,22,charlie@mail.com,2023-02-20 +4,Diana,28,diana@mail.com,2023-03-01 diff --git a/data/greenplum/fact_enrollments/._SUCCESS.crc b/data/greenplum/fact_enrollments/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/greenplum/fact_enrollments/._SUCCESS.crc differ diff --git a/data/greenplum/fact_enrollments/.part-00000-d311fabc-8fdc-47ee-9104-12970d7f94dc-c000.csv.crc b/data/greenplum/fact_enrollments/.part-00000-d311fabc-8fdc-47ee-9104-12970d7f94dc-c000.csv.crc new file mode 100644 index 0000000..f94d252 Binary files /dev/null and b/data/greenplum/fact_enrollments/.part-00000-d311fabc-8fdc-47ee-9104-12970d7f94dc-c000.csv.crc differ diff --git a/data/greenplum/fact_enrollments/_SUCCESS b/data/greenplum/fact_enrollments/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/greenplum/fact_enrollments/part-00000-d311fabc-8fdc-47ee-9104-12970d7f94dc-c000.csv b/data/greenplum/fact_enrollments/part-00000-d311fabc-8fdc-47ee-9104-12970d7f94dc-c000.csv new file mode 100644 index 0000000..98482fe --- /dev/null +++ b/data/greenplum/fact_enrollments/part-00000-d311fabc-8fdc-47ee-9104-12970d7f94dc-c000.csv @@ -0,0 +1,6 @@ +user_id,course_id,enrolled_at +1,2,2023-02-01T00:00:00.000+03:00 +1,1,2023-01-15T00:00:00.000+03:00 +4,3,2023-04-01T00:00:00.000+03:00 +2,1,2023-01-20T00:00:00.000+03:00 +3,2,2023-03-05T00:00:00.000+03:00 diff --git a/data/greenplum/fact_lesson_views/._SUCCESS.crc b/data/greenplum/fact_lesson_views/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/greenplum/fact_lesson_views/._SUCCESS.crc differ diff --git a/data/greenplum/fact_lesson_views/.part-00000-f8a87f91-7c0d-4669-b996-3e985d8c4d5f-c000.csv.crc b/data/greenplum/fact_lesson_views/.part-00000-f8a87f91-7c0d-4669-b996-3e985d8c4d5f-c000.csv.crc new file mode 100644 index 0000000..6bf7ebe Binary files /dev/null and b/data/greenplum/fact_lesson_views/.part-00000-f8a87f91-7c0d-4669-b996-3e985d8c4d5f-c000.csv.crc differ diff --git a/data/greenplum/fact_lesson_views/_SUCCESS b/data/greenplum/fact_lesson_views/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/greenplum/fact_lesson_views/part-00000-f8a87f91-7c0d-4669-b996-3e985d8c4d5f-c000.csv b/data/greenplum/fact_lesson_views/part-00000-f8a87f91-7c0d-4669-b996-3e985d8c4d5f-c000.csv new file mode 100644 index 0000000..3524f89 --- /dev/null +++ b/data/greenplum/fact_lesson_views/part-00000-f8a87f91-7c0d-4669-b996-3e985d8c4d5f-c000.csv @@ -0,0 +1,7 @@ +user_id,lesson_id,course_id,viewed_at +1,2,1,2023-01-16T10:15:00.000+03:00 +1,1,1,2023-01-16T10:00:00.000+03:00 +4,4,3,2023-04-02T10:00:00.000+03:00 +3,3,2,2023-03-06T12:00:00.000+03:00 +2,1,1,2023-01-21T09:00:00.000+03:00 +4,5,3,2023-04-03T10:00:00.000+03:00 diff --git a/data/marts/clickhouse/course_completion_rate/._SUCCESS.crc b/data/marts/clickhouse/course_completion_rate/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/clickhouse/course_completion_rate/._SUCCESS.crc differ diff --git a/data/marts/clickhouse/course_completion_rate/.part-00000-c4867fff-8099-44f4-b764-96b073565cbf-c000.csv.crc b/data/marts/clickhouse/course_completion_rate/.part-00000-c4867fff-8099-44f4-b764-96b073565cbf-c000.csv.crc new file mode 100644 index 0000000..a8602de Binary files /dev/null and b/data/marts/clickhouse/course_completion_rate/.part-00000-c4867fff-8099-44f4-b764-96b073565cbf-c000.csv.crc differ diff --git a/data/marts/clickhouse/course_completion_rate/_SUCCESS b/data/marts/clickhouse/course_completion_rate/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/clickhouse/course_completion_rate/part-00000-c4867fff-8099-44f4-b764-96b073565cbf-c000.csv b/data/marts/clickhouse/course_completion_rate/part-00000-c4867fff-8099-44f4-b764-96b073565cbf-c000.csv new file mode 100644 index 0000000..0d85c86 --- /dev/null +++ b/data/marts/clickhouse/course_completion_rate/part-00000-c4867fff-8099-44f4-b764-96b073565cbf-c000.csv @@ -0,0 +1,6 @@ +user_id,user_name,course_id,course_title,lessons_in_course,lessons_viewed,completion_rate +1,Alice,1,SQL для начинающих,2,2,1.0 +1,Alice,2,Python для анализа данных,1,0,0.0 +2,Bob,1,SQL для начинающих,2,1,0.5 +3,Charlie,2,Python для анализа данных,1,1,1.0 +4,Diana,3,BI с нуля,2,2,1.0 diff --git a/data/marts/clickhouse/inactive_users_summary/._SUCCESS.crc b/data/marts/clickhouse/inactive_users_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/clickhouse/inactive_users_summary/._SUCCESS.crc differ diff --git a/data/marts/clickhouse/inactive_users_summary/.part-00000-f06a0d71-9736-4628-bb4e-38dc5be14d15-c000.csv.crc b/data/marts/clickhouse/inactive_users_summary/.part-00000-f06a0d71-9736-4628-bb4e-38dc5be14d15-c000.csv.crc new file mode 100644 index 0000000..6329fa2 Binary files /dev/null and b/data/marts/clickhouse/inactive_users_summary/.part-00000-f06a0d71-9736-4628-bb4e-38dc5be14d15-c000.csv.crc differ diff --git a/data/marts/clickhouse/inactive_users_summary/_SUCCESS b/data/marts/clickhouse/inactive_users_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/clickhouse/inactive_users_summary/part-00000-f06a0d71-9736-4628-bb4e-38dc5be14d15-c000.csv b/data/marts/clickhouse/inactive_users_summary/part-00000-f06a0d71-9736-4628-bb4e-38dc5be14d15-c000.csv new file mode 100644 index 0000000..484fef8 --- /dev/null +++ b/data/marts/clickhouse/inactive_users_summary/part-00000-f06a0d71-9736-4628-bb4e-38dc5be14d15-c000.csv @@ -0,0 +1,2 @@ +user_id,user_name,user_email,user_age,user_registration_date,enrollments_count +5,Ethan,ethan@gmail.com,35,2023-03-10,0 diff --git a/data/marts/clickhouse/lesson_popularity_summary/._SUCCESS.crc b/data/marts/clickhouse/lesson_popularity_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/clickhouse/lesson_popularity_summary/._SUCCESS.crc differ diff --git a/data/marts/clickhouse/lesson_popularity_summary/.part-00000-8115cf5c-950f-4566-9655-a4eb5a49c3b3-c000.csv.crc b/data/marts/clickhouse/lesson_popularity_summary/.part-00000-8115cf5c-950f-4566-9655-a4eb5a49c3b3-c000.csv.crc new file mode 100644 index 0000000..40eec70 Binary files /dev/null and b/data/marts/clickhouse/lesson_popularity_summary/.part-00000-8115cf5c-950f-4566-9655-a4eb5a49c3b3-c000.csv.crc differ diff --git a/data/marts/clickhouse/lesson_popularity_summary/_SUCCESS b/data/marts/clickhouse/lesson_popularity_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/clickhouse/lesson_popularity_summary/part-00000-8115cf5c-950f-4566-9655-a4eb5a49c3b3-c000.csv b/data/marts/clickhouse/lesson_popularity_summary/part-00000-8115cf5c-950f-4566-9655-a4eb5a49c3b3-c000.csv new file mode 100644 index 0000000..9939a3d --- /dev/null +++ b/data/marts/clickhouse/lesson_popularity_summary/part-00000-8115cf5c-950f-4566-9655-a4eb5a49c3b3-c000.csv @@ -0,0 +1,6 @@ +lesson_id,lesson_title,course_id,course_title,total_views,unique_users,first_view,last_view +1,SELECT и FROM,1,SQL для начинающих,2,2,2023-01-16T10:00:00.000+03:00,2023-01-21T09:00:00.000+03:00 +2,JOIN,1,SQL для начинающих,1,1,2023-01-16T10:15:00.000+03:00,2023-01-16T10:15:00.000+03:00 +3,Pandas,2,Python для анализа данных,1,1,2023-03-06T12:00:00.000+03:00,2023-03-06T12:00:00.000+03:00 +4,Основы BI,3,BI с нуля,1,1,2023-04-02T10:00:00.000+03:00,2023-04-02T10:00:00.000+03:00 +5,Метрики и дашборды,3,BI с нуля,1,1,2023-04-03T10:00:00.000+03:00,2023-04-03T10:00:00.000+03:00 diff --git a/data/marts/greenplum/course_completion_rate/._SUCCESS.crc b/data/marts/greenplum/course_completion_rate/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/greenplum/course_completion_rate/._SUCCESS.crc differ diff --git a/data/marts/greenplum/course_completion_rate/.part-00000-e353fa40-b1ae-4614-8932-8c694ff4295f-c000.csv.crc b/data/marts/greenplum/course_completion_rate/.part-00000-e353fa40-b1ae-4614-8932-8c694ff4295f-c000.csv.crc new file mode 100644 index 0000000..a8602de Binary files /dev/null and b/data/marts/greenplum/course_completion_rate/.part-00000-e353fa40-b1ae-4614-8932-8c694ff4295f-c000.csv.crc differ diff --git a/data/marts/greenplum/course_completion_rate/_SUCCESS b/data/marts/greenplum/course_completion_rate/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/greenplum/course_completion_rate/part-00000-e353fa40-b1ae-4614-8932-8c694ff4295f-c000.csv b/data/marts/greenplum/course_completion_rate/part-00000-e353fa40-b1ae-4614-8932-8c694ff4295f-c000.csv new file mode 100644 index 0000000..0d85c86 --- /dev/null +++ b/data/marts/greenplum/course_completion_rate/part-00000-e353fa40-b1ae-4614-8932-8c694ff4295f-c000.csv @@ -0,0 +1,6 @@ +user_id,user_name,course_id,course_title,lessons_in_course,lessons_viewed,completion_rate +1,Alice,1,SQL для начинающих,2,2,1.0 +1,Alice,2,Python для анализа данных,1,0,0.0 +2,Bob,1,SQL для начинающих,2,1,0.5 +3,Charlie,2,Python для анализа данных,1,1,1.0 +4,Diana,3,BI с нуля,2,2,1.0 diff --git a/data/marts/greenplum/inactive_users_summary/._SUCCESS.crc b/data/marts/greenplum/inactive_users_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/greenplum/inactive_users_summary/._SUCCESS.crc differ diff --git a/data/marts/greenplum/inactive_users_summary/.part-00000-cf2138fd-4baa-4151-b5f5-630b6a4b5e58-c000.csv.crc b/data/marts/greenplum/inactive_users_summary/.part-00000-cf2138fd-4baa-4151-b5f5-630b6a4b5e58-c000.csv.crc new file mode 100644 index 0000000..f3885aa Binary files /dev/null and b/data/marts/greenplum/inactive_users_summary/.part-00000-cf2138fd-4baa-4151-b5f5-630b6a4b5e58-c000.csv.crc differ diff --git a/data/marts/greenplum/inactive_users_summary/_SUCCESS b/data/marts/greenplum/inactive_users_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/greenplum/inactive_users_summary/part-00000-cf2138fd-4baa-4151-b5f5-630b6a4b5e58-c000.csv b/data/marts/greenplum/inactive_users_summary/part-00000-cf2138fd-4baa-4151-b5f5-630b6a4b5e58-c000.csv new file mode 100644 index 0000000..0a03e95 --- /dev/null +++ b/data/marts/greenplum/inactive_users_summary/part-00000-cf2138fd-4baa-4151-b5f5-630b6a4b5e58-c000.csv @@ -0,0 +1,2 @@ +user_id,user_name,email,age,registration_date,enrollments_count +5,Ethan,ethan@gmail.com,35,2023-03-10,0 diff --git a/data/marts/greenplum/lesson_popularity_summary/._SUCCESS.crc b/data/marts/greenplum/lesson_popularity_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/greenplum/lesson_popularity_summary/._SUCCESS.crc differ diff --git a/data/marts/greenplum/lesson_popularity_summary/.part-00000-4e240af5-02fb-4c41-a17f-eb33ee5153a4-c000.csv.crc b/data/marts/greenplum/lesson_popularity_summary/.part-00000-4e240af5-02fb-4c41-a17f-eb33ee5153a4-c000.csv.crc new file mode 100644 index 0000000..40eec70 Binary files /dev/null and b/data/marts/greenplum/lesson_popularity_summary/.part-00000-4e240af5-02fb-4c41-a17f-eb33ee5153a4-c000.csv.crc differ diff --git a/data/marts/greenplum/lesson_popularity_summary/_SUCCESS b/data/marts/greenplum/lesson_popularity_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/greenplum/lesson_popularity_summary/part-00000-4e240af5-02fb-4c41-a17f-eb33ee5153a4-c000.csv b/data/marts/greenplum/lesson_popularity_summary/part-00000-4e240af5-02fb-4c41-a17f-eb33ee5153a4-c000.csv new file mode 100644 index 0000000..9939a3d --- /dev/null +++ b/data/marts/greenplum/lesson_popularity_summary/part-00000-4e240af5-02fb-4c41-a17f-eb33ee5153a4-c000.csv @@ -0,0 +1,6 @@ +lesson_id,lesson_title,course_id,course_title,total_views,unique_users,first_view,last_view +1,SELECT и FROM,1,SQL для начинающих,2,2,2023-01-16T10:00:00.000+03:00,2023-01-21T09:00:00.000+03:00 +2,JOIN,1,SQL для начинающих,1,1,2023-01-16T10:15:00.000+03:00,2023-01-16T10:15:00.000+03:00 +3,Pandas,2,Python для анализа данных,1,1,2023-03-06T12:00:00.000+03:00,2023-03-06T12:00:00.000+03:00 +4,Основы BI,3,BI с нуля,1,1,2023-04-02T10:00:00.000+03:00,2023-04-02T10:00:00.000+03:00 +5,Метрики и дашборды,3,BI с нуля,1,1,2023-04-03T10:00:00.000+03:00,2023-04-03T10:00:00.000+03:00 diff --git a/data/marts/postgresql/course_summary/._SUCCESS.crc b/data/marts/postgresql/course_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/postgresql/course_summary/._SUCCESS.crc differ diff --git a/data/marts/postgresql/course_summary/.part-00000-7777b1b0-c1ca-4556-a247-6b27cf47f938-c000.csv.crc b/data/marts/postgresql/course_summary/.part-00000-7777b1b0-c1ca-4556-a247-6b27cf47f938-c000.csv.crc new file mode 100644 index 0000000..9971373 Binary files /dev/null and b/data/marts/postgresql/course_summary/.part-00000-7777b1b0-c1ca-4556-a247-6b27cf47f938-c000.csv.crc differ diff --git a/data/marts/postgresql/course_summary/_SUCCESS b/data/marts/postgresql/course_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/postgresql/course_summary/part-00000-7777b1b0-c1ca-4556-a247-6b27cf47f938-c000.csv b/data/marts/postgresql/course_summary/part-00000-7777b1b0-c1ca-4556-a247-6b27cf47f938-c000.csv new file mode 100644 index 0000000..43d90df --- /dev/null +++ b/data/marts/postgresql/course_summary/part-00000-7777b1b0-c1ca-4556-a247-6b27cf47f938-c000.csv @@ -0,0 +1,4 @@ +course_id,course_title,total_views,unique_users,lessons_count,avg_views_per_user,first_viewed_at,last_viewed_at +1,SQL для начинающих,3,2,2,1.5,2023-01-16T10:00:00.000+03:00,2023-01-21T09:00:00.000+03:00 +2,Python для анализа данных,1,2,1,0.5,2023-03-06T12:00:00.000+03:00,2023-03-06T12:00:00.000+03:00 +3,BI с нуля,2,1,2,2.0,2023-04-02T10:00:00.000+03:00,2023-04-03T10:00:00.000+03:00 diff --git a/data/marts/postgresql/platform_summary/._SUCCESS.crc b/data/marts/postgresql/platform_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/postgresql/platform_summary/._SUCCESS.crc differ diff --git a/data/marts/postgresql/platform_summary/.part-00000-188edaca-41e1-43e5-98bb-d9bced06bdf1-c000.csv.crc b/data/marts/postgresql/platform_summary/.part-00000-188edaca-41e1-43e5-98bb-d9bced06bdf1-c000.csv.crc new file mode 100644 index 0000000..c438de6 Binary files /dev/null and b/data/marts/postgresql/platform_summary/.part-00000-188edaca-41e1-43e5-98bb-d9bced06bdf1-c000.csv.crc differ diff --git a/data/marts/postgresql/platform_summary/_SUCCESS b/data/marts/postgresql/platform_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/postgresql/platform_summary/part-00000-188edaca-41e1-43e5-98bb-d9bced06bdf1-c000.csv b/data/marts/postgresql/platform_summary/part-00000-188edaca-41e1-43e5-98bb-d9bced06bdf1-c000.csv new file mode 100644 index 0000000..d1671a6 --- /dev/null +++ b/data/marts/postgresql/platform_summary/part-00000-188edaca-41e1-43e5-98bb-d9bced06bdf1-c000.csv @@ -0,0 +1,2 @@ +total_users,total_courses,total_lessons,users_with_views,avg_lessons_per_course,avg_views_per_lesson +5,3,5,4,1.67,2.6 diff --git a/data/marts/postgresql/user_activity_summary/._SUCCESS.crc b/data/marts/postgresql/user_activity_summary/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/marts/postgresql/user_activity_summary/._SUCCESS.crc differ diff --git a/data/marts/postgresql/user_activity_summary/.part-00000-0ed600f1-d0ee-432a-86f0-f7e2e95eb025-c000.csv.crc b/data/marts/postgresql/user_activity_summary/.part-00000-0ed600f1-d0ee-432a-86f0-f7e2e95eb025-c000.csv.crc new file mode 100644 index 0000000..54e40f2 Binary files /dev/null and b/data/marts/postgresql/user_activity_summary/.part-00000-0ed600f1-d0ee-432a-86f0-f7e2e95eb025-c000.csv.crc differ diff --git a/data/marts/postgresql/user_activity_summary/_SUCCESS b/data/marts/postgresql/user_activity_summary/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/marts/postgresql/user_activity_summary/part-00000-0ed600f1-d0ee-432a-86f0-f7e2e95eb025-c000.csv b/data/marts/postgresql/user_activity_summary/part-00000-0ed600f1-d0ee-432a-86f0-f7e2e95eb025-c000.csv new file mode 100644 index 0000000..10bf4b9 --- /dev/null +++ b/data/marts/postgresql/user_activity_summary/part-00000-0ed600f1-d0ee-432a-86f0-f7e2e95eb025-c000.csv @@ -0,0 +1,5 @@ +user_id,name,enrollment_count,viewed_lessons_count,last_view,first_view,engagement_rate +2,Bob,1,1,2023-01-21T09:00:00.000+03:00,2023-01-21T09:00:00.000+03:00,50.0% +1,Alice,2,2,2023-01-16T10:15:00.000+03:00,2023-01-16T10:00:00.000+03:00,66.67% +3,Charlie,1,1,2023-03-06T12:00:00.000+03:00,2023-03-06T12:00:00.000+03:00,100.0% +4,Diana,1,2,2023-04-03T10:00:00.000+03:00,2023-04-02T10:00:00.000+03:00,100.0% diff --git a/data/postgresql/courses/._SUCCESS.crc b/data/postgresql/courses/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/postgresql/courses/._SUCCESS.crc differ diff --git a/data/postgresql/courses/.part-00000-590b85f0-27d0-4842-bc89-bbe601542e72-c000.csv.crc b/data/postgresql/courses/.part-00000-590b85f0-27d0-4842-bc89-bbe601542e72-c000.csv.crc new file mode 100644 index 0000000..9bcdab1 Binary files /dev/null and b/data/postgresql/courses/.part-00000-590b85f0-27d0-4842-bc89-bbe601542e72-c000.csv.crc differ diff --git a/data/postgresql/courses/_SUCCESS b/data/postgresql/courses/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/postgresql/courses/part-00000-590b85f0-27d0-4842-bc89-bbe601542e72-c000.csv b/data/postgresql/courses/part-00000-590b85f0-27d0-4842-bc89-bbe601542e72-c000.csv new file mode 100644 index 0000000..5f19346 --- /dev/null +++ b/data/postgresql/courses/part-00000-590b85f0-27d0-4842-bc89-bbe601542e72-c000.csv @@ -0,0 +1,4 @@ +id,title,category,created_at +1,SQL для начинающих,data,2023-01-01 +2,Python для анализа данных,programming,2023-01-15 +3,BI с нуля,business,2023-03-01 diff --git a/data/postgresql/enrollments/._SUCCESS.crc b/data/postgresql/enrollments/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/postgresql/enrollments/._SUCCESS.crc differ diff --git a/data/postgresql/enrollments/.part-00000-ea9b6889-39de-4b73-9772-55366146f7f7-c000.csv.crc b/data/postgresql/enrollments/.part-00000-ea9b6889-39de-4b73-9772-55366146f7f7-c000.csv.crc new file mode 100644 index 0000000..00aade4 Binary files /dev/null and b/data/postgresql/enrollments/.part-00000-ea9b6889-39de-4b73-9772-55366146f7f7-c000.csv.crc differ diff --git a/data/postgresql/enrollments/_SUCCESS b/data/postgresql/enrollments/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/postgresql/enrollments/part-00000-ea9b6889-39de-4b73-9772-55366146f7f7-c000.csv b/data/postgresql/enrollments/part-00000-ea9b6889-39de-4b73-9772-55366146f7f7-c000.csv new file mode 100644 index 0000000..995a0cc --- /dev/null +++ b/data/postgresql/enrollments/part-00000-ea9b6889-39de-4b73-9772-55366146f7f7-c000.csv @@ -0,0 +1,6 @@ +id,user_id,course_id,enrolled_at +1,1,1,2023-01-15 +2,1,2,2023-02-01 +3,2,1,2023-01-20 +4,3,2,2023-03-05 +5,4,3,2023-04-01 diff --git a/data/postgresql/lesson_views/._SUCCESS.crc b/data/postgresql/lesson_views/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/postgresql/lesson_views/._SUCCESS.crc differ diff --git a/data/postgresql/lesson_views/.part-00000-4388aea9-9203-4df1-925b-bfe2cc27cdf0-c000.csv.crc b/data/postgresql/lesson_views/.part-00000-4388aea9-9203-4df1-925b-bfe2cc27cdf0-c000.csv.crc new file mode 100644 index 0000000..2628fb8 Binary files /dev/null and b/data/postgresql/lesson_views/.part-00000-4388aea9-9203-4df1-925b-bfe2cc27cdf0-c000.csv.crc differ diff --git a/data/postgresql/lesson_views/_SUCCESS b/data/postgresql/lesson_views/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/postgresql/lesson_views/part-00000-4388aea9-9203-4df1-925b-bfe2cc27cdf0-c000.csv b/data/postgresql/lesson_views/part-00000-4388aea9-9203-4df1-925b-bfe2cc27cdf0-c000.csv new file mode 100644 index 0000000..944cdfb --- /dev/null +++ b/data/postgresql/lesson_views/part-00000-4388aea9-9203-4df1-925b-bfe2cc27cdf0-c000.csv @@ -0,0 +1,7 @@ +id,user_id,lesson_id,viewed_at +1,1,1,2023-01-16T10:00:00.000+03:00 +2,1,2,2023-01-16T10:15:00.000+03:00 +3,2,1,2023-01-21T09:00:00.000+03:00 +4,3,3,2023-03-06T12:00:00.000+03:00 +5,4,4,2023-04-02T10:00:00.000+03:00 +6,4,5,2023-04-03T10:00:00.000+03:00 diff --git a/data/postgresql/lessons/._SUCCESS.crc b/data/postgresql/lessons/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/postgresql/lessons/._SUCCESS.crc differ diff --git a/data/postgresql/lessons/.part-00000-35ab76dc-0f6b-48ef-9a8d-5a6396efdb9e-c000.csv.crc b/data/postgresql/lessons/.part-00000-35ab76dc-0f6b-48ef-9a8d-5a6396efdb9e-c000.csv.crc new file mode 100644 index 0000000..a91e186 Binary files /dev/null and b/data/postgresql/lessons/.part-00000-35ab76dc-0f6b-48ef-9a8d-5a6396efdb9e-c000.csv.crc differ diff --git a/data/postgresql/lessons/_SUCCESS b/data/postgresql/lessons/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/postgresql/lessons/part-00000-35ab76dc-0f6b-48ef-9a8d-5a6396efdb9e-c000.csv b/data/postgresql/lessons/part-00000-35ab76dc-0f6b-48ef-9a8d-5a6396efdb9e-c000.csv new file mode 100644 index 0000000..38d29a7 --- /dev/null +++ b/data/postgresql/lessons/part-00000-35ab76dc-0f6b-48ef-9a8d-5a6396efdb9e-c000.csv @@ -0,0 +1,6 @@ +id,course_id,title,duration_min +1,1,SELECT и FROM,10 +2,1,JOIN,15 +3,2,Pandas,20 +4,3,Основы BI,12 +5,3,Метрики и дашборды,18 diff --git a/data/postgresql/users/._SUCCESS.crc b/data/postgresql/users/._SUCCESS.crc new file mode 100644 index 0000000..3b7b044 Binary files /dev/null and b/data/postgresql/users/._SUCCESS.crc differ diff --git a/data/postgresql/users/.part-00000-c5d54c54-96a4-4465-ac64-2e090564e64c-c000.csv.crc b/data/postgresql/users/.part-00000-c5d54c54-96a4-4465-ac64-2e090564e64c-c000.csv.crc new file mode 100644 index 0000000..793bb33 Binary files /dev/null and b/data/postgresql/users/.part-00000-c5d54c54-96a4-4465-ac64-2e090564e64c-c000.csv.crc differ diff --git a/data/postgresql/users/_SUCCESS b/data/postgresql/users/_SUCCESS new file mode 100644 index 0000000..e69de29 diff --git a/data/postgresql/users/part-00000-c5d54c54-96a4-4465-ac64-2e090564e64c-c000.csv b/data/postgresql/users/part-00000-c5d54c54-96a4-4465-ac64-2e090564e64c-c000.csv new file mode 100644 index 0000000..8cc56d0 --- /dev/null +++ b/data/postgresql/users/part-00000-c5d54c54-96a4-4465-ac64-2e090564e64c-c000.csv @@ -0,0 +1,6 @@ +id,name,age,email,registration_date +1,Alice,25,alice@mail.com,2023-01-10 +2,Bob,30,bob@gmail.com,2023-02-05 +3,Charlie,22,charlie@mail.com,2023-02-20 +4,Diana,28,diana@mail.com,2023-03-01 +5,Ethan,35,ethan@gmail.com,2023-03-10 diff --git a/jars/clickhouse-jdbc-0.3.2-shaded.jar b/jars/clickhouse-jdbc-0.3.2-shaded.jar new file mode 100644 index 0000000..a4cf5c6 Binary files /dev/null and b/jars/clickhouse-jdbc-0.3.2-shaded.jar differ diff --git a/jars/postgresql-42.6.0.jar b/jars/postgresql-42.6.0.jar new file mode 100644 index 0000000..02f902a Binary files /dev/null and b/jars/postgresql-42.6.0.jar differ