├── .gitignore ├── .scalafmt.conf ├── LICENSE ├── README.md ├── img └── pic1.jpg ├── pom.xml ├── script ├── create_dataset.py ├── crontab.py ├── deploy.py ├── submit.py └── topic.py ├── sql ├── impala.sql ├── window_data_move.sql ├── window_partition_shift.sql └── window_view_alter.sql └── src ├── main ├── resources │ ├── application.conf │ ├── ip2region.db │ └── log4j.properties └── scala │ └── com │ └── wzx │ ├── common │ ├── Constant.scala │ ├── FilePath.scala │ └── TableName.scala │ ├── entity │ ├── Event.scala │ └── Profile.scala │ ├── extracting │ ├── NewRegisterExtract.scala │ └── VideoVisitOver100.scala │ ├── mock │ └── Upload2Kafka.scala │ ├── sink │ └── KuduSink.scala │ ├── streaming │ ├── DataExtract.scala │ └── ProfileMapper.scala │ └── util │ ├── DateUtil.scala │ ├── IpUtil.scala │ ├── OptionUtil.scala │ └── TransformUtil.scala └── test ├── resources ├── log4j.properties └── mock_data └── scala └── com └── wzx ├── extracting ├── NewRegisterExtractTest.scala └── VideoVisitOver100Test.scala ├── mock └── Upload2KafkaTest.scala └── streaming ├── DataExtractTest.scala └── ProfileMapperTest.scala /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/.gitignore -------------------------------------------------------------------------------- /.scalafmt.conf: -------------------------------------------------------------------------------- 1 | version = 2.5.0 -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/README.md -------------------------------------------------------------------------------- /img/pic1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/img/pic1.jpg -------------------------------------------------------------------------------- /pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/pom.xml -------------------------------------------------------------------------------- /script/create_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/script/create_dataset.py -------------------------------------------------------------------------------- /script/crontab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/script/crontab.py -------------------------------------------------------------------------------- /script/deploy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/script/deploy.py -------------------------------------------------------------------------------- /script/submit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/script/submit.py -------------------------------------------------------------------------------- /script/topic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/script/topic.py -------------------------------------------------------------------------------- /sql/impala.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/sql/impala.sql -------------------------------------------------------------------------------- /sql/window_data_move.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/sql/window_data_move.sql -------------------------------------------------------------------------------- /sql/window_partition_shift.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/sql/window_partition_shift.sql -------------------------------------------------------------------------------- /sql/window_view_alter.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/sql/window_view_alter.sql -------------------------------------------------------------------------------- /src/main/resources/application.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/resources/application.conf -------------------------------------------------------------------------------- /src/main/resources/ip2region.db: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/resources/ip2region.db -------------------------------------------------------------------------------- /src/main/resources/log4j.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/resources/log4j.properties -------------------------------------------------------------------------------- /src/main/scala/com/wzx/common/Constant.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/common/Constant.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/common/FilePath.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/common/FilePath.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/common/TableName.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/common/TableName.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/entity/Event.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/entity/Event.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/entity/Profile.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/entity/Profile.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/extracting/NewRegisterExtract.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/extracting/NewRegisterExtract.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/extracting/VideoVisitOver100.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/extracting/VideoVisitOver100.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/mock/Upload2Kafka.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/mock/Upload2Kafka.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/sink/KuduSink.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/sink/KuduSink.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/streaming/DataExtract.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/streaming/DataExtract.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/streaming/ProfileMapper.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/streaming/ProfileMapper.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/util/DateUtil.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/util/DateUtil.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/util/IpUtil.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/util/IpUtil.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/util/OptionUtil.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/util/OptionUtil.scala -------------------------------------------------------------------------------- /src/main/scala/com/wzx/util/TransformUtil.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/main/scala/com/wzx/util/TransformUtil.scala -------------------------------------------------------------------------------- /src/test/resources/log4j.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/resources/log4j.properties -------------------------------------------------------------------------------- /src/test/resources/mock_data: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/resources/mock_data -------------------------------------------------------------------------------- /src/test/scala/com/wzx/extracting/NewRegisterExtractTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/scala/com/wzx/extracting/NewRegisterExtractTest.scala -------------------------------------------------------------------------------- /src/test/scala/com/wzx/extracting/VideoVisitOver100Test.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/scala/com/wzx/extracting/VideoVisitOver100Test.scala -------------------------------------------------------------------------------- /src/test/scala/com/wzx/mock/Upload2KafkaTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/scala/com/wzx/mock/Upload2KafkaTest.scala -------------------------------------------------------------------------------- /src/test/scala/com/wzx/streaming/DataExtractTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/scala/com/wzx/streaming/DataExtractTest.scala -------------------------------------------------------------------------------- /src/test/scala/com/wzx/streaming/ProfileMapperTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzx140/LabelLogAnalysis/HEAD/src/test/scala/com/wzx/streaming/ProfileMapperTest.scala --------------------------------------------------------------------------------