├── .gitignore
├── LICENSE
├── README.md
├── pom.xml
└── src
    ├── main
        └── java
        │   ├── cn
        │       └── net
        │       │   └── communion
        │       │       └── sync
        │       │           ├── elasticsearch
        │       │               └── Client.java
        │       │           ├── entity
        │       │               ├── JobInfo.java
        │       │               └── Node.java
        │       │           ├── helper
        │       │               └── SysProps.java
        │       │           ├── main
        │       │               └── App.java
        │       │           ├── quartz
        │       │               ├── JobScheduler.java
        │       │               └── Listener.java
        │       │           ├── service
        │       │               └── JdbcConnector.java
        │       │           └── task
        │       │               └── Task.java
        │   ├── log4j.properties
        │   └── spring
        │       ├── root.xml
        │       └── xml
        │           ├── client.xml
        │           ├── db.xml
        │           ├── jobs.xml
        │           └── nodes.xml
    └── test
        └── java
            └── cn
                └── net
                    └── communion
                        └── sync
                            └── AppTest.java


/.gitignore:
--------------------------------------------------------------------------------
1 | /target
2 | .settings
3 | .classpath
4 | .project
5 | *.log
6 | sys.properties


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | The MIT License (MIT)
 2 | 
 3 | Copyright (c) 2016 GongDexing
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | ## elasticsearch-mysql简单实用的同步工具
  2 | 简单实用的同步工具，实现mysql数据库中数据定期同步到elasticsearch，只需简单的配置，便能达到非凡的效果。
  3 | 
  4 | ## 配置说明
  5 | 主要配置在spring/xml目录下面的四个xml文件中
  6 | - **client.xml**：配置cluster.name(集群名称)，集群名称要和elasticsearch保持一致，可以参考elasticsearch.yaml文件
  7 | - **db.xml**：配置mysql数据库的连接方式，数据连接池使用的Druid，主要是设置url、username、password，其他采用默认配置即可
  8 | - **jobs.xml**：配置数据同步的任务，可以配置多个job，每个job包括：name(任务名称，不要出现重复)、index(elasticsearch的索引)、type(elasticsearch的type)、cron(任务的调度机制)、sql(查询mysql的sql语句)、step(分页查询的的每页数量limit x, **step**)、params(sql语句的参数，用于实现增量同步)、paramTypes(参数类型)
  9 | - **nodes.xml**：配置同步到的elasticsearch节点，可以配置多个，每个节点包括：ip(节点的ip地址)、port(节点的端口，一般为9300)
 10 | 
 11 | ## 编译运行
 12 | > git clone git@192.168.1.244:hainan-bigdata/elasticsearch-mysql.git<br/>
 13 | > cd elasticsearch-mysql<br/>
 14 | > mvn clean package<br/>
 15 | > java -jar target/elasticsearch-mysql-0.0.1-SNAPSHOT.jar
 16 | 
 17 | ## 测试
 18 | > $ curl -XGET "127.0.0.1:9200/data/comment/_search?pretty"<br/>
 19 | 
 20 | ```js
 21 |  {
 22 |    "took" : 34,
 23 |    "timed_out" : false,
 24 |    "_shards" : {
 25 |      "total" : 5,
 26 |      "successful" : 5,
 27 |      "failed" : 0
 28 |    },
 29 |    "hits" : {
 30 |      "total" : 39,
 31 |      "max_score" : 1.0,
 32 |      "hits" : [
 33 |        {
 34 |          "_index" : "data",
 35 |          "_type" : "comment",
 36 |          ...
 37 | ```
 38 | 
 39 | ## 实现原理
 40 | ### 增量同步
 41 | 为了提供同步的效率和对数据库的压力，建议在配置是都采用增量同步的方式，前提是数据表中有设置与时间相关的字段，根据该字段每次同步只会同步新的数据，而不是把已经同步过的字段再同步一遍。
 42 | ##### 举例说明
 43 | ```
 44 |  <bean class="cn.net.communion.sync.entity.JobInfo"
 45 |   p:name="job2"
 46 |   p:index="data"
 47 |   p:type="comment"
 48 |   p:cron="0/10 * * * * ?"
 49 |   p:sql="select id,comment from tbl_comment where time > ?"
 50 |   p:params="sys.lastTime2"
 51 |   p:paramTypes="12"/>
 52 | ```
 53 | 在job2的配置中设置sql的条件为 **time > ?** ，而 **?** 指的是 **sys.lastTime2** ，这样每次同步都只会上次同步后更新的数据，**sys.lastTime2** 的名称可以随意更改，但是不要出现重复，每次同步完以后， 将开始同步的时间会为**value**， **sys.lastTime2** 作为 **key** 更新到sys.properties文件中。
 54 | > sys.properties文件内容举例
 55 | 
 56 | ```
 57 | #last job finish at
 58 | #Wed Dec 21 15:08:10 CST 2016
 59 | sys.lastTime2=2016-12-21T15\:08\:10.003
 60 | sys.lastTime1=2016-12-21T15\:08\:10.002
 61 | ```
 62 | 
 63 | 因此，要想实现全量同步也非常简单，只需将sys.properties文件删除即可，  当程序没有检测到sys.properties文件，便会将所有的数据同步到elasticsearch中。
 64 | ### 调度机制
 65 | 采用quartz实现任务调度，最小的粒度可以到秒级，涉及quartz相关的代码主要在JobScheduler.java和Listener.java两个文件中
 66 | > JobScheduler部分代码片段
 67 | 
 68 | ```java
 69 | public JobScheduler pushJobs(Collection<JobInfo> infos) {
 70 |     infos.forEach(info -> {
 71 |         JobDetail job = newJob(Task.class).withIdentity(info.getName(), "jobs").build();
 72 |         job.getJobDataMap().put("jobInfo", info);
 73 |         CronTrigger trigger = newTrigger().withIdentity(info.getName(), "triggers")
 74 |                 .withSchedule(cronSchedule(info.getCron())).build();
 75 |         try {
 76 |             scheduler.scheduleJob(job, trigger);
 77 |         } catch (SchedulerException e) {
 78 |             e.printStackTrace();
 79 |         }
 80 |     });
 81 |     return this;
 82 | }
 83 | 
 84 | public boolean isRunning(String jobKey) {
 85 |     try {
 86 |         for (JobExecutionContext context : scheduler.getCurrentlyExecutingJobs()) {
 87 |             if (context.getJobDetail().getKey().getName().equals(jobKey)) {
 88 |                 return true;
 89 |             }
 90 |         }
 91 |     } catch (SchedulerException e) {
 92 |         logger.info("get jobs status failed");
 93 |         e.printStackTrace();
 94 |     }
 95 |     return false;
 96 | }
 97 | 
 98 | public void start() throws SchedulerException {
 99 |     scheduler.start();
100 | }
101 | ```
102 | 
103 | 代码说明：
104 | - **pushJobs()** 实现将jobs.xml配置的job添加进quartz的scheduler中
105 | - **isRunning()** 根据job.name检测某个任务是否处于运行状态，对于调度间隔比较短或者同步时间的比较的任务，可能出现新的任务已经开始然而上个任务还未执行完成，这时新的任务会直接被取消执行
106 | - **start()** 启动任务调度
107 | 
108 | 
109 | > Listener部分代码片段
110 | 
111 | ```java
112 | @Override
113 | public void jobToBeExecuted(JobExecutionContext context) {
114 |     String jobKey = context.getJobDetail().getKey().getName();
115 |     boolean isCancel = JobScheduler.getInstance().isRunning(jobKey);
116 |     context.getJobDetail().getJobDataMap().put("cancel", isCancel);
117 | }
118 | ```
119 | 代码说明:
120 | - 每一个任务执行之前均会调用 **jobToBeExecuted()** ，在该方法中调用 **JobScheduler** 的 **isRunning** 并且设置 **isCancel** 值，如果 **isCancel** 为 **true** 便会取消任务的执行。
121 | 


--------------------------------------------------------------------------------
/pom.xml:
--------------------------------------------------------------------------------
  1 | <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  2 | 	xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
  3 | 	<modelVersion>4.0.0</modelVersion>
  4 | 
  5 | 	<groupId>cn.net.communion</groupId>
  6 | 	<artifactId>elasticsearch-mysql</artifactId>
  7 | 	<version>0.0.1-SNAPSHOT</version>
  8 | 	<packaging>jar</packaging>
  9 | 
 10 | 	<name>elasticsearch-mysql</name>
 11 | 	<url>http://maven.apache.org</url>
 12 | 
 13 | 	<properties>
 14 | 		<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
 15 | 	</properties>
 16 | 
 17 | 	<dependencies>
 18 | 		<dependency>
 19 | 			<groupId>junit</groupId>
 20 | 			<artifactId>junit</artifactId>
 21 | 			<version>3.8.1</version>
 22 | 			<scope>test</scope>
 23 | 		</dependency>
 24 | 		<dependency>
 25 | 		    <groupId>org.springframework</groupId>
 26 | 		    <artifactId>spring-core</artifactId>
 27 | 		    <version>4.3.4.RELEASE</version>
 28 | 		</dependency>
 29 | 		
 30 | 		<dependency>
 31 | 		    <groupId>org.springframework</groupId>
 32 | 		    <artifactId>spring-context</artifactId>
 33 | 		    <version>4.3.4.RELEASE</version>
 34 | 		</dependency>
 35 | 		<dependency>
 36 | 		    <groupId>org.springframework</groupId>
 37 | 		    <artifactId>spring-jdbc</artifactId>
 38 | 		    <version>4.3.4.RELEASE</version>
 39 | 		</dependency>
 40 | 		<dependency>
 41 | 		    <groupId>org.springframework</groupId>
 42 | 		    <artifactId>spring-beans</artifactId>
 43 | 		    <version>4.3.4.RELEASE</version>
 44 | 		</dependency>		
 45 | 		<dependency>
 46 | 			<groupId>mysql</groupId>
 47 | 			<artifactId>mysql-connector-java</artifactId>
 48 | 			<version>5.1.22</version>
 49 | 		</dependency>
 50 | 		<dependency>
 51 | 			<groupId>org.quartz-scheduler</groupId>
 52 | 			<artifactId>quartz</artifactId>
 53 | 			<version>2.1.3</version>
 54 | 		</dependency>
 55 | 		<dependency>
 56 | 			<groupId>log4j</groupId>
 57 | 			<artifactId>log4j</artifactId>
 58 | 			<version>1.2.14</version>
 59 | 		</dependency>
 60 | 		<dependency>
 61 | 		    <groupId>org.apache.logging.log4j</groupId>
 62 | 		    <artifactId>log4j-to-slf4j</artifactId>
 63 | 		    <version>2.7</version>
 64 | 		</dependency>
 65 | 		<dependency>
 66 | 		    <groupId>org.slf4j</groupId>
 67 | 		    <artifactId>slf4j-api</artifactId>
 68 | 		    <version>1.7.21</version>
 69 | 		</dependency>
 70 | 		<dependency>
 71 | 		    <groupId>org.slf4j</groupId>
 72 | 		    <artifactId>slf4j-simple</artifactId>
 73 | 		    <version>1.7.21</version>
 74 | 		</dependency>
 75 | 		<dependency>
 76 | 		    <groupId>com.alibaba</groupId>
 77 | 		    <artifactId>druid</artifactId>
 78 | 		    <version>1.0.27</version>
 79 | 		</dependency>
 80 | 		<dependency>
 81 | 		    <groupId>org.elasticsearch.client</groupId>
 82 | 		    <artifactId>transport</artifactId>
 83 | 		    <version>5.1.1</version>
 84 | 		</dependency>
 85 | 		<dependency>
 86 | 		    <groupId>org.elasticsearch</groupId>
 87 | 		    <artifactId>elasticsearch</artifactId>
 88 | 		    <version>5.1.1</version>
 89 | 		</dependency>		
 90 | 	</dependencies>
 91 | 
 92 | 	<build>
 93 | 		<plugins>
 94 | 			<plugin>
 95 | 				<groupId>org.apache.maven.plugins</groupId>
 96 | 				<artifactId>maven-jar-plugin</artifactId>
 97 | 				<configuration>
 98 | 					<archive>
 99 | 						<manifest>
100 | 							<addClasspath>true</addClasspath>
101 | 							<classpathPrefix>lib/</classpathPrefix>
102 | 							<mainClass>cn.net.communion.sync.main.App</mainClass>
103 | 						</manifest>
104 | 					</archive>
105 | 				</configuration>
106 | 			</plugin>
107 | 			<plugin>
108 | 				<groupId>org.apache.maven.plugins</groupId>
109 | 				<artifactId>maven-dependency-plugin</artifactId>
110 | 				<executions>
111 | 					<execution>
112 | 						<id>copy</id>
113 | 						<phase>package</phase>
114 | 						<goals>
115 | 							<goal>copy-dependencies</goal>
116 | 						</goals>
117 | 						<configuration>
118 | 							<outputDirectory>${project.build.directory}/lib</outputDirectory>
119 | 						</configuration>
120 | 					</execution>
121 | 				</executions>
122 | 			</plugin>
123 | 		</plugins>
124 | 		<resources>
125 | 			<resource>
126 | 				<directory>src/main/java</directory>
127 | 				<includes>
128 | 					<include>**/*.properties</include>
129 | 					<include>**/*.xml</include>
130 | 				</includes>
131 | 				<filtering>true</filtering>
132 | 			</resource>
133 | 		</resources>
134 | 	</build>
135 | </project>
136 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/elasticsearch/Client.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.elasticsearch;
 2 | 
 3 | import java.net.InetAddress;
 4 | import java.net.UnknownHostException;
 5 | import java.util.List;
 6 | import java.util.Map;
 7 | import java.util.Set;
 8 | 
 9 | import org.apache.log4j.Logger;
10 | import org.elasticsearch.action.bulk.BulkRequestBuilder;
11 | import org.elasticsearch.action.search.SearchResponse;
12 | import org.elasticsearch.client.transport.TransportClient;
13 | import org.elasticsearch.common.settings.Settings;
14 | import org.elasticsearch.common.transport.InetSocketTransportAddress;
15 | import org.elasticsearch.transport.client.PreBuiltTransportClient;
16 | 
17 | import cn.net.communion.sync.entity.Node;
18 | 
19 | public class Client {
20 |     private static TransportClient client;
21 |     private static Logger logger = Logger.getLogger(Client.class);
22 | 
23 |     private Client(String clusterName, Set<Node> nodes) {
24 |         Settings settings = Settings.builder().put("client.transport.sniff", true)
25 |                 .put("cluster.name", clusterName).build();
26 |         client = new PreBuiltTransportClient(settings);
27 |         nodes.stream().forEach(node -> {
28 |             try {
29 |                 client.addTransportAddress(new InetSocketTransportAddress(
30 |                         InetAddress.getByName(node.getIp()), node.getPort()));
31 |             } catch (UnknownHostException e) {
32 |                 e.printStackTrace();
33 |             }
34 |         });
35 |     }
36 | 
37 |     public static boolean bulkIndex(String index, String type, List<Map<String, Object>> list) {
38 |         BulkRequestBuilder bulkRequest = client.prepareBulk();
39 |         list.stream().forEach(map -> {
40 |             bulkRequest.add(
41 |                     client.prepareIndex(index, type, String.valueOf(map.get("id"))).setSource(map));
42 |         });
43 |         return !bulkRequest.get().hasFailures();
44 |     }
45 | 
46 |     public static void searchAll() {
47 |         SearchResponse response = client.prepareSearch().get();
48 |         response.getHits().forEach(hit -> {
49 |             logger.info(hit.getSource());
50 |         });
51 |     }
52 | 
53 |     public static void searchByIndexType(String index, String type) {
54 |         SearchResponse response = client.prepareSearch(index).setTypes(type).get();
55 |         logger.info(index + "-" + type);
56 |         logger.info(response);
57 |     }
58 | 
59 |     public static void shutdown() {
60 |         client.close();
61 |     }
62 | 
63 | }
64 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/entity/JobInfo.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.entity;
 2 | 
 3 | public class JobInfo {
 4 |     private String name;
 5 |     private String index;
 6 |     private String type;
 7 |     private String cron;
 8 |     private String sql;
 9 |     private long step = 1000;
10 |     private String[] params;
11 |     private int[] paramTypes;
12 | 
13 |     public String getName() {
14 |         return name;
15 |     }
16 | 
17 |     public void setName(String name) {
18 |         this.name = name;
19 |     }
20 | 
21 |     public String getIndex() {
22 |         return index;
23 |     }
24 | 
25 |     public void setIndex(String index) {
26 |         this.index = index;
27 |     }
28 | 
29 |     public String getType() {
30 |         return type;
31 |     }
32 | 
33 |     public void setType(String type) {
34 |         this.type = type;
35 |     }
36 | 
37 |     public String getCron() {
38 |         return cron;
39 |     }
40 | 
41 |     public void setCron(String cron) {
42 |         this.cron = cron;
43 |     }
44 | 
45 |     public String getSql() {
46 |         return sql;
47 |     }
48 | 
49 |     public void setSql(String sql) {
50 |         this.sql = sql;
51 |     }
52 | 
53 |     public long getStep() {
54 |         return step;
55 |     }
56 | 
57 |     public void setStep(long step) {
58 |         this.step = step;
59 |     }
60 | 
61 |     public String[] getParams() {
62 |         return params;
63 |     }
64 | 
65 |     public void setParams(String[] params) {
66 |         this.params = params;
67 |     }
68 | 
69 |     public int[] getParamTypes() {
70 |         return paramTypes;
71 |     }
72 | 
73 |     public void setParamTypes(int[] paramTypes) {
74 |         this.paramTypes = paramTypes;
75 |     }
76 | }
77 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/entity/Node.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.entity;
 2 | 
 3 | public class Node {
 4 |     private String ip = "127.0.0.1";
 5 |     private int port = 9300;
 6 | 
 7 |     public String getIp() {
 8 |         return ip;
 9 |     }
10 | 
11 |     public void setIp(String ip) {
12 |         this.ip = ip;
13 |     }
14 | 
15 |     public int getPort() {
16 |         return port;
17 |     }
18 | 
19 |     public void setPort(int port) {
20 |         this.port = port;
21 |     }
22 | }
23 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/helper/SysProps.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.helper;
 2 | 
 3 | import java.io.File;
 4 | import java.io.FileInputStream;
 5 | import java.io.FileNotFoundException;
 6 | import java.io.FileOutputStream;
 7 | import java.io.IOException;
 8 | import java.io.OutputStream;
 9 | import java.util.Properties;
10 | 
11 | import org.apache.log4j.Logger;
12 | 
13 | public class SysProps {
14 |     private static Logger logger = Logger.getLogger(SysProps.class);
15 |     private static String path = "sys.properties";;
16 |     private static Properties props = new Properties();
17 | 
18 | 
19 |     static {
20 |         try {
21 |             File file = new File(path);
22 |             if (!file.exists()) {
23 |                 file.createNewFile();
24 |             }
25 |             props.load(new FileInputStream(file));
26 |         } catch (FileNotFoundException e) {
27 |             e.printStackTrace();
28 |             System.exit(-1);
29 |         } catch (IOException e) {
30 |             System.exit(-1);
31 |         }
32 |     }
33 | 
34 |     public static String get(String key) {
35 |         return props.getProperty(key);
36 |     }
37 | 
38 |     public static String get(String key, String defaultValue) {
39 |         return props.getProperty(key, defaultValue);
40 |     }
41 | 
42 |     public static void update(String key, String value) {
43 |         try {
44 |             OutputStream fos = new FileOutputStream(path);
45 |             props.setProperty(key, value);
46 |             props.store(fos, "last job finish at");
47 |             fos.close();
48 |         } catch (IOException e) {
49 |             logger.info("update " + key + " failed");
50 |         }
51 |     }
52 | }
53 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/main/App.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.main;
 2 | 
 3 | import java.util.Optional;
 4 | import java.util.Set;
 5 | 
 6 | import org.apache.log4j.Logger;
 7 | import org.quartz.SchedulerException;
 8 | import org.springframework.context.support.ClassPathXmlApplicationContext;
 9 | 
10 | import cn.net.communion.sync.elasticsearch.Client;
11 | import cn.net.communion.sync.entity.JobInfo;
12 | import cn.net.communion.sync.quartz.JobScheduler;
13 | 
14 | public class App {
15 |     Logger logger = Logger.getLogger(App.class);
16 |     ClassPathXmlApplicationContext context;
17 | 
18 |     public App() {
19 |         this.context = new ClassPathXmlApplicationContext("/spring/root.xml");
20 |     }
21 | 
22 |     public void start() {
23 |         JobScheduler jobScheduler = JobScheduler.getInstance();
24 |         Optional<Set<JobInfo>> optional = Optional.of((Set<JobInfo>) context.getBean("jobs"));
25 |         optional.ifPresent(infos -> {
26 |             try {
27 | 
28 |                 jobScheduler.pushJobs(infos).start();
29 |             } catch (SchedulerException e) {
30 |                 Client.shutdown();
31 |                 JobScheduler.getInstance().shutdown();
32 |                 System.exit(1);
33 |             }
34 |         });
35 |     }
36 | 
37 |     public static void main(String[] args) {
38 |         new App().start();
39 |     }
40 | 
41 | }
42 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/quartz/JobScheduler.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.quartz;
 2 | 
 3 | import static org.quartz.CronScheduleBuilder.cronSchedule;
 4 | import static org.quartz.JobBuilder.newJob;
 5 | import static org.quartz.TriggerBuilder.newTrigger;
 6 | import static org.quartz.impl.matchers.EverythingMatcher.allJobs;
 7 | 
 8 | import java.util.Collection;
 9 | 
10 | import org.apache.log4j.Logger;
11 | import org.quartz.CronTrigger;
12 | import org.quartz.JobDetail;
13 | import org.quartz.JobExecutionContext;
14 | import org.quartz.Scheduler;
15 | import org.quartz.SchedulerException;
16 | import org.quartz.SchedulerFactory;
17 | import org.quartz.impl.StdSchedulerFactory;
18 | 
19 | import cn.net.communion.sync.entity.JobInfo;
20 | import cn.net.communion.sync.task.Task;
21 | 
22 | public class JobScheduler {
23 |     private Logger logger = Logger.getLogger(getClass());
24 |     private Scheduler scheduler;
25 |     private static JobScheduler instance = new JobScheduler();
26 | 
27 |     private JobScheduler() {
28 |         SchedulerFactory sf = new StdSchedulerFactory();
29 |         try {
30 |             scheduler = sf.getScheduler();
31 |             scheduler.getListenerManager().addJobListener(new Listener(), allJobs());
32 |         } catch (SchedulerException e) {
33 |             e.printStackTrace();
34 |         }
35 |     }
36 | 
37 |     public static JobScheduler getInstance() {
38 |         return instance;
39 |     }
40 | 
41 |     public JobScheduler pushJobs(Collection<JobInfo> infos) {
42 |         infos.forEach(info -> {
43 |             JobDetail job = newJob(Task.class).withIdentity(info.getName(), "jobs").build();
44 |             job.getJobDataMap().put("jobInfo", info);
45 |             CronTrigger trigger = newTrigger().withIdentity(info.getName(), "triggers")
46 |                     .withSchedule(cronSchedule(info.getCron())).build();
47 |             try {
48 |                 scheduler.scheduleJob(job, trigger);
49 |             } catch (SchedulerException e) {
50 |                 e.printStackTrace();
51 |             }
52 |         });
53 |         return this;
54 |     }
55 | 
56 |     public boolean isRunning(String jobKey) {
57 |         try {
58 |             for (JobExecutionContext context : scheduler.getCurrentlyExecutingJobs()) {
59 |                 // logger.info(context.getJobDetail().getKey().getName() + " is running");
60 |                 if (context.getJobDetail().getKey().getName().equals(jobKey)) {
61 |                     return true;
62 |                 }
63 |             }
64 |         } catch (SchedulerException e) {
65 |             logger.info("get jobs status failed");
66 |             e.printStackTrace();
67 |         }
68 |         return false;
69 |     }
70 | 
71 |     public void start() throws SchedulerException {
72 |         scheduler.start();
73 |     }
74 | 
75 |     public void shutdown() {
76 |         try {
77 |             scheduler.shutdown(true);
78 |         } catch (SchedulerException e) {
79 |             e.printStackTrace();
80 |         }
81 |     }
82 | }
83 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/quartz/Listener.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.quartz;
 2 | 
 3 | import org.quartz.JobExecutionContext;
 4 | import org.quartz.JobExecutionException;
 5 | import org.quartz.JobListener;
 6 | 
 7 | public class Listener implements JobListener {
 8 | 
 9 | 
10 |     @Override
11 |     public String getName() {
12 |         return "Job_Listener";
13 |     }
14 | 
15 |     @Override
16 |     public void jobToBeExecuted(JobExecutionContext context) {
17 |         String jobKey = context.getJobDetail().getKey().getName();
18 |         boolean isCancel = JobScheduler.getInstance().isRunning(jobKey);
19 |         context.getJobDetail().getJobDataMap().put("cancel", isCancel);
20 |     }
21 | 
22 |     @Override
23 |     public void jobExecutionVetoed(JobExecutionContext context) {
24 | 
25 |     }
26 | 
27 |     @Override
28 |     public void jobWasExecuted(JobExecutionContext context, JobExecutionException jobException) {
29 | 
30 |     }
31 | }
32 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/service/JdbcConnector.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.service;
 2 | 
 3 | import java.util.List;
 4 | import java.util.Map;
 5 | 
 6 | import org.apache.log4j.Logger;
 7 | import org.springframework.beans.factory.annotation.Autowired;
 8 | import org.springframework.jdbc.core.JdbcTemplate;
 9 | import org.springframework.stereotype.Component;
10 | 
11 | @Component
12 | public class JdbcConnector {
13 |     Logger logger = Logger.getLogger(JdbcConnector.class);
14 |     private static JdbcTemplate template;
15 | 
16 |     @Autowired
17 |     public JdbcConnector(JdbcTemplate jdbcTemplate) {
18 |         template = jdbcTemplate;
19 |     }
20 | 
21 |     // public void queryTest() {
22 |     // List<Map<String, Object>> list =
23 |     // jdbcTemplate.queryForList("select id,isbn from tbl_book limit 2");
24 |     // // list.stream().map((m) -> logger.info(m.toString()));
25 |     // list.forEach(m -> logger.info(m.toString()));
26 |     // }
27 | 
28 |     public static List<Map<String, Object>> query(String sql) {
29 |         return template.queryForList(sql);
30 |     }
31 | 
32 |     public static List<Map<String, Object>> query(String sql, Object[] params, int[] paramTypes) {
33 |         return template.queryForList(sql, params, paramTypes);
34 |     }
35 | }
36 | 


--------------------------------------------------------------------------------
/src/main/java/cn/net/communion/sync/task/Task.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync.task;
 2 | 
 3 | import java.time.LocalDateTime;
 4 | import java.util.ArrayList;
 5 | import java.util.List;
 6 | import java.util.Map;
 7 | 
 8 | import org.apache.log4j.Logger;
 9 | import org.quartz.Job;
10 | import org.quartz.JobDataMap;
11 | import org.quartz.JobExecutionContext;
12 | import org.quartz.JobExecutionException;
13 | 
14 | import cn.net.communion.sync.elasticsearch.Client;
15 | import cn.net.communion.sync.entity.JobInfo;
16 | import cn.net.communion.sync.helper.SysProps;
17 | import cn.net.communion.sync.service.JdbcConnector;
18 | 
19 | public class Task implements Job {
20 |     Logger logger = Logger.getLogger(Task.class);
21 | 
22 |     @Override
23 |     public void execute(JobExecutionContext context) throws JobExecutionException {
24 |         JobDataMap data = context.getJobDetail().getJobDataMap();
25 |         JobInfo info = (JobInfo) data.get("jobInfo");
26 |         if (data.getBoolean("cancel")) {
27 |             logger.info(info.getName() + " new task just be canceled, this job is in running");
28 |             return;
29 |         }
30 |         String[] params = info.getParams();
31 |         int[] paramTypes = info.getParamTypes();
32 |         long sum = 0;
33 |         String time = LocalDateTime.now().toString();
34 |         while (true) {
35 |             String sql = info.getSql() + limitAddStep(sum, info.getStep());
36 |             List<Map<String, Object>> result =
37 |                     (info.getSql().indexOf("?") > 0 && params != null && paramTypes != null)
38 |                             ? JdbcConnector.query(sql, parseSysParams(params), paramTypes)
39 |                             : JdbcConnector.query(sql);
40 |             sum += result.size();
41 |             if (result.size() > 0 && Client.bulkIndex(info.getIndex(), info.getType(), result)) {
42 |                 logger.info(info.getName() + " has already sync " + sum + " records successfully");
43 |             }
44 |             if (result.size() < 10000) {
45 |                 logger.info(info.getName() + " sync end, this job total records: " + sum);
46 |                 break;
47 |             }
48 |         }
49 |         updateSysParams(info.getParams(), time);
50 |     }
51 | 
52 |     private String limitAddStep(long start, long step) {
53 |         return new StringBuilder(" limit ").append(start).append(",").append(step).toString();
54 |     }
55 | 
56 |     private Object[] parseSysParams(String[] params) {
57 |         List<Object> list = new ArrayList<Object>();
58 |         for (int index = 0; index < params.length; index++) {
59 |             list.add(SysProps.get(params[index], ""));
60 |         }
61 |         return list.toArray();
62 |     }
63 | 
64 |     private void updateSysParams(String[] params, String value) {
65 |         for (int index = 0; index < params.length; index++) {
66 |             SysProps.update(params[index], value);
67 |         }
68 |     }
69 | }
70 | 


--------------------------------------------------------------------------------
/src/main/java/log4j.properties:
--------------------------------------------------------------------------------
 1 | #定义3个输出端
 2 | log4j.rootCategory=info,A1
 3 | #log4j.rootCategory=info,A1,A2
 4 | 
 5 | #定义A1输出到控制器
 6 | log4j.appender.A1=org.apache.log4j.ConsoleAppender
 7 | #定义A1的布局模式为PaternLayout
 8 | log4j.appender.A1.layout=org.apache.log4j.PatternLayout
 9 | # 定义A1的输出格式
10 | log4j.appender.A1.layout.ConversionPattern=%4p [%t] (%F:%L) - %m%n
11 | 
12 | #定义A2输出到文件
13 | #log4j.appender.A2=org.apache.log4j.RollingFileAppender
14 | #定义A2输出到哪个文件
15 | #log4j.appender.A2.File=./databaseSync.log
16 | #定义A2输出文件的最大长度
17 | #log4j.appender.A2.MaxFileSize = 10MB
18 | #定义A2的备份文件数
19 | #log4j.appender.A2.MaxBackupIndex = 10
20 | #定义A2的布局模式为PatternLayout
21 | #log4j.appender.A2.layout=org.apache.log4j.PatternLayout
22 | #定义A2的输出模式
23 | #log4j.appender.A2.layout.ConversionPattern=%d{yyyy-MM-dd hh:mm:ss}:%p %t %c - %m%n
24 | appender.console.type = Console
25 | appender.console.name = console
26 | appender.console.layout.type = PatternLayout
27 | 
28 | rootLogger.level = info
29 | rootLogger.appenderRef.console.ref = console
30 | 


--------------------------------------------------------------------------------
/src/main/java/spring/root.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <beans xmlns="http://www.springframework.org/schema/beans"
 3 | 	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 4 | 	xmlns:context="http://www.springframework.org/schema/context"
 5 | 	xmlns:p="http://www.springframework.org/schema/p"
 6 | 	xsi:schemaLocation="http://www.springframework.org/schema/beans http://www.springframework.org/schema/beans/spring-beans.xsd
 7 |         http://www.springframework.org/schema/context http://www.springframework.org/schema/context/spring-context.xsd">
 8 | 	<context:component-scan base-package="cn.net.communion.sync"/> 
 9 |     <!-- 将多个配置文件读取到容器中，交给Spring管理 -->  
10 |     <context:property-placeholder location="classpath:/spring/props/*.properties"/>
11 |     <import resource="/xml/*.xml" />
12 | </beans>


--------------------------------------------------------------------------------
/src/main/java/spring/xml/client.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <beans xmlns="http://www.springframework.org/schema/beans"
 3 | xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 4 | xmlns:p="http://www.springframework.org/schema/p"
 5 | xsi:schemaLocation="http://www.springframework.org/schema/beans
 6 | http://www.springframework.org/schema/beans/spring-beans.xsd">
 7 |     <bean class="cn.net.communion.sync.elasticsearch.Client">
 8 |     	<constructor-arg value="my-application"/><!-- cluster.name -->
 9 |     	<constructor-arg ref="nodes"/>
10 |     </bean>
11 | </beans>


--------------------------------------------------------------------------------
/src/main/java/spring/xml/db.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <beans xmlns="http://www.springframework.org/schema/beans"
 3 | 	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 4 | 	xmlns:jdbc="http://www.springframework.org/schema/jdbc" 
 5 | 	xsi:schemaLocation="http://www.springframework.org/schema/beans http://www.springframework.org/schema/beans/spring-beans.xsd">
 6 | 	<bean id="dataSource" class="com.alibaba.druid.pool.DruidDataSource"
 7 | 		init-method="init" destroy-method="close">
 8 | 		<!-- 基本属性 url、user、password -->
 9 | 		<property name="url" value="jdbc:mysql://localhost:3306/hainan_demo?useUnicode=true&amp;characterEncoding=UTF-8" />
10 | 		<property name="username" value="root" />
11 | 		<property name="password" value="123456" />
12 | 		<!-- 配置初始化大小、最小、最大 -->
13 | 		<property name="initialSize" value="1" />
14 | 		<property name="minIdle" value="1" />
15 | 		<property name="maxActive" value="20" />
16 | 		<!-- 配置获取连接等待超时的时间 -->
17 | 		<property name="maxWait" value="60000" />
18 | 		<!-- 配置间隔多久才进行一次检测，检测需要关闭的空闲连接，单位是毫秒 -->
19 | 		<property name="timeBetweenEvictionRunsMillis" value="60000" />
20 | 		<!-- 配置一个连接在池中最小生存的时间，单位是毫秒 -->
21 | 		<property name="minEvictableIdleTimeMillis" value="300000" />
22 | 		<property name="validationQuery" value="SELECT 'x'" />
23 | 		<property name="testWhileIdle" value="true" />
24 | 		<property name="testOnBorrow" value="false" />
25 | 		<property name="testOnReturn" value="false" />
26 | 		<!-- 打开PSCache，并且指定每个连接上PSCache的大小 -->
27 | 		<property name="poolPreparedStatements" value="true" />
28 | 		<property name="maxPoolPreparedStatementPerConnectionSize"
29 | 			value="20" />
30 | 		<!-- 配置监控统计拦截的filters -->
31 | 		<property name="filters" value="stat" />
32 | 	</bean>
33 | 	<bean id="jdbcTemplate" class="org.springframework.jdbc.core.JdbcTemplate">
34 | 		<property name="dataSource" ref="dataSource"/>
35 | 	</bean>
36 | </beans>


--------------------------------------------------------------------------------
/src/main/java/spring/xml/jobs.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <beans xmlns="http://www.springframework.org/schema/beans"
 3 | xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 4 | xmlns:p="http://www.springframework.org/schema/p"
 5 | xmlns:util="http://www.springframework.org/schema/util"
 6 | xsi:schemaLocation="http://www.springframework.org/schema/beans http://www.springframework.org/schema/beans/spring-beans.xsd
 7 | 	http://www.springframework.org/schema/util http://www.springframework.org/schema/util/spring-util.xsd">
 8 | 	<!-- DATE:91,VARCHAR:12,INTEGER:4,SMALLINT:5,BIGINT:-5,TINYINT:-6,TIMESTAMP:93-->
 9 | 	<!-- 尽量保证每个数据表有个时间字段，用于增量同步，提高同步效率，每个job的params最好不要相同, step用于设置每次同步的数量，默认为1000条-->
10 | 	<!-- 同步的字段必须包括id -->
11 | 	<util:set id="jobs">
12 | 		<bean class="cn.net.communion.sync.entity.JobInfo"
13 | 			p:name="job1" 
14 | 			p:index="data" 
15 | 			p:type="book" 
16 | 			p:cron="0/10 * * * * ?" 
17 | 			p:sql="select id,author,title,publisher,words,summary,img,rating from tbl_book where updateTime > ?"
18 | 			p:step="50000" 
19 | 			p:params="sys.lastTime1"
20 | 			p:paramTypes="12"/>	
21 | 		<bean class="cn.net.communion.sync.entity.JobInfo"
22 | 			p:name="job2" 
23 | 			p:index="data" 
24 | 			p:type="comment" 
25 | 			p:cron="0/10 * * * * ?" 
26 | 			p:sql="select id,comment from tbl_comment where time > ?" 
27 | 			p:params="sys.lastTime2"
28 | 			p:paramTypes="12"/>
29 | 	</util:set>
30 | </beans>


--------------------------------------------------------------------------------
/src/main/java/spring/xml/nodes.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <beans xmlns="http://www.springframework.org/schema/beans"
 3 | xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 4 | xmlns:p="http://www.springframework.org/schema/p"
 5 | xmlns:util="http://www.springframework.org/schema/util"
 6 | xsi:schemaLocation="http://www.springframework.org/schema/beans http://www.springframework.org/schema/beans/spring-beans.xsd
 7 | 	http://www.springframework.org/schema/util http://www.springframework.org/schema/util/spring-util.xsd">
 8 | 	<util:set id="nodes">
 9 | 		<bean class="cn.net.communion.sync.entity.Node" 
10 | 			p:ip="127.0.0.1" 
11 | 			p:port="9300"/>		
12 | 	</util:set>
13 | </beans>


--------------------------------------------------------------------------------
/src/test/java/cn/net/communion/sync/AppTest.java:
--------------------------------------------------------------------------------
 1 | package cn.net.communion.sync;
 2 | 
 3 | import junit.framework.Test;
 4 | import junit.framework.TestCase;
 5 | import junit.framework.TestSuite;
 6 | 
 7 | /**
 8 |  * Unit test for simple App.
 9 |  */
10 | public class AppTest 
11 |     extends TestCase
12 | {
13 |     /**
14 |      * Create the test case
15 |      *
16 |      * @param testName name of the test case
17 |      */
18 |     public AppTest( String testName )
19 |     {
20 |         super( testName );
21 |     }
22 | 
23 |     /**
24 |      * @return the suite of tests being tested
25 |      */
26 |     public static Test suite()
27 |     {
28 |         return new TestSuite( AppTest.class );
29 |     }
30 | 
31 |     /**
32 |      * Rigourous Test :-)
33 |      */
34 |     public void testApp()
35 |     {
36 |         assertTrue( true );
37 |     }
38 | }
39 | 


--------------------------------------------------------------------------------