{"id":40313,"date":"2022-11-10T13:55:26","date_gmt":"2023-07-06T13:47:05","guid":{"rendered":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/"},"modified":"2024-01-15T10:34:10","modified_gmt":"2024-01-15T02:34:10","slug":"%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab","status":"publish","type":"post","link":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/","title":{"rendered":"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b"},"content":{"rendered":"<p>\u6211\u5011\u5c07\u4f7f\u7528Spring Boot\u548cSpring Integration\u4f86\u5275\u5efa\u4e00\u500b\u7c21\u55ae\u7684\u722c\u87f2\uff0c\u4e0d\u9700\u8981\u4f7f\u7528XML\uff0c\u53ea\u4f7f\u7528Java Config\u3002<\/p>\n<h2>\u5fc5\u987b (Necessarily)<\/h2>\n<p>\u8bf7\u4e8b\u5148\u5b89\u88c5\u4ee5\u4e0b\u8f6f\u4ef6\u3002<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">JDK 6 or later<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">Maven 3.0 or later<\/ul>\n<h2>\u7b80\u800c\u8a00\u4e4b<\/h2>\n<p>\u6240\u5f00\u53d1\u7684\u7f51\u7edc\u722c\u866b\u4f1a\u901a\u8fc7\u6293\u53d6\u7ef4\u57fa\u767e\u79d1\u7684\u8f6c\u50a8\u5217\u8868\u6765\u83b7\u53d6\u4ee5\u4e0b\u7684\u4fe1\u606f\u3002<\/p>\n<div>\n<div class=\"post-table\">timestampidrefstatus2014-05-31 01:57:31nowikinowiki\/20140530Dump in progress2014-05-31 01:57:32trwikitrwiki\/20140530Dump in progress2014-05-30 14:38:08anwikianwiki\/20140530Dump complete2014-05-30 14:30:29viwiktionaryviwiktionary\/20140530Dump complete2014-05-30 13:02:57ckbwikickbwiki\/20140530Dump complete&#8230;&#8230;&#8230;&#8230;<\/div>\n<\/div>\n<h2>pom.xml =&gt; \u9879\u76ee\u5bf9\u8c61\u6a21\u578b\u6587\u4ef6 (Project Object Model \u6587\u4ef6)<\/h2>\n<pre class=\"post-pre\"><code>    <span class=\"nt\">&lt;parent&gt;<\/span>\r\n        <span class=\"nt\">&lt;groupId&gt;<\/span>org.springframework.boot<span class=\"nt\">&lt;\/groupId&gt;<\/span>\r\n        <span class=\"nt\">&lt;artifactId&gt;<\/span>spring-boot-starter-parent<span class=\"nt\">&lt;\/artifactId&gt;<\/span>\r\n        <span class=\"nt\">&lt;version&gt;<\/span>1.1.0.M2<span class=\"nt\">&lt;\/version&gt;<\/span>\r\n        <span class=\"nt\">&lt;relativePath\/&gt;<\/span>\r\n    <span class=\"nt\">&lt;\/parent&gt;<\/span>\r\n\r\n    <span class=\"nt\">&lt;dependencies&gt;<\/span>\r\n        <span class=\"nt\">&lt;dependency&gt;<\/span>\r\n            <span class=\"nt\">&lt;groupId&gt;<\/span>org.springframework.boot<span class=\"nt\">&lt;\/groupId&gt;<\/span>\r\n            <span class=\"nt\">&lt;artifactId&gt;<\/span>spring-boot-starter-integration<span class=\"nt\">&lt;\/artifactId&gt;<\/span>\r\n        <span class=\"nt\">&lt;\/dependency&gt;<\/span>\r\n        <span class=\"nt\">&lt;dependency&gt;<\/span>\r\n            <span class=\"nt\">&lt;groupId&gt;<\/span>org.jsoup<span class=\"nt\">&lt;\/groupId&gt;<\/span>\r\n            <span class=\"nt\">&lt;artifactId&gt;<\/span>jsoup<span class=\"nt\">&lt;\/artifactId&gt;<\/span>\r\n            <span class=\"nt\">&lt;version&gt;<\/span>1.7.3<span class=\"nt\">&lt;\/version&gt;<\/span>\r\n        <span class=\"nt\">&lt;\/dependency&gt;<\/span>\r\n    <span class=\"nt\">&lt;\/dependencies&gt;<\/span>\r\n\r\n    <span class=\"nt\">&lt;repositories&gt;<\/span>\r\n        <span class=\"nt\">&lt;repository&gt;<\/span>\r\n            <span class=\"nt\">&lt;id&gt;<\/span>spring-milestones<span class=\"nt\">&lt;\/id&gt;<\/span>\r\n            <span class=\"nt\">&lt;url&gt;<\/span>http:\/\/repo.spring.io\/milestone\/<span class=\"nt\">&lt;\/url&gt;<\/span>\r\n        <span class=\"nt\">&lt;\/repository&gt;<\/span>\r\n    <span class=\"nt\">&lt;\/repositories&gt;<\/span>\r\n<\/code><\/pre>\n<p>\u56e0\u4e3a\u5728\u8fdb\u884c\u7f51\u9875\u6293\u53d6\u65f6\u4f7f\u7528\u4e86jsoup\uff0c\u6240\u4ee5\u5c06\u5176\u6574\u5408\u5230pom.xml\u4e2d\u3002<\/p>\n<h2>\u4e0b\u8f7d\u5668<\/h2>\n<p>\u4e0b\u8f7d\u5668\u4f1a\u5b9a\u671f\u4ece\u6307\u5b9a\u7684URL\u4e0b\u8f7dHTML\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"nd\">@MessageEndpoint<\/span>\r\n<span class=\"kd\">public<\/span> <span class=\"kd\">class<\/span> <span class=\"nc\">Downloader<\/span> <span class=\"o\">{<\/span>\r\n    <span class=\"nd\">@Autowired<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">CrawlerConfig<\/span> <span class=\"n\">config<\/span><span class=\"o\">;<\/span>\r\n\r\n    <span class=\"nd\">@Autowired<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">RestTemplate<\/span> <span class=\"n\">template<\/span><span class=\"o\">;<\/span>\r\n\r\n    <span class=\"nd\">@InboundChannelAdapter<\/span><span class=\"o\">(<\/span><span class=\"n\">value<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel1\"<\/span><span class=\"o\">,<\/span> <span class=\"n\">poller<\/span> <span class=\"o\">=<\/span> <span class=\"nd\">@Poller<\/span><span class=\"o\">(<\/span><span class=\"s\">\"downloadTrigger\"<\/span><span class=\"o\">))<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">ResponseEntity<\/span><span class=\"o\">&lt;<\/span><span class=\"nc\">String<\/span><span class=\"o\">&gt;<\/span> <span class=\"nf\">download<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">String<\/span> <span class=\"n\">url<\/span> <span class=\"o\">=<\/span> <span class=\"n\">config<\/span><span class=\"o\">.<\/span><span class=\"na\">getUrl<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"nc\">ResponseEntity<\/span><span class=\"o\">&lt;<\/span><span class=\"nc\">String<\/span><span class=\"o\">&gt;<\/span> <span class=\"n\">entity<\/span> <span class=\"o\">=<\/span> <span class=\"n\">template<\/span><span class=\"o\">.<\/span><span class=\"na\">getForEntity<\/span><span class=\"o\">(<\/span><span class=\"n\">url<\/span><span class=\"o\">,<\/span> <span class=\"nc\">String<\/span><span class=\"o\">.<\/span><span class=\"na\">class<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">entity<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n<span class=\"o\">}<\/span>\r\n<\/code><\/pre>\n<p>\u4e0b\u8f7d\u7684HTML\u4ee5ResponseEntity\u7c7b\u7684\u5b9e\u4f8b\u5f62\u5f0f\u53d1\u9001\u7ed9channel1\u3002<br \/>\n\u4e0b\u8f7d\u9891\u7387\u7531\u5916\u90e8\u7684downloadTrigger bean\u5b9a\u4e49\u3002<\/p>\n<h2>\u522e\u5200<\/h2>\n<p>Scraper \u4eceHTML\u4e2d\u63d0\u53d6\u6240\u9700\u90e8\u5206\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"nd\">@MessageEndpoint<\/span>\r\n<span class=\"kd\">public<\/span> <span class=\"kd\">class<\/span> <span class=\"nc\">Scraper<\/span> <span class=\"o\">{<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"kd\">final<\/span> <span class=\"nc\">Pattern<\/span> <span class=\"n\">patter<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">Pattern<\/span><span class=\"o\">.<\/span><span class=\"na\">compile<\/span><span class=\"o\">(<\/span><span class=\"s\">\"^&lt;li&gt;\\\\d{4}-\\\\d{2}-\\\\d{2} \\\\d{2}:\\\\d{2}:\\\\d{2} \\\\S+\"<\/span><span class=\"o\">);<\/span>\r\n\r\n    <span class=\"nd\">@Splitter<\/span><span class=\"o\">(<\/span><span class=\"n\">inputChannel<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel1\"<\/span><span class=\"o\">,<\/span> <span class=\"n\">outputChannel<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel2\"<\/span><span class=\"o\">)<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">List<\/span><span class=\"o\">&lt;<\/span><span class=\"nc\">Element<\/span><span class=\"o\">&gt;<\/span> <span class=\"nf\">scrape<\/span><span class=\"o\">(<\/span><span class=\"nc\">ResponseEntity<\/span><span class=\"o\">&lt;<\/span><span class=\"nc\">String<\/span><span class=\"o\">&gt;<\/span> <span class=\"n\">payload<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">String<\/span> <span class=\"n\">html<\/span> <span class=\"o\">=<\/span> <span class=\"n\">payload<\/span><span class=\"o\">.<\/span><span class=\"na\">getBody<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"kd\">final<\/span> <span class=\"nc\">Document<\/span> <span class=\"n\">htmlDoc<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">Jsoup<\/span><span class=\"o\">.<\/span><span class=\"na\">parse<\/span><span class=\"o\">(<\/span><span class=\"n\">html<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"kd\">final<\/span> <span class=\"nc\">Elements<\/span> <span class=\"n\">anchorNodes<\/span> <span class=\"o\">=<\/span> <span class=\"n\">htmlDoc<\/span><span class=\"o\">.<\/span><span class=\"na\">select<\/span><span class=\"o\">(<\/span><span class=\"s\">\"body\"<\/span><span class=\"o\">).<\/span><span class=\"na\">select<\/span><span class=\"o\">(<\/span><span class=\"s\">\"ul\"<\/span><span class=\"o\">).<\/span><span class=\"na\">select<\/span><span class=\"o\">(<\/span><span class=\"s\">\"li\"<\/span><span class=\"o\">);<\/span>\r\n\r\n        <span class=\"kd\">final<\/span> <span class=\"nc\">List<\/span><span class=\"o\">&lt;<\/span><span class=\"nc\">Element<\/span><span class=\"o\">&gt;<\/span> <span class=\"n\">anchorList<\/span> <span class=\"o\">=<\/span> <span class=\"k\">new<\/span> <span class=\"nc\">ArrayList<\/span><span class=\"o\">&lt;<\/span><span class=\"nc\">Element<\/span><span class=\"o\">&gt;();<\/span>\r\n        <span class=\"n\">anchorNodes<\/span><span class=\"o\">.<\/span><span class=\"na\">traverse<\/span><span class=\"o\">(<\/span><span class=\"k\">new<\/span> <span class=\"nc\">NodeVisitor<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n            <span class=\"nd\">@Override<\/span>\r\n            <span class=\"kd\">public<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">head<\/span><span class=\"o\">(<\/span><span class=\"n\">org<\/span><span class=\"o\">.<\/span><span class=\"na\">jsoup<\/span><span class=\"o\">.<\/span><span class=\"na\">nodes<\/span><span class=\"o\">.<\/span><span class=\"na\">Node<\/span> <span class=\"n\">node<\/span><span class=\"o\">,<\/span> <span class=\"kt\">int<\/span> <span class=\"n\">depth<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n                <span class=\"k\">if<\/span> <span class=\"o\">(<\/span><span class=\"n\">node<\/span> <span class=\"k\">instanceof<\/span> <span class=\"n\">org<\/span><span class=\"o\">.<\/span><span class=\"na\">jsoup<\/span><span class=\"o\">.<\/span><span class=\"na\">nodes<\/span><span class=\"o\">.<\/span><span class=\"na\">Element<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n                    <span class=\"nc\">Element<\/span> <span class=\"n\">e<\/span> <span class=\"o\">=<\/span> <span class=\"o\">(<\/span><span class=\"nc\">Element<\/span><span class=\"o\">)<\/span><span class=\"n\">node<\/span><span class=\"o\">;<\/span>\r\n                    <span class=\"n\">anchorList<\/span><span class=\"o\">.<\/span><span class=\"na\">add<\/span><span class=\"o\">(<\/span><span class=\"n\">e<\/span><span class=\"o\">);<\/span>\r\n                <span class=\"o\">}<\/span>\r\n            <span class=\"o\">}<\/span>\r\n\r\n            <span class=\"nd\">@Override<\/span>\r\n            <span class=\"kd\">public<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">tail<\/span><span class=\"o\">(<\/span><span class=\"nc\">Node<\/span> <span class=\"n\">node<\/span><span class=\"o\">,<\/span> <span class=\"kt\">int<\/span> <span class=\"n\">depth<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n            <span class=\"o\">}<\/span>\r\n        <span class=\"o\">});<\/span>\r\n\r\n        <span class=\"k\">return<\/span> <span class=\"n\">anchorList<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Filter<\/span><span class=\"o\">(<\/span><span class=\"n\">inputChannel<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel2\"<\/span><span class=\"o\">,<\/span> <span class=\"n\">outputChannel<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel3\"<\/span><span class=\"o\">)<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">boolean<\/span> <span class=\"nf\">filter<\/span><span class=\"o\">(<\/span><span class=\"nc\">Element<\/span> <span class=\"n\">payload<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">Matcher<\/span> <span class=\"n\">m<\/span> <span class=\"o\">=<\/span> <span class=\"n\">patter<\/span><span class=\"o\">.<\/span><span class=\"na\">matcher<\/span><span class=\"o\">(<\/span><span class=\"n\">payload<\/span><span class=\"o\">.<\/span><span class=\"na\">toString<\/span><span class=\"o\">());<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">m<\/span><span class=\"o\">.<\/span><span class=\"na\">find<\/span><span class=\"o\">();<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Transformer<\/span><span class=\"o\">(<\/span><span class=\"n\">inputChannel<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel3\"<\/span><span class=\"o\">,<\/span> <span class=\"n\">outputChannel<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"channel4\"<\/span><span class=\"o\">)<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">DumpEntry<\/span> <span class=\"nf\">convert<\/span><span class=\"o\">(<\/span><span class=\"nc\">Element<\/span> <span class=\"n\">payload<\/span><span class=\"o\">)<\/span> <span class=\"kd\">throws<\/span> <span class=\"nc\">ParseException<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">String<\/span> <span class=\"n\">dateStr<\/span> <span class=\"o\">=<\/span> <span class=\"n\">payload<\/span><span class=\"o\">.<\/span><span class=\"na\">ownText<\/span><span class=\"o\">().<\/span><span class=\"na\">substring<\/span><span class=\"o\">(<\/span><span class=\"mi\">0<\/span><span class=\"o\">,<\/span> <span class=\"mi\">19<\/span><span class=\"o\">);<\/span>\r\n\r\n        <span class=\"nc\">DateFormat<\/span> <span class=\"n\">format<\/span> <span class=\"o\">=<\/span> <span class=\"k\">new<\/span> <span class=\"nc\">SimpleDateFormat<\/span><span class=\"o\">(<\/span><span class=\"s\">\"yyyy-MM-dd hh:mm:ss\"<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"n\">format<\/span><span class=\"o\">.<\/span><span class=\"na\">setTimeZone<\/span><span class=\"o\">(<\/span><span class=\"nc\">TimeZone<\/span><span class=\"o\">.<\/span><span class=\"na\">getTimeZone<\/span><span class=\"o\">(<\/span><span class=\"s\">\"GMT\"<\/span><span class=\"o\">));<\/span>\r\n\r\n        <span class=\"nc\">Date<\/span> <span class=\"n\">timestamp<\/span> <span class=\"o\">=<\/span> <span class=\"n\">format<\/span><span class=\"o\">.<\/span><span class=\"na\">parse<\/span><span class=\"o\">(<\/span><span class=\"n\">dateStr<\/span><span class=\"o\">);<\/span>\r\n\r\n        <span class=\"nc\">Elements<\/span> <span class=\"n\">list<\/span> <span class=\"o\">=<\/span> <span class=\"n\">payload<\/span><span class=\"o\">.<\/span><span class=\"na\">select<\/span><span class=\"o\">(<\/span><span class=\"s\">\"a\"<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"nc\">String<\/span> <span class=\"n\">id<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"nc\">String<\/span> <span class=\"n\">ref<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(<\/span><span class=\"n\">list<\/span><span class=\"o\">.<\/span><span class=\"na\">size<\/span><span class=\"o\">()<\/span> <span class=\"o\">&gt;<\/span> <span class=\"mi\">0<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n            <span class=\"nc\">Element<\/span> <span class=\"n\">a<\/span> <span class=\"o\">=<\/span> <span class=\"n\">list<\/span><span class=\"o\">.<\/span><span class=\"na\">get<\/span><span class=\"o\">(<\/span><span class=\"mi\">0<\/span><span class=\"o\">);<\/span>\r\n            <span class=\"n\">id<\/span> <span class=\"o\">=<\/span> <span class=\"n\">a<\/span><span class=\"o\">.<\/span><span class=\"na\">ownText<\/span><span class=\"o\">();<\/span>\r\n            <span class=\"n\">ref<\/span> <span class=\"o\">=<\/span> <span class=\"n\">a<\/span><span class=\"o\">.<\/span><span class=\"na\">attr<\/span><span class=\"o\">(<\/span><span class=\"s\">\"href\"<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"o\">}<\/span> <span class=\"k\">else<\/span> <span class=\"o\">{<\/span>\r\n            <span class=\"n\">id<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"private data\"<\/span><span class=\"o\">;<\/span>\r\n            <span class=\"n\">ref<\/span> <span class=\"o\">=<\/span> <span class=\"kc\">null<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"o\">}<\/span>\r\n\r\n        <span class=\"nc\">Element<\/span> <span class=\"n\">span<\/span> <span class=\"o\">=<\/span> <span class=\"n\">payload<\/span><span class=\"o\">.<\/span><span class=\"na\">select<\/span><span class=\"o\">(<\/span><span class=\"s\">\"span\"<\/span><span class=\"o\">).<\/span><span class=\"na\">get<\/span><span class=\"o\">(<\/span><span class=\"mi\">0<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"nc\">String<\/span> <span class=\"n\">status<\/span> <span class=\"o\">=<\/span> <span class=\"n\">span<\/span><span class=\"o\">.<\/span><span class=\"na\">ownText<\/span><span class=\"o\">();<\/span>\r\n\r\n        <span class=\"k\">return<\/span> <span class=\"k\">new<\/span> <span class=\"nf\">DumpEntry<\/span><span class=\"o\">(<\/span><span class=\"n\">timestamp<\/span><span class=\"o\">,<\/span> <span class=\"n\">id<\/span><span class=\"o\">,<\/span> <span class=\"n\">ref<\/span><span class=\"o\">,<\/span> <span class=\"n\">status<\/span><span class=\"o\">);<\/span>\r\n    <span class=\"o\">}<\/span>\r\n<span class=\"o\">}<\/span>\r\n<\/code><\/pre>\n<p>\u4ecechannel1\u63a5\u6536\u5230\u7684HTML\u4e2d\u63d0\u53d6\u51fabody\/ul\/li\u5143\u7d20\uff0c\u5e76\u7b5b\u9009\u51fa\u6240\u9700\u7684li\u5143\u7d20\uff0c\u5c06li\u5143\u7d20\u8f6c\u6362\u4e3aDompEntry\u5e76\u53d1\u9001\u5230channel4\u4e2d\u3002<\/p>\n<h2>DompEntry \u2192 \u6570\u636e\u9879<\/h2>\n<p>DompEntry\u662f\u6307\u4ee3\u76ee\u6807\u90e8\u5206\u7684\u5b9e\u4f53\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"kd\">public<\/span> <span class=\"kd\">class<\/span> <span class=\"nc\">DumpEntry<\/span> <span class=\"kd\">implements<\/span> <span class=\"nc\">Serializable<\/span> <span class=\"o\">{<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">Date<\/span> <span class=\"n\">timestamp<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">id<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">ref<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">status<\/span><span class=\"o\">;<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"nf\">DumpEntry<\/span><span class=\"o\">(<\/span><span class=\"nc\">Date<\/span> <span class=\"n\">timestamp<\/span><span class=\"o\">,<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">id<\/span><span class=\"o\">,<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">ref<\/span><span class=\"o\">,<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">status<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">this<\/span><span class=\"o\">.<\/span><span class=\"na\">timestamp<\/span> <span class=\"o\">=<\/span> <span class=\"n\">timestamp<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">this<\/span><span class=\"o\">.<\/span><span class=\"na\">id<\/span> <span class=\"o\">=<\/span> <span class=\"n\">id<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">this<\/span><span class=\"o\">.<\/span><span class=\"na\">ref<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ref<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">this<\/span><span class=\"o\">.<\/span><span class=\"na\">status<\/span> <span class=\"o\">=<\/span> <span class=\"n\">status<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">Date<\/span> <span class=\"nf\">getTimestamp<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">timestamp<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">String<\/span> <span class=\"nf\">getId<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">id<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">String<\/span> <span class=\"nf\">getRef<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">ref<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">String<\/span> <span class=\"nf\">getStatus<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">status<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Override<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">boolean<\/span> <span class=\"nf\">equals<\/span><span class=\"o\">(<\/span><span class=\"nc\">Object<\/span> <span class=\"n\">o<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(<\/span><span class=\"k\">this<\/span> <span class=\"o\">==<\/span> <span class=\"n\">o<\/span><span class=\"o\">)<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">true<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(!(<\/span><span class=\"n\">o<\/span> <span class=\"k\">instanceof<\/span> <span class=\"nc\">DumpEntry<\/span><span class=\"o\">))<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n\r\n        <span class=\"nc\">DumpEntry<\/span> <span class=\"n\">dumpEntry<\/span> <span class=\"o\">=<\/span> <span class=\"o\">(<\/span><span class=\"nc\">DumpEntry<\/span><span class=\"o\">)<\/span> <span class=\"n\">o<\/span><span class=\"o\">;<\/span>\r\n\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(!<\/span><span class=\"n\">id<\/span><span class=\"o\">.<\/span><span class=\"na\">equals<\/span><span class=\"o\">(<\/span><span class=\"n\">dumpEntry<\/span><span class=\"o\">.<\/span><span class=\"na\">id<\/span><span class=\"o\">))<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(!<\/span><span class=\"n\">ref<\/span><span class=\"o\">.<\/span><span class=\"na\">equals<\/span><span class=\"o\">(<\/span><span class=\"n\">dumpEntry<\/span><span class=\"o\">.<\/span><span class=\"na\">ref<\/span><span class=\"o\">))<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(!<\/span><span class=\"n\">status<\/span><span class=\"o\">.<\/span><span class=\"na\">equals<\/span><span class=\"o\">(<\/span><span class=\"n\">dumpEntry<\/span><span class=\"o\">.<\/span><span class=\"na\">status<\/span><span class=\"o\">))<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(!<\/span><span class=\"n\">timestamp<\/span><span class=\"o\">.<\/span><span class=\"na\">equals<\/span><span class=\"o\">(<\/span><span class=\"n\">dumpEntry<\/span><span class=\"o\">.<\/span><span class=\"na\">timestamp<\/span><span class=\"o\">))<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n\r\n        <span class=\"k\">return<\/span> <span class=\"kc\">true<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Override<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">int<\/span> <span class=\"nf\">hashCode<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"kt\">int<\/span> <span class=\"n\">result<\/span> <span class=\"o\">=<\/span> <span class=\"n\">timestamp<\/span><span class=\"o\">.<\/span><span class=\"na\">hashCode<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"n\">result<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">31<\/span> <span class=\"o\">*<\/span> <span class=\"n\">result<\/span> <span class=\"o\">+<\/span> <span class=\"n\">id<\/span><span class=\"o\">.<\/span><span class=\"na\">hashCode<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"n\">result<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">31<\/span> <span class=\"o\">*<\/span> <span class=\"n\">result<\/span> <span class=\"o\">+<\/span> <span class=\"n\">ref<\/span><span class=\"o\">.<\/span><span class=\"na\">hashCode<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"n\">result<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">31<\/span> <span class=\"o\">*<\/span> <span class=\"n\">result<\/span> <span class=\"o\">+<\/span> <span class=\"n\">status<\/span><span class=\"o\">.<\/span><span class=\"na\">hashCode<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">result<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Override<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">String<\/span> <span class=\"nf\">toString<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"s\">\"DumpEntry{\"<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"s\">\"timestamp=\"<\/span> <span class=\"o\">+<\/span> <span class=\"n\">timestamp<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"s\">\", id='\"<\/span> <span class=\"o\">+<\/span> <span class=\"n\">id<\/span> <span class=\"o\">+<\/span> <span class=\"sc\">'\\''<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"s\">\", ref='\"<\/span> <span class=\"o\">+<\/span> <span class=\"n\">ref<\/span> <span class=\"o\">+<\/span> <span class=\"sc\">'\\''<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"s\">\", status='\"<\/span> <span class=\"o\">+<\/span> <span class=\"n\">status<\/span> <span class=\"o\">+<\/span> <span class=\"sc\">'\\''<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"sc\">'}'<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n<span class=\"o\">}<\/span>\r\n<\/code><\/pre>\n<h2>\u722c\u866b\u914d\u7f6e (CrawlerConfig)<\/h2>\n<p>\u8fd9\u662f\u5173\u4e8e\u722c\u866b\u8bbe\u7f6e\u7684\u8bf4\u660e\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"nd\">@Component<\/span>\r\n<span class=\"nd\">@ConfigurationProperties<\/span>\r\n<span class=\"kd\">public<\/span> <span class=\"kd\">class<\/span> <span class=\"nc\">CrawlerConfig<\/span> <span class=\"o\">{<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"kd\">static<\/span> <span class=\"kd\">final<\/span> <span class=\"nc\">String<\/span> <span class=\"no\">DEFAULT_URL<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"http:\/\/dumps.wikimedia.org\/backup-index.html\"<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"kd\">static<\/span> <span class=\"kd\">final<\/span> <span class=\"kt\">long<\/span> <span class=\"no\">DEFAULT_DOWNLOAD_INTERVAL<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">TimeUnit<\/span><span class=\"o\">.<\/span><span class=\"na\">HOURS<\/span><span class=\"o\">.<\/span><span class=\"na\">toMillis<\/span><span class=\"o\">(<\/span><span class=\"mi\">1<\/span><span class=\"o\">);<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">String<\/span> <span class=\"n\">url<\/span> <span class=\"o\">=<\/span> <span class=\"no\">DEFAULT_URL<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"kt\">long<\/span> <span class=\"n\">downloadInterval<\/span> <span class=\"o\">=<\/span> <span class=\"no\">DEFAULT_DOWNLOAD_INTERVAL<\/span><span class=\"o\">;<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">String<\/span> <span class=\"nf\">getUrl<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">url<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">setUrl<\/span><span class=\"o\">(<\/span><span class=\"nc\">String<\/span> <span class=\"n\">url<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">this<\/span><span class=\"o\">.<\/span><span class=\"na\">url<\/span> <span class=\"o\">=<\/span> <span class=\"n\">url<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">long<\/span> <span class=\"nf\">getDownloadInterval<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">downloadInterval<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">setDownloadInterval<\/span><span class=\"o\">(<\/span><span class=\"kt\">long<\/span> <span class=\"n\">downloadInterval<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">this<\/span><span class=\"o\">.<\/span><span class=\"na\">downloadInterval<\/span> <span class=\"o\">=<\/span> <span class=\"n\">downloadInterval<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Override<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">boolean<\/span> <span class=\"nf\">equals<\/span><span class=\"o\">(<\/span><span class=\"nc\">Object<\/span> <span class=\"n\">o<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(<\/span><span class=\"k\">this<\/span> <span class=\"o\">==<\/span> <span class=\"n\">o<\/span><span class=\"o\">)<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">true<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(<\/span><span class=\"n\">o<\/span> <span class=\"o\">==<\/span> <span class=\"kc\">null<\/span> <span class=\"o\">||<\/span> <span class=\"n\">getClass<\/span><span class=\"o\">()<\/span> <span class=\"o\">!=<\/span> <span class=\"n\">o<\/span><span class=\"o\">.<\/span><span class=\"na\">getClass<\/span><span class=\"o\">())<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n\r\n        <span class=\"nc\">CrawlerConfig<\/span> <span class=\"n\">that<\/span> <span class=\"o\">=<\/span> <span class=\"o\">(<\/span><span class=\"nc\">CrawlerConfig<\/span><span class=\"o\">)<\/span> <span class=\"n\">o<\/span><span class=\"o\">;<\/span>\r\n\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(<\/span><span class=\"n\">downloadInterval<\/span> <span class=\"o\">!=<\/span> <span class=\"n\">that<\/span><span class=\"o\">.<\/span><span class=\"na\">downloadInterval<\/span><span class=\"o\">)<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n        <span class=\"k\">if<\/span> <span class=\"o\">(!<\/span><span class=\"n\">url<\/span><span class=\"o\">.<\/span><span class=\"na\">equals<\/span><span class=\"o\">(<\/span><span class=\"n\">that<\/span><span class=\"o\">.<\/span><span class=\"na\">url<\/span><span class=\"o\">))<\/span> <span class=\"k\">return<\/span> <span class=\"kc\">false<\/span><span class=\"o\">;<\/span>\r\n\r\n        <span class=\"k\">return<\/span> <span class=\"kc\">true<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Override<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">int<\/span> <span class=\"nf\">hashCode<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"kt\">int<\/span> <span class=\"n\">result<\/span> <span class=\"o\">=<\/span> <span class=\"n\">url<\/span><span class=\"o\">.<\/span><span class=\"na\">hashCode<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"n\">result<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">31<\/span> <span class=\"o\">*<\/span> <span class=\"n\">result<\/span> <span class=\"o\">+<\/span> <span class=\"o\">(<\/span><span class=\"kt\">int<\/span><span class=\"o\">)<\/span> <span class=\"o\">(<\/span><span class=\"n\">downloadInterval<\/span> <span class=\"o\">^<\/span> <span class=\"o\">(<\/span><span class=\"n\">downloadInterval<\/span> <span class=\"o\">&gt;&gt;&gt;<\/span> <span class=\"mi\">32<\/span><span class=\"o\">));<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">result<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Override<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">String<\/span> <span class=\"nf\">toString<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"s\">\"CrawlerConfig{\"<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"s\">\"url='\"<\/span> <span class=\"o\">+<\/span> <span class=\"n\">url<\/span> <span class=\"o\">+<\/span> <span class=\"sc\">'\\''<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"s\">\", downloadInterval=\"<\/span> <span class=\"o\">+<\/span> <span class=\"n\">downloadInterval<\/span> <span class=\"o\">+<\/span>\r\n                <span class=\"sc\">'}'<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n<span class=\"o\">}<\/span>\r\n<\/code><\/pre>\n<p>\u9ed8\u8ba4\u60c5\u51b5\u4e0b\uff0c\u6bcf\u96941\u5c0f\u65f6\u4ece&#8221;http:\/\/dumps.wikimedia.org\/backup-index.html&#8221;\u4e0b\u8f7dHTML\u6587\u4ef6\u3002<\/p>\n<h2>\u722c\u866b\u5e94\u7528<\/h2>\n<p>\u6700\u540e\u662f\u5e94\u7528\u7a0b\u5e8f\u7c7b\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"nd\">@Configuration<\/span>\r\n<span class=\"nd\">@ComponentScan<\/span>\r\n<span class=\"nd\">@EnableAutoConfiguration<\/span>\r\n<span class=\"nd\">@EnableConfigurationProperties<\/span>\r\n<span class=\"kd\">public<\/span> <span class=\"kd\">class<\/span> <span class=\"nc\">CrawlerApp<\/span> <span class=\"o\">{<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"kd\">static<\/span> <span class=\"nc\">Logger<\/span> <span class=\"no\">LOG<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">LoggerFactory<\/span><span class=\"o\">.<\/span><span class=\"na\">getLogger<\/span><span class=\"o\">(<\/span><span class=\"nc\">CrawlerApp<\/span><span class=\"o\">.<\/span><span class=\"na\">class<\/span><span class=\"o\">);<\/span>\r\n\r\n    <span class=\"kd\">public<\/span> <span class=\"kd\">static<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">main<\/span><span class=\"o\">(<\/span><span class=\"nc\">String<\/span><span class=\"o\">[]<\/span> <span class=\"n\">args<\/span><span class=\"o\">)<\/span> <span class=\"kd\">throws<\/span> <span class=\"nc\">Exception<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">ApplicationContext<\/span> <span class=\"n\">ctx<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">SpringApplication<\/span><span class=\"o\">.<\/span><span class=\"na\">run<\/span><span class=\"o\">(<\/span><span class=\"nc\">CrawlerApp<\/span><span class=\"o\">.<\/span><span class=\"na\">class<\/span><span class=\"o\">,<\/span> <span class=\"n\">args<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"nc\">System<\/span><span class=\"o\">.<\/span><span class=\"na\">in<\/span><span class=\"o\">.<\/span><span class=\"na\">read<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"nc\">Runtime<\/span><span class=\"o\">.<\/span><span class=\"na\">getRuntime<\/span><span class=\"o\">().<\/span><span class=\"na\">exit<\/span><span class=\"o\">(<\/span><span class=\"nc\">SpringApplication<\/span><span class=\"o\">.<\/span><span class=\"na\">exit<\/span><span class=\"o\">(<\/span><span class=\"n\">ctx<\/span><span class=\"o\">));<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Autowired<\/span>\r\n    <span class=\"kd\">private<\/span> <span class=\"nc\">CrawlerConfig<\/span> <span class=\"n\">config<\/span><span class=\"o\">;<\/span>\r\n\r\n    <span class=\"nd\">@PostConstruct<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">postConstruct<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"no\">LOG<\/span><span class=\"o\">.<\/span><span class=\"na\">info<\/span><span class=\"o\">(<\/span><span class=\"s\">\"starting crawler with config={}\"<\/span><span class=\"o\">,<\/span> <span class=\"n\">config<\/span><span class=\"o\">);<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@MessageEndpoint<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"kd\">static<\/span> <span class=\"kd\">class<\/span> <span class=\"nc\">Endpoint<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nd\">@ServiceActivator<\/span><span class=\"o\">(<\/span><span class=\"n\">inputChannel<\/span><span class=\"o\">=<\/span><span class=\"s\">\"channel4\"<\/span><span class=\"o\">)<\/span>\r\n        <span class=\"kd\">public<\/span> <span class=\"kt\">void<\/span> <span class=\"nf\">log<\/span><span class=\"o\">(<\/span><span class=\"nc\">DumpEntry<\/span> <span class=\"n\">payload<\/span><span class=\"o\">)<\/span> <span class=\"o\">{<\/span>\r\n            <span class=\"no\">LOG<\/span><span class=\"o\">.<\/span><span class=\"na\">info<\/span><span class=\"o\">(<\/span><span class=\"s\">\"entry={}\"<\/span><span class=\"o\">,<\/span> <span class=\"n\">payload<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"o\">}<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Bean<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">RestTemplate<\/span> <span class=\"nf\">restTemplate<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"k\">new<\/span> <span class=\"nf\">RestTemplate<\/span><span class=\"o\">();<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Bean<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">PollerMetadata<\/span> <span class=\"nf\">downloadTrigger<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">PeriodicTrigger<\/span> <span class=\"n\">trigger<\/span> <span class=\"o\">=<\/span> <span class=\"k\">new<\/span> <span class=\"nc\">PeriodicTrigger<\/span><span class=\"o\">(<\/span><span class=\"n\">config<\/span><span class=\"o\">.<\/span><span class=\"na\">getDownloadInterval<\/span><span class=\"o\">());<\/span>\r\n        <span class=\"n\">trigger<\/span><span class=\"o\">.<\/span><span class=\"na\">setFixedRate<\/span><span class=\"o\">(<\/span><span class=\"kc\">true<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"nc\">PollerMetadata<\/span> <span class=\"n\">pollerMetadata<\/span> <span class=\"o\">=<\/span> <span class=\"k\">new<\/span> <span class=\"nc\">PollerMetadata<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"n\">pollerMetadata<\/span><span class=\"o\">.<\/span><span class=\"na\">setTrigger<\/span><span class=\"o\">(<\/span><span class=\"n\">trigger<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"n\">pollerMetadata<\/span><span class=\"o\">.<\/span><span class=\"na\">setMaxMessagesPerPoll<\/span><span class=\"o\">(<\/span><span class=\"mi\">1<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">pollerMetadata<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Bean<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">MessageChannel<\/span> <span class=\"nf\">channel1<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"k\">new<\/span> <span class=\"nf\">QueueChannel<\/span><span class=\"o\">(<\/span><span class=\"mi\">10<\/span><span class=\"o\">);<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Bean<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">MessageChannel<\/span> <span class=\"nf\">channel2<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"k\">new<\/span> <span class=\"nf\">DirectChannel<\/span><span class=\"o\">();<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Bean<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">MessageChannel<\/span> <span class=\"nf\">channel3<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"k\">new<\/span> <span class=\"nf\">DirectChannel<\/span><span class=\"o\">();<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"nd\">@Bean<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">MessageChannel<\/span> <span class=\"nf\">channel4<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"k\">new<\/span> <span class=\"nf\">QueueChannel<\/span><span class=\"o\">(<\/span><span class=\"mi\">10<\/span><span class=\"o\">);<\/span>\r\n    <span class=\"o\">}<\/span>\r\n\r\n    <span class=\"c1\">\/\/ &lt;int:poller id=\"poller\" default=\"true\" fixed-rate=\"10\"\/&gt;<\/span>\r\n    <span class=\"nd\">@Bean<\/span><span class=\"o\">(<\/span><span class=\"n\">name<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">PollerMetadata<\/span><span class=\"o\">.<\/span><span class=\"na\">DEFAULT_POLLER<\/span><span class=\"o\">)<\/span>\r\n    <span class=\"kd\">public<\/span> <span class=\"nc\">PollerMetadata<\/span> <span class=\"nf\">poller<\/span><span class=\"o\">()<\/span> <span class=\"o\">{<\/span>\r\n        <span class=\"nc\">PeriodicTrigger<\/span> <span class=\"n\">trigger<\/span> <span class=\"o\">=<\/span> <span class=\"k\">new<\/span> <span class=\"nc\">PeriodicTrigger<\/span><span class=\"o\">(<\/span><span class=\"mi\">10<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"n\">trigger<\/span><span class=\"o\">.<\/span><span class=\"na\">setFixedRate<\/span><span class=\"o\">(<\/span><span class=\"kc\">true<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"nc\">PollerMetadata<\/span> <span class=\"n\">pollerMetadata<\/span> <span class=\"o\">=<\/span> <span class=\"k\">new<\/span> <span class=\"nc\">PollerMetadata<\/span><span class=\"o\">();<\/span>\r\n        <span class=\"n\">pollerMetadata<\/span><span class=\"o\">.<\/span><span class=\"na\">setTrigger<\/span><span class=\"o\">(<\/span><span class=\"n\">trigger<\/span><span class=\"o\">);<\/span>\r\n        <span class=\"k\">return<\/span> <span class=\"n\">pollerMetadata<\/span><span class=\"o\">;<\/span>\r\n    <span class=\"o\">}<\/span>\r\n<span class=\"o\">}<\/span>\r\n<\/code><\/pre>\n<p>\u5728CrawlerApp\u4e2d\uff0c\u6211\u4eec\u5b9a\u4e49\u4e86downloadTrigger\u7684\u4e0b\u8f7d\u95f4\u9694\uff0c\u4ee5\u53ca\u5b9a\u4e49\u4e86channel1\u5230channel4\u7684\u5404\u4e2a\u9891\u9053\u3002<\/p>\n<p>\u6b64\u5916\uff0cCrawlerApp\u5728\u63a5\u6536\u6765\u81eachannel4\u7684DumpEntry\u540e\u5c06\u5176\u8f93\u51fa\u5230\u65e5\u5fd7\u4e2d\u3002\u5b9e\u9645\u4e0a\uff0c\u5b83\u4f1a\u4e0e\u5916\u90e8\u7cfb\u7edf\u8fdb\u884c\u534f\u4f5c\uff0c\u6bd4\u5982\u5c06\u5176\u5199\u5165\u6587\u4ef6\u3001\u4fdd\u5b58\u5230\u6570\u636e\u5e93\u6216\u53d1\u9001\u5230\u6d88\u606f\u961f\u5217\u7b49\u3002<\/p>\n<h2>\u8fd0\u884c\u65b9\u6cd5\u548c\u5b9e\u4f8b<\/h2>\n<p>\u4ee5\u4e0b\u662f\u6267\u884c\u65b9\u6cd5\uff1a<\/p>\n<pre class=\"post-pre\"><code>mvn package\r\njava -jar target\/spring-boot-integration-crawler-sample-1.0.jar\r\n<\/code><\/pre>\n<h2>\u5b8c\u6574\u6e90\u4ee3\u7801<\/h2>\n<pre class=\"post-pre\"><code>git clone https:\/\/github.com\/sunny4381\/spring-boot-integration-crawler-sample.git\r\n<\/code><\/pre>\n","protected":false},"excerpt":{"rendered":"<p>\u6211\u5011\u5c07\u4f7f\u7528Spring Boot\u548cSpring Integration\u4f86\u5275\u5efa\u4e00\u500b\u7c21\u55ae\u7684\u722c\u87f2\uff0c\u4e0d\u9700\u8981\u4f7f\u7528XML\uff0c [&hellip;]<\/p>\n","protected":false},"author":10,"featured_media":0,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[],"class_list":["post-40313","post","type-post","status-publish","format-standard","hentry","category-uncategorized"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v21.5 (Yoast SEO v21.5) - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b - Blog - Silicon Cloud<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.silicloud.com\/zh\/blog\/\u4f7f\u7528spring-boot\u548cspring-integration\u7684\u7f51\u7edc\u722c\u866b\/\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b\" \/>\n<meta property=\"og:description\" content=\"\u6211\u5011\u5c07\u4f7f\u7528Spring Boot\u548cSpring Integration\u4f86\u5275\u5efa\u4e00\u500b\u7c21\u55ae\u7684\u722c\u87f2\uff0c\u4e0d\u9700\u8981\u4f7f\u7528XML\uff0c [&hellip;]\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.silicloud.com\/zh\/blog\/\u4f7f\u7528spring-boot\u548cspring-integration\u7684\u7f51\u7edc\u722c\u866b\/\" \/>\n<meta property=\"og:site_name\" content=\"Blog - Silicon Cloud\" \/>\n<meta property=\"article:published_time\" content=\"2023-07-06T13:47:05+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2024-01-15T02:34:10+00:00\" \/>\n<meta name=\"author\" content=\"\u5b87, \u534e\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"\u5b87, \u534e\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"5 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/\",\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/\",\"name\":\"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b - Blog - Silicon Cloud\",\"isPartOf\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#website\"},\"datePublished\":\"2023-07-06T13:47:05+00:00\",\"dateModified\":\"2024-01-15T02:34:10+00:00\",\"author\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/513018e4e121d3add1b7c5de8be21458\"},\"breadcrumb\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/www.silicloud.com\/zh\/blog\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#website\",\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/\",\"name\":\"Blog - Silicon Cloud\",\"description\":\"\",\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/513018e4e121d3add1b7c5de8be21458\",\"name\":\"\u5b87, \u534e\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/secure.gravatar.com\/avatar\/63cd45cbc05a35fc4ff7637a163c83c4962ef58d27472726c3a3e0c9c5194f0f?s=96&d=mm&r=g\",\"contentUrl\":\"https:\/\/secure.gravatar.com\/avatar\/63cd45cbc05a35fc4ff7637a163c83c4962ef58d27472726c3a3e0c9c5194f0f?s=96&d=mm&r=g\",\"caption\":\"\u5b87, \u534e\"},\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/author\/yuhua\/\"},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/#local-main-organization-logo\",\"url\":\"\",\"contentUrl\":\"\",\"caption\":\"Blog - Silicon Cloud\"}]}<\/script>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b - Blog - Silicon Cloud","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.silicloud.com\/zh\/blog\/\u4f7f\u7528spring-boot\u548cspring-integration\u7684\u7f51\u7edc\u722c\u866b\/","og_locale":"zh_CN","og_type":"article","og_title":"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b","og_description":"\u6211\u5011\u5c07\u4f7f\u7528Spring Boot\u548cSpring Integration\u4f86\u5275\u5efa\u4e00\u500b\u7c21\u55ae\u7684\u722c\u87f2\uff0c\u4e0d\u9700\u8981\u4f7f\u7528XML\uff0c [&hellip;]","og_url":"https:\/\/www.silicloud.com\/zh\/blog\/\u4f7f\u7528spring-boot\u548cspring-integration\u7684\u7f51\u7edc\u722c\u866b\/","og_site_name":"Blog - Silicon Cloud","article_published_time":"2023-07-06T13:47:05+00:00","article_modified_time":"2024-01-15T02:34:10+00:00","author":"\u5b87, \u534e","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"\u5b87, \u534e","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"5 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/","url":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/","name":"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b - Blog - Silicon Cloud","isPartOf":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/#website"},"datePublished":"2023-07-06T13:47:05+00:00","dateModified":"2024-01-15T02:34:10+00:00","author":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/513018e4e121d3add1b7c5de8be21458"},"breadcrumb":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/www.silicloud.com\/zh\/blog\/"},{"@type":"ListItem","position":2,"name":"\u4f7f\u7528Spring Boot\u548cSpring Integration\u7684\u7f51\u7edc\u722c\u866b"}]},{"@type":"WebSite","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#website","url":"https:\/\/www.silicloud.com\/zh\/blog\/","name":"Blog - Silicon Cloud","description":"","inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/513018e4e121d3add1b7c5de8be21458","name":"\u5b87, \u534e","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/image\/","url":"https:\/\/secure.gravatar.com\/avatar\/63cd45cbc05a35fc4ff7637a163c83c4962ef58d27472726c3a3e0c9c5194f0f?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/63cd45cbc05a35fc4ff7637a163c83c4962ef58d27472726c3a3e0c9c5194f0f?s=96&d=mm&r=g","caption":"\u5b87, \u534e"},"url":"https:\/\/www.silicloud.com\/zh\/blog\/author\/yuhua\/"},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e4%bd%bf%e7%94%a8spring-boot%e5%92%8cspring-integration%e7%9a%84%e7%bd%91%e7%bb%9c%e7%88%ac%e8%99%ab\/#local-main-organization-logo","url":"","contentUrl":"","caption":"Blog - Silicon Cloud"}]}},"_links":{"self":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/40313","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/users\/10"}],"replies":[{"embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/comments?post=40313"}],"version-history":[{"count":2,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/40313\/revisions"}],"predecessor-version":[{"id":58667,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/40313\/revisions\/58667"}],"wp:attachment":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/media?parent=40313"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/categories?post=40313"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/tags?post=40313"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}