{"id":46812,"date":"2023-09-13T10:11:34","date_gmt":"2023-07-25T06:26:54","guid":{"rendered":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/"},"modified":"2024-05-03T23:33:04","modified_gmt":"2024-05-03T15:33:04","slug":"%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91","status":"publish","type":"post","link":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/","title":{"rendered":"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3&#8221;\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01&#8221;\u7684\u9700\u6c42"},"content":{"rendered":"<p>\u8fd9\u7bc7\u6587\u7ae0\u662fNTT\u901a\u4fe1\u5b98\u65b9\u5723\u8bde\u8282\u65e5\u5386\u7684\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u3002\u6ca1\u60f3\u5230\u6211\u7adf\u7136\u62c5\u4efb\u4e86\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u8d23\u4efb\uff0c\u771f\u662f\u4e0d\u597d\u610f\u601d\u3002<\/p>\n<p>\u8be5\u4f5c\u8005\u76ee\u524d\u5728\u6280\u672f\u5f00\u53d1\u90e8\u95e8\u5de5\u4f5c\uff0c\u8d1f\u8d23\u8fdb\u884c\u516c\u53f8\u5185\u5916\u5404\u79cd\u6570\u636e\u5206\u6790\u548c\u5f02\u5e38\u68c0\u6d4b\u6280\u672f\u7684\u7814\u7a76\u4e0e\u5f00\u53d1\u3002\u6700\u8fd1\u7684\u7814\u7a76\u6210\u679c\u5df2\u88abAAAI\u7684IAAI2018\u4f1a\u8bae\u91c7\u7eb3\u3002<\/p>\n<h3>\u9996\u5148<\/h3>\n<p>\u4e3a\u4e86\u8fc5\u901f\u5411\u56e2\u961f\u5185\u7684\u5404\u79cd\u670d\u52a1\u90e8\u95e8\u63d0\u4f9b\u5206\u6790\u7ed3\u679c\uff0c\u6211\u4eec\u6b63\u5728\u56e2\u961f\u4e2d\u5efa\u7acb\u4f7f\u7528\u5f00\u6e90\u8f6f\u4ef6\u6784\u5efa\u7684\u5206\u6790\u57fa\u7840\u8bbe\u65bd\u3002\u5728\u8fdb\u884c\u62a5\u544a\u5206\u6790\u65f6\uff0c\u9700\u8981\u8fdb\u884c\u6570\u636e\u6c47\u603b\u548c\u5206\u6790\u5904\u7406\u3002\u6839\u636e\u89c2\u770b\u8005\u7684\u4e0d\u540c\uff0c\u4e5f\u6709\u5404\u79cd\u62a5\u544a\u95f4\u9694\uff08\u5206\u6790\u7ed3\u679c\u66f4\u65b0\u9891\u7387\uff09\u7684\u8981\u6c42\u3002\u4f8b\u5982\uff0c<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">\u5b9a\u671f\u7684\u306a\u30e1\u30fc\u30eb\u914d\u4fe1\u3001\u30c7\u30fc\u30bf\u306e\u6700\u65b0\u5316\u3001\u6a5f\u68b0\u5b66\u7fd2\u306e\u30e2\u30c7\u30eb\u306e\u66f4\u65b0\uff081\u65e5\u306b1\u56de\u306e\u30d0\u30c3\u30c1\u51e6\u7406\uff09<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">\uff11\u65e5\u306b\u4f55\u5ea6\u304b\u30c7\u30fc\u30bf\u306b\u30a2\u30af\u30bb\u30b9\u3057\u3066\u3001\u30c7\u30fc\u30bf\u306e\u72b6\u6cc1\u3092\u78ba\u8a8d\u3059\u308b\uff08\u25ef\u5206\u9593 \/ \u25ef\u6642\u9593\u3067\u306e\u30d0\u30c3\u30c1\u51e6\u7406\uff09<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\u5e38\u306b\u4eca\u306e\u30c7\u30fc\u30bf\u3092\u30e2\u30cb\u30bf\u30ea\u30f3\u30b0\u3057\u305f\u3044\uff08\u30cb\u30a2\u30ea\u30a2\u30eb\u30bf\u30a4\u30e0\u51e6\u7406\u3001\u30b9\u30c8\u30ea\u30fc\u30df\u30f3\u30b0\u51e6\u7406\uff09<\/ul>\n<p>\u7279\u522b\u662f\u6700\u8fd1\u7684\u793e\u4ea4\u8c08\u8bdd\u4e2d\uff0c\u7ecf\u5e38\u4f1a\u6d89\u53ca\u5230\u5e0c\u671b\u5b9e\u65f6\u67e5\u770b\u6570\u636e\u6216\u8005\u60f3\u77e5\u9053\u73b0\u5728\u7684\u60c5\u51b5\u8fd9\u6837\u7684\u8bdd\u9898\u3002\u5b9e\u9645\u4e0a\uff0c\u6bcf\u5929\u90fd\u4e0d\u4f1a\u4e00\u76f4\u76ef\u7740\u76d1\u89c6\u5668\u3002\u4f46\u662f\uff0c\u5728\u670d\u52a1\u51fa\u73b0\u6545\u969c\u65f6\uff0c\u53ef\u80fd\u4f1a\u9700\u8981\u7d27\u76ef\u76d1\u89c6\u5668\uff0c\u6e34\u671b\u5c3d\u5feb\u77e5\u9053\u6570\u636e\u662f\u5426\u5df2\u7ecf\u5230\u4e86\u6216\u8005\u73b0\u5728\u7684\u60c5\u51b5\u5982\u4f55\u3002\u53e6\u5916\uff0c\u5982\u679c\u80fd\u591f\u5728\u6f14\u793a\u4e2d\u5c55\u793a\u5b9e\u65f6\u8fd0\u884c\u7684\u8bdd\uff0c\u4e5f\u4f1a\u663e\u5f97\u5f88\u9177\uff01<\/p>\n<p>\u6211\u4eec\u5728\u5404\u79cd\u5f00\u6e90\u8f6f\u4ef6\u67b6\u6784\u4e0b\u5b9e\u65bd\u4e86\u8fd9\u6837\u7684\u5b9e\u65f6\u5206\u6790\uff0c\u5e76\u8fdb\u884c\u4e86\u9a8c\u8bc1\u548c\u5f15\u5165\u3002\u5728JANOG2 39th\u4e2d\uff0c\u6211\u4eec\u7684\u540c\u4e8b@__kaname__\u8d1f\u8d23\u4e86\u4f7f\u7528pmacct-&gt;kafka-&gt;presto-&gt;re:dash\u8fdb\u884c\u5feb\u901f\u6d41\u5206\u6790\u7684\u62a5\u544a\u3002\u6211\u4eec\u516c\u53f8\u4e5f\u53d1\u5e03\u4e86\u6709\u5173\u7f51\u7edc\u6d41\u91cf\u6570\u636e\u7684\u5b9e\u65f6\u5206\u6790\u6848\u4f8b\u3002\u9664\u4e86\u8fd9\u6837\u7684\u7f51\u7edc\u6d41\u91cf\u6570\u636e\u5206\u6790\u5916\uff0c\u6211\u4eec\u8fd8\u4f7f\u7528\u5728\u4e92\u8054\u7f51\u4e0a\u5b89\u88c5\u7684\u4f20\u611f\u5668\uff08\u63a2\u6d4b\u5668\uff09\u6536\u96c6\u4e0d\u540c\u7684\u7f51\u7edc\u6d41\u91cf\u6570\u636e\uff0c\u5e76\u5728\u5404\u79cd\u89d2\u5ea6\u4e0a\u8fdb\u884c\u5206\u6790\u3002\u56e0\u6b64\uff0c\u5728\u672c\u6587\u4e2d\uff0c\u6211\u60f3\u5206\u4eab\u5173\u4e8e\u642d\u5efa\u57fa\u4e8eKafka+SparkStreaming\u7684\u5b9e\u65f6\u5904\u7406\u5e73\u53f0\u7684\u7ecf\u9a8c\u3002\u7531\u4e8e\u5bf9\u8bb8\u591a\u6280\u672f\u662f\u7b2c\u4e00\u6b21\u63a5\u89e6\uff0c\u6211\u5728\u5b66\u4e60\u7684\u540c\u65f6\u4e5f\u5728\u5b9e\u8df5\u4e2d\u79ef\u7d2f\u7ecf\u9a8c\u3002<\/p>\n<p>\u5728\u89e3\u91ca\u65f6\uff0c\u4f1a\u6d89\u53ca\u5230fluentd\u3001Docker\u3001Kafka\u3001Spark\u7b49\u672f\u8bed\uff0c\u4f46\u5728\u8fd9\u65b9\u9762\u6211\u4f1a\u5c3d\u91cf\u7528\u5e73\u6613\u7684\u8bed\u8a00\u8fdb\u884c\u89e3\u91ca\uff0c\u4f46\u4e0d\u4f1a\u8fc7\u591a\u5c55\u5f00\u3002<\/p>\n<h3>\u5efa\u7b51\u8bbe\u8ba1<\/h3>\n<p>\u5047\u8bbe\u5728\u591a\u4e2a\u5730\u70b9\u5b89\u88c5\u4e86\u4f20\u611f\u5668\uff0c\u5e76\u4e14\u901a\u8fc7Fluentd\u5c06\u6570\u636e\u4fdd\u5b58\u5728\u4e91\u4e0a\u7684\u865a\u62df\u673a\u4e2d\u3002<\/p>\n<p>\u5728\u8fd9\u79cd\u60c5\u51b5\u4e0b\uff0c\u9700\u8981\u7684\u6761\u4ef6\u662f\uff0c<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">SQL\u30d9\u30fc\u30b9\u3067\u66f8\u3051\u308b\u51e6\u7406\u304c\u5fc5\u8981\u3002\u3059\u3067\u306b\u5206\u6790\u8005\u304c\u5229\u7528\u3057\u3066\u3044\u308bSQL\u30af\u30a8\u30ea\u304c\u8907\u6570\u5b58\u5728\u3059\u308b\u306e\u3067\u3001\u30ea\u30a2\u30eb\u30bf\u30a4\u30e0\u306b\u96c6\u8a08\u3059\u308b\u969b\u306b\u3082\u305d\u308c\u3092\u5229\u7528\u3067\u304d\u308b\u3088\u3046\u306b\u3057\u305f\u3044\u3002<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">Python\u30d9\u30fc\u30b9\u3067\u69cb\u7bc9\u3057\u305f\u3044\u3002\u30c1\u30fc\u30e0\u306e\u30b9\u30ad\u30eb\u30bb\u30c3\u30c8\u7684\u306bPython\u3067\u69cb\u7bc9\u3057\u305f\u307b\u3046\u304c\u30e1\u30f3\u30c6\u30ca\u30f3\u30b9\u30b3\u30b9\u30c8\u304c\u304b\u304b\u3089\u306a\u3044\u306e\u3068\u3001\u57fa\u76e4\u4e0a\u3067\u6a5f\u68b0\u5b66\u7fd2\u30e2\u30c7\u30ebAPI\u306e\u30a4\u30f3\u30bf\u30d5\u30a7\u30fc\u30b9\u3092\u3059\u3050\u306b\u5229\u7528\u3067\u304d\u308b\u305f\u3081\u3067\u3059\u3002<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">\u5206\u6790\u74b0\u5883\u306e\u518d\u73fe\u6027\u306e\u78ba\u4fdd\u306e\u305f\u3081\u3001Docker\u30b3\u30f3\u30c6\u30ca\u3067\u69cb\u7bc9\u3057\u305f\u3044\u3002<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">Kibana\u3067\u306e\u53ef\u8996\u5316\u306e\u305f\u3081\u3001Elasticsearch\u306b\u30c7\u30fc\u30bf\u3092\u683c\u7d0d\u3057\u305f\u3044\u3002<\/ul>\n<p>\u57fa\u4e8e\u4e0a\u8ff0\u8981\u6c42\u548c\u5f53\u524d\u8d8b\u52bf\uff0c\u6211\u4eec\u51b3\u5b9a\u4f7f\u7528Docker\u5bb9\u5668\u5728Kafka\u548cSparkStreaming\u4e0a\u8fdb\u884c\u90e8\u7f72\uff0c\u5e76\u4f7f\u7528Python\u6784\u5efa\u6240\u6709\u5904\u7406\u8fc7\u7a0b\u3002<\/p>\n<p>\u9009\u62e9SparkStreaming\u7684\u539f\u56e0\u5305\u62ec\u4ee5\u4e0b\u51e0\u70b9\uff1a\u4e0d\u8981\u6c42\u5b9e\u65f6\u7c92\u5ea6\u5230\u51e0\u79d2\u7684\u7a0b\u5ea6\uff0cSparkSQL\u80fd\u591f\u4f7f\u7528SQL\u5904\u7406\u6d41\u5165\u7684\u6570\u636e\uff0c\u540c\u65f6\u53ef\u4ee5\u76f4\u63a5\u5728Python\u4e2d\u4f7f\u7528\u673a\u5668\u5b66\u4e60API\u3002<\/p>\n<p>\u4ee5\u4e0b\u662fPonzi\u56fe\u7684\u5185\u5bb9\u3002\u672c\u6587\u6392\u9664\u4e86\u8282\u70b9\u6570\u3001\u96c6\u7fa4\u89c4\u6a21\u4ee5\u53ca\u673a\u5668\u5b66\u4e60API\u7b49\u65b9\u9762\u7684\u5185\u5bb9\u3002<\/p>\n<div><img decoding=\"async\" class=\"post-images\" title=\"\" src=\"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d7af0913a08637a697aad\/15-0.png\" alt=\"advent.png\" \/><\/div>\n<p>\u6211\u5011\u4f7f\u7528\u7684\u7248\u672c\u5982\u4e0b\u6240\u5217\u3002<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">fluentd : 0.12.40<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">Kafka : 0.10.2.1<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">Spark : 2.2<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">Elasticsearch : 5.6.2<\/ul>\n<p>\u76ee\u524d\uff0cKafka\u96c6\u7fa4\u548cElasticsearch\u96c6\u7fa4\u5df2\u7ecf\u542f\u52a8\u3002<\/p>\n<h3>\u4ece\u4e91\u7aef\u7684Fluentd\u4f20\u9001\u5230Kafka<\/h3>\n<p>\u4e3a\u4e86\u5c06\u4ece\u6536\u96c6\u4f20\u611f\u5668\u53d1\u9001\u5230Kafka\uff0c\u6211\u4eec\u4f7f\u7528\u4e91\u73af\u5883\u7684fluentd\u4f5c\u4e3a\u4e2d\u7ee7\u3002\u4e3a\u6b64\uff0c\u6211\u4eec\u5c06\u7f16\u8f91fluent.conf\uff0c\u5e76\u4f7f\u7528fluent-plugin-kafka\u4f5c\u4e3a\u8f93\u51fa\u63d2\u4ef6\u53d1\u9001\u5230Kafka\u3002\u4ee5\u4e0b\u662f\u4e00\u4e2a\u793a\u4f8b\uff1a<\/p>\n<pre class=\"post-pre\"><code>&lt;match aaa&gt;\r\n  &lt;store&gt;\r\n    @type kafka_buffered\r\n    brokers XXX.XXX.XXX.XXX:9092\r\n    default_topic TOPIC_NAME\r\n    &lt;snip&gt;\r\n\r\n    # See fluentd document for buffer related parameters\r\n    max_send_retries 1\r\n    required_acks -1\r\n    ack_timeout nil\r\n    compression_codec gzip\r\n    kafka_agg_max_bytes 4096\r\n    kafka_agg_max_messages nil\r\n    max_send_limit_bytes 1000000\r\n    discard_kafka_delivery_failed false\r\n    monitoring_list []\r\n  &lt;\/store&gt;\r\n&lt;\/match&gt;\r\n<\/code><\/pre>\n<p>\u53c2\u6570\u8c03\u6574\u6309\u7167\u6587\u6863\u8fdb\u884c\uff0c\u4f46\u4e5f\u8fdb\u884c\u4e86\u8bbe\u7f6e\u5e76\u9650\u5236\u4e86 max_send_limit_bytes\u3002\u8bbe\u7f6e\u540e\u91cd\u65b0\u52a0\u8f7d\u540e\uff0c\u9891\u7e41\u51fa\u73b0\u4e86 forward error error=# error_class=Fluent::BufferQueueLimitError \u7684\u9519\u8bef\u3002\u53c2\u8003\u8fc7\u5904\u7406\u7c7b\u4f3c\u9519\u8bef\u7684\u65b9\u6cd5\uff08\u5728 td-agent \u4e2d\u5904\u7406\u961f\u5217\u5927\u5c0f\u8d85\u8fc7\u9650\u5236\u7684\u65b9\u6cd5\uff09\uff0c\u5bf9 Fluentd \u7684\u865a\u62df\u673a\u5185\u5b58\u8fdb\u884c\u589e\u52a0\u6765\u5904\u7406\u3002<\/p>\n<h3>\u4ece\u4e91\u4e0a\u7684Kafka\u8fde\u63a5\u5230\u57fa\u7840\u8bbe\u65bd\u4e0a\u7684Kafka\u3002<\/h3>\n<p>\u5c06\u4e91\u7aef\u7684Kafka\u53d1\u9001\u6570\u636e\u5230\u57fa\u7840Kafka\u3002\u9700\u8981\u8fdb\u884c\u6570\u636e\u6e05\u6d17\u5904\u7406\uff0c\u4ee5\u4fbf\u66f4\u5bb9\u6613\u8fdb\u884c\u5206\u6790\u3002\u8fd9\u5305\u62ec\u4e3a\u539f\u59cb\u6570\u636e\u6dfb\u52a0\u8282\u70b9\u6807\u7b7e\u4fe1\u606f\u3001\u65f6\u95f4\u4fe1\u606f\u548c\u7edf\u8ba1\u4fe1\u606f\u7b49\u3002<\/p>\n<p>\u4e3a\u4e86\u4f7f\u7528SparkStreaming\u8fdb\u884c\u5904\u7406\uff0c\u9996\u5148\u8981\u786e\u4fdd\u5728\u4efb\u4f55\u73af\u5883\u4e0b\u90fd\u80fd\u4fdd\u8bc1\u53ef\u91cd\u73b0\u6027\uff0c\u6240\u4ee5\u9700\u8981\u6784\u5efaSpark\u7684Docker\u5bb9\u5668\u3002\u867d\u7136\u5df2\u7ecf\u6709\u516c\u5f00\u7684Spark Docker\u955c\u50cf\u6587\u4ef6\uff0c\u4f46\u662f\u7531\u4e8e\u5305\u542b\u4e86\u4e0d\u5fc5\u8981\u7684\u5e93\u7b49\u539f\u56e0\uff0c\u6ca1\u6709\u7b80\u5355\u7684\u955c\u50cf\u53ef\u7528\uff0c\u6240\u4ee5\u9700\u8981\u51c6\u5907Dockerfile\u3002\u5bf9\u4e8e\u4f7f\u7528Docker Swarm\u6784\u5efaApache Spark\u96c6\u7fa4\u7684\u53c2\u8003\u4e5f\u5f88\u6709\u5e2e\u52a9\u3002<\/p>\n<p>\u6211\u53ea\u4f1a\u63d0\u53d6Dockerfile\u4e2d\u7684\u91cd\u8981\u90e8\u5206\u3002<\/p>\n<p>\u5b89\u88c5Spark<\/p>\n<pre class=\"post-pre\"><code><span class=\"c\"># install spark<\/span>\r\n<span class=\"k\">RUN <\/span><span class=\"nb\">cd<\/span> \/tmp <span class=\"se\">\\\r\n<\/span>  <span class=\"o\">&amp;&amp;<\/span> curl <span class=\"nt\">-LO<\/span> http:\/\/ftp.jaist.ac.jp\/pub\/apache\/spark\/spark-2.2.0\/spark-2.2.0-bin-hadoop2.7.tgz <span class=\"se\">\\\r\n<\/span>  <span class=\"o\">&amp;&amp;<\/span> <span class=\"nb\">tar <\/span>zxf spark-2.2.0-bin-hadoop2.7.tgz <span class=\"se\">\\\r\n<\/span>  <span class=\"o\">&amp;&amp;<\/span> <span class=\"nb\">mv <\/span>spark-2.2.0-bin-hadoop2.7 \/spark <span class=\"se\">\\\r\n<\/span>  <span class=\"o\">&amp;&amp;<\/span> <span class=\"nb\">rm <\/span>spark-2.2.0-bin-hadoop2.7.tgz\r\n<\/code><\/pre>\n<p>\u4f7f\u7528Spark\u65f6\uff0c\u9700\u8981\u4e0b\u8f7d\u5916\u90e8\u7684JAR\u6587\u4ef6\u3002\u8fd9\u4e9b\u6587\u4ef6\u5305\u62ecapache-log4j-extras-1.2.17.jar\uff0c\u7528\u4e8e\u4ee5JST\u65f6\u533a\u663e\u793a\u65e5\u5fd7\uff0c\u4ee5\u53caspark-streaming-kafka-0-8-assembly_2.11-2.2.0.jar\uff0c\u7528\u4e8e\u4eceKafka\u52a0\u8f7d\u6570\u636e\u3002<br \/>\n\u53e6\u5916\uff0c\u5982\u679c\u4f7f\u7528Structured Streaming\uff0c\u9700\u8981\u53c2\u8003Structured Streaming + Kafka Integration Guide\uff08Kafka broker\u7248\u672c0.10.0\u6216\u66f4\u9ad8\u7248\u672c\uff09\uff0c\u5e76\u4f7f\u7528spark-sql-kafka-0-10_2.11-2.2.0.jar\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c\"># add jar files<\/span>\r\n<span class=\"k\">RUN <\/span>curl <span class=\"nt\">-o<\/span> \/spark\/jars\/apache-log4j-extras-1.2.17.jar <span class=\"nt\">-L<\/span> <span class=\"s2\">\"https:\/\/www.apache.org\/dist\/logging\/log4j\/extras\/1.2.17\/apache-log4j-extras-1.2.17.jar\"<\/span>\r\n<span class=\"k\">RUN <\/span>curl <span class=\"nt\">-o<\/span> \/spark\/jars\/spark-sql-kafka-0-10_2.11-2.2.0.jar <span class=\"nt\">-L<\/span> <span class=\"s2\">\"http:\/\/central.maven.org\/maven2\/org\/apache\/spark\/spark-sql-kafka-0-10_2.11\/2.2.0\/spark-sql-kafka-0-10_2.11-2.2.0.jar\"<\/span>\r\n<span class=\"k\">RUN <\/span>curl <span class=\"nt\">-o<\/span> \/spark\/jars\/spark-streaming-kafka-0-8-assembly_2.11-2.2.0.jar <span class=\"s2\">\"http:\/\/central.maven.org\/maven2\/org\/apache\/spark\/spark-streaming-kafka-0-8-assembly_2.11\/2.2.0\/spark-streaming-kafka-0-8-assembly_2.11-2.2.0.jar\"<\/span>\r\n<\/code><\/pre>\n<p>\u8fd9\u662f\u4e00\u4e2a\u7528\u4e8e\u5c06\u6570\u636e\u53d1\u5e03\u5230Kafka\u7684Python\u5e93\uff0c\u9002\u7528\u4e8ePython\u5728Spark\u4e2d\u7684\u7248\u672c\u8bbe\u7f6e\u73af\u5883\u53d8\u91cf\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c\"># python packages<\/span>\r\n<span class=\"k\">RUN <\/span>pip3 <span class=\"nb\">install<\/span> <span class=\"nt\">--upgrade<\/span> pip setuptools\r\n<span class=\"k\">RUN <\/span>pip3 <span class=\"nb\">install <\/span>kafka-python\r\n\r\n<span class=\"c\"># set python3 for spark<\/span>\r\n<span class=\"k\">ENV<\/span><span class=\"s\"> PYSPARK_PYTHON=python3<\/span>\r\n<\/code><\/pre>\n<p>\u6784\u5efaDockerfile\u5e76\u751f\u6210\u955c\u50cf\u3002<\/p>\n<pre class=\"post-pre\"><code>$ docker build -t spark-streaming-load:latest .\r\n<\/code><\/pre>\n<p>\u4f7f\u7528docker-compose\u8fdb\u884c\u542f\u52a8\u3002\u5728\u6b64\u8fc7\u7a0b\u4e2d\uff0c\u5c06\u6302\u8f7dSpark\u7684\u914d\u7f6e\u6587\u4ef6\u5e76\u542f\u52a8\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"na\">spark-streaming-load<\/span><span class=\"pi\">:<\/span>\r\n  <span class=\"na\">image<\/span><span class=\"pi\">:<\/span> <span class=\"s\">spark-streaming-load:latest<\/span>\r\n  <span class=\"na\">container_name<\/span><span class=\"pi\">:<\/span> <span class=\"s\">spark-streaming-load<\/span>\r\n  <span class=\"na\">hostname<\/span><span class=\"pi\">:<\/span> <span class=\"s\">spark-streaming-load<\/span>\r\n  <span class=\"na\">volumes<\/span><span class=\"pi\">:<\/span>\r\n    <span class=\"pi\">-<\/span> <span class=\"s\">\/data:\/data<\/span>\r\n    <span class=\"pi\">-<\/span> <span class=\"s\">\/spark\/conf\/load.spark-defaults.conf:\/spark\/conf\/defaults.conf<\/span>\r\n    <span class=\"pi\">-<\/span> <span class=\"s\">\/spark\/conf\/load.log4j.properties:\/spark\/conf\/log4j.properties<\/span>\r\n    <span class=\"pi\">-<\/span> <span class=\"s\">\/spark\/log:\/spark\/log<\/span>\r\n<\/code><\/pre>\n<p>\u5728load.spark-defaults.conf\u4e2d\u8bbe\u7f6e\u4e0eSpark\u6027\u80fd\u6709\u5173\u7684\u53c2\u6570\u3002\u5728\u5b98\u65b9\u6587\u6863\u4e2d\u67e5\u770b\u53c2\u6570\u7684\u5185\u5bb9\u3002\u4ee5\u4e0b\u662f\u793a\u4f8b\u3002\u5173\u4e8e\u53c2\u6570\u8c03\u4f18\u7684\u8be6\u7ec6\u4fe1\u606f\u5c06\u5728\u540e\u9762\u4ecb\u7ecd\u3002<\/p>\n<pre class=\"post-pre\"><code>spark.master                     local[2]\r\nspark.driver.memory              8g\r\nspark.executor.memory            8g\r\nspark.eventLog.enabled           true\r\nspark.streaming.concurrentJobs   1\r\n<\/code><\/pre>\n<p>\u901a\u8fc7\u8bbe\u7f6e\u65e5\u5fd7\u6587\u4ef6\uff0c\u53ef\u4ee5\u8bbe\u7f6e\u65e5\u5fd7\u7684\u8f93\u51fa\u4f4d\u7f6e\u548c\u683c\u5f0f\uff0c\u4ee5\u4fbf\u4e8e\u8fdb\u884c\u8c03\u8bd5\u3002<\/p>\n<p>\u8fdb\u884c\u5c06\u65e5\u5fd7\u8f93\u51fa\u5230\u6587\u4ef6\u7684\u8bbe\u7f6e\uff08\u53c2\u8003\uff1aSpark Streaming \u65e5\u5fd7\u914d\u7f6e\uff09\u3002\u6bcf\u4e2a\u6587\u4ef6\u6700\u591a\u5b58\u50a850MB\u6570\u636e\uff0c\u5982\u679c\u8d85\u8fc7\uff0c\u5c06\u5199\u5165\u5230\u53e6\u4e00\u4e2a\u6587\u4ef6\u4e2d\u3002\u8bbe\u7f6e\u4fdd\u5b58\u6700\u591a5\u4e2a\u6587\u4ef6\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c\"># Set everything to be logged to the console\r\n#log4j.rootCategory=INFO,console\r\n<\/span><span class=\"py\">log4j.rootCategory<\/span><span class=\"p\">=<\/span><span class=\"s\">INFO,rolling<\/span>\r\n\r\n<span class=\"c\"># logged to the rolling setting\r\n<\/span><span class=\"py\">log4j.appender.rolling<\/span><span class=\"p\">=<\/span><span class=\"s\">org.apache.log4j.RollingFileAppender<\/span>\r\n<span class=\"py\">log4j.appender.rolling.layout<\/span><span class=\"p\">=<\/span><span class=\"s\">org.apache.log4j.EnhancedPatternLayout<\/span>\r\n<span class=\"py\">log4j.appender.rolling.layout.conversionPattern<\/span><span class=\"p\">=<\/span><span class=\"s\">[%d{ISO8601}{GMT+9}]%-5p - %m%n<\/span>\r\n<span class=\"py\">log4j.appender.rolling.maxFileSize<\/span><span class=\"p\">=<\/span><span class=\"s\">50MB<\/span>\r\n<span class=\"py\">log4j.appender.rolling.maxBackupIndex<\/span><span class=\"p\">=<\/span><span class=\"s\">5<\/span>\r\n<span class=\"py\">log4j.appender.rolling.file<\/span><span class=\"p\">=<\/span><span class=\"s\">\/var\/log\/spark\/streaming_load.log<\/span>\r\n<span class=\"py\">log4j.appender.rolling.encoding<\/span><span class=\"p\">=<\/span><span class=\"s\">UTF-8<\/span>\r\n<\/code><\/pre>\n<p>\u5bf9\u4e8e\u65f6\u95f4\u523b\u5ea6\uff0c\u5c06\u6309\u7167\u4ee5\u4e0b\u683c\u5f0f\u8f93\u51fa\u3002\u6ce8\u91ca\u88ab\u9ed8\u8ba4\u8bbe\u7f6e\u4e3a\u7981\u7528\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c\">#log4j.appender.console.layout=org.apache.log4j.PatternLayout\r\n<\/span><span class=\"py\">log4j.appender.console.layout<\/span><span class=\"p\">=<\/span><span class=\"s\">org.apache.log4j.EnhancedPatternLayout<\/span>\r\n<span class=\"c\">#log4j.appender.console.layout.ConversionPattern=%d{yy\/MM\/dd HH:mm:ss\/zzz} %p %c{1}: %m%n\r\n<\/span><span class=\"py\">log4j.appender.console.layout.ConversionPattern<\/span><span class=\"p\">=<\/span><span class=\"s\">[%d{ISO8601}{GMT+9}]%-5p - %m%n<\/span>\r\n<\/code><\/pre>\n<p>\u7ed3\u679c\uff0c\u65e5\u5fd7\u88ab\u6210\u529f\u8f93\u51fa\u5230\u6587\u4ef6\u4e2d\u3002<\/p>\n<pre class=\"post-pre\"><code>&lt;snip&gt;\r\n[2017-11-01 14:25:26,413]INFO  - Running Spark version 2.2.0\r\n&lt;snip&gt;\r\n<\/code><\/pre>\n<p>\u6211\u5011\u5df2\u7d93\u5b8c\u6210\u4e86\u57fa\u672c\u7684\u8a2d\u7f6e\uff0c\u63a5\u4e0b\u4f86\u6e96\u5099Python\u8173\u672c\u3002\u4ee5\u4e0b\u662f\u4e00\u500b\u7bc4\u4f8b\uff0c\u6211\u5011\u5c07\u4f7f\u7528Direct Kafka\u4f86\u8f09\u5165\u6578\u64da\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c1\"># -*- coding:utf-8 -*-\r\n<\/span><span class=\"kn\">import<\/span> <span class=\"nn\">sys<\/span><span class=\"p\">,<\/span><span class=\"n\">json<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">datetime<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">datetime<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">kafka<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">KafkaProducer<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">collections<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">defaultdict<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">pyspark.streaming<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">StreamingContext<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">pyspark.streaming.kafka<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">KafkaUtils<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">pyspark.sql<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">SQLContext<\/span><span class=\"p\">,<\/span><span class=\"n\">SparkSession<\/span>\r\n\r\n<span class=\"k\">def<\/span> <span class=\"nf\">process<\/span><span class=\"p\">(<\/span><span class=\"n\">dstream<\/span><span class=\"p\">):<\/span>\r\n    <span class=\"c1\"># process\r\n<\/span>    <span class=\"o\">&lt;<\/span><span class=\"n\">\u7701\u7565<\/span><span class=\"o\">&gt;<\/span>\r\n\r\n    <span class=\"c1\"># Output\r\n<\/span>    <span class=\"n\">BROKER_HOSTS<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"XXX.XXX.XXX.XXX:9092\"<\/span>\r\n    <span class=\"n\">producer<\/span> <span class=\"o\">=<\/span> <span class=\"n\">KafkaProducer<\/span><span class=\"p\">(<\/span><span class=\"n\">bootstrap_servers<\/span> <span class=\"o\">=<\/span> <span class=\"n\">BROKER_HOSTS<\/span><span class=\"p\">,<\/span>\r\n                             <span class=\"n\">value_serializer<\/span> <span class=\"o\">=<\/span> <span class=\"k\">lambda<\/span> <span class=\"n\">v<\/span> <span class=\"p\">:<\/span> <span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"n\">dumps<\/span><span class=\"p\">(<\/span><span class=\"n\">v<\/span><span class=\"p\">).<\/span><span class=\"n\">encode<\/span><span class=\"p\">(<\/span><span class=\"s\">'utf-8'<\/span><span class=\"p\">))<\/span>\r\n    <span class=\"n\">producer<\/span><span class=\"p\">.<\/span><span class=\"n\">send<\/span><span class=\"p\">(<\/span><span class=\"s\">\"TOPIC_NAME\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">data<\/span><span class=\"p\">)<\/span>\r\n\r\n<span class=\"k\">if<\/span> <span class=\"n\">__name__<\/span> <span class=\"o\">==<\/span> <span class=\"s\">\"__main__\"<\/span><span class=\"p\">:<\/span>\r\n\r\n    <span class=\"c1\"># 30\u79d2\u6bce\u306e\u30d0\u30c3\u30c1\u51e6\u7406\u3092\u7e70\u308a\u8fd4\u3059StreamingContext\r\n<\/span>    <span class=\"n\">spark<\/span> <span class=\"o\">=<\/span> <span class=\"p\">(<\/span><span class=\"n\">SparkSession<\/span><span class=\"p\">.<\/span><span class=\"n\">builder<\/span><span class=\"p\">.<\/span><span class=\"n\">getOrCreate<\/span><span class=\"p\">())<\/span>\r\n    <span class=\"n\">sc<\/span> <span class=\"o\">=<\/span> <span class=\"n\">spark<\/span><span class=\"p\">.<\/span><span class=\"n\">sparkContext<\/span>\r\n    <span class=\"n\">sqlContext<\/span> <span class=\"o\">=<\/span> <span class=\"n\">SQLContext<\/span><span class=\"p\">(<\/span><span class=\"n\">sc<\/span><span class=\"p\">)<\/span>\r\n    <span class=\"n\">ssc<\/span> <span class=\"o\">=<\/span> <span class=\"n\">StreamingContext<\/span><span class=\"p\">(<\/span><span class=\"n\">sc<\/span><span class=\"p\">,<\/span> <span class=\"mi\">30<\/span><span class=\"p\">)<\/span>\r\n\r\n    <span class=\"c1\"># kafka Direct Stream\r\n<\/span>    <span class=\"k\">def<\/span> <span class=\"nf\">my_utf8_decoder<\/span><span class=\"p\">(<\/span><span class=\"n\">s<\/span><span class=\"p\">):<\/span>\r\n        <span class=\"k\">try<\/span> <span class=\"p\">:<\/span>\r\n            <span class=\"k\">if<\/span> <span class=\"n\">s<\/span> <span class=\"ow\">is<\/span> <span class=\"bp\">None<\/span><span class=\"p\">:<\/span>\r\n                <span class=\"k\">return<\/span> <span class=\"s\">\"{}\"<\/span>\r\n            <span class=\"k\">return<\/span> <span class=\"n\">s<\/span><span class=\"p\">.<\/span><span class=\"n\">decode<\/span><span class=\"p\">(<\/span><span class=\"s\">'utf-8'<\/span><span class=\"p\">)<\/span>\r\n        <span class=\"k\">except<\/span> <span class=\"nb\">UnicodeDecodeError<\/span> <span class=\"p\">:<\/span>\r\n            <span class=\"k\">return<\/span> <span class=\"s\">\"{}\"<\/span>\r\n    <span class=\"n\">BROKERS_HOSTS<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"XXX.XXX.XXX.XXX:9092\"<\/span>\r\n    <span class=\"n\">kafkaStream<\/span> <span class=\"o\">=<\/span> <span class=\"n\">KafkaUtils<\/span><span class=\"p\">.<\/span><span class=\"n\">createDirectStream<\/span><span class=\"p\">(<\/span><span class=\"n\">ssc<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ssc<\/span><span class=\"p\">,<\/span>\r\n                                                <span class=\"n\">topics<\/span> <span class=\"o\">=<\/span> <span class=\"p\">[<\/span><span class=\"s\">\"TOPIC_NAME\"<\/span><span class=\"p\">],<\/span>\r\n                                                <span class=\"n\">kafkaParams<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span><span class=\"s\">\"metadata.broker.list\"<\/span> <span class=\"p\">:<\/span> <span class=\"n\">BROKERS_HOSTS<\/span><span class=\"p\">},<\/span>\r\n                                                <span class=\"n\">valueDecoder<\/span> <span class=\"o\">=<\/span> <span class=\"n\">my_utf8_decoder<\/span><span class=\"p\">)<\/span>\r\n\r\n    <span class=\"c1\"># Parse\r\n<\/span>    <span class=\"n\">lines<\/span> <span class=\"o\">=<\/span> <span class=\"n\">kafkaStream<\/span><span class=\"p\">.<\/span><span class=\"nb\">map<\/span><span class=\"p\">(<\/span><span class=\"k\">lambda<\/span> <span class=\"n\">x<\/span><span class=\"p\">:<\/span> <span class=\"n\">x<\/span><span class=\"p\">[<\/span><span class=\"mi\">1<\/span><span class=\"p\">])<\/span>\r\n    <span class=\"n\">lines<\/span><span class=\"p\">.<\/span><span class=\"n\">foreachRDD<\/span><span class=\"p\">(<\/span><span class=\"n\">process<\/span><span class=\"p\">)<\/span>\r\n\r\n    <span class=\"c1\"># \u30b9\u30c8\u30ea\u30fc\u30e0\u51e6\u7406\u3092\u958b\u59cb\r\n<\/span>    <span class=\"n\">ssc<\/span><span class=\"p\">.<\/span><span class=\"n\">start<\/span><span class=\"p\">()<\/span>\r\n    <span class=\"n\">ssc<\/span><span class=\"p\">.<\/span><span class=\"n\">awaitTermination<\/span><span class=\"p\">()<\/span>\r\n<\/code><\/pre>\n<p>\u7531\u4e8eSpark\u6709\u4e00\u4e2a\u793a\u4f8b\u6587\u4ef6\uff0c\u6240\u4ee5\u57fa\u672c\u4e0a\u53ef\u4ee5\u901a\u8fc7\u53c2\u8003\u5b83\u6765\u8fd0\u884c\u3002\u4f46\u662f\u5728\u6301\u7eed\u8fd0\u884c\u65f6\uff0c\u4f1a\u53d1\u751f\u6765\u81eaKafka\u7684\u6570\u636e\u52a0\u8f7d\u65f6\u7684EOFError\u3002\u8fd9\u4f3c\u4e4e\u662f\u7531\u4e8e\u65e0\u6cd5\u89e3\u7801\u6570\u636e\u7684\u5b57\u7b26\u7f16\u7801\u5f15\u8d77\u7684\u3002\u56e0\u6b64\uff0c\u5728valueDecoder\u4e2d\u6dfb\u52a0\u4e86\u5f02\u5e38\u5904\u7406\u3002\u53d1\u751f\u8fd9\u4e2a\u7684\u539f\u56e0\u662f\u4f20\u611f\u5668\u6570\u636e\u83b7\u53d6\u7684\u9519\u8bef\uff0c\u5bfc\u81f4\u5076\u5c14\u51fa\u73b0\u5b57\u7b26\u4e32\u6570\u636e\u3002\u5728\u73b0\u5b9e\u95ee\u9898\u4e2d\uff0c\u8fd9\u79cd\u60c5\u51b5\u7ecf\u5e38\u53d1\u751f\u3002\u53c2\u8003\uff1a\u8fde\u63a5Flume\u63a8\u7279\u6d41\u5230Spark\u65f6\u51fa\u73b0UTF-8\u7f16\u7801\u9519\u8bef\u3002<\/p>\n<h4>\u4e3a\u4e86\u907f\u514d\u4efb\u52a1\u5806\u79ef\uff0c\u8fdb\u884c\u53c2\u6570\u8c03\u6574\u3002<\/h4>\n<p>\u4e3a\u4e86\u7a33\u5b9a\u5730\u8fd0\u884cSparkStreaming\u4f5c\u4e1a\uff0c\u5fc5\u987b\u76d1\u89c6\u4f5c\u4e1a\u662f\u5426\u5806\u79ef\u7b49\u60c5\u51b5\u3002\u5982\u679c\u7f6e\u4e4b\u4e0d\u7406\uff0c\u4f5c\u4e1a\u5904\u7406\u5c06\u8d76\u4e0d\u4e0a\uff0c\u5bfc\u81f4\u6570\u636e\u5ef6\u8fdf\u3002\u4f8b\u5982\uff0c\u5728\u67d0\u4e2a\u65f6\u95f4\u70b9\u6570\u636e\u6025\u5267\u589e\u52a0\u6216\u8005\u6dfb\u52a0\u4e86\u7e41\u91cd\u7684\u5904\u7406\u4efb\u52a1\u65f6\u4f1a\u53d1\u751f\u8fd9\u79cd\u60c5\u51b5\u3002<\/p>\n<p>\u5728Spark\u7684\u8c03\u8bd5\u65e5\u5fd7\u4e2d\uff0c\u4f1a\u51fa\u73b0&#8221;INFO JobScheduler\uff1a\u5df2\u6dfb\u52a0\u65f6\u95f4\u4e3a\u25ef\u25ef\u25ef\u6beb\u79d2\u7684\u4f5c\u4e1a&#8221;\uff0c\u4ece\u4e2d\u53ef\u4ee5\u610f\u8bc6\u5230\u51fa\u73b0\u4e86\u8fd9\u79cd\u60c5\u51b5\u3002<\/p>\n<p>\u5f53\u521d\uff0c\u6211\u6ce8\u610f\u5230\u8fd9\u4e2a\u65e5\u5fd7\u4e00\u76f4\u5728\u9891\u7e41\u8f93\u51fa\uff0c\u4e8e\u662f\u6211\u641c\u7d22\u4e86\u4e00\u4e0b\uff0c\u53d1\u73b0\u50cf\u662f\u5728\u6211\u7684Spark\u72ec\u7acb\u96c6\u7fa4\u4e2d\u8fde\u7eed\u6dfb\u52a0\u4e86\u4e00\u4e9b\u4efb\u52a1\uff0c\u9700\u8981\u8bf4\u660e\u7684\u662f\uff0c\u8fd9\u662f\u5728\u5904\u7406\u7ebf\u7a0b\u4e0d\u8db3\u7684\u60c5\u51b5\u4e0b\u4ea7\u751f\u7684INFO\u65e5\u5fd7\u3002<\/p>\n<p>\u867d\u7136\u4ec5\u4ec5\u589e\u52a0Spark\u7684\u5de5\u4f5c\u8282\u70b9\u6570\u91cf\u5e76\u4e0d\u80fd\u89e3\u51b3\u95ee\u9898\uff0c\u4f46\u63a5\u4e0b\u6765\u6211\u4eec\u5f00\u59cb\u7814\u7a76\u6027\u80fd\u8c03\u4f18\u3002<\/p>\n<p>\u5728\u6211\u8fdb\u884c\u641c\u7d22\u5e76\u627e\u5230\u7684\u6587\u7ae0\u4e2d\uff0c\u7279\u522b\u6709\u5e2e\u52a9\u7684\u662fLinkedin\u7684\u6280\u672f\u535a\u5ba2\u300aSpark Streaming : Performance Tuning With Kafka and Mesos\u300b\u3002\u6839\u636e\u6211\u7684\u7406\u89e3\uff0c\u5b83\u7684\u6458\u8981\u5982\u4e0b\uff1a<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">Receiver base\u3088\u308a\u3000Direct base\u63a8\u5968\u3002\u7406\u7531\u306f\u3001Kafka\u306e\u30c7\u30fc\u30bf\u30d1\u30fc\u30c6\u30a3\u30b7\u30e7\u30f3\u3054\u3068\u306b\u3001Spark\u306eRDD\u30921\u5bfe1\u3067\u5bfe\u5fdc\u3055\u305b\u308b\u3053\u3068\u304c\u3067\u304d\u308b\u3002\u7d50\u679c\u3001\u30b5\u30fc\u30d0\u306e\u30b3\u30a2\u6570\u3092\u30d5\u30eb\u306b\u6d3b\u7528\u3057\u3066\u51e6\u7406\u304c\u306f\u3084\u304f\u306a\u308b\u3002Kafka\u306e\u30c7\u30fc\u30bf\u30d1\u30fc\u30c6\u30a3\u30b7\u30e7\u30f3\u306f\u30b5\u30fc\u30d0\u306e\u30b3\u30a2\u6570\u306e\u7d042\u301c3\u500d\u306e\u307b\u3046\u304c\u30d5\u30eb\u306bCPU\u3092\u5229\u7528\u3067\u304d\u308b\uff08\u3089\u3057\u3044\uff09<\/ul>\n<\/li>\n<\/ul>\n<p>Batch Interval Parameter\u3092\u5c11\u3057\u305a\u3064\u5927\u304d\u304f\u3057\u3066\u8abf\u6574\u3059\u308b\u3002\u3053\u308c\u306f\u3001Spark\u306e\u30df\u30cb\u30d0\u30c3\u30c1\u306e\u9593\u9694\u306e\u3053\u3068\u3067\u3001ssc = StreamingContext(sc, XXX)\u306eXXX\u90e8\u5206\u3092\u8abf\u6574\u3057\u307e\u3059\u3002\u3053\u308c\u306f\u30b8\u30e7\u30d6\u306e\u5927\u304d\u3055\u3084\u8981\u4ef6\uff08RTB\u5e83\u544a\u914d\u4fe1\u306a\u3069\u3067\u306f\u304b\u306a\u308a\u30ad\u30e2\u306b\u306a\u308b\uff09\u306b\u3088\u3063\u3066\u6700\u9069\u306a\u306e\u3092\u8abf\u6574\u3057\u307e\u3059\u3002<\/p>\n<p>ConcurrentJobs Parameter \u3092\u5927\u304d\u304f\u3059\u308b\u3002\u30b8\u30e7\u30d6\u306e\u5b9f\u884c\u6570\u306e\u3053\u3068\u3067\u3001\u3053\u3053\u3092\u5927\u304d\u304f\u3059\u308b\u3068\u3001\u3042\u308b\u30b8\u30e7\u30d6\u306e\u51e6\u7406\u304c\u9045\u308c\u3066\u3044\u3066\u3082\u3001\u305d\u308c\u304c\u5b8c\u4e86\u3059\u308b\u306e\u3092\u5f85\u3064\u3053\u3068\u306a\u304f\u6b21\u306e\u30b8\u30e7\u30d6\u3092\u5b9f\u884c\u3059\u308b\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002\u305f\u3060\u3057\u3001\u79c1\u306e\u610f\u898b\u3067\u3082\u3042\u308a\u307e\u3059\u304c\u3001\u672c\u6765\uff11\u3067\u3042\u308b\u306e\u304c\u671b\u307e\u3057\u3044\u3068\u601d\u3044\u307e\u3059\u3002\u7406\u7531\u306f\u3001\u305d\u3082\u305d\u3082\u30b8\u30e7\u30d6\u304c\u306a\u305c\u9045\u308c\u3066\u3044\u308b\u306e\u304b\u306e\u539f\u56e0\u304c\u30ed\u30b0\u4e0a\u3067\u898b\u3048\u306b\u304f\u304f\u306a\u308b\u305f\u3081\u3067\u3059\u3002<br \/>\nKafka\u306ePatition\u304c\u3042\u308b\u306a\u3089\u30011\u30df\u30cb\u30d0\u30c3\u30c1\u306e1\u30d1\u30fc\u30c6\u30a3\u30b7\u30e7\u30f3\u3042\u305f\u308a\u306e\u51e6\u7406\u30e1\u30c3\u30bb\u30fc\u30b8\u6570\u306e\u5236\u9650\u5024maxRatePerPartition\u3092\u8a2d\u5b9a\uff08\u30c7\u30d5\u30a9\u30eb\u30c8\u306fnot set\uff09\u3059\u308b\u3002\u3053\u308c\u306f\u3042\u308b\u30d1\u30fc\u30c6\u30a3\u30b7\u30e7\u30f3\u3067\u6025\u6fc0\u306a\u30c7\u30fc\u30bf\u304c\u5897\u3048\u3066\u3082\u3001\u5236\u9650\u5024\u3067\u30b3\u30f3\u30c8\u30ed\u30fc\u30eb\u3067\u304d\u308b\u3088\u3046\u306b\u3059\u308b\u305f\u3081\u306e\u30d1\u30e9\u30e1\u30fc\u30bf\u3067\u3059\u3002<\/p>\n<p>\u9664\u6b64\u4e4b\u5916\uff0cMapR\u7684\u300aApache Kafka\/Spark Streaming\u7cfb\u7edf\u7684\u6027\u80fd\u4f18\u5316-\u7535\u4fe1\u6848\u4f8b\u7814\u7a76\u300b\u4e5f\u5bf9\u7cfb\u7edf\u4e2d\u5de5\u4f5c\u8282\u70b9\u7684\u5185\u5b58\u5206\u914d\u7b49\u8fdb\u884c\u4e86\u4ecb\u7ecd\uff0c\u5bf9\u6211\u975e\u5e38\u6709\u53c2\u8003\u4ef7\u503c\u3002<\/p>\n<h3>\u5c06\u5361\u592b\u5361\u4e2d\u7684\u6570\u636e\u5bfc\u51fa\u5230Elasticsearch<\/h3>\n<p>\u6211\u5011\u958b\u59cb\u5c07\u6578\u64da\u7a4d\u7d2f\u5230\u57fa\u790e\u8a2d\u65bd\u4e0a\u7684 Kafka\u3002\u95dc\u65bc\u5982\u4f55\u4f7f\u7528\u9019\u4e9b\u6578\u64da\uff0c\u9019\u6b21\u6211\u5011\u5c07\u4f7f\u7528\u53e6\u4e00\u500b SparkStreaming \u4f86\u5c07\u9019\u4e9b\u6578\u64da\u5b58\u5132\u5230 ElasticSearch \u4e2d\uff0c\u4ee5\u4f9b\u5be6\u6642\u53ef\u8996\u5316\u4f7f\u7528\u3002\u4ee5\u4e0b\u662f\u793a\u4f8b\u4ee3\u78bc\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"c1\"># -*- coding:utf-8 -*-\r\n<\/span><span class=\"kn\">import<\/span> <span class=\"nn\">json<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">datetime<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">datetime<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">pyspark.streaming<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">StreamingContext<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">pyspark.streaming.kafka<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">KafkaUtils<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">pyspark.sql<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">SQLContext<\/span><span class=\"p\">,<\/span><span class=\"n\">SparkSession<\/span><span class=\"p\">,<\/span><span class=\"n\">Row<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">utils.Schema<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">Schema<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">utils.Select<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">Select<\/span>\r\n<span class=\"kn\">from<\/span> <span class=\"nn\">utils.ElasticSpark<\/span> <span class=\"kn\">import<\/span> <span class=\"n\">ElasticSpark<\/span>\r\n\r\n<span class=\"k\">def<\/span> <span class=\"nf\">getSparkSessionInstance<\/span><span class=\"p\">(<\/span><span class=\"n\">sparkConf<\/span><span class=\"p\">):<\/span>\r\n    <span class=\"k\">if<\/span> <span class=\"p\">(<\/span><span class=\"s\">'sparkSessionSingletonInstance'<\/span> <span class=\"ow\">not<\/span> <span class=\"ow\">in<\/span> <span class=\"nb\">globals<\/span><span class=\"p\">()):<\/span>\r\n        <span class=\"nb\">globals<\/span><span class=\"p\">()[<\/span><span class=\"s\">'sparkSessionSingletonInstance'<\/span><span class=\"p\">]<\/span> <span class=\"o\">=<\/span> <span class=\"n\">SparkSession<\/span>\\\r\n            <span class=\"p\">.<\/span><span class=\"n\">builder<\/span>\\\r\n            <span class=\"p\">.<\/span><span class=\"n\">config<\/span><span class=\"p\">(<\/span><span class=\"n\">conf<\/span><span class=\"o\">=<\/span><span class=\"n\">sparkConf<\/span><span class=\"p\">)<\/span>\\\r\n            <span class=\"p\">.<\/span><span class=\"n\">getOrCreate<\/span><span class=\"p\">()<\/span>\r\n    <span class=\"k\">return<\/span> <span class=\"nb\">globals<\/span><span class=\"p\">()[<\/span><span class=\"s\">'sparkSessionSingletonInstance'<\/span><span class=\"p\">]<\/span>\r\n\r\n<span class=\"k\">def<\/span> <span class=\"nf\">process<\/span><span class=\"p\">(<\/span><span class=\"n\">dstream<\/span><span class=\"p\">):<\/span>\r\n    <span class=\"c1\"># dstream load\r\n<\/span>    <span class=\"n\">spark_dstream<\/span> <span class=\"o\">=<\/span> <span class=\"n\">getSparkSessionInstance<\/span><span class=\"p\">(<\/span><span class=\"n\">dstream<\/span><span class=\"p\">.<\/span><span class=\"n\">context<\/span><span class=\"p\">.<\/span><span class=\"n\">getConf<\/span><span class=\"p\">())<\/span>\r\n    <span class=\"n\">row<\/span> <span class=\"o\">=<\/span> <span class=\"n\">dstream<\/span><span class=\"p\">.<\/span><span class=\"nb\">map<\/span><span class=\"p\">(<\/span><span class=\"k\">lambda<\/span> <span class=\"n\">x<\/span><span class=\"p\">:<\/span> <span class=\"n\">Row<\/span><span class=\"p\">(<\/span>\r\n        <span class=\"n\">date<\/span> <span class=\"o\">=<\/span> <span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"n\">loads<\/span><span class=\"p\">(<\/span><span class=\"n\">x<\/span><span class=\"p\">)[<\/span><span class=\"s\">\"DATE\"<\/span><span class=\"p\">]<\/span> \r\n        <span class=\"n\">key<\/span> <span class=\"o\">=<\/span> <span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"n\">loads<\/span><span class=\"p\">(<\/span><span class=\"n\">x<\/span><span class=\"p\">)[<\/span><span class=\"s\">\"KEY\"<\/span><span class=\"p\">],<\/span>\r\n        <span class=\"n\">value<\/span> <span class=\"o\">=<\/span> <span class=\"nb\">float<\/span><span class=\"p\">(<\/span><span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"n\">loads<\/span><span class=\"p\">(<\/span><span class=\"n\">x<\/span><span class=\"p\">)[<\/span><span class=\"s\">\"VALUE\"<\/span><span class=\"p\">]))<\/span>\r\n    <span class=\"p\">)<\/span>\r\n\r\n    <span class=\"c1\"># schema setting\r\n<\/span>    <span class=\"n\">schema<\/span> <span class=\"o\">=<\/span> <span class=\"n\">Schema<\/span><span class=\"p\">()<\/span>\r\n    <span class=\"n\">row_df<\/span> <span class=\"o\">=<\/span> <span class=\"n\">spark_dstream<\/span><span class=\"p\">.<\/span><span class=\"n\">createDataFrame<\/span><span class=\"p\">(<\/span><span class=\"n\">row<\/span><span class=\"p\">,<\/span> <span class=\"n\">schema<\/span><span class=\"p\">.<\/span><span class=\"n\">get<\/span><span class=\"p\">())<\/span>\r\n    <span class=\"n\">row_df<\/span><span class=\"p\">.<\/span><span class=\"n\">show<\/span><span class=\"p\">()<\/span>\r\n\r\n    <span class=\"c1\"># Select and Filtering\r\n<\/span>    <span class=\"n\">ps<\/span> <span class=\"o\">=<\/span> <span class=\"n\">Select<\/span><span class=\"p\">(<\/span><span class=\"n\">spark<\/span> <span class=\"o\">=<\/span> <span class=\"n\">spark<\/span><span class=\"p\">,<\/span> <span class=\"n\">df<\/span> <span class=\"o\">=<\/span> <span class=\"n\">row_df<\/span><span class=\"p\">)<\/span>\r\n    <span class=\"n\">sql_df<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ps<\/span><span class=\"p\">.<\/span><span class=\"n\">select<\/span><span class=\"p\">(<\/span><span class=\"n\">keyword<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"AAA\"<\/span><span class=\"p\">)<\/span>\r\n    <span class=\"n\">sql_df<\/span><span class=\"p\">.<\/span><span class=\"n\">show<\/span><span class=\"p\">()<\/span>\r\n\r\n    <span class=\"c1\"># To ES\r\n<\/span>    <span class=\"n\">es<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ElasticSpark<\/span><span class=\"p\">()<\/span>\r\n    <span class=\"n\">es<\/span><span class=\"p\">.<\/span><span class=\"n\">df_write<\/span><span class=\"p\">(<\/span><span class=\"n\">sql_df<\/span><span class=\"p\">,<\/span> <span class=\"s\">\"BBB\"<\/span><span class=\"p\">,<\/span> <span class=\"s\">\"BBB\"<\/span><span class=\"p\">)<\/span>\r\n\r\n<span class=\"k\">if<\/span> <span class=\"n\">__name__<\/span> <span class=\"o\">==<\/span> <span class=\"s\">\"__main__\"<\/span><span class=\"p\">:<\/span>\r\n\r\n    <span class=\"c1\"># StreamingContext by Each 60 sec\r\n<\/span>    <span class=\"n\">spark<\/span> <span class=\"o\">=<\/span> <span class=\"p\">(<\/span><span class=\"n\">SparkSession<\/span><span class=\"p\">.<\/span><span class=\"n\">builder<\/span><span class=\"p\">.<\/span><span class=\"n\">getOrCreate<\/span><span class=\"p\">())<\/span>\r\n    <span class=\"n\">sc<\/span> <span class=\"o\">=<\/span> <span class=\"n\">spark<\/span><span class=\"p\">.<\/span><span class=\"n\">sparkContext<\/span>\r\n    <span class=\"n\">sqlContext<\/span> <span class=\"o\">=<\/span> <span class=\"n\">SQLContext<\/span><span class=\"p\">(<\/span><span class=\"n\">sc<\/span><span class=\"p\">)<\/span>\r\n    <span class=\"n\">ssc<\/span> <span class=\"o\">=<\/span> <span class=\"n\">StreamingContext<\/span><span class=\"p\">(<\/span><span class=\"n\">sc<\/span><span class=\"p\">,<\/span> <span class=\"mi\">60<\/span><span class=\"p\">)<\/span>\r\n\r\n    <span class=\"c1\"># kafka Direct Stream\r\n<\/span>    <span class=\"n\">BROKERS_HOSTS<\/span> <span class=\"o\">=<\/span> <span class=\"s\">\"XXX.XXX.XXX.XXX:9092\"<\/span>\r\n    <span class=\"n\">kafkaStream<\/span> <span class=\"o\">=<\/span> <span class=\"n\">KafkaUtils<\/span><span class=\"p\">.<\/span><span class=\"n\">createDirectStream<\/span><span class=\"p\">(<\/span><span class=\"n\">ssc<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ssc<\/span><span class=\"p\">,<\/span>\r\n                                                <span class=\"n\">topics<\/span> <span class=\"o\">=<\/span> <span class=\"p\">[<\/span><span class=\"s\">\"TOPIC_NAME\"<\/span><span class=\"p\">],<\/span>\r\n                                                <span class=\"n\">kafkaParams<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span><span class=\"s\">\"metadata.broker.list\"<\/span> <span class=\"p\">:<\/span> <span class=\"n\">BROKERS_HOSTS<\/span><span class=\"p\">})<\/span>\r\n    <span class=\"c1\"># Batch Process Define\r\n<\/span>    <span class=\"n\">lines<\/span> <span class=\"o\">=<\/span> <span class=\"n\">kafkaStream<\/span><span class=\"p\">.<\/span><span class=\"nb\">map<\/span><span class=\"p\">(<\/span><span class=\"k\">lambda<\/span> <span class=\"n\">x<\/span><span class=\"p\">:<\/span> <span class=\"n\">x<\/span><span class=\"p\">[<\/span><span class=\"mi\">1<\/span><span class=\"p\">])<\/span>\r\n    <span class=\"n\">lines<\/span><span class=\"p\">.<\/span><span class=\"n\">foreachRDD<\/span><span class=\"p\">(<\/span><span class=\"n\">process<\/span><span class=\"p\">)<\/span>\r\n\r\n    <span class=\"c1\"># Start\r\n<\/span>    <span class=\"n\">ssc<\/span><span class=\"p\">.<\/span><span class=\"n\">start<\/span><span class=\"p\">()<\/span>\r\n    <span class=\"n\">ssc<\/span><span class=\"p\">.<\/span><span class=\"n\">awaitTermination<\/span><span class=\"p\">()<\/span>\r\n<\/code><\/pre>\n<p>\u5927\u81f4\u4e0a\u4e0eSpark\u793a\u4f8b\u4ee3\u7801\u76f8\u540c\uff0c\u4f46\u4e3a\u4e86\u786e\u4fdd\u5176\u80fd\u591f\u5728\u5b9e\u9645\u5206\u6790\u4e2d\u4f7f\u7528\uff0c\u6211\u8fdb\u884c\u4e86\u4e00\u4e9b\u5904\u7406\u3002\u4ee5\u4e0b\u662f\u5927\u81f4\u7684\u6d41\u7a0b\u8bf4\u660e\u3002<\/p>\n<p>\u4e3a\u4e86\u4f7f\u7528Spark\u7684DataFrame\u7c7b\u578b\u5904\u7406\u6570\u636e\uff0c\u9996\u5148\u5c06RDD\u683c\u5f0f\u4ee5Row\u7c7b\u578b\u8fdb\u884c\u63cf\u8ff0\uff0c\u7136\u540e\u6784\u5efaDataFrame\u3002<\/p>\n<p>\u63a5\u4e0b\u6765\uff0c\u6211\u4eec\u5c06\u4f7f\u7528\u81ea\u5b9a\u4e49\u7684Schema\u7c7b\u6765\u5b9a\u4e49\u6bcf\u4e2a\u6570\u636e\u5217\u7684\u6a21\u5f0f\uff08\u4f8b\u5982\uff1a\u5b57\u7b26\u4e32\u3001\u6d6e\u70b9\u6570\u548c\u65e5\u671f\u7c7b\u578b\uff09\u3002\u793a\u4f8b\u5982\u4e0b\uff1a<\/p>\n<pre class=\"post-pre\"><code><span class=\"n\">schema<\/span> <span class=\"o\">=<\/span> <span class=\"n\">StructType<\/span><span class=\"p\">([<\/span>\r\n            <span class=\"n\">StructField<\/span><span class=\"p\">(<\/span><span class=\"s\">\"date\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">TimestampType<\/span><span class=\"p\">(),<\/span> <span class=\"bp\">True<\/span><span class=\"p\">),<\/span>\r\n            <span class=\"n\">StructField<\/span><span class=\"p\">(<\/span><span class=\"s\">\"key\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">StringType<\/span><span class=\"p\">(),<\/span> <span class=\"bp\">True<\/span><span class=\"p\">),<\/span>\r\n            <span class=\"n\">StructField<\/span><span class=\"p\">(<\/span><span class=\"s\">\"value\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">FloatType<\/span><span class=\"p\">(),<\/span> <span class=\"bp\">True<\/span><span class=\"p\">)<\/span>\r\n<span class=\"p\">])<\/span>\r\n<\/code><\/pre>\n<p>\u63a5\u4e0b\u6765\uff0c\u6211\u4eec\u53ef\u4ee5\u4f7f\u7528\u81ea\u5b9a\u4e49\u7684Select\u7c7b\u57fa\u4e8eSpark SQL\u4ece\u6570\u636e\u4e2d\u9009\u62e9\u6240\u9700\u7684\u5217\uff0c\u6216\u8005\u4ec5\u63d0\u53d6\u4e0e\u6761\u4ef6\u5339\u914d\u7684\u884c\uff0c\u8fd8\u53ef\u4ee5\u4f7f\u7528Groupby\u7b49\u65b9\u6cd5\u8fdb\u884c\u7edf\u8ba1\u5904\u7406\u4ee5\u751f\u6210\u6570\u636e\u3002\u4ee5\u4e0b\u662f\u4e00\u4e2a\u4f8b\u5b50\uff1a<\/p>\n<pre class=\"post-pre\"><code><span class=\"n\">sql_df<\/span> <span class=\"o\">=<\/span> <span class=\"bp\">self<\/span><span class=\"p\">.<\/span><span class=\"n\">spark<\/span><span class=\"p\">.<\/span><span class=\"n\">sql<\/span><span class=\"p\">(<\/span><span class=\"s\">\"\"\"\r\n                select *\r\n                from df\r\n                where key rlike '^[a-z]+[0-9]{2}$' AND\r\n                      (value &gt; 0 AND value &lt; 100)\r\n            \"\"\"<\/span><span class=\"p\">)<\/span>\r\n<\/code><\/pre>\n<p>\u6700\u5f8c\uff0c\u5c07DataFrame\u6578\u64da\u5c0e\u5165\u5230Elasticsearch\u4e2d\u3002\u5728\u9019\u88e1\uff0c\u6578\u64da\u5c07\u901a\u904eElasticsearch\u7684\u57fa\u672c\u8eab\u4efd\u9a57\u8b49\u9032\u884c\u5b58\u5132\u3002\u9019\u88e1\u9700\u8981\u6ce8\u610f\u7684\u662f\uff0c\u6211\u767c\u73fees.nodes.wan.only\u7684\u9ed8\u8a8d\u503c\u4f3c\u4e4e\u662fFalse\uff0c\u4f46\u6211\u5728\u81ea\u5df1\u7684\u74b0\u5883\u4e2d\u5c07\u5176\u8a2d\u7f6e\u70baTrue\u3002\u6b64\u5916\uff0c\u6211\u9084\u5c07\u6dfb\u52a0\u7570\u5e38\u8655\u7406\uff0c\u4ee5\u78ba\u4fdd\u5728Elasticsearch\u670d\u52d9\u5b95\u6a5f\u6642\u4ecd\u7136\u80fd\u5920\u7e7c\u7e8c\u8655\u7406\u3002<\/p>\n<pre class=\"post-pre\"><code><span class=\"k\">try<\/span> <span class=\"p\">:<\/span>\r\n    <span class=\"n\">df<\/span><span class=\"p\">.<\/span><span class=\"n\">write<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"nb\">format<\/span><span class=\"p\">(<\/span><span class=\"s\">\"org.elasticsearch.spark.sql\"<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">mode<\/span><span class=\"p\">(<\/span><span class=\"s\">'append'<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">option<\/span><span class=\"p\">(<\/span><span class=\"s\">\"es.nodes\"<\/span><span class=\"p\">,<\/span><span class=\"bp\">self<\/span><span class=\"p\">.<\/span><span class=\"n\">urls<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">option<\/span><span class=\"p\">(<\/span><span class=\"s\">\"es.port\"<\/span><span class=\"p\">,<\/span><span class=\"bp\">self<\/span><span class=\"p\">.<\/span><span class=\"n\">port<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">option<\/span><span class=\"p\">(<\/span><span class=\"s\">\"es.net.http.auth.user\"<\/span><span class=\"p\">,<\/span><span class=\"bp\">self<\/span><span class=\"p\">.<\/span><span class=\"n\">user<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">option<\/span><span class=\"p\">(<\/span><span class=\"s\">\"es.net.http.auth.pass\"<\/span><span class=\"p\">,<\/span><span class=\"bp\">self<\/span><span class=\"p\">.<\/span><span class=\"n\">password<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">option<\/span><span class=\"p\">(<\/span><span class=\"s\">\"es.nodes.wan.only\"<\/span><span class=\"p\">,<\/span> <span class=\"bp\">True<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">option<\/span><span class=\"p\">(<\/span><span class=\"s\">\"es.resource\"<\/span><span class=\"p\">,<\/span><span class=\"n\">index<\/span><span class=\"o\">+<\/span><span class=\"s\">\"\/\"<\/span><span class=\"o\">+<\/span><span class=\"n\">mapping<\/span><span class=\"p\">)<\/span>\\\r\n        <span class=\"p\">.<\/span><span class=\"n\">save<\/span><span class=\"p\">()<\/span>\r\n<span class=\"k\">except<\/span> <span class=\"n\">Py4JJavaError<\/span> <span class=\"p\">:<\/span> \r\n    <span class=\"k\">print<\/span><span class=\"p\">(<\/span><span class=\"s\">\"ERROR - Something wrong to import ES\"<\/span><span class=\"p\">)<\/span>\r\n<\/code><\/pre>\n<p>\u6700\u7ec8\u7ed3\u679c\u662f\u4ee5DataFrame\u5f62\u5f0f\u7684\u6570\u636e\u6d41\u5165\uff0c\u5e76\u88ab\u5bfc\u5165\u5230Elasticsearch\u4e2d\u3002<\/p>\n<pre class=\"post-pre\"><code>&lt;snip&gt;\r\nINFO DAGScheduler: Job 93 finished: showString at NativeMethodAccessorImpl.java:0, took 0.162547 s\r\n+---------------------+-------------+-----------+\r\n|                 date|          key|      value|\r\n+---------------------+-------------+-----------+\r\n|  2017-12-12 09:58:50|       abcc12|       3.72|\r\n+---------------------+-------------+-----------+\r\nINFO SparkContext: Starting job: runJob at EsSparkSQL.scala:101\r\n&lt;snip&gt;\r\n<\/code><\/pre>\n<p>\u7136\u540e\u53ef\u4ee5\u4f7f\u7528Kibana\u6309\u7167\u4e2a\u4eba\u559c\u597d\u6765\u67e5\u770b\u6570\u636e\u3002\u7701\u7565\u4e86\u6b64\u8bbe\u7f6e\u3002<\/p>\n<h3>\u56de\u987e\u6784\u5efa\u540e\u7684\u60c5\u51b5\u65f6<\/h3>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">Kafka\uff0bSparkStreaming\u3092\u4eca\u56de\u4e00\u304b\u3089\u4f5c\u308a\u307e\u3057\u305f\u3002\u30b5\u30f3\u30d7\u30eb\u30b3\u30fc\u30c9\u306f\u8272\u3005\u3042\u308b\u306e\u3067\u3059\u304c\u3001\u305d\u308c\u3092\u5b9f\u74b0\u5883\u3067\u52d5\u304b\u3059\u307e\u3067\u306e\u30d7\u30ed\u30bb\u30b9\u306f\u305d\u308c\u306e\u7d44\u307f\u5408\u308f\u305b\u3060\u3051\u3058\u3083\u89e3\u6c7a\u3057\u306a\u3044\u3053\u3068\u3082\u591a\u304b\u3063\u305f\u3067\u3059\u3002\u305d\u306e\u8fba\u306f\u3001\u5e45\u5e83\u3044\u5468\u8fba\u77e5\u8b58\u3092\u30ad\u30e3\u30c3\u30c1\u30a2\u30c3\u30d7\u3057\u306a\u304c\u3089\u3001\u3042\u3068\u306fStack Overflow\u306e\u691c\u7d22\u529b\u3002<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">\u30c7\u30fc\u30bf\u306e\u767a\u751f\u304b\u3089\u306eES\u3078\u306e\u683c\u7d0d\u307e\u3067\u306e\u30dc\u30c8\u30eb\u30cd\u30c3\u30af\u7b87\u6240\u306e\u5206\u6790\u306f\u3053\u308c\u304b\u3089\u5fc5\u8981\u306b\u306a\u308a\u305d\u3046\u3067\u3059\u3002Kafka\u3001Spark\u3001Elasticsearch\u3068\u30dc\u30c8\u30eb\u30cd\u30c3\u30af\u7b87\u6240\u3068\u306a\u308a\u5f97\u308b\u306e\u304c\u8907\u6570\u8003\u3048\u3089\u308c\u308b\u305f\u3081\u3001\u5207\u308a\u5206\u3051\u306e\u305f\u3081\u306b\u5404\u7a2e\u30d7\u30ed\u30bb\u30b9\u306e\u30e2\u30cb\u30bf\u30ea\u30f3\u30b0\u304c\u5fc5\u8981\u306b\u306a\u308a\u307e\u3059\u3002Spark Streaming\u306e\u6982\u8981\u3068\u691c\u8a3c\u30b7\u30ca\u30ea\u30aa\u306f\u8aad\u3093\u3067\u3044\u3066\u3001\u30dc\u30c8\u30eb\u30cd\u30c3\u30af\u7b87\u6240\u3092\u8abf\u3079\u308b\u52c9\u5f37\u306b\u306a\u308a\u307e\u3057\u305f\u3002<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\n<li style=\"list-style-type: none;\">\n<ul class=\"post-ul\">\u3069\u308c\u304f\u3089\u3044\u306e\u524d\u306e\u30c7\u30fc\u30bf\u3092\u898b\u305f\u3044\u3068\u3044\u3046\u30cb\u30fc\u30ba\u306b\u3053\u306e\u30a2\u30fc\u30ad\u30c6\u30af\u30c1\u30e3\u3060\u3068\u3069\u3053\u307e\u3067\u8010\u3048\u308c\u308b\u306e\u304b\u306f\u307e\u3060\u307e\u3060\u308f\u304b\u308a\u307e\u305b\u3093\u3002\u4f8b\u3048\u3070\u300110\u79d2\u5f8c\u306e\u30c7\u30fc\u30bf\u304c\u307f\u305f\u3044\u3068\u3044\u3063\u305f\u3053\u3068\u306b\u8010\u3048\u308c\u308b\u306e\u304b\u306a\u3069\u3002<\/ul>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<ul class=\"post-ul\">\u30bb\u30ad\u30e5\u30ea\u30c6\u30a3\u8981\u4ef6\u3092\u4eca\u56de\u306f\u7701\u3044\u3066\u3044\u307e\u3059\u304c\u3001SSL\u5316\u7b49\u3067\u30d1\u30d5\u30a9\u30fc\u30de\u30f3\u30b9\u304c\u3069\u306e\u7a0b\u5ea6\u843d\u3061\u308b\u306e\u304b\u3082\u6c17\u306b\u306a\u308a\u307e\u3059\u3002<\/ul>\n<p>\u6211\u5011\u5728\u904b\u7528\u4e2d\u7406\u89e3\u8981\u9ede\uff0c\u73fe\u5728\u9054\u5230\u4e86\u50c5\u4f7f\u7528Python\u5c31\u80fd\u5b8c\u6210\u8655\u7406\u7684\u80fd\u529b\uff0c\u6240\u4ee5\u5c07\u4f86\u6703\u671d\u8457\u66f4\u597d\u7684\u65b9\u5411\u52aa\u529b\u3002<\/p>\n<h3>\u5728\u6700\u540e<\/h3>\n<p>\u5728\u672c\u7bc7\u6587\u7ae0\u4e2d\uff0c\u4f5c\u8005\u56de\u987e\u4e86\u81ea\u5df1\u5728Python\u4e2d\u6784\u5efa\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\u7684\u7ecf\u9a8c\u3002\u6700\u8fd1\u4e00\u76f4\u5728\u8fdb\u884c\u5f02\u5e38\u68c0\u6d4b\u6280\u672f\u7684\u7814\u7a76\u548c\u8bba\u6587\u5199\u4f5c\uff0c\u56e0\u6b64\u80fd\u591f\u4ee5\u4e00\u79cd\u65b0\u9c9c\u7684\u5fc3\u6001\u6765\u5904\u7406\u57fa\u7840\u8bbe\u65bd\u7684\u6784\u5efa\u3002\u56de\u987e\u8fc7\u7a0b\u4e2d\uff0c\u786e\u5b9e\u5b58\u5728\u4e00\u4e9b\u4e0d\u8db3\u4e4b\u5904\uff0c\u4f46\u901a\u8fc7\u53c2\u4e0e\u8282\u65e5\u7684\u673a\u4f1a\uff0c\u80fd\u591f\u5c06\u5176\u8f93\u51fa\u3002\u5bf9\u4e8e\u4e3a\u4ec0\u4e48\u4f1a\u505a\u8fd9\u6837\u7684\u4e8b\u60c5\u7b49\u4e00\u4e9b\u6734\u7d20\u7684\u610f\u89c1\u548c\u95ee\u9898\uff0c\u6211\u4eec\u975e\u5e38\u6b22\u8fce\uff01\u4eab\u53d7\u6570\u636e\u5427\uff01<\/p>\n<div>\n<p>\u901a\u8fc7\u57fa\u4e8eJavaScript\u7684\u968f\u673a\u51fd\u6570\u8fdb\u884c\u516c\u5e73\u5224\u65ad\u6765\u51b3\u5b9a\u3002\u21a9<\/p>\n<p>\u65e5\u672c\u7f51\u7edc\u8fd0\u8425\u5546\u534f\u4f1a\u7684\u7f29\u5199\u3002\u65e8\u5728\u901a\u8fc7\u8ba8\u8bba\u3001\u7814\u7a76\u548c\u4ecb\u7ecd\u4e0e\u4e92\u8054\u7f51\u6280\u672f\u53ca\u76f8\u5173\u64cd\u4f5c\u4e8b\u9879\u6709\u5173\u7684\u4e8b\u5b9c\uff0c\u4e3a\u65e5\u672c\u7684\u4e92\u8054\u7f51\u6280\u672f\u4eba\u5458\u548c\u7528\u6237\u505a\u51fa\u8d21\u732e\u7684\u7ec4\u7ec7\uff08\u5b98\u65b9\u7f51\u9875\uff09\u21a9<\/p>\n<p>\u53ef\u4ee5\u5b9a\u671f\u5c06\u6587\u4ef6\u5199\u5165HDFS\u5e76\u4f5c\u4e3a\u51b7\u6570\u636e\u8fdb\u884c\u6c38\u4e45\u4fdd\u5b58\uff0c\u4e5f\u53ef\u4ee5\u901a\u8fc7\u673a\u5668\u5b66\u4e60\u5c06\u5206\u6790\u7ed3\u679c\u5b58\u50a8\u5728ES\u4e2d\u8003\u8651\u3002\u21a9<\/p>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u8fd9\u7bc7\u6587\u7ae0\u662fNTT\u901a\u4fe1\u5b98\u65b9\u5723\u8bde\u8282\u65e5\u5386\u7684\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u3002\u6ca1\u60f3\u5230\u6211\u7adf\u7136\u62c5\u4efb\u4e86\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u8d23\u4efb\uff0c\u771f\u662f\u4e0d\u597d\u610f\u601d\u3002 \u8be5\u4f5c [&hellip;]<\/p>\n","protected":false},"author":7,"featured_media":0,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[],"class_list":["post-46812","post","type-post","status-publish","format-standard","hentry","category-uncategorized"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v21.5 (Yoast SEO v21.5) - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3&quot;\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01&quot;\u7684\u9700\u6c42 - Blog - Silicon Cloud<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.silicloud.com\/zh\/blog\/\u6982\u8981\u5730\u56de\u987epython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\u6211\/\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3&quot;\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01&quot;\u7684\u9700\u6c42\" \/>\n<meta property=\"og:description\" content=\"\u8fd9\u7bc7\u6587\u7ae0\u662fNTT\u901a\u4fe1\u5b98\u65b9\u5723\u8bde\u8282\u65e5\u5386\u7684\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u3002\u6ca1\u60f3\u5230\u6211\u7adf\u7136\u62c5\u4efb\u4e86\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u8d23\u4efb\uff0c\u771f\u662f\u4e0d\u597d\u610f\u601d\u3002 \u8be5\u4f5c [&hellip;]\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.silicloud.com\/zh\/blog\/\u6982\u8981\u5730\u56de\u987epython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\u6211\/\" \/>\n<meta property=\"og:site_name\" content=\"Blog - Silicon Cloud\" \/>\n<meta property=\"article:published_time\" content=\"2023-07-25T06:26:54+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2024-05-03T15:33:04+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d7af0913a08637a697aad\/15-0.png\" \/>\n<meta name=\"author\" content=\"\u79d1, \u9896\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"\u79d1, \u9896\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"6 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/\",\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/\",\"name\":\"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\\\"\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01\\\"\u7684\u9700\u6c42 - Blog - Silicon Cloud\",\"isPartOf\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#website\"},\"datePublished\":\"2023-07-25T06:26:54+00:00\",\"dateModified\":\"2024-05-03T15:33:04+00:00\",\"author\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/8ca01ba7f7362ad4edb7da206a12f29e\"},\"breadcrumb\":{\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/www.silicloud.com\/zh\/blog\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3&#8221;\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01&#8221;\u7684\u9700\u6c42\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#website\",\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/\",\"name\":\"Blog - Silicon Cloud\",\"description\":\"\",\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/8ca01ba7f7362ad4edb7da206a12f29e\",\"name\":\"\u79d1, \u9896\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/secure.gravatar.com\/avatar\/8a6fb3cc7ba2f69d2189ba532aec4633ea7ed75ac0af162ec367cb3abc0fb2af?s=96&d=mm&r=g\",\"contentUrl\":\"https:\/\/secure.gravatar.com\/avatar\/8a6fb3cc7ba2f69d2189ba532aec4633ea7ed75ac0af162ec367cb3abc0fb2af?s=96&d=mm&r=g\",\"caption\":\"\u79d1, \u9896\"},\"url\":\"https:\/\/www.silicloud.com\/zh\/blog\/author\/keying\/\"},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/#local-main-organization-logo\",\"url\":\"\",\"contentUrl\":\"\",\"caption\":\"Blog - Silicon Cloud\"}]}<\/script>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\"\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01\"\u7684\u9700\u6c42 - Blog - Silicon Cloud","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.silicloud.com\/zh\/blog\/\u6982\u8981\u5730\u56de\u987epython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\u6211\/","og_locale":"zh_CN","og_type":"article","og_title":"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\"\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01\"\u7684\u9700\u6c42","og_description":"\u8fd9\u7bc7\u6587\u7ae0\u662fNTT\u901a\u4fe1\u5b98\u65b9\u5723\u8bde\u8282\u65e5\u5386\u7684\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u3002\u6ca1\u60f3\u5230\u6211\u7adf\u7136\u62c5\u4efb\u4e86\u6700\u540e\u4e00\u5929\u7684\u6587\u7ae0\u8d23\u4efb\uff0c\u771f\u662f\u4e0d\u597d\u610f\u601d\u3002 \u8be5\u4f5c [&hellip;]","og_url":"https:\/\/www.silicloud.com\/zh\/blog\/\u6982\u8981\u5730\u56de\u987epython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\u6211\/","og_site_name":"Blog - Silicon Cloud","article_published_time":"2023-07-25T06:26:54+00:00","article_modified_time":"2024-05-03T15:33:04+00:00","og_image":[{"url":"https:\/\/cdn.silicloud.com\/blog-img\/blog\/img\/657d7af0913a08637a697aad\/15-0.png"}],"author":"\u79d1, \u9896","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"\u79d1, \u9896","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"6 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/","url":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/","name":"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3\"\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01\"\u7684\u9700\u6c42 - Blog - Silicon Cloud","isPartOf":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/#website"},"datePublished":"2023-07-25T06:26:54+00:00","dateModified":"2024-05-03T15:33:04+00:00","author":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/8ca01ba7f7362ad4edb7da206a12f29e"},"breadcrumb":{"@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/www.silicloud.com\/zh\/blog\/"},{"@type":"ListItem","position":2,"name":"\u6982\u8981\u5730\u56de\u987ePython\u6784\u5efa\u7684\u5b9e\u65f6\u5904\u7406\u57fa\u7840\u8bbe\u65bd\uff0c\u4ee5\u6ee1\u8db3&#8221;\u6211\u60f3\u4e86\u89e3\u76ee\u524d\u7684\u6570\u636e\uff01&#8221;\u7684\u9700\u6c42"}]},{"@type":"WebSite","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#website","url":"https:\/\/www.silicloud.com\/zh\/blog\/","name":"Blog - Silicon Cloud","description":"","inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/8ca01ba7f7362ad4edb7da206a12f29e","name":"\u79d1, \u9896","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.silicloud.com\/zh\/blog\/#\/schema\/person\/image\/","url":"https:\/\/secure.gravatar.com\/avatar\/8a6fb3cc7ba2f69d2189ba532aec4633ea7ed75ac0af162ec367cb3abc0fb2af?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/8a6fb3cc7ba2f69d2189ba532aec4633ea7ed75ac0af162ec367cb3abc0fb2af?s=96&d=mm&r=g","caption":"\u79d1, \u9896"},"url":"https:\/\/www.silicloud.com\/zh\/blog\/author\/keying\/"},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.silicloud.com\/zh\/blog\/%e6%a6%82%e8%a6%81%e5%9c%b0%e5%9b%9e%e9%a1%bepython%e6%9e%84%e5%bb%ba%e7%9a%84%e5%ae%9e%e6%97%b6%e5%a4%84%e7%90%86%e5%9f%ba%e7%a1%80%e8%ae%be%e6%96%bd%ef%bc%8c%e4%bb%a5%e6%bb%a1%e8%b6%b3%e6%88%91\/#local-main-organization-logo","url":"","contentUrl":"","caption":"Blog - Silicon Cloud"}]}},"_links":{"self":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/46812","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/users\/7"}],"replies":[{"embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/comments?post=46812"}],"version-history":[{"count":2,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/46812\/revisions"}],"predecessor-version":[{"id":94769,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/posts\/46812\/revisions\/94769"}],"wp:attachment":[{"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/media?parent=46812"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/categories?post=46812"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.silicloud.com\/zh\/blog\/wp-json\/wp\/v2\/tags?post=46812"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}