{"id":1883,"date":"2024-12-20T14:51:00","date_gmt":"2024-12-20T06:51:00","guid":{"rendered":"https:\/\/aws-oncloudai.com\/?p=1883"},"modified":"2025-05-07T16:11:14","modified_gmt":"2025-05-07T08:11:14","slug":"learn-more-aws-glue-a-key-tool-for-modern-data-integration","status":"publish","type":"post","link":"https:\/\/aws-oncloudai.com\/zh_hk\/learn-more-aws-glue-a-key-tool-for-modern-data-integration\/","title":{"rendered":"\u6df1\u5165\u4e86\u89e3AWS Glue\uff1a\u73fe\u4ee3\u8cc7\u6599\u6574\u5408\u7684\u95dc\u9375\u5de5\u5177"},"content":{"rendered":"<p class=\"\" data-start=\"330\" data-end=\"579\">\u5728\u6578\u64da\u7206\u70b8\u6027\u6210\u9577\u7684\u4eca\u5929\uff0c\u4f01\u696d\u6b63\u4e0d\u65b7\u61c9\u5c0d\u5982\u4f55\u6574\u5408\u3001\u8655\u7406\u548c\u5206\u6790\u4f86\u81ea\u591a\u7a2e <strong data-start=\"364\" data-end=\"380\">data sources<\/strong> \u7684\u6d77\u91cf\u6578\u64da\u3002<strong data-start=\"387\" data-end=\"399\">AWS Glue<\/strong>\uff0c\u4f5c\u70ba <strong data-start=\"403\" data-end=\"426\">Amazon Web Services<\/strong>\uff08AWS\uff09\u63a8\u51fa\u7684\u4e00\u9805\u8a17\u7ba1\u5f0f <strong data-start=\"440\" data-end=\"448\">\u6578\u64da\u96c6\u6210<\/strong> \u670d\u52d9\uff0c\u6b63\u9010\u6f38\u6210\u70ba\u5efa\u69cb\u73fe\u4ee3 <strong data-start=\"462\" data-end=\"479\">data pipeline<\/strong> \u8207 <strong data-start=\"482\" data-end=\"496\">data lakes<\/strong> \u7684\u6838\u5fc3\u5de5\u5177\u3002\u5b83\u7c21\u5316\u4e86 <strong data-start=\"508\" data-end=\"522\">\u8cc7\u6599\u6e96\u5099\u3001\u8f49\u63db\u548c\u8f09\u5165<\/strong>\uff08ETL pipeline\uff09\u7684\u5168\u7a0b\uff0c\u5e6b\u52a9\u4f7f\u7528\u8005\u66f4\u5feb\u7372\u53d6 <strong data-start=\"550\" data-end=\"572\">data for analytics<\/strong> \u548c\u696d\u52d9\u6d1e\u5bdf\u3002<\/p>\n<p class=\"\" data-start=\"581\" data-end=\"638\">\u672c\u6587\u5c07\u5e36\u60a8\u6df1\u5165\u4e86\u89e3 <strong data-start=\"591\" data-end=\"603\">AWS Glue<\/strong> \u7684\u6838\u5fc3\u529f\u80fd\u3001\u5178\u578b\u4f7f\u7528\u60c5\u5883\u4ee5\u53ca\u5176\u5728\u81ea\u52d5\u5316\u8cc7\u6599\u8655\u7406\u548c\u6574\u5408\u65b9\u9762\u7684\u5353\u8d8a\u8868\u73fe\u3002<\/p>\n<p><img fetchpriority=\"high\" decoding=\"async\" class=\"aligncenter wp-image-1903 size-large\" src=\"http:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8cbb-\u4e8c\u9032\u4f4d-\u4ee3\u78bc-\u50cf\u7d20-\u7684-\u514d\u8cbb\u7d20\u6750\u5716\u7247-\u7d20\u6750\u5716\u7247-1024x683.jpg\" alt=\"\" width=\"800\" height=\"534\" srcset=\"\" sizes=\"(max-width: 800px) 100vw, 800px\" data-srcset=\"\" \/><\/p>\n<p>&nbsp;<\/p>\n<h4>\u4ec0\u9ebc\u662fAWS Glue\uff1f<\/h4>\n<p class=\"\" data-start=\"363\" data-end=\"576\"><strong data-start=\"363\" data-end=\"375\">AWS Glue<\/strong> \u662f\u4e00\u9805\u7121\u4f3a\u670d\u5668\u3001\u5168\u8a17\u7ba1\u7684\u8cc7\u6599\u6574\u5408\u670d\u52d9\uff0c\u81f4\u529b\u65bc\u5e6b\u52a9\u4f7f\u7528\u8005\u8f15\u9b06 <strong data-start=\"405\" data-end=\"413\">\u6574\u5408\u6578\u64da<\/strong> \u4e26\u5c07\u5176\u7528\u65bc\u5206\u6790\u3001\u6a5f\u5668\u5b78\u7fd2\u6216\u61c9\u7528\u958b\u767c\u3002\u900f\u904e\u81ea\u52d5\u767c\u73fe\u8cc7\u6599\u7d50\u69cb\u3001<strong data-start=\"443\" data-end=\"458\">\u81ea\u52d5\u7522\u751fETL \u4f5c\u696d<\/strong> \u548c\u904b\u884c\u4f5c\u696d\uff0cGlue \u80fd\u5c07\u539f\u59cb\u8cc7\u6599\u5f9e\u591a\u7a2e <strong data-start=\"480\" data-end=\"487\">\u8cc7\u6599\u4f86\u6e90<\/strong> \u4e2d\u63d0\u53d6\u3001\u8f49\u63db\u70ba\u76ee\u6a19\u683c\u5f0f\uff0c\u4e26\u8f09\u5165\u5230 <strong data-start=\"505\" data-end=\"518\">Amazon S3<\/strong>\u3001<strong data-start=\"519\" data-end=\"533\">Amazon RDS<\/strong>\u3001<strong data-start=\"534\" data-end=\"562\">Amazon Redshift Spectrum<\/strong> \u7b49 <strong data-start=\"565\" data-end=\"573\">\u8cc7\u6599\u5132\u5b58<\/strong> \u4e2d\u3002<\/p>\n<p class=\"\" data-start=\"578\" data-end=\"642\">\u5176\u6700\u5927\u512a\u52e2\u5728\u65bc <strong data-start=\"586\" data-end=\"594\">\u7a0b\u5f0f\u78bc\u751f\u6210<\/strong> \u81ea\u52d5\u5316\u548c\u7121\u4f3a\u670d\u5668\u67b6\u69cb\uff0c\u4f7f\u7528\u8005\u7121\u9700\u7ba1\u7406\u5e95\u5c64\u8cc7\u6e90\uff0c\u5373\u53ef\u9ad8\u6548\u8a2d\u8a08\u548c\u904b\u884c\u5b8c\u6574\u7684 <strong data-start=\"630\" data-end=\"641\">ETL \u5de5\u4f5c\u6d41\u7a0b<\/strong>\u3002<\/p>\n<p>&nbsp;<\/p>\n<h4>\u00a0AWS Glue \u7684\u6838\u5fc3\u529f\u80fd<\/h4>\n<h5 data-start=\"668\" data-end=\"703\">1. Glue \u8cc7\u6599\u76ee\u9304\uff08Glue Data Catalog\uff09<\/h5>\n<p class=\"\" data-start=\"705\" data-end=\"878\">Glue \u63d0\u4f9b\u4e86\u4e00\u500b\u53ef\u64f4\u5c55\u7684 <strong data-start=\"720\" data-end=\"733\">Glue \u8cc7\u6599\u76ee\u9304<\/strong>\uff0c\u652f\u63f4\u81ea\u52d5\u722c\u53d6\u4e26\u5206\u985e\u8cc7\u6599\u3002\u5b83\u8a18\u9304\u4e86\u5143\u8cc7\u6599\uff08metadata\uff09\uff0c\u5305\u62ec\u8868\u7d50\u69cb\u3001\u5206\u5340\u53ca\u4f4d\u7f6e\uff0c\u53ef\u8207 <strong data-start=\"779\" data-end=\"804\">Apache Hive Metastore<\/strong> \u517c\u5bb9\uff0c\u4e26\u7121\u7e2b\u96c6\u6210\u5230 <strong data-start=\"815\" data-end=\"832\">Amazon Athena<\/strong>\u3001<strong data-start=\"833\" data-end=\"852\">Amazon Redshift<\/strong> \u4e2d\uff0c\u4fbf\u65bc\u5feb\u901f\u67e5\u8a62\u548c\u8a2a\u554f <strong data-start=\"865\" data-end=\"872\">\u8cc7\u6599\u6e56<\/strong> \u4e2d\u7684\u5167\u5bb9\u3002<\/p>\n<h5 data-start=\"880\" data-end=\"910\">2. \u81ea\u52d5\u7a0b\u5f0f\u78bc\u7522\u751f\uff08Code Generation\uff09<\/h5>\n<p class=\"\" data-start=\"912\" data-end=\"1007\">Glue \u6703\u6839\u64da\u8cc7\u6599\u4f86\u6e90\u548c\u76ee\u6a19\u81ea\u52d5\u751f\u6210 <strong data-start=\"931\" data-end=\"958\">Python \u6216Scala \u7684ETL \u8173\u672c<\/strong>\u3002\u9019\u7a2e <strong data-start=\"962\" data-end=\"970\">\u81ea\u52d5\u751f\u6210<\/strong> \u7684\u80fd\u529b\u986f\u8457\u63d0\u9ad8\u958b\u767c\u6548\u7387\uff0c\u5c24\u5176\u9069\u7528\u65bc\u5feb\u901f\u5efa\u7f6e\u548c\u90e8\u7f72 <strong data-start=\"996\" data-end=\"1006\">ETL \u7ba1\u9053<\/strong>\u3002<\/p>\n<h5 data-start=\"1009\" data-end=\"1034\">3. \u7121\u4f3a\u670d\u5668\u67b6\u69cb\uff08Serverless\uff09<\/h5>\n<p class=\"\" data-start=\"1036\" data-end=\"1100\">AWS Glue \u662f\u7121\u4f3a\u670d\u5668\u670d\u52d9\uff0c\u4e0d\u9700\u8981\u8a2d\u5b9a\u53e2\u96c6\u6216\u904b\u7b97\u8cc7\u6e90\u3002\u7cfb\u7d71\u6703\u6839\u64da\u4f5c\u696d\u898f\u6a21\u81ea\u52d5\u64f4\u5c55\u8cc7\u6e90\uff0c\u4e26\u6309\u79d2\u8a08\u8cbb\uff0c\u5e6b\u52a9\u4f7f\u7528\u8005\u512a\u5316\u8cc7\u6e90\u548c\u6210\u672c\u3002<\/p>\n<h5 data-start=\"1102\" data-end=\"1117\">4. \u591a\u7a2e\u8cc7\u6599\u683c\u5f0f\u652f\u6301<\/h5>\n<p class=\"\" data-start=\"1119\" data-end=\"1188\">Glue \u80fd\u8655\u7406\u5305\u62ecJSON\u3001CSV\u3001Avro\u3001Parquet\u3001ORC \u7b49\u5728\u5167\u7684\u7d50\u69cb\u5316\u8207\u534a\u7d50\u69cb\u5316\u6578\u64da\uff0c\u6eff\u8db3\u5404\u7a2e <strong data-start=\"1176\" data-end=\"1184\">\u8cc7\u6599\u8655\u7406<\/strong> \u9700\u6c42\u3002<\/p>\n<h5 data-start=\"1190\" data-end=\"1215\">5. Glue Studio\uff08\u8996\u89ba\u5316\u958b\u767c\uff09<\/h5>\n<p class=\"\" data-start=\"1217\" data-end=\"1302\"><strong data-start=\"1217\" data-end=\"1232\">Glue Studio<\/strong> \u662f\u9762\u5411\u958b\u767c\u8005\u7684\u5716\u5f62\u5316\u5de5\u5177\uff0c\u5141\u8a31\u4f7f\u7528\u8005\u900f\u904e\u62d6\u66f3\u5143\u4ef6\u4f86\u5efa\u69cb\u3001\u8abf\u8a66\u548c\u7ba1\u7406\u8907\u96dc\u7684 <strong data-start=\"1268\" data-end=\"1279\">ETL \u5de5\u4f5c\u6d41\u7a0b<\/strong>\u3002\u5373\u4f7f\u6c92\u6709\u7a0b\u5f0f\u8a2d\u8a08\u7d93\u9a57\uff0c\u4e5f\u80fd\u8f15\u9b06\u8a2d\u8a08\u8cc7\u6599\u6574\u5408\u4efb\u52d9\u3002<\/p>\n<h5 data-start=\"1304\" data-end=\"1334\">6. Glue DataBrew\uff1a\u7121\u9700\u7a0b\u5f0f\u78bc\u7684\u8cc7\u6599\u6e96\u5099<\/h5>\n<p class=\"\" data-start=\"1336\" data-end=\"1431\"><strong data-start=\"1336\" data-end=\"1353\">Glue DataBrew<\/strong> \u662fAWS Glue \u7684\u4e00\u90e8\u5206\uff0c\u5b83\u70ba\u975e\u6280\u8853\u7528\u6236\u63d0\u4f9b\u4e86\u4e00\u500b\u5716\u5f62\u5316\u4ecb\u9762\uff0c\u652f\u63f4\u8d85\u904e250 \u7a2e <strong data-start=\"1399\" data-end=\"1407\">\u8cc7\u6599\u8f49\u63db<\/strong> \u64cd\u4f5c\uff0c\u9069\u5408\u7528\u65bc <strong data-start=\"1416\" data-end=\"1430\">\u81ea\u52d5\u5316\u8cc7\u6599\u6e96\u5099\u7684\u8f49\u63db<\/strong>\u3002<\/p>\n<h5 data-start=\"1433\" data-end=\"1460\">7. \u5373\u6642\u4e32\u6d41\u8655\u7406\uff08Streaming ETL\uff09<\/h5>\n<p class=\"\" data-start=\"1462\" data-end=\"1554\">Glue \u652f\u63f4\u5373\u6642 <strong data-start=\"1472\" data-end=\"1480\">\u8cc7\u6599\u8655\u7406<\/strong>\uff0c\u53ef\u5f9e <strong data-start=\"1484\" data-end=\"1502\">Amazon Kinesis<\/strong> \u6216 <strong data-start=\"1505\" data-end=\"1521\">Apache Kafka<\/strong> \u7b49\u6d41\u670d\u52d9\u4e2d\u63a5\u6536\u8cc7\u6599\u4e26\u9032\u884c\u8f49\u63db\u8207\u5b58\u5132\uff0c\u6eff\u8db3\u5c0d\u4f4e\u5ef6\u9072\u8cc7\u6599\u5206\u6790\u7684\u9700\u6c42\u3002<\/p>\n<h5 data-start=\"1556\" data-end=\"1573\">8. \u81ea\u52d5\u5316\u8abf\u5ea6\u8207\u4f9d\u8cf4\u7ba1\u7406<\/h5>\n<p class=\"\" data-start=\"1575\" data-end=\"1635\">Glue \u5167\u5efa\u7684\u4efb\u52d9\u8abf\u5ea6\u5668\u652f\u63f4\u5b9a\u6642\u6216\u4e8b\u4ef6\u89f8\u767c\uff0c\u4e26\u53ef\u8a2d\u5b9a\u4efb\u52d9\u4f9d\u8cf4\u95dc\u4fc2\uff0c\u81ea\u52d5\u5efa\u7f6e\u548c\u57f7\u884c\u8907\u96dc\u7684 <strong data-start=\"1620\" data-end=\"1630\">ETL \u4f5c\u696d<\/strong> \u5de5\u4f5c\u6d41\u7a0b\u3002<\/p>\n<p>&nbsp;<\/p>\n<h4>AWS Glue \u7684\u95dc\u9375\u512a\u52e2<\/h4>\n<h5 data-start=\"1661\" data-end=\"1676\">1. \u7121\u9700\u7ba1\u7406\u57fa\u790e\u8a2d\u65bd<\/h5>\n<p class=\"\" data-start=\"1678\" data-end=\"1724\">Glue \u7684\u7121\u4f3a\u670d\u5668\u7279\u6027\u8b93\u4f7f\u7528\u8005\u7121\u9700\u914d\u7f6e\u4f3a\u670d\u5668\u6216\u7ba1\u7406\u96c6\u7fa4\uff0c\u5b8c\u5168\u7531AWS \u8ca0\u8cac\u8cc7\u6e90\u8abf\u5ea6\u8207\u7dad\u8b77\u3002<\/p>\n<h5 data-start=\"1726\" data-end=\"1742\">2. \u964d\u4f4e\u958b\u767c\u8207\u7dad\u904b\u6210\u672c<\/h5>\n<p class=\"\" data-start=\"1744\" data-end=\"1817\">\u900f\u904e <strong data-start=\"1747\" data-end=\"1755\">\u7a0b\u5f0f\u78bc\u751f\u6210<\/strong>\u3001Glue Studio \u548cGlue DataBrew\uff0c\u958b\u767c\u4eba\u54e1\u53ef\u4ee5\u5728\u6700\u77ed\u6642\u9593\u5167\u5b8c\u6210\u8907\u96dc\u7684\u8cc7\u6599\u6574\u5408\u5de5\u4f5c\uff0c\u986f\u8457\u964d\u4f4e\u4eba\u529b\u6210\u672c\u3002<\/p>\n<h5 data-start=\"1819\" data-end=\"1838\">3. \u8207AWS \u670d\u52d9\u6df1\u5ea6\u6574\u5408<\/h5>\n<p class=\"\" data-start=\"1840\" data-end=\"1961\">Glue \u8207 <strong data-start=\"1847\" data-end=\"1860\">Amazon S3<\/strong>\u3001<strong data-start=\"1861\" data-end=\"1889\">Amazon Redshift Spectrum<\/strong>\u3001<strong data-start=\"1890\" data-end=\"1900\">Athena<\/strong>\u3001<strong data-start=\"1901\" data-end=\"1908\">RDS<\/strong> \u7b49 <strong data-start=\"1911\" data-end=\"1934\">Amazon Web Services<\/strong> \u7dca\u5bc6\u6574\u5408\uff0c\u5efa\u7acb\u5b8c\u6574\u7684\u7aef\u5230\u7aef\u8cc7\u6599\u89e3\u6c7a\u65b9\u6848\u8b8a\u5f97\u66f4\u52a0\u5bb9\u6613\u3002<\/p>\n<h5 data-start=\"1963\" data-end=\"1977\">4. \u5f48\u6027\u8207\u53ef\u64f4\u5c55\u6027<\/h5>\n<p class=\"\" data-start=\"1979\" data-end=\"2018\">Glue \u80fd\u81ea\u52d5\u64f4\u5c55\u8655\u7406\u8cc7\u6e90\uff0c\u9069\u914d\u5f9e\u5c0f\u898f\u6a21\u8655\u7406\u4efb\u52d9\u5230PB \u7b49\u7d1a\u7684\u5927\u6578\u64da\u9700\u6c42\u3002<\/p>\n<h5 data-start=\"2020\" data-end=\"2033\">5. \u5373\u6642\u8655\u7406\u80fd\u529b<\/h5>\n<p class=\"\" data-start=\"2035\" data-end=\"2102\">\u900f\u904e <strong data-start=\"2038\" data-end=\"2055\">Streaming ETL<\/strong>\uff0cAWS Glue \u53ef\u5be6\u73fe\u8fd1\u5be6\u6642\u7684\u8cc7\u6599\u651d\u53d6\u8207\u8655\u7406\uff0c\u9069\u7528\u65bc\u8cc7\u6599\u76e3\u63a7\u3001\u65e5\u8a8c\u5206\u6790\u3001\u5373\u6642\u5100\u9336\u677f\u7b49\u60c5\u5883\u3002<\/p>\n<p>&nbsp;<\/p>\n<h4>\u4f7f\u7528\u5834\u666f<\/h4>\n<ul data-start=\"2118\" data-end=\"2417\">\n<li class=\"\" data-start=\"2118\" data-end=\"2172\">\n<p class=\"\" data-start=\"2120\" data-end=\"2172\"><strong data-start=\"2120\" data-end=\"2132\">\u8cc7\u6599\u6e56\u7ba1\u7406\u8207\u69cb\u5efa<\/strong>\uff1a\u81ea\u52d5\u767c\u73fe\u4e26\u8a3b\u518a <strong data-start=\"2141\" data-end=\"2154\">Amazon S3<\/strong> \u4e2d\u7684\u6578\u64da\uff0c\u5feb\u901f\u5efa\u7acb\u53ef\u67e5\u8a62\u7684\u6578\u64da\u6e56\u3002<\/p>\n<\/li>\n<li class=\"\" data-start=\"2173\" data-end=\"2241\">\n<p class=\"\" data-start=\"2175\" data-end=\"2241\"><strong data-start=\"2175\" data-end=\"2186\">\u81ea\u52d5\u5316\u6578\u64da\u7ba1\u9053<\/strong>\uff1a\u5efa\u69cb\u7aef\u5230\u7aef\u7684 <strong data-start=\"2194\" data-end=\"2204\">ETL \u7ba1\u9053<\/strong>\uff0c\u5c07\u4f86\u81ea\u591a\u7cfb\u7d71\u7684\u6578\u64da\u6574\u5408\u81f3\u7d71\u4e00\u5206\u6790\u5e73\u53f0\u5982Amazon Redshift\u3002<\/p>\n<\/li>\n<li class=\"\" data-start=\"2242\" data-end=\"2287\">\n<p class=\"\" data-start=\"2244\" data-end=\"2287\"><strong data-start=\"2244\" data-end=\"2255\">\u8cc7\u6599\u9077\u79fb\u8207\u6574\u5408<\/strong>\uff1a\u5c07\u672c\u6a5f\u8cc7\u6599\u5eab\u6216\u7b2c\u4e09\u65b9\u8cc7\u6599\u5e73\u53f0\u4e2d\u7684\u8cc7\u6599\u9077\u79fb\u4e26\u683c\u5f0f\u5316\u5f8c\u8f09\u5165\u5230\u96f2\u7aef\u3002<\/p>\n<\/li>\n<li class=\"\" data-start=\"2288\" data-end=\"2341\">\n<p class=\"\" data-start=\"2290\" data-end=\"2341\"><strong data-start=\"2290\" data-end=\"2300\">\u5373\u6642\u6578\u64da\u8655\u7406<\/strong>\uff1a\u501f\u52a9 <strong data-start=\"2304\" data-end=\"2321\">Streaming ETL<\/strong> \u529f\u80fd\uff0c\u5373\u6642\u6536\u96c6\u4e26\u8655\u7406\u65e5\u8a8c\u6216\u611f\u6e2c\u5668\u8cc7\u6599\u3002<\/p>\n<\/li>\n<li class=\"\" data-start=\"2342\" data-end=\"2417\">\n<p class=\"\" data-start=\"2344\" data-end=\"2417\"><strong data-start=\"2344\" data-end=\"2356\">\u6a5f\u5668\u5b78\u7fd2\u8cc7\u6599\u6e96\u5099<\/strong>\uff1a\u4f7f\u7528Glue DataBrew \u9032\u884c <strong data-start=\"2377\" data-end=\"2398\">\u8cc7\u6599\u6e05\u6d17\u3001\u7f3a\u5931\u503c\u586b\u5145\u3001\u53bb\u91cd\u3001\u6a19\u6e96\u5316<\/strong> \u7b49\u64cd\u4f5c\uff0c\u52a0\u901f\u6a5f\u5668\u5b78\u7fd2\u6a21\u578b\u7684\u958b\u767c\u6d41\u7a0b\u3002<\/p>\n<\/li>\n<\/ul>\n<p>&nbsp;<\/p>\n<h4>\u5b9a\u50f9\u6a21\u578b<\/h4>\n<p class=\"\" data-start=\"2433\" data-end=\"2452\">AWS Glue \u7684\u8a08\u8cbb\u6a5f\u5236\u4e3b\u8981\u5305\u62ec\uff1a<\/p>\n<ul data-start=\"2454\" data-end=\"2567\">\n<li class=\"\" data-start=\"2454\" data-end=\"2481\">\n<p class=\"\" data-start=\"2456\" data-end=\"2481\"><strong data-start=\"2456\" data-end=\"2466\">\u4f5c\u696d\u57f7\u884c\u6642\u9593<\/strong>\uff1a\u6309\u79d2\u8a08\u8cbb\uff0c\u6700\u4f4e1 \u5206\u9418\u8d77\uff1b<\/p>\n<\/li>\n<li class=\"\" data-start=\"2482\" data-end=\"2521\">\n<p class=\"\" data-start=\"2484\" data-end=\"2521\"><strong data-start=\"2484\" data-end=\"2494\">\u8cc7\u6599\u76ee\u9304\u5b58\u5132<\/strong>\uff1a\u6309 <strong data-start=\"2497\" data-end=\"2510\">Glue \u8cc7\u6599\u76ee\u9304<\/strong> \u4e2d\u5143\u8cc7\u6599\u689d\u76ee\u6578\u8a08\u8cbb\uff1b<\/p>\n<\/li>\n<li class=\"\" data-start=\"2522\" data-end=\"2567\">\n<p class=\"\" data-start=\"2524\" data-end=\"2567\"><strong data-start=\"2524\" data-end=\"2534\">\u6d41\u8655\u7406\u8cc7\u6599\u91cf<\/strong>\uff1a\u5728Streaming ETL \u4f5c\u696d\u4e2d\u8655\u7406\u7684\u8cc7\u6599\u6703\u7522\u751f\u984d\u5916\u8cbb\u7528\u3002<\/p>\n<\/li>\n<\/ul>\n<p class=\"\" data-start=\"2569\" data-end=\"2610\">Glue \u7684\u5f48\u6027\u5b9a\u50f9\u6a21\u5f0f\u8b93\u4f7f\u7528\u8005\u53ef\u4ee5\u6309\u9700\u64f4\u5c55\uff0c\u800c\u7121\u9700\u9810\u4ed8\u6216\u9810\u7559\u8cc7\u6e90\uff0c\u4fbf\u65bc\u6210\u672c\u63a7\u5236\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><img decoding=\"async\" class=\"size-large wp-image-1490 aligncenter\" src=\"http:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8d39-\u4ed8\u6b3e-\u4ed9-\u503c-\u7684-\u514d\u8d39\u7d20\u6750\u56fe\u7247-\u7d20\u6750\u56fe\u7247-1024x678.jpg\" alt=\"\" width=\"800\" height=\"530\" srcset=\"https:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8d39-\u4ed8\u6b3e-\u4ed9-\u503c-\u7684-\u514d\u8d39\u7d20\u6750\u56fe\u7247-\u7d20\u6750\u56fe\u7247-1024x678.jpg 1024w, https:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8d39-\u4ed8\u6b3e-\u4ed9-\u503c-\u7684-\u514d\u8d39\u7d20\u6750\u56fe\u7247-\u7d20\u6750\u56fe\u7247-300x199.jpg 300w, https:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8d39-\u4ed8\u6b3e-\u4ed9-\u503c-\u7684-\u514d\u8d39\u7d20\u6750\u56fe\u7247-\u7d20\u6750\u56fe\u7247-768x509.jpg 768w, https:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8d39-\u4ed8\u6b3e-\u4ed9-\u503c-\u7684-\u514d\u8d39\u7d20\u6750\u56fe\u7247-\u7d20\u6750\u56fe\u7247-1536x1017.jpg 1536w, https:\/\/aws-oncloudai.com\/wp-content\/uploads\/2024\/12\/\u514d\u8d39-\u4ed8\u6b3e-\u4ed9-\u503c-\u7684-\u514d\u8d39\u7d20\u6750\u56fe\u7247-\u7d20\u6750\u56fe\u7247-2048x1356.jpg 2048w\" sizes=\"(max-width: 800px) 100vw, 800px\" \/><\/p>\n<p>&nbsp;<\/p>\n<h4>\u5982\u4f55\u5feb\u901f\u958b\u59cb\u4f7f\u7528AWS Glue\uff1f<\/h4>\n<p>\u4ee5\u4e0b\u662f\u4f7f\u7528AWS Glue \u7684\u57fa\u672c\u6b65\u9a5f\uff1a<\/p>\n<ol>\n<li><strong>\u8cc7\u6599\u6e96\u5099<\/strong>\uff1a\u5c07\u8cc7\u6599\u5132\u5b58\u5230Amazon S3 \u6216\u5176\u4ed6\u652f\u63f4\u7684\u5132\u5b58\u670d\u52d9\u3002<\/li>\n<li><strong>\u5efa\u7acb\u722c\u7db2\u5668<\/strong>\uff1a\u914d\u7f6eGlue \u722c\u7db2\u5668\uff0c\u81ea\u52d5\u767c\u73fe\u8cc7\u6599\u4f86\u6e90\u4e26\u7522\u751f\u8cc7\u6599\u76ee\u9304\u3002<\/li>\n<li><strong>\u5b9a\u7fa9ETL \u4f5c\u696d<\/strong>\uff1a\u900f\u904eGlue Studio \u6216\u76f4\u63a5\u7de8\u8f2f\u7a0b\u5f0f\u78bc\u5b9a\u7fa9ETL \u4f5c\u696d\u3002<\/li>\n<li><strong>\u904b\u884cETL \u4f5c\u696d<\/strong>\uff1a\u555f\u52d5ETL \u4f5c\u696d\uff0c\u5c07\u8cc7\u6599\u63d0\u53d6\u3001\u8f49\u63db\u4e26\u8f09\u5165\u5230\u76ee\u6a19\u5132\u5b58\u4e2d\u3002<\/li>\n<li><strong>\u6574\u5408\u5206\u6790\u5de5\u5177<\/strong>\uff1a\u5229\u7528Amazon Athena\u3001Redshift \u6216\u5176\u4ed6\u5de5\u5177\u5206\u6790\u8655\u7406\u5f8c\u7684\u8cc7\u6599\u3002<\/li>\n<\/ol>\n<p>&nbsp;<\/p>\n<h4>\u603b\u7ed3<\/h4>\n<p class=\"\" data-start=\"2883\" data-end=\"3010\"><strong data-start=\"2883\" data-end=\"2895\">AWS Glue<\/strong> \u662f\u73fe\u4ee3\u4f01\u696d\u61c9\u5c0d\u8cc7\u6599\u6574\u5408\u6311\u6230\u7684\u5f37\u5927\u5de5\u5177\u3002\u5176 <strong data-start=\"2917\" data-end=\"2934\">serverless \u67b6\u69cb<\/strong>\u3001\u81ea\u52d5\u5316 <strong data-start=\"2939\" data-end=\"2949\">ETL \u4f5c\u696d<\/strong> \u7ba1\u7406\u3001\u8207 <strong data-start=\"2955\" data-end=\"2978\">Amazon Web Services<\/strong> \u5168\u751f\u614b\u7684\u6574\u5408\uff0c\u8b93\u4f01\u696d\u7121\u9700\u6df1\u539a\u958b\u767c\u80cc\u666f\u5373\u53ef\u8f15\u9b06\u5efa\u69cb\u8907\u96dc\u7684\u8cc7\u6599\u6d41\u3002<\/p>\n<p class=\"\" data-start=\"3012\" data-end=\"3113\">\u7121\u8ad6\u662f\u5efa\u7acb\u8cc7\u6599\u6e56\u3001\u5373\u6642\u8cc7\u6599\u8655\u7406\uff0c\u6216\u662f\u9077\u79fb\u8cc7\u6599\u548c\u6e96\u5099\u6a5f\u5668\u5b78\u7fd2\u8a13\u7df4\u6578\u64da\uff0cAWS Glue \u90fd\u63d0\u4f9b\u4e86\u9748\u6d3b\u9ad8\u6548\u7684\u89e3\u6c7a\u65b9\u6848\u3002\u5982\u679c\u60a8\u5e0c\u671b\u6253\u9020\u4e00\u500b\u53ef\u64f4\u5c55\u3001\u53ef\u7dad\u8b77\u4e14\u7d93\u6fdf\u7684\u8cc7\u6599\u5e73\u53f0\uff0cAWS Glue \u503c\u5f97\u6df1\u5165\u4e86\u89e3\u8207\u5be6\u8e10\uff01<\/p>","protected":false},"excerpt":{"rendered":"<p>\u5728\u8cc7\u6599\u7206\u70b8\u6027\u6210\u9577\u7684\u4eca\u5929\uff0c\u4f01\u696d\u6b63\u4e0d\u65b7\u61c9\u5c0d\u5982\u4f55\u6574\u5408\u3001\u8655\u7406\u548c\u5206\u6790\u4f86\u81ea\u591a\u7a2edata sources \u7684\u5927\u91cf\u8cc7\u6599\u3002 AWS Glue\uff0c\u4f5c\u70baAmazon Web Services\uff08AWS\uff09\u63a8\u51fa\u7684\u8a17\u7ba1\u5f0f\u8cc7\u6599\u6574\u5408\u670d\u52d9\uff0c\u6b63\u9010\u6f38\u6210\u70ba\u5efa\u7f6e\u73fe\u4ee3data pipeline \u8207data lakes \u7684\u6838\u5fc3\u5de5\u5177\u3002\u5b83\u7c21\u5316\u4e86\u8cc7\u6599\u6e96\u5099\u3001\u8f49\u63db\u548c\u8f09\u5165\uff08ETL pipeline\uff09\u7684\u6574\u500b\u904e\u7a0b\uff0c\u5e6b\u52a9\u4f7f\u7528\u8005\u66f4\u5feb\u53d6\u5f97data for analytics \u548c\u696d\u52d9\u6d1e\u5bdf\u3002<\/p>","protected":false},"author":1,"featured_media":1885,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[65],"tags":[],"class_list":["post-1883","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-technical-sharing"],"_links":{"self":[{"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/posts\/1883","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/comments?post=1883"}],"version-history":[{"count":0,"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/posts\/1883\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/media\/1885"}],"wp:attachment":[{"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/media?parent=1883"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/categories?post=1883"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/aws-oncloudai.com\/zh_hk\/wp-json\/wp\/v2\/tags?post=1883"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}