{"id":12661,"date":"2024-04-16T15:19:20","date_gmt":"2024-04-16T07:19:20","guid":{"rendered":"https:\/\/nj.transwarp.cn:8180\/?p=12661"},"modified":"2024-04-16T15:28:11","modified_gmt":"2024-04-16T07:28:11","slug":"sqoop%e5%a4%84%e7%90%86clob%e5%8c%85%e5%90%ab%e6%8d%a2%e8%a1%8c%e7%ac%a6%e7%9a%84%e6%83%85%e5%86%b5","status":"publish","type":"post","link":"https:\/\/kbwp.transwarp.cn\/?p=12661","title":{"rendered":"sqoop\u5904\u7406clob\u5305\u542b\u6362\u884c\u7b26\u7684\u60c5\u51b5"},"content":{"rendered":"<h3>\u6982\u8981\u63cf\u8ff0<\/h3>\n<hr \/>\n<p>CLOB\u5b57\u6bb5\u4eceOracle\u5bfc\u5165\u5230inceptort\u65f6\uff0c\u5982\u679cCLOB\u4e2d\u6709\u6362\u884c\u7b26\uff0c\u5728\u5bfc\u5165hdfs\u7684\u65f6\u5019\uff0c\u6570\u636e\u6587\u4ef6\u6761\u6570\u4f1a\u5bf9\u4e0d\u4e0a\uff0c\u8fd9\u91cc\u63d0\u4f9bdemo\u53ca\u89e3\u51b3\u65b9\u6848\u3002<\/p>\n<h3>\u8be6\u7ec6\u8bf4\u660e<\/h3>\n<hr \/>\n<h4>1. \u521b\u5efaoracle\u539f\u8868\uff0cclob\u5217\u5305\u542b\u6362\u884c\u7b26<\/h4>\n<pre><code class=\"language-sql\">--\u521b\u5efa\u8868\nDROP TABLE tmp_clob;\nCREATE TABLE tmp_clob (name VARCHAR2(200),age NUMBER, c_clob CLOB);\n\n--\u63d2\u5165\u5305\u542b\u6362\u884c\u7b26\u7684\u6570\u636e\nDECLARE\n  my_clob CLOB;\nBEGIN\n  DBMS_LOB.CREATETEMPORARY(my_clob, TRUE);\n  DBMS_LOB.WRITE(my_clob, 12801, 1, RPAD('111111' || CHR(10), 12801, '1'));\n  INSERT INTO tmp_clob (name,age,c_clob) VALUES ('zhangsan',18,my_clob);\n  COMMIT;\nEND;\n\nSELECT CASE WHEN INSTR(c_clob, CHR(10)) > 0 THEN 'EXITS' ELSE 'NOT EXISTS' END AS newline_check from tmp_clob;  --EXISTS<\/code><\/pre>\n<h4>2. \u4f7f\u7528TDH-Client\u5ba2\u6237\u7aef\u96c6\u6210\u7684sqoop\u547d\u4ee4\u5c06oracle\u6570\u636e\u5bfc\u5165\u5230hdfs\u8def\u5f84\u4e0b<\/h4>\n<pre><code class=\"language-shell\">sqoop import \\\n--connect jdbc:oracle:thin:@172.22.23.9:1521\/helowin \\\n--username lkw \\\n--password 123456  \\\n--table lkw.tmp_clob  \\\n--columns \"name,age,c_clob\" \\\n--split-by age -m 4 \\\n--target-dir \/tmp\/dst_clob10 \\\n--fields-terminated-by \"\\\\01\" \\\n--hive-drop-import-delims \\\n--null-string '\\\\N' \\\n--null-non-string '\\\\N'<\/code><\/pre>\n<p><strong>\u4eceHDFS\u8def\u5f84\u4e2d\u67e5\u770b\u5bfc\u5165\u7684\u6587\u4ef6\uff0c\u53ef\u4ee5\u770b\u5230\u67092\u6761\u6570\u636e<\/strong><\/p>\n<pre><code class=\"language-shell\">[root@kv1~]# hdfs dfs -ls \/tmp\/dst_clob10\n2024-04-16 14:56:50,742 INFO util.KerberosUtil: Using principal pattern: HTTP\/_HOST\nFound 2 items\n-rw-r--r--   3 hdfs hadoop          0 2024-04-16 14:55 \/tmp\/dst_clob10\/_SUCCESS\n-rw-r--r--   3 hdfs hadoop      12814 2024-04-16 14:55 \/tmp\/dst_clob10\/part-m-00000\n\n[root@kv1~]# hdfs dfs -cat \/tmp\/dst_clob10\/part-m-00000 | wc -l \n2024-04-16 15:15:54,513 INFO util.KerberosUtil: Using principal pattern: HTTP\/_HOST\n2<\/code><\/pre>\n<p><strong>\u8fd9\u91cc\u5982\u679c\u901a\u8fc7\u521b\u5efainceptor\u5916\u8868\u7684\u65b9\u5f0f\u80fd\u770b\u5230\u6570\u636e\u6362\u884c<\/strong><\/p>\n<pre><code class=\"language-sql\">DROP TABLE IF EXISTS test_clob01;\nCREATE EXTERNAL TABLE test_clob01\n(NAME STRING ,AGE INT,C_CLOB BINARY)\nROW FORMAT DELIMITED FIELDS TERMINATED BY '\\001'\nLOCATION '\/tmp\/dst_clob10\/';<\/code><\/pre>\n<h3>\u89e3\u51b3\u65b9\u6848<\/h3>\n<hr \/>\n<pre><code class=\"language-shell\">sqoop import \\\n--connect jdbc:oracle:thin:@172.22.23.9:1521\/helowin \\\n--username lkw \\\n--password 123456  \\\n--table lkw.tmp_clob  \\\n# \u6dfb\u52a0\u5982\u4e0b\u8fd9\u884c\n--map-column-java c_clob=String \\\n--columns \"name,age,c_clob\" \\\n--split-by age -m 4 \\\n--target-dir \/tmp\/dst_clob12 \\\n--fields-terminated-by \"\\\\01\" \\\n# \uff01\uff01\uff01\u6ce8\u610f\uff1a\u8fd9\u91cc\u5fc5\u987b\u8981\u628a<code>--hive-drop-import-delims<\/code>\u5199\u4e0a\u53bb\n--hive-drop-import-delims \\\n--null-string '\\\\N' \\\n--null-non-string '\\\\N'<\/code><\/pre>\n<pre><code class=\"language-shell\">[root@kv1~]# hdfs dfs -ls \/tmp\/dst_clob12\/\n2024-04-16 15:15:45,446 INFO util.KerberosUtil: Using principal pattern: HTTP\/_HOST\nFound 2 items\n-rw-r--r--   3 hdfs hadoop          0 2024-04-16 15:15 \/tmp\/dst_clob12\/_SUCCESS\n-rw-r--r--   3 hdfs hadoop      12813 2024-04-16 15:15 \/tmp\/dst_clob12\/part-m-00000\n[root@kv1~]# hdfs dfs -cat \/tmp\/dst_clob12\/part-m-00000 | wc -l \n2024-04-16 15:15:54,513 INFO util.KerberosUtil: Using principal pattern: HTTP\/_HOST\n1<\/code><\/pre>\n<p><strong>Sqoop import\u53c2\u6570\u9009\u9879 <code>--hive-drop-import-delims<\/code> \u5bf9CLOB\u4e2d\u6362\u884c\u7b26\u662f\u6ca1\u6709\u6548\u679c\u7684\uff0c\u9700\u8981\u663e\u793a\u6dfb\u52a0<code>--map-column-java CLOB\u5217\u540d=String<\/code>\uff0c\u8fd9\u6837<code>--hive-drop-import-delims<\/code>\u624d\u80fd\u53bb\u9664CLOB\u4e2d\u7684\u6362\u884c\u7b26\u3002<\/strong><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u6982\u8981\u63cf\u8ff0 CLOB\u5b57\u6bb5\u4eceOracle\u5bfc\u5165\u5230inceptort\u65f6\uff0c\u5982\u679cCLOB\u4e2d\u6709\u6362\u884c\u7b26\uff0c\u5728\u5bfc\u5165hdfs\u7684\u65f6\u5019\uff0c ..<\/p>\n<div class=\"clear-fix\"><\/div>\n<p><a href=\"https:\/\/kbwp.transwarp.cn\/?p=12661\" title=\"read more...\">Read more<\/a><\/p>\n","protected":false},"author":12,"featured_media":0,"comment_status":"closed","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[],"class_list":["post-12661","post","type-post","status-publish","format-standard","hentry","category-uncategorized"],"acf":[],"_links":{"self":[{"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=\/wp\/v2\/posts\/12661","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=\/wp\/v2\/users\/12"}],"replies":[{"embeddable":true,"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=12661"}],"version-history":[{"count":3,"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=\/wp\/v2\/posts\/12661\/revisions"}],"predecessor-version":[{"id":12672,"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=\/wp\/v2\/posts\/12661\/revisions\/12672"}],"wp:attachment":[{"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=12661"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=12661"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/kbwp.transwarp.cn\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=12661"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}