<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Sqoop --split-by on a string /varchar column in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Sqoop-split-by-on-a-string-varchar-column/m-p/165530#M127892</link>
    <description>&lt;P&gt;The answer is outdated. It is possible to use a character attribute as split-by attribute.&lt;/P&gt;&lt;P&gt;You only need to add -Dorg.apache.sqoop.splitter.allow_text_splitter=true&lt;/P&gt;&lt;P&gt;after your 'sqoop job' statement like this:&lt;/P&gt;&lt;PRE&gt;sqoop job -Dorg.apache.sqoop.splitter.allow_text_splitter=true \\
    --create ${JOB_NAME} \\
    -- \\
    import \\
    --connect \"${JDBC}\" \\
    --username ${SOURCE_USR} \\
    --password-file ${PWD_FILE_PATH} \\&lt;/PRE&gt;&lt;P&gt;no guarantees though that sqoop splits your records evenly over your mappers though.&lt;/P&gt;</description>
    <pubDate>Thu, 03 Nov 2016 20:10:30 GMT</pubDate>
    <dc:creator>rene_sluiter</dc:creator>
    <dc:date>2016-11-03T20:10:30Z</dc:date>
  </channel>
</rss>

