<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question impala split udf in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21376#M3608</link>
    <description>&lt;P&gt;I am on CDH 5.2 using Impala 2.0&lt;/P&gt;&lt;P&gt;Does anybody know when the UDTF split function be available? &amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I have an array that is delimited by Pipe that has a max of 6 entries; min of 4&lt;/P&gt;&lt;P&gt;split[0], split[3] would have worked perfectly&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Ideas are welcome on how to work around my challenge&amp;nbsp;&lt;/P&gt;&lt;P&gt;example&amp;nbsp;&lt;/P&gt;&lt;P&gt;aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;a is variable length but always there&lt;/P&gt;&lt;P&gt;b may not be present&lt;/P&gt;&lt;P&gt;c may not be present&lt;/P&gt;&lt;P&gt;d, e and f is always there fixed length&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am think a really convoluted usage of substr&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Fri, 16 Sep 2022 09:12:19 GMT</pubDate>
    <dc:creator>scratch28</dc:creator>
    <dc:date>2022-09-16T09:12:19Z</dc:date>
    <item>
      <title>impala split udf</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21376#M3608</link>
      <description>&lt;P&gt;I am on CDH 5.2 using Impala 2.0&lt;/P&gt;&lt;P&gt;Does anybody know when the UDTF split function be available? &amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I have an array that is delimited by Pipe that has a max of 6 entries; min of 4&lt;/P&gt;&lt;P&gt;split[0], split[3] would have worked perfectly&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Ideas are welcome on how to work around my challenge&amp;nbsp;&lt;/P&gt;&lt;P&gt;example&amp;nbsp;&lt;/P&gt;&lt;P&gt;aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;a is variable length but always there&lt;/P&gt;&lt;P&gt;b may not be present&lt;/P&gt;&lt;P&gt;c may not be present&lt;/P&gt;&lt;P&gt;d, e and f is always there fixed length&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am think a really convoluted usage of substr&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 09:12:19 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21376#M3608</guid>
      <dc:creator>scratch28</dc:creator>
      <dc:date>2022-09-16T09:12:19Z</dc:date>
    </item>
    <item>
      <title>Re: impala split udf</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21586#M3609</link>
      <description>&lt;P class="p1"&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;&amp;gt; select regexp_extract('aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 1);
Query: select regexp_extract('aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 1)
aaaaaaaa
Fetched 1 row(s) in 0.01s
&amp;nbsp;
&amp;gt; select regexp_extract('aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 3);
Query: select regexp_extract('aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 3)
ccc
Fetched 1 row(s) in 0.01s
&amp;nbsp;
&amp;gt; select regexp_extract('aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 6);
Query: select regexp_extract('aaaaaaaa|bbb|ccc|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 6)
ffffff
Fetched 1 row(s) in 0.01s
&amp;nbsp;
&amp;gt; select regexp_extract('aaaaaaaa|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 1);
Query: select regexp_extract('aaaaaaaa|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 1)
aaaaaaaa
Fetched 1 row(s) in 0.01s
&amp;nbsp;
&amp;gt; select regexp_extract('aaaaaaaa|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 3);
Query: select regexp_extract('aaaaaaaa|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 3)
eeeeeeee
Fetched 1 row(s) in 0.01s
&amp;nbsp;
&amp;gt; select regexp_extract('aaaaaaaa|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 6);
Query: select regexp_extract('aaaaaaaa|ddddddddddd|eeeeeeee|ffffff', '([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|([a-z]+)\\|?([a-z]*)\\|?([a-z]*)', 6)
""&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 14 Nov 2014 15:36:33 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21586#M3609</guid>
      <dc:creator>chaaaaaarlie</dc:creator>
      <dc:date>2014-11-14T15:36:33Z</dc:date>
    </item>
    <item>
      <title>Re: impala split udf</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21763#M3610</link>
      <description>&lt;P&gt;somewhat better than me leveraging nested substr and reverses&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;but still wouldn't mind seeing the split function be brought in&lt;/P&gt;</description>
      <pubDate>Tue, 18 Nov 2014 19:36:34 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/impala-split-udf/m-p/21763#M3610</guid>
      <dc:creator>scratch28</dc:creator>
      <dc:date>2014-11-18T19:36:34Z</dc:date>
    </item>
  </channel>
</rss>

