<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Hbase filter query using pyspark in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382931#M244750</link>
    <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109002"&gt;@Taries&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;As I mentioned previously,&lt;/SPAN&gt;&lt;SPAN&gt; only the &lt;/SPAN&gt;hbase.spark.query.timerange&lt;SPAN&gt; parameter can be used for filtering data during read.&lt;/SPAN&gt;&lt;SPAN&gt; The &lt;/SPAN&gt;hbase.spark.scan&lt;SPAN&gt; parameter wouldn't be set for this purpose.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;To filter the data after reading, you can apply a Spark WHERE or filter clause with your desired conditions.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Wed, 31 Jan 2024 14:59:57 GMT</pubDate>
    <dc:creator>RangaReddy</dc:creator>
    <dc:date>2024-01-31T14:59:57Z</dc:date>
    <item>
      <title>Hbase filter query using pyspark</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382904#M244738</link>
      <description>&lt;P&gt;I am trying to pull the records from the Hbase based on the row key in pyspark using the following details&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="pyspark.JPG" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/39622i3FC4BB8154713040/image-size/medium?v=v2&amp;amp;px=400" role="button" title="pyspark.JPG" alt="pyspark.JPG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt; &lt;/P&gt;&lt;P&gt;but the records which is returning showing all the records (i,e without filter), can you please help me to resolving the issue&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 05:22:24 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382904#M244738</guid>
      <dc:creator>Taries</dc:creator>
      <dc:date>2024-01-31T05:22:24Z</dc:date>
    </item>
    <item>
      <title>Re: Hbase filter query using pyspark</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382907#M244740</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109002"&gt;@Taries&lt;/a&gt;,&amp;nbsp;Welcome to our community! To help you get the best possible answer, I have tagged in our HBase and Spark experts&amp;nbsp; &lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/40384"&gt;@smdas&lt;/a&gt;&amp;nbsp; &lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/78612"&gt;@RangaReddy&lt;/a&gt;&amp;nbsp;who may be able to assist you further.&lt;BR /&gt;&lt;BR /&gt;Please feel free to provide any additional information or details about your query, and we hope that you will find a satisfactory solution to your question.&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 07:02:11 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382907#M244740</guid>
      <dc:creator>VidyaSargur</dc:creator>
      <dc:date>2024-01-31T07:02:11Z</dc:date>
    </item>
    <item>
      <title>Re: Hbase filter query using pyspark</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382912#M244742</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109002"&gt;@Taries&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;You need to use the following two parameters to apply filter.&lt;/P&gt;&lt;P&gt;hbase.spark.query.timerange.start&lt;/P&gt;&lt;P&gt;hbase.spark.query.timerange.end&lt;/P&gt;&lt;P&gt;&lt;STRONG&gt;Reference:&lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://github.com/apache/hbase-connectors/blob/307607cf7287084b3ce49cdd96d094e2ede9363a/spark/hbase-spark/src/main/scala/org/apache/hadoop/hbase/spark/datasources/HBaseSparkConf.scala#L65" target="_blank"&gt;https://github.com/apache/hbase-connectors/blob/307607cf7287084b3ce49cdd96d094e2ede9363a/spark/hbase-spark/src/main/scala/org/apache/hadoop/hbase/spark/datasources/HBaseSparkConf.scala#L65&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 08:34:00 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382912#M244742</guid>
      <dc:creator>RangaReddy</dc:creator>
      <dc:date>2024-01-31T08:34:00Z</dc:date>
    </item>
    <item>
      <title>Re: Hbase filter query using pyspark</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382927#M244748</link>
      <description>&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Taries_0-1706710173347.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/39631iC4D950338464D2C1/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Taries_0-1706710173347.png" alt="Taries_0-1706710173347.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;with the above given options, it is only taking the timerange start and end , not considering the rowkey passed along with it.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 14:09:35 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382927#M244748</guid>
      <dc:creator>Taries</dc:creator>
      <dc:date>2024-01-31T14:09:35Z</dc:date>
    </item>
    <item>
      <title>Re: Hbase filter query using pyspark</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382931#M244750</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109002"&gt;@Taries&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;As I mentioned previously,&lt;/SPAN&gt;&lt;SPAN&gt; only the &lt;/SPAN&gt;hbase.spark.query.timerange&lt;SPAN&gt; parameter can be used for filtering data during read.&lt;/SPAN&gt;&lt;SPAN&gt; The &lt;/SPAN&gt;hbase.spark.scan&lt;SPAN&gt; parameter wouldn't be set for this purpose.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;To filter the data after reading, you can apply a Spark WHERE or filter clause with your desired conditions.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 14:59:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/382931#M244750</guid>
      <dc:creator>RangaReddy</dc:creator>
      <dc:date>2024-01-31T14:59:57Z</dc:date>
    </item>
    <item>
      <title>Re: Hbase filter query using pyspark</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/383107#M244821</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109002"&gt;@Taries&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I hope you are doing good. Do you need any further help on this issue. If above solutions is helped in your case please accept the Solution. It will help for others.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 04 Feb 2024 15:46:28 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hbase-filter-query-using-pyspark/m-p/383107#M244821</guid>
      <dc:creator>RangaReddy</dc:creator>
      <dc:date>2024-02-04T15:46:28Z</dc:date>
    </item>
  </channel>
</rss>

