<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Spark Big Data job in local mode - Configuring external hive metastore in Talend Studio</title>
    <link>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234726#M23992</link>
    <description>&lt;P&gt;&lt;A href="https://community.qlik.com/s/profile/0053p0000078APoAAM"&gt;@csapparapu&lt;/A&gt;, You can define below way in&amp;nbsp;&lt;/P&gt; 
&lt;DIV class="depth-2 content-locale-en-US"&gt;
  Define the advanced settings 
&lt;/DIV&gt; 
&lt;DIV class="content-locale-en-US content-locale-en depth-2"&gt; 
 &lt;DIV&gt; 
  &lt;DIV class="body taskbody"&gt; 
   &lt;DIV class="abstract"&gt; 
    &lt;SPAN class="shortdesc"&gt;Define Spark advanced settings in the Studio to read Spark 2.0 jar files in your cluster.&lt;/SPAN&gt; 
   &lt;/DIV&gt; 
   &lt;DIV class="tasklabel"&gt;
     Procedure 
   &lt;/DIV&gt; 
   &lt;OL&gt; 
    &lt;LI&gt;&lt;SPAN class="ph cmd"&gt;In the&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN class="ph uicontrol"&gt;Advanced properties&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;table, to add a row, click the plus symbol (&lt;SPAN class="ph uicontrol"&gt;+&lt;/SPAN&gt;).&lt;/SPAN&gt;&lt;/LI&gt; 
    &lt;LI&gt;&lt;SPAN class="ph cmd"&gt;In the&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN class="ph uicontrol"&gt;Property&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;column, in double quotation marks, enter&lt;SPAN&gt;&amp;nbsp;spark.sql.hive.metastore.jars&lt;/SPAN&gt;. This parameter provides the names of jar files to be used by your Spark Job, as well as the paths to them in your cluster.&lt;/SPAN&gt;&lt;/LI&gt; 
   &lt;/OL&gt; 
  &lt;/DIV&gt; 
 &lt;/DIV&gt; 
&lt;/DIV&gt;</description>
    <pubDate>Mon, 04 Nov 2019 08:59:56 GMT</pubDate>
    <dc:creator>manodwhb</dc:creator>
    <dc:date>2019-11-04T08:59:56Z</dc:date>
    <item>
      <title>Spark Big Data job in local mode - Configuring external hive metastore</title>
      <link>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234725#M23991</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;
&lt;P&gt;My goal is to run a Spark Big Data batch job using Talend in local mode, no third party clusters or distributions.&lt;/P&gt;
&lt;P&gt;I want to save the output to S3, but before that I want to register that data as an external table in a hive metastore.&lt;/P&gt;
&lt;P&gt;I would like to use an external hive metastore database. I was able to connect to an external mysql database as the metastore from my spark-shell.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I am having trouble on how to set spark.sql.hive.metastore.jars properties in the Run tab's Spark configuration. I couldn't find any information in the documentation.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Thanks for looking into this.&lt;/P&gt;
&lt;P&gt;Chandana&lt;/P&gt;</description>
      <pubDate>Sat, 16 Nov 2024 04:11:30 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234725#M23991</guid>
      <dc:creator>csapparapu</dc:creator>
      <dc:date>2024-11-16T04:11:30Z</dc:date>
    </item>
    <item>
      <title>Re: Spark Big Data job in local mode - Configuring external hive metastore</title>
      <link>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234726#M23992</link>
      <description>&lt;P&gt;&lt;A href="https://community.qlik.com/s/profile/0053p0000078APoAAM"&gt;@csapparapu&lt;/A&gt;, You can define below way in&amp;nbsp;&lt;/P&gt; 
&lt;DIV class="depth-2 content-locale-en-US"&gt;
  Define the advanced settings 
&lt;/DIV&gt; 
&lt;DIV class="content-locale-en-US content-locale-en depth-2"&gt; 
 &lt;DIV&gt; 
  &lt;DIV class="body taskbody"&gt; 
   &lt;DIV class="abstract"&gt; 
    &lt;SPAN class="shortdesc"&gt;Define Spark advanced settings in the Studio to read Spark 2.0 jar files in your cluster.&lt;/SPAN&gt; 
   &lt;/DIV&gt; 
   &lt;DIV class="tasklabel"&gt;
     Procedure 
   &lt;/DIV&gt; 
   &lt;OL&gt; 
    &lt;LI&gt;&lt;SPAN class="ph cmd"&gt;In the&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN class="ph uicontrol"&gt;Advanced properties&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;table, to add a row, click the plus symbol (&lt;SPAN class="ph uicontrol"&gt;+&lt;/SPAN&gt;).&lt;/SPAN&gt;&lt;/LI&gt; 
    &lt;LI&gt;&lt;SPAN class="ph cmd"&gt;In the&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN class="ph uicontrol"&gt;Property&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;column, in double quotation marks, enter&lt;SPAN&gt;&amp;nbsp;spark.sql.hive.metastore.jars&lt;/SPAN&gt;. This parameter provides the names of jar files to be used by your Spark Job, as well as the paths to them in your cluster.&lt;/SPAN&gt;&lt;/LI&gt; 
   &lt;/OL&gt; 
  &lt;/DIV&gt; 
 &lt;/DIV&gt; 
&lt;/DIV&gt;</description>
      <pubDate>Mon, 04 Nov 2019 08:59:56 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234726#M23992</guid>
      <dc:creator>manodwhb</dc:creator>
      <dc:date>2019-11-04T08:59:56Z</dc:date>
    </item>
    <item>
      <title>Re: Spark Big Data job in local mode - Configuring external hive metastore</title>
      <link>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234727#M23993</link>
      <description>&lt;P&gt;&lt;A href="https://community.qlik.com/s/profile/0053p000007LKmJAAW"&gt;@manodwhb&lt;/A&gt;,&lt;/P&gt; 
&lt;P&gt;Thanks for your reply, my question was which jar files to include. I have tried several jar files, as shown below, but still cannot run spark-sql in local mode.&lt;/P&gt; 
&lt;P&gt;Do you have an example of a spark batch job in local mode with an external hive metastore?&lt;/P&gt; 
&lt;P&gt;Are these jar files comma separated?&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;"file:///Users/abc/.m2/repository/mysql/mysql-connector-java/8.0.18/mysql-connector-java-8.0.18.jar;file:///Applications/TalendStudio-7.2.1/studio/configuration/.m2/repository/org/talend/libraries/hadoop-common-2.8.1/6.0.0/hadoop-common-2.8.1-6.0.0.jar;file:///Applications/TalendStudio-7.2.1/studio/configuration/.m2/repository/org/talend/libraries/spark-hive_2.11-2.2.0/6.0.0/spark-hive_2.11-2.2.0-6.0.0.jar;/Applications/TalendStudio-7.2.1/studio/configuration/.m2/repository/org/talend/libraries/hadoop-hdfs-2.6.0.2.2.0.0-2041/6.0.0/hadoop-hdfs-2.6.0.2.2.0.0-2041-6.0.0.jar;file:///Applications/TalendStudio-7.2.1/studio/configuration/.m2/repository/org/talend/libraries/hive-exec-2.1.0-talend-nolang3/6.0.0/hive-exec-2.1.0-talend-nolang3-6.0.0.jar;file:///Applications/TalendStudio-7.2.1/studio/configuration/.m2/repository/org/talend/libraries/hive-jdbc-2.1.0-amzn-0/6.0.0/hive-jdbc-2.1.0-amzn-0-6.0.0.jar"&lt;/P&gt;</description>
      <pubDate>Fri, 08 Nov 2019 22:29:27 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/Spark-Big-Data-job-in-local-mode-Configuring-external-hive/m-p/2234727#M23993</guid>
      <dc:creator>csapparapu</dc:creator>
      <dc:date>2019-11-08T22:29:27Z</dc:date>
    </item>
  </channel>
</rss>

