<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: tFileOutputParquet - creating Parquet files in Talend Studio</title>
    <link>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343371#M111134</link>
    <description>&lt;P&gt;Hello @Rui Motta​&amp;nbsp;,&lt;/P&gt;&lt;P&gt;It's a well known issue about hadoop on windows&lt;/P&gt;&lt;P&gt;see https://cwiki.apache.org/confluence/display/HADOOP2/WindowsProblems&lt;/P&gt;&lt;P&gt;The solution is:&lt;/P&gt;&lt;OL&gt;&lt;LI&gt; git clone the repository https://github.com/steveloughran/winutils to your local machine&lt;/LI&gt;&lt;LI&gt; Set the environment variable %HADOOP_HOME% to point to the directory above the BIN dir containing WINUTILS.EXE, it need to restart the studio make it take into account.&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;         Or&lt;/P&gt;&lt;P&gt;        setup a jvm parameter -Dhadoop.home.dir in the job's Run-&amp;gt;Advanced settings page as the below&lt;/P&gt;&lt;P&gt;          &lt;span class="lia-inline-image-display-wrapper" image-alt="0695b00000hraphAAA.png"&gt;&lt;img src="https://community.qlik.com/t5/image/serverpage/image-id/128267iAE74F69EEDA2FB1F/image-size/large?v=v2&amp;amp;px=999" role="button" title="0695b00000hraphAAA.png" alt="0695b00000hraphAAA.png" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 10 May 2023 01:45:24 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2023-05-10T01:45:24Z</dc:date>
    <item>
      <title>tFileOutputParquet - creating Parquet files</title>
      <link>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343370#M111133</link>
      <description>&lt;P&gt;Hi there,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I created this very simple Job:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="0695b00000hrU6MAAU.png"&gt;&lt;img src="https://community.qlik.com/t5/image/serverpage/image-id/146970iFF4325212091E716/image-size/large?v=v2&amp;amp;px=999" role="button" title="0695b00000hrU6MAAU.png" alt="0695b00000hrU6MAAU.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;There's no problem when I run it in Talend Cloud Big Data.&lt;/P&gt;&lt;P&gt;But when I run the same Job on Talend Cloud Data Fabric, on the same computer, it gives me the followinh error:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;"&lt;I&gt;Starting job ReadParquetFile at 12:41 09/05/2023.&lt;/I&gt;&lt;/P&gt;&lt;P&gt;&lt;I&gt;Error: Could not find or load main class Dhadoop.home.dir=C:\hadoop-3.3.0\bin&lt;/I&gt;&lt;/P&gt;&lt;P&gt;&lt;I&gt;Caused by: java.lang.ClassNotFoundException: Dhadoop.home.dir=C:\hadoop-3.3.0\bin&lt;/I&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;I&gt;Job ReadParquetFile ended at 12:41 09/05/2023. [Exit code&amp;nbsp;= 1]&lt;/I&gt;".&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Can anyone please help me solve this issue?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I appreciate it.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Rui&lt;/P&gt;</description>
      <pubDate>Fri, 15 Nov 2024 21:50:08 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343370#M111133</guid>
      <dc:creator>RMotta2408</dc:creator>
      <dc:date>2024-11-15T21:50:08Z</dc:date>
    </item>
    <item>
      <title>Re: tFileOutputParquet - creating Parquet files</title>
      <link>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343371#M111134</link>
      <description>&lt;P&gt;Hello @Rui Motta​&amp;nbsp;,&lt;/P&gt;&lt;P&gt;It's a well known issue about hadoop on windows&lt;/P&gt;&lt;P&gt;see https://cwiki.apache.org/confluence/display/HADOOP2/WindowsProblems&lt;/P&gt;&lt;P&gt;The solution is:&lt;/P&gt;&lt;OL&gt;&lt;LI&gt; git clone the repository https://github.com/steveloughran/winutils to your local machine&lt;/LI&gt;&lt;LI&gt; Set the environment variable %HADOOP_HOME% to point to the directory above the BIN dir containing WINUTILS.EXE, it need to restart the studio make it take into account.&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;         Or&lt;/P&gt;&lt;P&gt;        setup a jvm parameter -Dhadoop.home.dir in the job's Run-&amp;gt;Advanced settings page as the below&lt;/P&gt;&lt;P&gt;          &lt;span class="lia-inline-image-display-wrapper" image-alt="0695b00000hraphAAA.png"&gt;&lt;img src="https://community.qlik.com/t5/image/serverpage/image-id/128267iAE74F69EEDA2FB1F/image-size/large?v=v2&amp;amp;px=999" role="button" title="0695b00000hraphAAA.png" alt="0695b00000hraphAAA.png" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 10 May 2023 01:45:24 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343371#M111134</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2023-05-10T01:45:24Z</dc:date>
    </item>
    <item>
      <title>Re: tFileOutputParquet - creating Parquet files</title>
      <link>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343372#M111135</link>
      <description>&lt;P&gt;@Aiming Chen​&amp;nbsp;, thank you so much for your help.&lt;/P&gt;&lt;P&gt;It worked like it was supposed to.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I really appreciate all the help you've been giving.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Rui&lt;/P&gt;</description>
      <pubDate>Thu, 11 May 2023 13:12:45 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/tFileOutputParquet-creating-Parquet-files/m-p/2343372#M111135</guid>
      <dc:creator>RMotta2408</dc:creator>
      <dc:date>2023-05-11T13:12:45Z</dc:date>
    </item>
  </channel>
</rss>

