<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Read data from a pdf file in QlikView</title>
    <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553126#M206661</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;No, but there are converters from PDF to Excel.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Tue, 10 Dec 2013 19:39:04 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2013-12-10T19:39:04Z</dc:date>
    <item>
      <title>Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553125#M206660</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi All,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Is there any way or any extension available to read data from a pdf file,&lt;/P&gt;&lt;P&gt;just like we use to read from other sources as excel , or db etc..&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 10 Dec 2013 11:08:21 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553125#M206660</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2013-12-10T11:08:21Z</dc:date>
    </item>
    <item>
      <title>Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553126#M206661</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;No, but there are converters from PDF to Excel.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 10 Dec 2013 19:39:04 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553126#M206661</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2013-12-10T19:39:04Z</dc:date>
    </item>
    <item>
      <title>Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553127#M206662</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Interesting.. Could you post an example PDF file to understand the use case?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;- Ralf&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 10 Dec 2013 19:50:44 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553127#M206662</guid>
      <dc:creator>rbecher</dc:creator>
      <dc:date>2013-12-10T19:50:44Z</dc:date>
    </item>
    <item>
      <title>Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553128#M206663</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Interesting. . . Could you post an example PDF file to understand the use case?&lt;BR /&gt;-Brijesh&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Jan 2014 08:20:48 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553128#M206663</guid>
      <dc:creator>brijesh1991</dc:creator>
      <dc:date>2014-01-02T08:20:48Z</dc:date>
    </item>
    <item>
      <title>Re: Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553129#M206664</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;PFA a sample.........&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Jan 2014 10:01:54 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553129#M206664</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2014-01-02T10:01:54Z</dc:date>
    </item>
    <item>
      <title>Re: Re: Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553130#M206665</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Nitin,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;this is quite a long road.. You can do it with a file conversion using &lt;STRONG&gt;pdftohtml&lt;/STRONG&gt;.exe from Sourceforge:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE __default_attr="plain" __jive_macro_name="code" class="_jivemacro_uid_13886622633477730 jive_text_macro jive_macro_code" jivemacro_uid="_13886622633477730" modifiedtitle="true"&gt;
&lt;P&gt;// Set path of source file&lt;/P&gt;
&lt;P&gt;Set vPath = C:\Projekte\QVPDF\;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// Set amount of columns&lt;/P&gt;
&lt;P&gt;Set vCols = 2;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// convert PDF file to XML&lt;/P&gt;
&lt;P&gt;EXECUTE cmd.exe /C pdftohtml.exe -xml $(vPath)sample.pdf;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// Load from XML (this is very dependent from PDF layout!)&lt;/P&gt;
&lt;P&gt;RawData:&lt;/P&gt;
&lt;P&gt;LOAD text%Table as value&lt;/P&gt;
&lt;P&gt;FROM [$(vPath)sample.xml] (XmlSimple, Table is [pdf2xml/page/text]);&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// Load field names from header for later renaming&lt;/P&gt;
&lt;P&gt;HeaderMap:&lt;/P&gt;
&lt;P&gt;Mapping First $(vCols) LOAD '@' &amp;amp; RecNo() as x,&amp;nbsp; value as y&lt;/P&gt;
&lt;P&gt;Resident RawData;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// build a proper input table&lt;/P&gt;
&lt;P&gt;InputTable:&lt;/P&gt;
&lt;P&gt;LOAD ceil(RecNo()/2)-1 as %key, if(Mod(RecNo(),2)&amp;gt;0, '@1', '@2') as attribute, value&lt;/P&gt;
&lt;P&gt;Resident RawData&lt;/P&gt;
&lt;P&gt;Where RecNo()&amp;gt;$(vCols);&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// generic load from input table&lt;/P&gt;
&lt;P&gt;GenTable:&lt;/P&gt;
&lt;P&gt;Generic LOAD * Resident InputTable;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;// consolidation of tables created by generic load&lt;/P&gt;
&lt;P&gt;ResultTable:&lt;/P&gt;
&lt;P&gt;LOAD Distinct %key Resident InputTable;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;FOR i = 0 to NoOfTables()&lt;/P&gt;
&lt;P&gt;TableList:&lt;/P&gt;
&lt;P&gt;LOAD TableName($(i)) as Tablename AUTOGENERATE 1&lt;/P&gt;
&lt;P&gt;WHERE WildMatch(TableName($(i)), 'GenTable.*');&lt;/P&gt;
&lt;P&gt;NEXT i&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;FOR i = 1 to FieldValueCount('Tablename')&lt;/P&gt;
&lt;P&gt;LET vTable = FieldValue('Tablename', $(i));&lt;/P&gt;
&lt;P&gt;LEFT JOIN (ResultTable) LOAD * RESIDENT [$(vTable)];&lt;/P&gt;
&lt;P&gt;DROP TABLE [$(vTable)];&lt;/P&gt;
&lt;P&gt;NEXT i&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;DROP TABLES RawData, TableList, InputTable;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;RENAME Fields Using HeaderMap;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;P&gt;&lt;/P&gt;
&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;To run an external command you have to do these settings:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;IMG alt="Settings02.png" class="jive-image" src="https://community.qlik.com/legacyfs/online/50977_Settings02.png" /&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Open dialog by Shift-Ctrl-M:&lt;/P&gt;&lt;P&gt;&lt;IMG alt="Settings01.png" class="jive-image" src="https://community.qlik.com/legacyfs/online/50976_Settings01.png" /&gt;&lt;/P&gt;&lt;P&gt;- Ralf&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Jan 2014 11:35:44 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553130#M206665</guid>
      <dc:creator>rbecher</dc:creator>
      <dc:date>2014-01-02T11:35:44Z</dc:date>
    </item>
    <item>
      <title>Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553131#M206666</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;HI,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have done this to fetch data from voter list provided in government site.&lt;/P&gt;&lt;P&gt;As the files are in pdf format, i used a weeny free excel convertor&amp;nbsp; to convert it in excel format.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Now you can easily load excel files in QV.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Regards&lt;/P&gt;&lt;P&gt;Arun&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 16 Jan 2014 05:04:35 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553131#M206666</guid>
      <dc:creator />
      <dc:date>2014-01-16T05:04:35Z</dc:date>
    </item>
    <item>
      <title>Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553132#M206667</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;hi Ralf ,&lt;/P&gt;&lt;P&gt;this is really interesting. its working&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;great ! &lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 16 Jan 2014 05:12:02 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553132#M206667</guid>
      <dc:creator />
      <dc:date>2014-01-16T05:12:02Z</dc:date>
    </item>
    <item>
      <title>Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553133#M206668</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;I happened to download this file. &lt;/P&gt;&lt;P&gt;DON'T&lt;/P&gt;&lt;P&gt;Win32/Vigram.A virus&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 08 May 2018 11:57:14 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/553133#M206668</guid>
      <dc:creator>jerrysvensson</dc:creator>
      <dc:date>2018-05-08T11:57:14Z</dc:date>
    </item>
    <item>
      <title>Re: Re: Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/1564266#M441547</link>
      <description>&lt;P&gt;hi Ralp,&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;I ran the samples you submitted. but I got the error below. Could there be a problem with the version? Qlikview version 12.20&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Error text:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;The top level of the document is invalid.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;On line number: 2. On column number: 11. System ID: sample.xml.&lt;/P&gt;&lt;P&gt;RawData:&lt;BR /&gt;LOAD text%Table as value&lt;BR /&gt;FROM [C:\PDFtoQVD\sample.xml] (XmlSimple, Table is [pdf2xml/page/text])&lt;/P&gt;</description>
      <pubDate>Wed, 03 Apr 2019 05:32:48 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/1564266#M441547</guid>
      <dc:creator>nurettinsahin</dc:creator>
      <dc:date>2019-04-03T05:32:48Z</dc:date>
    </item>
    <item>
      <title>Re: Re: Re: Read data from a pdf file</title>
      <link>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/1593636#M443765</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;Do you use this XML to map all fields and rows there are inside the PDF? If it's ok, do you know if there is another way to do this?&lt;/P&gt;&lt;P&gt;Thank you&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jun 2019 13:25:05 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Read-data-from-a-pdf-file/m-p/1593636#M443765</guid>
      <dc:creator>wnascimento</dc:creator>
      <dc:date>2019-06-19T13:25:05Z</dc:date>
    </item>
  </channel>
</rss>

