<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Scrape website in QlikView</title>
    <link>https://community.qlik.com/t5/QlikView/Scrape-website/m-p/1023894#M346153</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Yes it is possible. I have done it by retrieving the entire HTML page as text. Then I use TextBetween() and other text functions to get the info I want.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The trick is to deselect HTML as format with the Web File wizard and choose FIXED as format. Then all the HTML text-lines will be retrieved into one field.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The load script will look like this:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE __default_attr="sql" __jive_macro_name="code" class="jive_macro_code _jivemacro_uid_14605421313516629 jive_text_macro" jivemacro_uid="_14605421313516629"&gt;
&lt;P&gt;ALLHTML:&lt;/P&gt;
&lt;P&gt;LOAD&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; Concat(Line, Chr(13) &amp;amp; Chr(10) , R ) AS HTML&amp;nbsp;&amp;nbsp;&amp;nbsp; // merge the table lines into a single field with linefeeds&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; // R is to get them concatenated in the right order.&lt;/P&gt;
&lt;P&gt;;&lt;/P&gt;
&lt;P&gt;LOAD&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; RecNo() AS R,&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; [@1:n] AS Line&lt;/P&gt;
&lt;P&gt;FROM&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; [&lt;/SPAN&gt;&lt;A class="jive-link-external-small" href="http://www.eurexclearing.com/clearing-en/markets-services/eurex-otc-clear/interest-rate-swaps/clearing-volume" rel="nofollow" target="_blank"&gt;http://www.eurexclearing.com/clearing-en/markets-services/eurex-otc-clear/interest-rate-swaps/clearing-volume&lt;/A&gt;&lt;SPAN&gt;]&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; (fix, utf8, no labels, no eof);&lt;/P&gt;
&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;If you then refer to HTML in an expression you will get this single field as the full text of the page.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Wed, 13 Apr 2016 11:23:04 GMT</pubDate>
    <dc:creator>petter</dc:creator>
    <dc:date>2016-04-13T11:23:04Z</dc:date>
    <item>
      <title>Scrape website</title>
      <link>https://community.qlik.com/t5/QlikView/Scrape-website/m-p/1023893#M346152</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi all,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This website &lt;A href="http://www.eurexclearing.com/clearing-en/markets-services/eurex-otc-clear/interest-rate-swaps/clearing-volume" title="http://www.eurexclearing.com/clearing-en/markets-services/eurex-otc-clear/interest-rate-swaps/clearing-volume"&gt;Eurex Clearing - Clearing volume&lt;/A&gt; does not have any HTML tables but has data in lists. Is there still a way to pull this into Qlikview? Thanks. &lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 13 Apr 2016 07:27:37 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Scrape-website/m-p/1023893#M346152</guid>
      <dc:creator>sifatnabil</dc:creator>
      <dc:date>2016-04-13T07:27:37Z</dc:date>
    </item>
    <item>
      <title>Re: Scrape website</title>
      <link>https://community.qlik.com/t5/QlikView/Scrape-website/m-p/1023894#M346153</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Yes it is possible. I have done it by retrieving the entire HTML page as text. Then I use TextBetween() and other text functions to get the info I want.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The trick is to deselect HTML as format with the Web File wizard and choose FIXED as format. Then all the HTML text-lines will be retrieved into one field.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The load script will look like this:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE __default_attr="sql" __jive_macro_name="code" class="jive_macro_code _jivemacro_uid_14605421313516629 jive_text_macro" jivemacro_uid="_14605421313516629"&gt;
&lt;P&gt;ALLHTML:&lt;/P&gt;
&lt;P&gt;LOAD&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; Concat(Line, Chr(13) &amp;amp; Chr(10) , R ) AS HTML&amp;nbsp;&amp;nbsp;&amp;nbsp; // merge the table lines into a single field with linefeeds&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; // R is to get them concatenated in the right order.&lt;/P&gt;
&lt;P&gt;;&lt;/P&gt;
&lt;P&gt;LOAD&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; RecNo() AS R,&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; [@1:n] AS Line&lt;/P&gt;
&lt;P&gt;FROM&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; [&lt;/SPAN&gt;&lt;A class="jive-link-external-small" href="http://www.eurexclearing.com/clearing-en/markets-services/eurex-otc-clear/interest-rate-swaps/clearing-volume" rel="nofollow" target="_blank"&gt;http://www.eurexclearing.com/clearing-en/markets-services/eurex-otc-clear/interest-rate-swaps/clearing-volume&lt;/A&gt;&lt;SPAN&gt;]&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; (fix, utf8, no labels, no eof);&lt;/P&gt;
&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;If you then refer to HTML in an expression you will get this single field as the full text of the page.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 13 Apr 2016 11:23:04 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Scrape-website/m-p/1023894#M346153</guid>
      <dc:creator>petter</dc:creator>
      <dc:date>2016-04-13T11:23:04Z</dc:date>
    </item>
  </channel>
</rss>

