<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Dataextraction from a Webpage in QlikView</title>
    <link>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202102#M59928</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Dear Experts,&lt;/P&gt;&lt;P&gt;I am trying to extract data from a webpage, so far nothing special, but am not able to extract the data. The URL reads&lt;/P&gt;&lt;P&gt;http://en.chineseshipping.com.cn/html/ccfi.asp&lt;/P&gt;&lt;P&gt;The required data should reside in table @8, but QV extracts only the header and columns, but not the values itself (and neither the dates in the header). Could neither find something in the source-code of the page. Looks as if the data are somehow generated over the existing webpage - Has someone a solution for this?&lt;/P&gt;&lt;P&gt;&lt;IMG alt="error loading image" class="jive-image error-loading-image" src="https://community.qlik.com/legacyfs/online/-2362_sourceID:2362" /&gt;&lt;/P&gt;&lt;P&gt;Peter&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Wed, 15 Sep 2010 13:13:54 GMT</pubDate>
    <dc:creator>prieper</dc:creator>
    <dc:date>2010-09-15T13:13:54Z</dc:date>
    <item>
      <title>Dataextraction from a Webpage</title>
      <link>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202102#M59928</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Dear Experts,&lt;/P&gt;&lt;P&gt;I am trying to extract data from a webpage, so far nothing special, but am not able to extract the data. The URL reads&lt;/P&gt;&lt;P&gt;http://en.chineseshipping.com.cn/html/ccfi.asp&lt;/P&gt;&lt;P&gt;The required data should reside in table @8, but QV extracts only the header and columns, but not the values itself (and neither the dates in the header). Could neither find something in the source-code of the page. Looks as if the data are somehow generated over the existing webpage - Has someone a solution for this?&lt;/P&gt;&lt;P&gt;&lt;IMG alt="error loading image" class="jive-image error-loading-image" src="https://community.qlik.com/legacyfs/online/-2362_sourceID:2362" /&gt;&lt;/P&gt;&lt;P&gt;Peter&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 15 Sep 2010 13:13:54 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202102#M59928</guid>
      <dc:creator>prieper</dc:creator>
      <dc:date>2010-09-15T13:13:54Z</dc:date>
    </item>
    <item>
      <title>Dataextraction from a Webpage</title>
      <link>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202103#M59929</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Pretty tricky one. I know developers in China are very smart.&lt;/P&gt;&lt;P&gt;I think you need to do IE automation to open the page and then save it as a text file on your hard drive. Then in QV script you need to read the text file and parse out the stuff you want. I don't know why it doesn't show contents right when you save as html, but save as text shows the numbers you are looking for.&lt;/P&gt;&lt;P&gt;Something like this should help: &lt;A href="http://www.experts-exchange.com/Programming/Languages/Visual_Basic/VB_Script/Q_22786372.html"&gt;http://www.experts-exchange.com/Programming/Languages/Visual_Basic/VB_Script/Q_22786372.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Sorry, not a 100% solution, but may give you some ideas.&lt;/P&gt;&lt;P&gt;Rakesh&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 15 Sep 2010 15:39:30 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202103#M59929</guid>
      <dc:creator>disqr_rm</dc:creator>
      <dc:date>2010-09-15T15:39:30Z</dc:date>
    </item>
    <item>
      <title>Dataextraction from a Webpage</title>
      <link>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202104#M59930</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Peter, looks like the actual values that appear in the table are being loaded asynchronously (note the 'I'm doing something in the background' progress wheel that displays until the table's populated) once the web page itself has loaded, hence they don't appear in the html source.&lt;/P&gt;&lt;P&gt;You may want to google around "screen scraping ajax" for pointers on how to figure out how a given site's set up to grab data asynch... (almost certainly some javascript (the 'j' in ajax) in the mix somewhere).&lt;/P&gt;&lt;P&gt;Good luck, Jason&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 15 Sep 2010 16:39:20 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202104#M59930</guid>
      <dc:creator />
      <dc:date>2010-09-15T16:39:20Z</dc:date>
    </item>
    <item>
      <title>Dataextraction from a Webpage</title>
      <link>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202105#M59931</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Thanks Jason,&lt;/P&gt;&lt;P&gt;played around a bit, but still looks to be pretty cumbersome.&lt;/P&gt;&lt;P&gt;++ Peter&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 20 Sep 2010 10:01:30 GMT</pubDate>
      <guid>https://community.qlik.com/t5/QlikView/Dataextraction-from-a-Webpage/m-p/202105#M59931</guid>
      <dc:creator>prieper</dc:creator>
      <dc:date>2010-09-20T10:01:30Z</dc:date>
    </item>
  </channel>
</rss>

