<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: help to convert html files into text files in SAS Procedures</title>
    <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116183#M32053</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;The html files are 10-k reports from SEC edgar. I want to convert these html files into text files. I also have url of these html files.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Wed, 16 May 2012 04:56:38 GMT</pubDate>
    <dc:creator>shalmali</dc:creator>
    <dc:date>2012-05-16T04:56:38Z</dc:date>
    <item>
      <title>help to convert html files into text files</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116179#M32049</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hello Everyone,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have almost 12000 html files. I want to convert these html files into text files. Is there any code to import html files in sas and convert it in to text file?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thank you for your time.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 16 May 2012 00:44:58 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116179#M32049</guid>
      <dc:creator>shalmali</dc:creator>
      <dc:date>2012-05-16T00:44:58Z</dc:date>
    </item>
    <item>
      <title>Re: help to convert html files into text files</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116180#M32050</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;You should just search for html to text converters on the web.&amp;nbsp; Or perhaps html to xml.&lt;/P&gt;&lt;P&gt;If the format is very clean you might be able to read it with a data step.&lt;/P&gt;&lt;P&gt;You might also look into reading them into Excel and then importing into SAS from excel.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 16 May 2012 00:52:10 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116180#M32050</guid>
      <dc:creator>Tom</dc:creator>
      <dc:date>2012-05-16T00:52:10Z</dc:date>
    </item>
    <item>
      <title>Re: help to convert html files into text files</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116181#M32051</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Can you provide one as an example?&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 16 May 2012 01:37:09 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116181#M32051</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2012-05-16T01:37:09Z</dc:date>
    </item>
    <item>
      <title>Re: help to convert html files into text files</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116182#M32052</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;The simplest way is using OLEDB .&lt;/P&gt;&lt;P&gt;&lt;A __default_attr="116355" __jive_macro_name="message" class="jive_macro jive_macro_message" href="https://communities.sas.com/"&gt;&lt;/A&gt;&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 16 May 2012 02:53:48 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116182#M32052</guid>
      <dc:creator>Ksharp</dc:creator>
      <dc:date>2012-05-16T02:53:48Z</dc:date>
    </item>
    <item>
      <title>Re: help to convert html files into text files</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116183#M32053</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;The html files are 10-k reports from SEC edgar. I want to convert these html files into text files. I also have url of these html files.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 16 May 2012 04:56:38 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116183#M32053</guid>
      <dc:creator>shalmali</dc:creator>
      <dc:date>2012-05-16T04:56:38Z</dc:date>
    </item>
    <item>
      <title>Re: help to convert html files into text files</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116184#M32054</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Oh. Maybe you should firstly download all these htmls at your local PC by using PROC HTTP or filename+url .Then using the method I posted convert it into SAS Datasets ,and use proc export to export txt files.&lt;/P&gt;&lt;P&gt;It is easy. I think. &lt;img id="smileyhappy" class="emoticon emoticon-smileyhappy" src="https://communities.sas.com/i/smilies/16x16_smiley-happy.png" alt="Smiley Happy" title="Smiley Happy" /&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Ksharp&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 16 May 2012 06:13:06 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/help-to-convert-html-files-into-text-files/m-p/116184#M32054</guid>
      <dc:creator>Ksharp</dc:creator>
      <dc:date>2012-05-16T06:13:06Z</dc:date>
    </item>
  </channel>
</rss>

