<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Need to extract data from pdf file in SAS Data Science</title>
    <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484284#M9935</link>
    <description>&lt;P&gt;Thank you for your help. In may case getting something out of the "official list" is discouraging. In any case will see what&amp;nbsp;can be done. Kind regards&lt;/P&gt;&lt;BLOCKQUOTE&gt;&lt;HR /&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/45151"&gt;@RW9&lt;/a&gt;&amp;nbsp;wrote:&lt;BR /&gt;&lt;P&gt;IT are not your enemy, there will be a way of getting the required software, just ask them.&amp;nbsp; Much the same as you would need to get Adobe, or Text Miner or something else.&amp;nbsp;&amp;nbsp;&lt;/P&gt;&lt;HR /&gt;&lt;/BLOCKQUOTE&gt;&lt;P&gt;&lt;BR /&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Mon, 06 Aug 2018 07:46:59 GMT</pubDate>
    <dc:creator>marcelo_higasi</dc:creator>
    <dc:date>2018-08-06T07:46:59Z</dc:date>
    <item>
      <title>Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483338#M9926</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I need to extract data from PDF documents. Is there a way to do it using some SAS procedure or SAS coding.&lt;/P&gt;&lt;P&gt;I saw a case where R was required. Unfortunately this is not an option for me my company would not allow use of this software.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I saw a module called SAS® Text Miner 14.2. It seems to handle PDF but I am not sure if it requires a separate license for it.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Does anyone know?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you,&lt;/P&gt;&lt;P&gt;Marcelo&lt;/P&gt;</description>
      <pubDate>Thu, 02 Aug 2018 10:37:31 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483338#M9926</guid>
      <dc:creator>marcelo_higasi</dc:creator>
      <dc:date>2018-08-02T10:37:31Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483360#M9927</link>
      <description>&lt;P&gt;Yes, text miner will be a licensed product, contact SAS for pricing.&lt;/P&gt;
&lt;P&gt;Why is R not an option?&amp;nbsp; Its free, and if it does the job use it.&lt;/P&gt;
&lt;P&gt;In normal SAS, no, there is no simple way of reading a PDF.&amp;nbsp; Extracting data from PDFs is a very complex and tricky process, and highly recommend to not go down that route.&amp;nbsp; Return to the source data, or if that is not possible, requisition some data entry.&lt;/P&gt;</description>
      <pubDate>Thu, 02 Aug 2018 12:13:04 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483360#M9927</guid>
      <dc:creator>RW9</dc:creator>
      <dc:date>2018-08-02T12:13:04Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483417#M9928</link>
      <description>&lt;P&gt;Adobe Professional has the capability to transfer the text/data out and that's the easiest and most accurate method I've found. Besides using Nvivo or a text mining tool.&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;BLOCKQUOTE&gt;&lt;HR /&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/112066"&gt;@marcelo_higasi&lt;/a&gt;&amp;nbsp;wrote:&lt;BR /&gt;
&lt;P&gt;Hello,&lt;/P&gt;
&lt;P&gt;I need to extract data from PDF documents. Is there a way to do it using some SAS procedure or SAS coding.&lt;/P&gt;
&lt;P&gt;I saw a case where R was required. Unfortunately this is not an option for me my company would not allow use of this software.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I saw a module called SAS® Text Miner 14.2. It seems to handle PDF but I am not sure if it requires a separate license for it.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Does anyone know?&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Thank you,&lt;/P&gt;
&lt;P&gt;Marcelo&lt;/P&gt;
&lt;HR /&gt;&lt;/BLOCKQUOTE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 02 Aug 2018 14:36:46 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483417#M9928</guid>
      <dc:creator>Reeza</dc:creator>
      <dc:date>2018-08-02T14:36:46Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483652#M9929</link>
      <description>&lt;P&gt;Thank you for the quick response.&lt;/P&gt;&lt;P&gt;R is not available at my company. I will need an alternative solution.&lt;/P&gt;&lt;P&gt;Kind regards&lt;/P&gt;</description>
      <pubDate>Fri, 03 Aug 2018 02:52:23 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483652#M9929</guid>
      <dc:creator>marcelo_higasi</dc:creator>
      <dc:date>2018-08-03T02:52:23Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483654#M9930</link>
      <description>&lt;P&gt;Using PDF professional seems like a possible solution. Thank&amp;nbsp;you!&lt;/P&gt;</description>
      <pubDate>Fri, 03 Aug 2018 02:54:06 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483654#M9930</guid>
      <dc:creator>marcelo_higasi</dc:creator>
      <dc:date>2018-08-03T02:54:06Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483693#M9931</link>
      <description>&lt;P&gt;Put it on a pen drive, it can be portable:&lt;/P&gt;
&lt;P&gt;&lt;A href="https://sourceforge.net/projects/rportable/" target="_blank"&gt;https://sourceforge.net/projects/rportable/&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 03 Aug 2018 07:51:37 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483693#M9931</guid>
      <dc:creator>RW9</dc:creator>
      <dc:date>2018-08-03T07:51:37Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483946#M9932</link>
      <description>&lt;P&gt;My work has all USB connections blocked. &lt;span class="lia-unicode-emoji" title=":disappointed_face:"&gt;😞&lt;/span&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 03 Aug 2018 23:32:27 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/483946#M9932</guid>
      <dc:creator>Reeza</dc:creator>
      <dc:date>2018-08-03T23:32:27Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484280#M9933</link>
      <description>&lt;P&gt;IT are not your enemy, there will be a way of getting the required software, just ask them.&amp;nbsp; Much the same as you would need to get Adobe, or Text Miner or something else.&amp;nbsp;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 06 Aug 2018 07:37:15 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484280#M9933</guid>
      <dc:creator>RW9</dc:creator>
      <dc:date>2018-08-06T07:37:15Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484283#M9934</link>
      <description>&lt;P&gt;My work has all USB connections blocked too! &lt;span class="lia-unicode-emoji" title=":disappointed_face:"&gt;😞&lt;/span&gt;&lt;/P&gt;&lt;BLOCKQUOTE&gt;&lt;HR /&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/45151"&gt;@RW9&lt;/a&gt;&amp;nbsp;wrote:&lt;BR /&gt;&lt;P&gt;Put it on a pen drive, it can be portable:&lt;/P&gt;&lt;P&gt;&lt;A href="https://sourceforge.net/projects/rportable/" target="_blank"&gt;https://sourceforge.net/projects/rportable/&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;HR /&gt;&lt;/BLOCKQUOTE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 06 Aug 2018 07:43:47 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484283#M9934</guid>
      <dc:creator>marcelo_higasi</dc:creator>
      <dc:date>2018-08-06T07:43:47Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484284#M9935</link>
      <description>&lt;P&gt;Thank you for your help. In may case getting something out of the "official list" is discouraging. In any case will see what&amp;nbsp;can be done. Kind regards&lt;/P&gt;&lt;BLOCKQUOTE&gt;&lt;HR /&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/45151"&gt;@RW9&lt;/a&gt;&amp;nbsp;wrote:&lt;BR /&gt;&lt;P&gt;IT are not your enemy, there will be a way of getting the required software, just ask them.&amp;nbsp; Much the same as you would need to get Adobe, or Text Miner or something else.&amp;nbsp;&amp;nbsp;&lt;/P&gt;&lt;HR /&gt;&lt;/BLOCKQUOTE&gt;&lt;P&gt;&lt;BR /&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 06 Aug 2018 07:46:59 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484284#M9935</guid>
      <dc:creator>marcelo_higasi</dc:creator>
      <dc:date>2018-08-06T07:46:59Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484288#M9936</link>
      <description>&lt;P&gt;Ahh, then that is easy.&amp;nbsp; Your response would be:&lt;/P&gt;
&lt;P&gt;PDF is not a datasource, it is next to impossible to extract anything from it.&amp;nbsp; Therefore there are three options:&lt;/P&gt;
&lt;P&gt;1) Go back to source and get appropriate data&lt;/P&gt;
&lt;P&gt;2)&amp;nbsp;Assign/hire someone to data entry all the data from the pdf&lt;/P&gt;
&lt;P&gt;3) Aquire tools to do such a task&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Its up to your company which they choose, but saying none of those is possible, makes your end impossible.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 06 Aug 2018 07:58:51 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484288#M9936</guid>
      <dc:creator>RW9</dc:creator>
      <dc:date>2018-08-06T07:58:51Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484489#M9937</link>
      <description>Hi Marcelo,&lt;BR /&gt;&lt;BR /&gt;As far as I am aware, the pdf conversion in Text miner is based on Apache Tika (&lt;A href="https://tika.apache.org/" target="_blank"&gt;https://tika.apache.org/&lt;/A&gt;) . I would consider these as a set of (Java based) programs which help in extracting data from a number of different document formats - pdfs, ppts, doc files etc.&lt;BR /&gt;You do not need to have Text Miner specifically to access Tika - if you explore your licences and happen to notice "Document Conversion Server" among your registered products - you may still be able to call the Tika program from the location / port where document conversion server is running.&lt;BR /&gt;In any case, you always have an option of installing and calling Tika from the command line interface. (It is a pretty lightweight utility)</description>
      <pubDate>Mon, 06 Aug 2018 18:52:48 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484489#M9937</guid>
      <dc:creator>SundareshS</dc:creator>
      <dc:date>2018-08-06T18:52:48Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484526#M9938</link>
      <description>&lt;P&gt;Besides PDF files, there are several types of files that SAS can read in.&amp;nbsp; You can see a full list at the following URL:&lt;BR /&gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp; &lt;A href="http://go.documentation.sas.com/?docsetId=tmref&amp;amp;docsetTarget=n1f1hnf1pk8w3in1i2h4v94rty2m.htm&amp;amp;docsetVersion=14.3&amp;amp;locale=en#p1xbvpf5z67255n1j4w868q6e4sc" target="_blank"&gt;http://go.documentation.sas.com/?docsetId=tmref&amp;amp;docsetTarget=n1f1hnf1pk8w3in1i2h4v94rty2m.htm&amp;amp;docsetVersion=14.3&amp;amp;locale=en#p1xbvpf5z67255n1j4w868q6e4sc&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 06 Aug 2018 20:35:16 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/484526#M9938</guid>
      <dc:creator>CraigDeVault</dc:creator>
      <dc:date>2018-08-06T20:35:16Z</dc:date>
    </item>
    <item>
      <title>Re: Need to extract data from pdf file</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/566805#M9939</link>
      <description>&lt;P&gt;You need not, need to Install R in your PC. You can directly use it on cloud platform. See the following link, might be helpfull.&amp;nbsp;&lt;/P&gt;&lt;P&gt;link:&amp;nbsp;&lt;A href="https://rstudio.cloud/" target="_self"&gt;https://rstudio.cloud/&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 18 Jun 2019 08:04:07 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Need-to-extract-data-from-pdf-file/m-p/566805#M9939</guid>
      <dc:creator>surajmetha55</dc:creator>
      <dc:date>2019-06-18T08:04:07Z</dc:date>
    </item>
  </channel>
</rss>

