<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How to reduce a large time series dataset in SAS Procedures</title>
    <link>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126216#M34676</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;PG,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Many thanks for this one, it worked perfectly. Apologies for the late reply, had the impression I had provided feedback&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Cheers&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Neo&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Sun, 05 May 2013 10:52:13 GMT</pubDate>
    <dc:creator>machete</dc:creator>
    <dc:date>2013-05-05T10:52:13Z</dc:date>
    <item>
      <title>How to reduce a large time series dataset</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126214#M34674</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Dear all,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This question partly originates from a larger problem currently addressed. For more info see below:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A __default_attr="40685" __jive_macro_name="thread" class="jive_macro jive_macro_thread" href="https://communities.sas.com/"&gt;&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have a large data set with 64 million observations containing high frequency (up to the second) data for currencies for a time period of 68 days.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I would like to reduce this dataset to a minute interval that is. Randomly to pick for each currency 1 observation per minute. This should net 60x24=1440 observations per day per currency and around 100 000(1440x68) per currency for the whole time period.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Since I have around 10 currencies the dataset will be reduced from 64 million to 10x100 000= 1 million.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Do you have any ideas on how to reduce the dataset based on my suggestion?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I will then use this reduced dataset to overcome the computation difficulties that appear in the matching question post (see above link)&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Attached is a sample of the data set for only once currency.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thank you&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Best&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Neo&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Sun, 03 Mar 2013 17:52:58 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126214#M34674</guid>
      <dc:creator>machete</dc:creator>
      <dc:date>2013-03-03T17:52:58Z</dc:date>
    </item>
    <item>
      <title>Re: How to reduce a large time series dataset</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126215#M34675</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;If your full dataset is sorted by _RIC, date_G_ and time_G_, you could use surveyselect this way :&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;proc sql;&lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;create view chfReuters3 as&lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;select &lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; *, &lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; intnx("MINUTE", dhms(datepart(date_G_), hour(time_G_), minute(time_G_), second(time_G_)), 0) &lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; as minute format=datetime13.&lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;from sasforum.chfReuters3;&lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;quit;&lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt; &lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;options nonotes; /* Prevents the printing of a note for every minute with only 1 obs */&lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt; &lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;proc surveyselect data=chfReuters3 out=chfReutersMinute method=srs sampsize=1;&lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;strata _RIC minute;&lt;/STRONG&gt;&lt;BR /&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;run;&lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt; &lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG style="font-size: 12pt; font-family: calibri, verdana, arial, sans-serif;"&gt;options notes;&lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;PG&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Sun, 03 Mar 2013 21:06:03 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126215#M34675</guid>
      <dc:creator>PGStats</dc:creator>
      <dc:date>2013-03-03T21:06:03Z</dc:date>
    </item>
    <item>
      <title>Re: How to reduce a large time series dataset</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126216#M34676</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;PG,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Many thanks for this one, it worked perfectly. Apologies for the late reply, had the impression I had provided feedback&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Cheers&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Neo&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Sun, 05 May 2013 10:52:13 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/How-to-reduce-a-large-time-series-dataset/m-p/126216#M34676</guid>
      <dc:creator>machete</dc:creator>
      <dc:date>2013-05-05T10:52:13Z</dc:date>
    </item>
  </channel>
</rss>

