<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Parallel Data Jobs in a Process Job in SAS Data Management</title>
    <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148825#M2507</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Feauture wise, yes. &lt;EM&gt;How&lt;/EM&gt; is applikation dependent.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Wed, 22 Jan 2014 15:06:10 GMT</pubDate>
    <dc:creator>LinusH</dc:creator>
    <dc:date>2014-01-22T15:06:10Z</dc:date>
    <item>
      <title>Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148824#M2506</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi all,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have created one process job, which contains 15 data job so it took about 10 hours in running a job with 1.6 million data, Is it possible to run the data jobs parallel so that it can reduce the time a bit ?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks and Regards&lt;/P&gt;&lt;P&gt;Joydip Ghosh&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 07:10:01 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148824#M2506</guid>
      <dc:creator>Joydip</dc:creator>
      <dc:date>2014-01-22T07:10:01Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148825#M2507</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Feauture wise, yes. &lt;EM&gt;How&lt;/EM&gt; is applikation dependent.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 15:06:10 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148825#M2507</guid>
      <dc:creator>LinusH</dc:creator>
      <dc:date>2014-01-22T15:06:10Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148826#M2508</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;To be able to help yu on how, please elaborate on how your job flow is built. How many separate data streams do you have, data/job dependencies, what HW reources are available to you?&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 15:08:17 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148826#M2508</guid>
      <dc:creator>LinusH</dc:creator>
      <dc:date>2014-01-22T15:08:17Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148827#M2509</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Linus,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The job has 15 data flows all are dependent on the 1st data flow node, which creates one value, but the other 14 are independent of all others. Now it is working like after completion of 1st node, 2nd node starts, then after completion of 2nd the 3rd starts. if we can do it parallel then I think it will be fast. How can we do that, should we require, Fork or Parallel iteration node transforms.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks and Regards&lt;/P&gt;&lt;P&gt;Joydip&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 15:24:10 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148827#M2509</guid>
      <dc:creator>Joydip</dc:creator>
      <dc:date>2014-01-22T15:24:10Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148828#M2510</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;If I understand you correctly, that there are 14 different jobs, then I would build job dependencies using the Schedule Manager plugin in Management Console.&lt;/P&gt;&lt;P&gt;If there are one job but with different set of input data, I would solve it using Loop-transformation in DI Studio. Parallelism is managed by setting parameters accordingly.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 16:09:19 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148828#M2510</guid>
      <dc:creator>LinusH</dc:creator>
      <dc:date>2014-01-22T16:09:19Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148829#M2511</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Joydip,&lt;/P&gt;&lt;P&gt;You can run the first data job then link it to a Fork Node which would contain all of the other 14 data jobs. The Fork node will allow the 14 jobs to run in parallel once the first node completes.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;See attached screenshot.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;-shawn&lt;/P&gt;&lt;BR /&gt;&lt;IMG src="https://communities.sas.com/t5/image/serverpage/image-id/11724iA781C67A7416A030/image-size/large?v=1.0&amp;amp;px=600" border="0" alt="fork_node.jpg" title="fork_node.jpg" /&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 16:31:36 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148829#M2511</guid>
      <dc:creator>skillman</dc:creator>
      <dc:date>2014-01-22T16:31:36Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148830#M2512</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;So, you work in Data Flux, that information could have been useful... &lt;span class="lia-unicode-emoji" title=":winking_face:"&gt;😉&lt;/span&gt;&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 22 Jan 2014 18:51:39 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148830#M2512</guid>
      <dc:creator>LinusH</dc:creator>
      <dc:date>2014-01-22T18:51:39Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148831#M2513</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Linus, Shawn,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks for the update using Fork, but we are still facing a lot of Issue, sometimes&lt;/P&gt;&lt;P&gt;a) out of memory.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Is there any way to control the memory to be allocated.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Secondly all our data jobs are writing the exceptions into a same table so the connection is refused by the server as two threads are trying to update the same table at same point of time and the job fails, is there any alternative way.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;All suggestions are welcome.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks and Regards&lt;/P&gt;&lt;P&gt;Joydip&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 27 Jan 2014 07:50:32 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148831#M2513</guid>
      <dc:creator>Joydip</dc:creator>
      <dc:date>2014-01-27T07:50:32Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148832#M2514</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Joydip,&lt;/P&gt;&lt;P&gt;Specifically which node is failing due to memory issues? There are node specific memory tweaks you can make. Also, how much physical memory is available on the computer that is running this job? What type of table are you writing the exceptions to? It sounds like it may be a table or a database that does not allow simultaneous connections.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;-shawn&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 27 Jan 2014 13:58:41 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148832#M2514</guid>
      <dc:creator>skillman</dc:creator>
      <dc:date>2014-01-27T13:58:41Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148833#M2515</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Shawn,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks for your reply, My system have 2GB Ram, and the database is an sql server database, and we are writing the exceptions to the table itself we are using macros to connect to the database and then write to the exception table. We are using an expression where we are opening and closing the connection and write the details with the help of that we are writing the exceptions records to the database. and this expression node is failing due to the memory issue.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks and Regards.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Joydip&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 27 Jan 2014 14:08:29 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148833#M2515</guid>
      <dc:creator>Joydip</dc:creator>
      <dc:date>2014-01-27T14:08:29Z</dc:date>
    </item>
    <item>
      <title>Re: Parallel Data Jobs in a Process Job</title>
      <link>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148834#M2516</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Joydip,&lt;/P&gt;&lt;P&gt;SQL Server uses pessimistic concurrency by default: This is stated in the offical MS documention. Have you thought about using the Data Target (Insert) node and passing the macros into it? Opening and Closing the database through an expression may be another reason the job is failing. You can control commit intervals in the Data Target (Insert) node which could help performance as well.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Pessimistic Concurrency&lt;/P&gt;&lt;P&gt;Default behavior: acquire locks to block access to data that another process is using.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Optimistic Concurrency&lt;/P&gt;&lt;P&gt;Assumes that there are sufficiently few conflicting data modification operations in the system that any single transaction is unlikely to modify data that another transaction is modifying.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope this helps,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;-shawn&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 27 Jan 2014 16:06:26 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Management/Parallel-Data-Jobs-in-a-Process-Job/m-p/148834#M2516</guid>
      <dc:creator>skillman</dc:creator>
      <dc:date>2014-01-27T16:06:26Z</dc:date>
    </item>
  </channel>
</rss>

