<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Hi, Gennady in Intel® oneAPI Math Kernel Library</title>
    <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156111#M27587</link>
    <description>&lt;P style="font-size: 19.512px;"&gt;Hi, Gennady&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;Thanks for your help.&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;I tried&amp;nbsp;&lt;SPAN style="font-size: 12px;"&gt;&amp;nbsp;set MKL_DISABLE_FAST_MM=1 , But it make&amp;nbsp;dtrsm which before &lt;/SPAN&gt;Create 8 VSLStreamStatePtr&amp;nbsp;become as slow as after them.&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;My code is linked with google's tcmalloc, which can be found in&amp;nbsp;gperftools-gperftools-2.5.&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;And add a unused map before the code can help repeat the issue, the map is original code is a static map.&lt;/P&gt;

&lt;P&gt;#include &amp;lt;map&amp;gt;&lt;/P&gt;

&lt;P&gt;#include &amp;lt;iostream&amp;gt;&lt;/P&gt;

&lt;P&gt;#include &amp;lt;cstring&amp;gt;&lt;/P&gt;

&lt;P&gt;#include "mkl_vsl_functions.h"&lt;/P&gt;

&lt;P&gt;#include "mkl_vsl_defines.h"&lt;/P&gt;

&lt;P&gt;#include "mkl_blas.h"&lt;/P&gt;

&lt;P&gt;#include "mkl_service.h"&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;class aaaValue&lt;/P&gt;

&lt;P&gt;{&lt;/P&gt;

&lt;P&gt;public:&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; ~aaaValue()&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; { aaa(); }&lt;/P&gt;

&lt;P&gt;private:&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; void aaa() {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; if (val_.sval)&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; free(val_.sval);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; val_.sval = 0;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;private:&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; union { int ival; double dval; char* sval; }&amp;nbsp;&amp;nbsp;&amp;nbsp; val_;&lt;/P&gt;

&lt;P&gt;};&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;int main(int argc, const char* argv[])&lt;/P&gt;

&lt;P&gt;{&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; std::map&amp;lt;int, aaaValue&amp;gt; Map;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int MmatrixARows=26;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int NmatrixBColumns=3;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double alpha=1;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int ldm=29;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double matrixA[87]={0.00311007,-1.12899e-05,-0.000141499,-1.82698e-14,-0.000785694,-1.98974e-14,-0.000778519,-2.71811e-14,-2.29056e-14,-2.7844e-14,-2.24393e-14,-3.12059e-14,-1.26095e-14,-4.47909e-10,-7.97785e-19,-1.74566e-07,-4.15789e-10,-2.17286e-29,-1.56053e-10,-1.34911e-12,-2.19906e-27,-3.5138e-09,-1.0398e-07,-5.29274e-06,-4.9252e-07,-8.93104e-05,-3.71938e-05,-1.28896e-09,-1.17735e-07,-3.26114e-08,0.00289051,-0.000149547,-2.34128e-13,-1.92531e-13,-0.000706043,-2.17513e-13,-3.48327e-13,-0.000670723,-3.56823e-13,-2.8756e-13,-3.99905e-13,-1.61591e-13,-5.73997e-09,-2.17241e-19,-1.42301e-08,-5.32835e-09,-5.47231e-30,-8.81321e-10,-3.39771e-13,-5.53829e-28,-8.70999e-10,-2.05336e-08,-5.30965e-06,-4.83782e-07,-8.84461e-05,-3.73614e-05,-1.5481e-11,-1.15641e-07,-4.02283e-07,-4.25622e-07,0.00303418,-0.00079269,-2.05185e-13,-2.71747e-13,-2.3181e-13,-0.000797297,-3.1283e-13,-3.80276e-13,-3.06461e-13,-4.2619e-13,-1.72212e-13,-6.11725e-09,-1.91907e-19,-1.90223e-07,-5.67858e-09,-4.75132e-30,-1.02734e-09,-2.95006e-13,-4.80861e-28,-5.38704e-10,-1.5342e-08,-1.98894e-06,-6.03159e-06,-8.35693e-05,-4.29327e-05,-1.62871e-10,-1.44174e-06};&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double matrixB_ori[87]={-1.82698e-14,-0.000785694,-1.98974e-14,-0.000778519,-2.71811e-14,-2.29056e-14,-2.7844e-14,-2.24393e-14,-3.12059e-14,-1.26095e-14,-4.47909e-10,-7.97785e-19,-1.74566e-07,-4.15789e-10,-2.17286e-29,-1.56053e-10,-1.34911e-12,-2.19906e-27,-3.5138e-09,-1.0398e-07,-5.29274e-06,-4.9252e-07,-8.93104e-05,-3.71938e-05,-1.28896e-09,-1.17735e-07,-3.26114e-08,0.00289051,-0.000149547,-2.34128e-13,-1.92531e-13,-0.000706043,-2.17513e-13,-3.48327e-13,-0.000670723,-3.56823e-13,-2.8756e-13,-3.99905e-13,-1.61591e-13,-5.73997e-09,-2.17241e-19,-1.42301e-08,-5.32835e-09,-5.47231e-30,-8.81321e-10,-3.39771e-13,-5.53829e-28,-8.70999e-10,-2.05336e-08,-5.30965e-06,-4.83782e-07,-8.84461e-05,-3.73614e-05,-1.5481e-11,-1.15641e-07,-4.02283e-07,-4.25622e-07,0.00303418,-0.00079269,-2.05185e-13,-2.71747e-13,-2.3181e-13,-0.000797297,-3.1283e-13,-3.80276e-13,-3.06461e-13,-4.2619e-13,-1.72212e-13,-6.11725e-09,-1.91907e-19,-1.90223e-07,-5.67858e-09,-4.75132e-30,-1.02734e-09,-2.95006e-13,-4.80861e-28,-5.38704e-10,-1.5342e-08,-1.98894e-06,-6.03159e-06,-8.35693e-05,-4.29327e-05,-1.62871e-10,-1.44174e-06,-1.87786e-13,-2.49161e-13,-0.00079269};&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double matrixB[87];&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int sweepCount = 1e5;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time_t time1, time2, time3, time4;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time1);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; for(int count = 0;&amp;nbsp; count &amp;lt; sweepCount; ++count) {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;memcpy(matrixB, matrixB_ori, sizeof(double)*87);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; dtrsm("Right", "Upper", "No transpose", "Nunit", &amp;amp;MmatrixARows, &amp;amp;NmatrixBColumns, &amp;amp;alpha, matrixA, &amp;amp;ldm, matrixB, &amp;amp;ldm);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time2);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; std::cout&amp;lt;&amp;lt;" Before new 8 VSLStreamStatePtr time: "&amp;lt;&amp;lt;difftime(time2, time1)&amp;lt;&amp;lt;std::endl;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; VSLStreamStatePtr&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; ptr_[8];&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; for(int i = 0; i &amp;lt; 8; ++i) {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; vslNewStream(&amp;amp;ptr_&lt;I&gt;, VSL_BRNG_MT2203 + i, 1);&lt;/I&gt;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time3);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; for(int count = 0;&amp;nbsp; count &amp;lt; sweepCount; ++count) {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;memcpy(matrixB, matrixB_ori, sizeof(double)*87);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; dtrsm("Right", "Upper", "No transpose", "Nunit", &amp;amp;MmatrixARows, &amp;amp;NmatrixBColumns, &amp;amp;alpha, matrixA, &amp;amp;ldm, matrixB, &amp;amp;ldm);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time4);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; std::cout&amp;lt;&amp;lt;"After new 8 VSLStreamStatePtr time: "&amp;lt;&amp;lt;difftime(time4, time3)&amp;lt;&amp;lt;std::endl;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;}&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Sat, 06 Jan 2018 00:03:26 GMT</pubDate>
    <dc:creator>jian_l_1</dc:creator>
    <dc:date>2018-01-06T00:03:26Z</dc:date>
    <item>
      <title>Create 8 VSLStreamStatePtr affected MKL "dtrsm"' s performance, include test code,issue still open</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156103#M27579</link>
      <description>&lt;P&gt;At first I want to generate random in multythreads in the following code:&lt;/P&gt;

&lt;P style="margin-right: 0cm; margin-left: 0cm; font-size: 12pt; font-family: 宋体; color: rgb(0, 0, 0); margin-bottom: 18pt; background-image: initial; background-position: initial; background-size: initial; background-repeat: initial; background-attachment: initial; background-origin: initial; background-clip: initial;"&gt;&lt;SPAN lang="EN-US" style="font-size: 9pt; font-family: Arial, sans-serif; color: rgb(83, 87, 94);"&gt;#define nstreams 8&lt;BR /&gt;
	VSLStreamStatePtr stream[nstreams];&lt;P&gt;&lt;/P&gt;&lt;/SPAN&gt;&lt;/P&gt;

&lt;P style="margin-right: 0cm; margin-left: 0cm; font-size: 12pt; font-family: 宋体; color: rgb(0, 0, 0); margin-bottom: 18pt; background-image: initial; background-position: initial; background-size: initial; background-repeat: initial; background-attachment: initial; background-origin: initial; background-clip: initial; word-wrap: break-word;"&gt;&lt;SPAN lang="EN-US" style="font-size: 9pt; font-family: Arial, sans-serif; color: rgb(83, 87, 94);"&gt;int k;&lt;BR /&gt;
	for ( k=0; k&amp;lt; nstreams; k++ )&lt;BR /&gt;
	{&lt;BR /&gt;
	vslNewStream( &amp;amp;stream&lt;K&gt;, VSL_BRNG_MT2203+k, seed );&lt;BR /&gt;
	}&lt;/K&gt;&lt;/SPAN&gt;&lt;/P&gt;

&lt;P&gt;But I found, If I generate 8&amp;nbsp;VSLStreamStatePtr , other MKL functions performance will be affected(5 times slower then normal), these affected funtions are:&lt;/P&gt;

&lt;P&gt;dtrsm("Right", "Upper", "No transpose", "Nunit", ...);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;</description>
      <pubDate>Mon, 13 Nov 2017 15:06:35 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156103#M27579</guid>
      <dc:creator>jian_l_1</dc:creator>
      <dc:date>2017-11-13T15:06:35Z</dc:date>
    </item>
    <item>
      <title>Hi jian,</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156104#M27580</link>
      <description>&lt;P&gt;Hi jian,&lt;/P&gt;

&lt;P&gt;Here's some question about your issue:&lt;/P&gt;

&lt;P&gt;1. How did you test the performance? If you enable MKL_VERBOSE to check, or write program to get clock time?&lt;BR /&gt;
	2. How about your problem size for trsv, gemv and trsm? and what about your seed for random data generation? Could you please provide a reproducer (just a sample case) that we can investigate?&lt;/P&gt;

&lt;P&gt;Thanks.&lt;/P&gt;

&lt;P&gt;Best regards,&lt;BR /&gt;
	Fiona&lt;/P&gt;</description>
      <pubDate>Tue, 14 Nov 2017 02:41:57 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156104#M27580</guid>
      <dc:creator>Zhen_Z_Intel</dc:creator>
      <dc:date>2017-11-14T02:41:57Z</dc:date>
    </item>
    <item>
      <title>Hi, Fiona</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156105#M27581</link>
      <description>&lt;P&gt;Hi, Fiona&lt;/P&gt;

&lt;P&gt;Thanks for your response.&lt;/P&gt;

&lt;P&gt;I need modify the issue: ONLY&amp;nbsp;&lt;SPAN style="font-size: 12px; line-height: 18px;"&gt;dtrsm is affected by new 8&amp;nbsp;vslNewStream.&lt;/SPAN&gt;&lt;/P&gt;

&lt;P&gt;Here is test code and result in my machine:&lt;/P&gt;

&lt;P&gt;result:&lt;/P&gt;

&lt;P&gt;Before new 8 VSLStreamStatePtr time: 1&lt;/P&gt;

&lt;P&gt;After new 8 VSLStreamStatePtr time: 12&lt;/P&gt;

&lt;DIV&gt;Code (c++):&lt;/DIV&gt;

&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;

&lt;DIV&gt;
	&lt;P&gt;#include "mkl_vsl_functions.h"&lt;/P&gt;

	&lt;P&gt;#include "mkl_vsl_defines.h"&lt;/P&gt;

	&lt;P&gt;#include "mkl_blas.h"&lt;/P&gt;

	&lt;P&gt;#include "mkl_service.h"&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&lt;/P&gt;

	&lt;P&gt;int MmatrixARows=26;&lt;/P&gt;

	&lt;P&gt;int NmatrixBColumns=3;&lt;/P&gt;

	&lt;P&gt;double alpha=1;&lt;/P&gt;

	&lt;P&gt;int ldm=29;&lt;/P&gt;

	&lt;P&gt;double matrixA[87]={0.00311007,-1.12899e-05,-0.000141499,-1.82698e-14,-0.000785694,-1.98974e-14,-0.000778519,-2.71811e-14,-2.29056e-14,-2.7844e-14,-2.24393e-14,-3.12059e-14,-1.26095e-14,-4.47909e-10,-7.97785e-19,-1.74566e-07,-4.15789e-10,-2.17286e-29,-1.56053e-10,-1.34911e-12,-2.19906e-27,-3.5138e-09,-1.0398e-07,-5.29274e-06,-4.9252e-07,-8.93104e-05,-3.71938e-05,-1.28896e-09,-1.17735e-07,-3.26114e-08,0.00289051,-0.000149547,-2.34128e-13,-1.92531e-13,-0.000706043,-2.17513e-13,-3.48327e-13,-0.000670723,-3.56823e-13,-2.8756e-13,-3.99905e-13,-1.61591e-13,-5.73997e-09,-2.17241e-19,-1.42301e-08,-5.32835e-09,-5.47231e-30,-8.81321e-10,-3.39771e-13,-5.53829e-28,-8.70999e-10,-2.05336e-08,-5.30965e-06,-4.83782e-07,-8.84461e-05,-3.73614e-05,-1.5481e-11,-1.15641e-07,-4.02283e-07,-4.25622e-07,0.00303418,-0.00079269,-2.05185e-13,-2.71747e-13,-2.3181e-13,-0.000797297,-3.1283e-13,-3.80276e-13,-3.06461e-13,-4.2619e-13,-1.72212e-13,-6.11725e-09,-1.91907e-19,-1.90223e-07,-5.67858e-09,-4.75132e-30,-1.02734e-09,-2.95006e-13,-4.80861e-28,-5.38704e-10,-1.5342e-08,-1.98894e-06,-6.03159e-06,-8.35693e-05,-4.29327e-05,-1.62871e-10,-1.44174e-06};&lt;/P&gt;

	&lt;P&gt;double matrixB_ori[87]={-1.82698e-14,-0.000785694,-1.98974e-14,-0.000778519,-2.71811e-14,-2.29056e-14,-2.7844e-14,-2.24393e-14,-3.12059e-14,-1.26095e-14,-4.47909e-10,-7.97785e-19,-1.74566e-07,-4.15789e-10,-2.17286e-29,-1.56053e-10,-1.34911e-12,-2.19906e-27,-3.5138e-09,-1.0398e-07,-5.29274e-06,-4.9252e-07,-8.93104e-05,-3.71938e-05,-1.28896e-09,-1.17735e-07,-3.26114e-08,0.00289051,-0.000149547,-2.34128e-13,-1.92531e-13,-0.000706043,-2.17513e-13,-3.48327e-13,-0.000670723,-3.56823e-13,-2.8756e-13,-3.99905e-13,-1.61591e-13,-5.73997e-09,-2.17241e-19,-1.42301e-08,-5.32835e-09,-5.47231e-30,-8.81321e-10,-3.39771e-13,-5.53829e-28,-8.70999e-10,-2.05336e-08,-5.30965e-06,-4.83782e-07,-8.84461e-05,-3.73614e-05,-1.5481e-11,-1.15641e-07,-4.02283e-07,-4.25622e-07,0.00303418,-0.00079269,-2.05185e-13,-2.71747e-13,-2.3181e-13,-0.000797297,-3.1283e-13,-3.80276e-13,-3.06461e-13,-4.2619e-13,-1.72212e-13,-6.11725e-09,-1.91907e-19,-1.90223e-07,-5.67858e-09,-4.75132e-30,-1.02734e-09,-2.95006e-13,-4.80861e-28,-5.38704e-10,-1.5342e-08,-1.98894e-06,-6.03159e-06,-8.35693e-05,-4.29327e-05,-1.62871e-10,-1.44174e-06,-1.87786e-13,-2.49161e-13,-0.00079269};&lt;/P&gt;

	&lt;P&gt;double matrixB[87];&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&lt;/P&gt;

	&lt;P&gt;int sweepCount = 1e6;&lt;/P&gt;

	&lt;P&gt;time_t time1, time2, time3, time4;&lt;/P&gt;

	&lt;P&gt;time(&amp;amp;time1);&lt;/P&gt;

	&lt;P&gt;for(int count = 0;&amp;nbsp; count &amp;lt; sweepCount; ++count) {&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;memcpy(matrixB, matrixB_ori, sizeof(double)*87);&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; dtrsm("Right", "Upper", "No transpose", "Nunit", &amp;amp;MmatrixARows, &amp;amp;NmatrixBColumns, &amp;amp;alpha, matrixA, &amp;amp;ldm, matrixB, &amp;amp;ldm);&lt;/P&gt;

	&lt;P&gt;}&lt;/P&gt;

	&lt;P&gt;time(&amp;amp;time2);&lt;/P&gt;

	&lt;P&gt;std::cout&amp;lt;&amp;lt;" Before new 8 VSLStreamStatePtr time: "&amp;lt;&amp;lt;difftime(time2, time1)&amp;lt;&amp;lt;std::endl;&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&lt;/P&gt;

	&lt;P&gt;VSLStreamStatePtr&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;ptr_[8];&lt;/P&gt;

	&lt;P&gt;for(int i = 0; i &amp;lt; 8; ++i) {&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; vslNewStream(&amp;amp;ptr_&lt;I&gt;, VSL_BRNG_MT2203 + i, 1);&lt;/I&gt;&lt;/P&gt;

	&lt;P&gt;}&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&lt;/P&gt;

	&lt;P&gt;time(&amp;amp;time3);&lt;/P&gt;

	&lt;P&gt;for(int count = 0;&amp;nbsp; count &amp;lt; sweepCount; ++count) {&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;memcpy(matrixB, matrixB_ori, sizeof(double)*87);&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; dtrsm("Right", "Upper", "No transpose", "Nunit", &amp;amp;MmatrixARows, &amp;amp;NmatrixBColumns, &amp;amp;alpha, matrixA, &amp;amp;ldm, matrixB, &amp;amp;ldm);&lt;/P&gt;

	&lt;P&gt;}&lt;/P&gt;

	&lt;P&gt;time(&amp;amp;time4);&lt;/P&gt;

	&lt;P&gt;std::cout&amp;lt;&amp;lt;"After new 8 VSLStreamStatePtr time: "&amp;lt;&amp;lt;difftime(time4, time3)&amp;lt;&amp;lt;std::endl;&lt;/P&gt;

	&lt;P&gt;&amp;nbsp;&lt;/P&gt;

	&lt;P&gt;Thanks&lt;/P&gt;
&lt;/DIV&gt;

&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;</description>
      <pubDate>Wed, 15 Nov 2017 02:47:32 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156105#M27581</guid>
      <dc:creator>jian_l_1</dc:creator>
      <dc:date>2017-11-15T02:47:32Z</dc:date>
    </item>
    <item>
      <title>Hi, Fiona</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156106#M27582</link>
      <description>&lt;P&gt;Hi, Fiona&lt;/P&gt;

&lt;P&gt;Can you repeat the issue? Or need more detail info about lib verstion and cpu info?&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;Thanks.&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&lt;/P&gt;&lt;BLOCKQUOTE&gt;Fiona Z. (Intel) wrote:&lt;BR /&gt;&lt;P&gt;&lt;/P&gt;

&lt;P&gt;Hi jian,&lt;/P&gt;

&lt;P&gt;Here's some question about your issue:&lt;/P&gt;

&lt;P&gt;1. How did you test the performance? If you enable MKL_VERBOSE to check, or write program to get clock time?&lt;BR /&gt;
	2. How about your problem size for trsv, gemv and trsm? and what about your seed for random data generation? Could you please provide a reproducer (just a sample case) that we can investigate?&lt;/P&gt;

&lt;P&gt;Thanks.&lt;/P&gt;

&lt;P&gt;Best regards,&lt;BR /&gt;
	Fiona&lt;/P&gt;

&lt;P&gt;&lt;/P&gt;&lt;/BLOCKQUOTE&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 22 Nov 2017 08:41:14 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156106#M27582</guid>
      <dc:creator>jian_l_1</dc:creator>
      <dc:date>2017-11-22T08:41:14Z</dc:date>
    </item>
    <item>
      <title>Hi Jian,</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156107#M27583</link>
      <description>&lt;P&gt;Hi Jian,&lt;/P&gt;

&lt;P&gt;I can reproduce your problem, we are investigating, I will give your response soon.&lt;/P&gt;

&lt;P&gt;Best regards,&lt;BR /&gt;
	Fiona&lt;/P&gt;</description>
      <pubDate>Fri, 24 Nov 2017 12:23:58 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156107#M27583</guid>
      <dc:creator>Zhen_Z_Intel</dc:creator>
      <dc:date>2017-11-24T12:23:58Z</dc:date>
    </item>
    <item>
      <title>The root cause analysis shows</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156108#M27584</link>
      <description>&lt;P&gt;&lt;SPAN style="color: rgb(84, 84, 84); font-family: Roboto, arial, sans-serif; font-size: small;"&gt;The root cause analysis shows the problem&amp;nbsp; with internal mkl_serv_allocate() routine. The issue is escalated. We will keep you updated with the status of this issue!&lt;/SPAN&gt;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 30 Nov 2017 08:54:26 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156108#M27584</guid>
      <dc:creator>Gennady_F_Intel</dc:creator>
      <dc:date>2017-11-30T08:54:26Z</dc:date>
    </item>
    <item>
      <title>Hi,Gennay</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156109#M27585</link>
      <description>&lt;P&gt;Hi,Gennay&lt;/P&gt;

&lt;P&gt;I am glad to hear that.&lt;SPAN style="font-size: 19.512px;"&gt;Thanks for your help.&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;

&lt;P&gt;&lt;/P&gt;&lt;BLOCKQUOTE&gt;Gennady F. (Intel) wrote:&lt;BR /&gt;&lt;P&gt;&lt;/P&gt;

&lt;P&gt;The root cause analysis shows the problem&amp;nbsp; with internal mkl_serv_allocate() routine. The issue is escalated. We will keep you updated with the status of this issue!&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&lt;/P&gt;&lt;/BLOCKQUOTE&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 10 Dec 2017 12:28:36 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156109#M27585</guid>
      <dc:creator>jian_l_1</dc:creator>
      <dc:date>2017-12-10T12:28:36Z</dc:date>
    </item>
    <item>
      <title>To mitigate the problem, we</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156110#M27586</link>
      <description>&lt;P&gt;To mitigate the problem, we may recommend&amp;nbsp;&lt;SPAN style="font-size: 1em;"&gt;set MKL_DISABLE_FAST_MM=1 to disable our memory buffering. Please refer more details into MKL's User's Guide -&amp;nbsp;&amp;nbsp;&lt;/SPAN&gt;Managing Performance and Memory&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 25 Dec 2017 15:53:33 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156110#M27586</guid>
      <dc:creator>Gennady_F_Intel</dc:creator>
      <dc:date>2017-12-25T15:53:33Z</dc:date>
    </item>
    <item>
      <title>Hi, Gennady</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156111#M27587</link>
      <description>&lt;P style="font-size: 19.512px;"&gt;Hi, Gennady&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;Thanks for your help.&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;I tried&amp;nbsp;&lt;SPAN style="font-size: 12px;"&gt;&amp;nbsp;set MKL_DISABLE_FAST_MM=1 , But it make&amp;nbsp;dtrsm which before &lt;/SPAN&gt;Create 8 VSLStreamStatePtr&amp;nbsp;become as slow as after them.&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;My code is linked with google's tcmalloc, which can be found in&amp;nbsp;gperftools-gperftools-2.5.&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;And add a unused map before the code can help repeat the issue, the map is original code is a static map.&lt;/P&gt;

&lt;P&gt;#include &amp;lt;map&amp;gt;&lt;/P&gt;

&lt;P&gt;#include &amp;lt;iostream&amp;gt;&lt;/P&gt;

&lt;P&gt;#include &amp;lt;cstring&amp;gt;&lt;/P&gt;

&lt;P&gt;#include "mkl_vsl_functions.h"&lt;/P&gt;

&lt;P&gt;#include "mkl_vsl_defines.h"&lt;/P&gt;

&lt;P&gt;#include "mkl_blas.h"&lt;/P&gt;

&lt;P&gt;#include "mkl_service.h"&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;class aaaValue&lt;/P&gt;

&lt;P&gt;{&lt;/P&gt;

&lt;P&gt;public:&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; ~aaaValue()&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; { aaa(); }&lt;/P&gt;

&lt;P&gt;private:&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; void aaa() {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; if (val_.sval)&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; free(val_.sval);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; val_.sval = 0;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;private:&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; union { int ival; double dval; char* sval; }&amp;nbsp;&amp;nbsp;&amp;nbsp; val_;&lt;/P&gt;

&lt;P&gt;};&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;int main(int argc, const char* argv[])&lt;/P&gt;

&lt;P&gt;{&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; std::map&amp;lt;int, aaaValue&amp;gt; Map;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int MmatrixARows=26;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int NmatrixBColumns=3;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double alpha=1;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int ldm=29;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double matrixA[87]={0.00311007,-1.12899e-05,-0.000141499,-1.82698e-14,-0.000785694,-1.98974e-14,-0.000778519,-2.71811e-14,-2.29056e-14,-2.7844e-14,-2.24393e-14,-3.12059e-14,-1.26095e-14,-4.47909e-10,-7.97785e-19,-1.74566e-07,-4.15789e-10,-2.17286e-29,-1.56053e-10,-1.34911e-12,-2.19906e-27,-3.5138e-09,-1.0398e-07,-5.29274e-06,-4.9252e-07,-8.93104e-05,-3.71938e-05,-1.28896e-09,-1.17735e-07,-3.26114e-08,0.00289051,-0.000149547,-2.34128e-13,-1.92531e-13,-0.000706043,-2.17513e-13,-3.48327e-13,-0.000670723,-3.56823e-13,-2.8756e-13,-3.99905e-13,-1.61591e-13,-5.73997e-09,-2.17241e-19,-1.42301e-08,-5.32835e-09,-5.47231e-30,-8.81321e-10,-3.39771e-13,-5.53829e-28,-8.70999e-10,-2.05336e-08,-5.30965e-06,-4.83782e-07,-8.84461e-05,-3.73614e-05,-1.5481e-11,-1.15641e-07,-4.02283e-07,-4.25622e-07,0.00303418,-0.00079269,-2.05185e-13,-2.71747e-13,-2.3181e-13,-0.000797297,-3.1283e-13,-3.80276e-13,-3.06461e-13,-4.2619e-13,-1.72212e-13,-6.11725e-09,-1.91907e-19,-1.90223e-07,-5.67858e-09,-4.75132e-30,-1.02734e-09,-2.95006e-13,-4.80861e-28,-5.38704e-10,-1.5342e-08,-1.98894e-06,-6.03159e-06,-8.35693e-05,-4.29327e-05,-1.62871e-10,-1.44174e-06};&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double matrixB_ori[87]={-1.82698e-14,-0.000785694,-1.98974e-14,-0.000778519,-2.71811e-14,-2.29056e-14,-2.7844e-14,-2.24393e-14,-3.12059e-14,-1.26095e-14,-4.47909e-10,-7.97785e-19,-1.74566e-07,-4.15789e-10,-2.17286e-29,-1.56053e-10,-1.34911e-12,-2.19906e-27,-3.5138e-09,-1.0398e-07,-5.29274e-06,-4.9252e-07,-8.93104e-05,-3.71938e-05,-1.28896e-09,-1.17735e-07,-3.26114e-08,0.00289051,-0.000149547,-2.34128e-13,-1.92531e-13,-0.000706043,-2.17513e-13,-3.48327e-13,-0.000670723,-3.56823e-13,-2.8756e-13,-3.99905e-13,-1.61591e-13,-5.73997e-09,-2.17241e-19,-1.42301e-08,-5.32835e-09,-5.47231e-30,-8.81321e-10,-3.39771e-13,-5.53829e-28,-8.70999e-10,-2.05336e-08,-5.30965e-06,-4.83782e-07,-8.84461e-05,-3.73614e-05,-1.5481e-11,-1.15641e-07,-4.02283e-07,-4.25622e-07,0.00303418,-0.00079269,-2.05185e-13,-2.71747e-13,-2.3181e-13,-0.000797297,-3.1283e-13,-3.80276e-13,-3.06461e-13,-4.2619e-13,-1.72212e-13,-6.11725e-09,-1.91907e-19,-1.90223e-07,-5.67858e-09,-4.75132e-30,-1.02734e-09,-2.95006e-13,-4.80861e-28,-5.38704e-10,-1.5342e-08,-1.98894e-06,-6.03159e-06,-8.35693e-05,-4.29327e-05,-1.62871e-10,-1.44174e-06,-1.87786e-13,-2.49161e-13,-0.00079269};&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; double matrixB[87];&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; int sweepCount = 1e5;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time_t time1, time2, time3, time4;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time1);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; for(int count = 0;&amp;nbsp; count &amp;lt; sweepCount; ++count) {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;memcpy(matrixB, matrixB_ori, sizeof(double)*87);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; dtrsm("Right", "Upper", "No transpose", "Nunit", &amp;amp;MmatrixARows, &amp;amp;NmatrixBColumns, &amp;amp;alpha, matrixA, &amp;amp;ldm, matrixB, &amp;amp;ldm);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time2);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; std::cout&amp;lt;&amp;lt;" Before new 8 VSLStreamStatePtr time: "&amp;lt;&amp;lt;difftime(time2, time1)&amp;lt;&amp;lt;std::endl;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; VSLStreamStatePtr&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; ptr_[8];&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; for(int i = 0; i &amp;lt; 8; ++i) {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; vslNewStream(&amp;amp;ptr_&lt;I&gt;, VSL_BRNG_MT2203 + i, 1);&lt;/I&gt;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time3);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; for(int count = 0;&amp;nbsp; count &amp;lt; sweepCount; ++count) {&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;memcpy(matrixB, matrixB_ori, sizeof(double)*87);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; dtrsm("Right", "Upper", "No transpose", "Nunit", &amp;amp;MmatrixARows, &amp;amp;NmatrixBColumns, &amp;amp;alpha, matrixA, &amp;amp;ldm, matrixB, &amp;amp;ldm);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; }&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; time(&amp;amp;time4);&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; std::cout&amp;lt;&amp;lt;"After new 8 VSLStreamStatePtr time: "&amp;lt;&amp;lt;difftime(time4, time3)&amp;lt;&amp;lt;std::endl;&lt;/P&gt;

&lt;P&gt;&amp;nbsp;&lt;/P&gt;

&lt;P&gt;}&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;

&lt;P style="font-size: 19.512px;"&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 06 Jan 2018 00:03:26 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/Create-8-VSLStreamStatePtr-affected-MKL-quot-dtrsm-quot-s/m-p/1156111#M27587</guid>
      <dc:creator>jian_l_1</dc:creator>
      <dc:date>2018-01-06T00:03:26Z</dc:date>
    </item>
  </channel>
</rss>

