<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio in Intel® oneAPI Math Kernel Library</title>
    <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352960#M32630</link>
    <description>&lt;P&gt;Could you please share your test machine environment variables?&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Thu, 20 Jan 2022 06:27:19 GMT</pubDate>
    <dc:creator>Rizwan1</dc:creator>
    <dc:date>2022-01-20T06:27:19Z</dc:date>
    <item>
      <title>MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1350748#M32563</link>
      <description>&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Hi,&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Previously I had tested mkl cblas_dgemm for m=n=k=10000 and found a performance of approximately 2 TFlop but now the same give me a performance of around 0.8 TFlops.&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Case 1:&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;CentOS 7.2.* and Intel Parallel Studio XE&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;MKL cblas_dgemm&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;m=n=k=10000&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Performance: 1900+ GFlops&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Case 2:&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;CentOS 8.5.* and Intel OneAPI&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;MKL cblas_dgemm&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;m=n=k=1000&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Performance: 750+ GFlops&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Why this is the huge gap. &lt;/FONT&gt;&lt;FONT style="vertical-align: inherit;"&gt;something is wrong&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;What is the reason?&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT style="vertical-align: inherit;"&gt;&lt;FONT style="vertical-align: inherit;"&gt;Please assist and guide&amp;nbsp;&lt;/FONT&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 12 Jan 2022 09:07:32 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1350748#M32563</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-12T09:07:32Z</dc:date>
    </item>
    <item>
      <title>Re:MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351111#M32564</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks for reaching out to us.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you please let us know with what versions of Intel parallel studio xe and oneAPI you have observed the differences in performance and also how did you calculate the performance (gflops) so that it would help us to investigate your issue from our end?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Vidya.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Thu, 13 Jan 2022 12:14:07 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351111#M32564</guid>
      <dc:creator>VidyalathaB_Intel</dc:creator>
      <dc:date>2022-01-13T12:14:07Z</dc:date>
    </item>
    <item>
      <title>RE: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351338#M32567</link>
      <description>&lt;P&gt;In 2017, Intel Parallel Studio XE Update 1 was used, and the performance of cblas_dgemm was about 2+ TFlops.&lt;/P&gt;
&lt;P&gt;In the next step, I used the MKL and OpenMP libraries that came with the previous installation, and the Intel C compiler that came with HPC kit version 2021. I still got a performance of about 1.95 TTFlops. This setup was on CentOS 7.2&lt;/P&gt;
&lt;P&gt;Now I have installed CentOS 8.5 on Intel Xeon Phi 7250, the performance of cblas_dgemm is around 0.75 TFlops, which is worse than before. I have installed oneAPI through GUI Installer&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 14 Jan 2022 00:48:00 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351338#M32567</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-14T00:48:00Z</dc:date>
    </item>
    <item>
      <title>Re:MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351890#M32582</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you please provide us with the&lt;B&gt; timings&lt;/B&gt; that you are getting for both cases?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Time taken when working with &amp;gt;&amp;gt; &lt;I&gt;In 2017, Intel Parallel Studio XE Update 1.&lt;/I&gt;&lt;/P&gt;&lt;P&gt;Time taken when working with &amp;gt;&amp;gt; &lt;I&gt;installed oneAPI through GUI Installer &lt;/I&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Vidya.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 17 Jan 2022 09:19:50 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351890#M32582</guid>
      <dc:creator>VidyalathaB_Intel</dc:creator>
      <dc:date>2022-01-17T09:19:50Z</dc:date>
    </item>
    <item>
      <title>RE: Re:MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351892#M32583</link>
      <description>&lt;P class="sub_section_element_selectors"&gt;&lt;STRONG&gt;Time taken when working with &amp;gt;&amp;gt;&amp;nbsp;&lt;I&gt;In 2017, Intel Parallel Studio XE Update 1.&lt;/I&gt;&lt;/STRONG&gt;&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;&lt;I&gt;I can't provide the exact timing information because an other researcher work at that time. But the rough estimate is about its near October 2017.&lt;/I&gt;&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;&amp;nbsp;&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;&lt;STRONG&gt;Time taken when working with &amp;gt;&amp;gt;&amp;nbsp;&lt;I&gt;installed oneAPI through GUI Installer&lt;/I&gt;&lt;/STRONG&gt;&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;I have installed oneAPI just couple of days ago less that one week from the current date&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;&amp;nbsp;&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;&amp;nbsp;&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;Thanks&lt;/P&gt;
&lt;P class="sub_section_element_selectors"&gt;Regards&lt;/P&gt;</description>
      <pubDate>Mon, 17 Jan 2022 09:24:30 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351892#M32583</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-17T09:24:30Z</dc:date>
    </item>
    <item>
      <title>Re:MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351918#M32586</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Let me rephrase my question. &lt;/P&gt;&lt;P&gt;The execution time of your code with the latest oneMKL 2022 and also with MKL 2017 (if possible)?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Vidya.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 17 Jan 2022 11:08:03 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1351918#M32586</guid>
      <dc:creator>VidyalathaB_Intel</dc:creator>
      <dc:date>2022-01-17T11:08:03Z</dc:date>
    </item>
    <item>
      <title>RE: Re:MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352109#M32589</link>
      <description>&lt;P&gt;For MKL2017&lt;/P&gt;
&lt;P&gt;OS: CentOS 7.2&lt;/P&gt;
&lt;P&gt;M=N=K=10000&lt;/P&gt;
&lt;P&gt;Execution Time 1.02 Seconds on&amp;nbsp; Intel Xeon Phi 7250 with&amp;nbsp;68 Cores&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;For OneMKL2022&lt;/P&gt;
&lt;P&gt;OS: CentOS 8.5&lt;/P&gt;
&lt;P&gt;M=N=K=10000&lt;/P&gt;
&lt;P&gt;Execution Time 3.17 Seconds on&amp;nbsp; Intel Xeon Phi 7250 with&amp;nbsp;68 Cores&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Regards&lt;/P&gt;
&lt;P&gt;Muhammad Rizwan&lt;/P&gt;</description>
      <pubDate>Tue, 18 Jan 2022 01:19:28 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352109#M32589</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-18T01:19:28Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352292#M32598</link>
      <description>&lt;P&gt;These performance comparisons are likely to be quite variable depending on system load, number of active users, etc.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;On a Windows PC with an i7-10710U (low power) NUC, here are my timing results for DGEMM with m=n=k=2000, alpha = 1, beta = 2:&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;TABLE border="1" width="100%"&gt;
&lt;TBODY&gt;
&lt;TR&gt;
&lt;TD width="50%"&gt;2014&lt;/TD&gt;
&lt;TD width="50%"&gt;0.445 s&lt;/TD&gt;
&lt;/TR&gt;
&lt;TR&gt;
&lt;TD width="50%"&gt;2016 U8&lt;/TD&gt;
&lt;TD width="50%"&gt;0.242&lt;/TD&gt;
&lt;/TR&gt;
&lt;TR&gt;
&lt;TD width="50%"&gt;2019.1 U3&lt;/TD&gt;
&lt;TD width="50%"&gt;0.151&lt;/TD&gt;
&lt;/TR&gt;
&lt;TR&gt;
&lt;TD width="50%"&gt;2021.5&lt;/TD&gt;
&lt;TD width="50%"&gt;0.152&lt;/TD&gt;
&lt;/TR&gt;
&lt;/TBODY&gt;
&lt;/TABLE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;For each case, I compiled with /Qopenmp /Qxhost and ran the program three or four times. The reported times above are the best of these three or four runs.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;For comparison purposes, it would be useful if you were to run the following program on your system and provide the results.&lt;/P&gt;
&lt;LI-CODE lang="fortran"&gt;program xdgemm
implicit none
integer, parameter :: N = 2000
double precision, allocatable, dimension(:,:) :: A, B, C
integer :: m,k
double precision :: alpha = 1d0, beta = 2d0
real t1,t2
!
allocate (A(N,N),B(N,N),C(N,N))
m = N
k = N
call random_number(A)
call random_number(B)
call random_number(C)
call cpu_time(t1)
call dgemm('N','N',m,n,k,alpha,A,N,B,N,beta,C,N)
call cpu_time(t2)
print *,t2-t1,' secs'
end&lt;/LI-CODE&gt;</description>
      <pubDate>Tue, 18 Jan 2022 15:55:13 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352292#M32598</guid>
      <dc:creator>mecej4</dc:creator>
      <dc:date>2022-01-18T15:55:13Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352440#M32604</link>
      <description>&lt;P&gt;Dear&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Are you kidding me?&lt;/P&gt;
&lt;P&gt;I am informing issue for Linux system CentOS and highlighting totally different platform and you are sharing the script for the windows system.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Please understand the context and problem first.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 00:46:42 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352440#M32604</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-19T00:46:42Z</dc:date>
    </item>
    <item>
      <title>Re:MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352514#M32607</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks for providing the details.&lt;/P&gt;&lt;P&gt;We are looking into this issue internally, we will get back to you soon.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Vidya.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Wed, 19 Jan 2022 05:12:34 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352514#M32607</guid>
      <dc:creator>VidyalathaB_Intel</dc:creator>
      <dc:date>2022-01-19T05:12:34Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352572#M32609</link>
      <description>&lt;P&gt;checking the problem on RH7 ( no CentOS available right now ) with MKL 2020.0.1 (the current) and MKL 2017.0 Update 2 on Intel(R) Xeon(R) Gold 6148 CPU @ 2.40GHz ( SkyLake CPU), I see ~ the same performance on my end:&lt;/P&gt;
&lt;P&gt;MKL 2017 u2:&lt;/P&gt;
&lt;P&gt;[gfedorov@skx2 05339303]$ MKL_VERBOSE=0 ./a.out 10000&lt;/P&gt;
&lt;P&gt;&amp;nbsp;size == 10000, GFlops == 2343.43&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;[gfedorov@skx2 05339303]$ MKL_VERBOSE=0 ./a.out 10000&lt;/P&gt;
&lt;P&gt;&amp;nbsp;size == 10000, GFlops == 2251.49&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;lscpu, as well both MKL_VERBOSE=1 logs are attached for your reference.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I noticed you said about Xeon Phi CPU. Then It should be noted, that since MKL 2022, this CPU type has been deprecated. Please check the latest Release Notes following this link: &lt;A href="https://cqpreview.intel.com/content/www/us/en/developer/articles/release-notes/onemkl-release-notes.html" target="_blank" rel="noopener"&gt;https://cqpreview.intel.com/content/www/us/en/developer/articles/release-notes/onemkl-release-notes.html&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 08:08:35 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352572#M32609</guid>
      <dc:creator>Gennady_F_Intel</dc:creator>
      <dc:date>2022-01-19T08:08:35Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352587#M32611</link>
      <description>&lt;P&gt;PLease share the valid url&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Rizwan1_0-1642580904770.png" style="width: 400px;"&gt;&lt;img src="https://community.intel.com/t5/image/serverpage/image-id/25786iCC98EE8425FD3CDF/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400&amp;amp;whitelist-exif-data=Orientation%2CResolution%2COriginalDefaultFinalSize%2CCopyright" role="button" title="Rizwan1_0-1642580904770.png" alt="Rizwan1_0-1642580904770.png" /&gt;&lt;/span&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Thanks for the update.&lt;/P&gt;
&lt;P&gt;Please share, what version of oneAPI BaseKIT and HPCKit best fit for &lt;SPAN&gt;&amp;nbsp;Intel Xeon Phi 7250 and&amp;nbsp;&lt;/SPAN&gt;CentOS 8.5. How can I get the previous versions&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 08:30:53 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352587#M32611</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-19T08:30:53Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352589#M32612</link>
      <description>&lt;P&gt;Could you please give a little favour and share the a.out binary file so that I can test it at my system&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;This will be a great help&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Thanks&lt;/P&gt;
&lt;P&gt;Regards&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 08:34:47 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352589#M32612</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-19T08:34:47Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352595#M32613</link>
      <description>&lt;P&gt;see the&amp;nbsp;_stat2020.log attached. This is a statically linked executable.&lt;/P&gt;
&lt;P&gt;I zipped _stat2020.out as *.log due to the *.out attachments are not acceptable by the forum engine.&lt;/P&gt;
&lt;P&gt;the password - intelmklforum&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 09:01:58 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352595#M32613</guid>
      <dc:creator>Gennady_F_Intel</dc:creator>
      <dc:date>2022-01-19T09:01:58Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352596#M32614</link>
      <description>&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 09:03:41 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352596#M32614</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-19T09:03:41Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352601#M32615</link>
      <description>&lt;P&gt;Thanks but is this compressed in the windows environment or Linux environment&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 09:19:19 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352601#M32615</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-19T09:19:19Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352607#M32616</link>
      <description>&lt;P&gt;Dear&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Thanks for sharing the executable file. I executed it but I still get 762.311 GFlops on Intel Xeon Phi and CentOS 8.5.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Could you please also give me one favour? Could you please tell me the environment variable set up at your end?&lt;BR /&gt;I don't know why files that give 2+ TFlops previously now give less than 800 GFlops&lt;/P&gt;
&lt;P&gt;I have installed intel one API&amp;nbsp;2022.0.1&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 09:37:26 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352607#M32616</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-19T09:37:26Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352697#M32619</link>
      <description>&lt;P&gt;Could you run this 2022 executable with verbose mode enabled and share the output?&amp;nbsp;&lt;/P&gt;
&lt;P&gt;how to run:&amp;nbsp; MKL_VERBOSE=1&amp;nbsp; ./a.out 10000&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 13:34:43 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352697#M32619</guid>
      <dc:creator>Gennady_F_Intel</dc:creator>
      <dc:date>2022-01-19T13:34:43Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352884#M32622</link>
      <description>&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Rizwan1_0-1642639299191.png" style="width: 400px;"&gt;&lt;img src="https://community.intel.com/t5/image/serverpage/image-id/25825iA9517BA89A210D60/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400&amp;amp;whitelist-exif-data=Orientation%2CResolution%2COriginalDefaultFinalSize%2CCopyright" role="button" title="Rizwan1_0-1642639299191.png" alt="Rizwan1_0-1642639299191.png" /&gt;&lt;/span&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 00:41:44 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352884#M32622</guid>
      <dc:creator>Rizwan1</dc:creator>
      <dc:date>2022-01-20T00:41:44Z</dc:date>
    </item>
    <item>
      <title>Re: MKL cblas_dgemm huge performance gap on intelOneAPI and Parallel Studio Studio</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352934#M32626</link>
      <description>&lt;P&gt;Ok and then link your example against MKL 2017 and run with the same MKL_VERBOSE=1 on the same machine and share the log file, please.&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 04:44:14 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/MKL-cblas-dgemm-huge-performance-gap-on-intelOneAPI-and-Parallel/m-p/1352934#M32626</guid>
      <dc:creator>Gennady_F_Intel</dc:creator>
      <dc:date>2022-01-20T04:44:14Z</dc:date>
    </item>
  </channel>
</rss>

