<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re:CPU backend performance issues. in Intel® oneAPI DPC++/C++ Compiler</title>
    <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241700#M873</link>
    <description>&lt;P&gt;No, it is not reproducible, even with O3. Could you please share a compiler command line and other steps to reproduce?&lt;/P&gt;&lt;P&gt;What do you mean by 'which should translate to -O3 by clang-cl'?&lt;/P&gt;&lt;BR /&gt;</description>
    <pubDate>Tue, 29 Dec 2020 17:46:50 GMT</pubDate>
    <dc:creator>Alina_S_Intel</dc:creator>
    <dc:date>2020-12-29T17:46:50Z</dc:date>
    <item>
      <title>CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1238192#M842</link>
      <description>&lt;DIV class="lia-quilt-row lia-quilt-row-message-subject"&gt;
&lt;DIV class="lia-quilt-column lia-quilt-column-24 lia-quilt-column-single lia-quilt-column-message-subject-content"&gt;
&lt;DIV class="lia-quilt-column-alley lia-quilt-column-alley-single"&gt;
&lt;DIV class="topic-subject-wrapper"&gt;
&lt;DIV class="lia-message-subject lia-component-message-view-widget-subject"&gt;
&lt;DIV class="MessageSubject"&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;STRONG&gt;OS&lt;/STRONG&gt;&lt;/FONT&gt;&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;DIV class="lia-quilt-row lia-quilt-row-message-body"&gt;
&lt;DIV class="lia-quilt-column lia-quilt-column-24 lia-quilt-column-single lia-quilt-column-message-body-content"&gt;
&lt;DIV class="lia-quilt-column-alley lia-quilt-column-alley-single"&gt;
&lt;DIV id="bodyDisplay" class="lia-message-body lia-component-message-view-widget-body lia-component-body-signature-highlight-escalation lia-component-message-view-widget-body-signature-highlight-escalation"&gt;
&lt;DIV class="lia-message-body-content"&gt;
&lt;P class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;Windows 10&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;STRONG&gt;IDE&lt;/STRONG&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;Visual Studio 19&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;STRONG&gt;Compiler&lt;/STRONG&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;Intel(R) oneAPI DPC++ compiler&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;STRONG&gt;Toolkit&lt;/STRONG&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;P class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;oneAPI Base Toolkit version 2021.1&lt;/FONT&gt;&lt;/P&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;STRONG&gt;Problem&lt;/STRONG&gt;&lt;/FONT&gt;&lt;/P&gt;
&lt;OL&gt;
&lt;LI class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;Random&amp;nbsp;&lt;FONT face="courier new,courier"&gt;call&lt;/FONT&gt;&amp;nbsp;instructions are generated in critical loops when using&amp;nbsp;&lt;FONT face="courier new,courier"&gt;parallel_for&lt;/FONT&gt;.&lt;/FONT&gt;&lt;/LI&gt;
&lt;LI class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;No loop optimization is applied when using&amp;nbsp;&lt;FONT face="courier new,courier"&gt;single_task&lt;/FONT&gt;.&lt;/FONT&gt;&lt;/LI&gt;
&lt;/OL&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;Example program,&lt;/FONT&gt;&lt;/P&gt;
&lt;LI-CODE lang="markup"&gt;#include &amp;lt;CL/sycl.hpp&amp;gt;

#include &amp;lt;iostream&amp;gt;

namespace {

  __declspec(noinline) void add(
    float const* a, size_t a_stride,
    float const* b, size_t b_stride,
    float* c, size_t c_stride,
    size_t w, size_t h
  ) {
    for (size_t y = 0; y &amp;lt; h; ++y) {
      for (size_t x = 0; x &amp;lt; w; ++x) {
        c[y * c_stride + x] = a[y * a_stride + x] + b[y * b_stride + x];
      }
    }
  }

  __declspec(noinline) void add_single_task(
    sycl::queue&amp;amp; q,
    float const* a, size_t a_stride,
    float const* b, size_t b_stride,
    float* c, size_t c_stride,
    size_t w, size_t h
  ) {
    auto e = q.submit([&amp;amp;](sycl::handler&amp;amp; cgh) {

      cgh.single_task([=]() {
        for (size_t y = 0; y &amp;lt; h; ++y) {
          for (size_t x = 0; x &amp;lt; w; ++x) {
            c[y * c_stride + x] = a[y * a_stride + x] + b[y * b_stride + x];
          }
        }
        });
      });

    e.wait_and_throw();
  }

  __declspec(noinline) void add_parallel_for(
    sycl::queue&amp;amp; q,
    float const* a, size_t a_stride,
    float const* b, size_t b_stride,
    float* c, size_t c_stride,
    size_t w, size_t h
  ) {
    auto e = q.submit([&amp;amp;](sycl::handler&amp;amp; cgh) {

      cgh.parallel_for(sycl::range&amp;lt;2&amp;gt;(h, w), [=](sycl::id&amp;lt;2&amp;gt; index) {
        auto y = index[0];
        auto x = index[1];

        c[y * c_stride + x] = a[y * a_stride + x] + b[y * b_stride + x];
        });
      });

    e.wait_and_throw();
  }

  sycl::queue get_queue() {
    // Note:
    // Initialization of a queue is very slow.
    // Hence, we'll be caching it.
    static auto q = sycl::queue(sycl::cpu_selector());
    return q;
  }

}  // namespace

int main(int argc, char* argv[]) {
  try {
    auto q = get_queue();
  }
  catch (std::exception const&amp;amp; e) {
    std::cout &amp;lt;&amp;lt; "Queue initialization failed with " &amp;lt;&amp;lt; e.what() &amp;lt;&amp;lt; '\n';
    return -1;
  }

  try {
    constexpr auto w = size_t(1024);
    constexpr auto h = size_t(1024);

    auto a = std::vector&amp;lt;float&amp;gt;(w * h, 1);
    auto b = std::vector&amp;lt;float&amp;gt;(w * h, 2);
    auto c = std::vector&amp;lt;float&amp;gt;(w * h);

    auto q = get_queue();

    for (size_t i = 0; i &amp;lt; 30; ++i) {
      add(a.data(), w, b.data(), w, c.data(), w, w, h);
      add_single_task(q, a.data(), w, b.data(), w, c.data(), w, w, h);
      add_parallel_for(q, a.data(), w, b.data(), w, c.data(), w, w, h);
    }
  }
  catch (std::exception const&amp;amp; e) {
    std::cout &amp;lt;&amp;lt; "Add failed with " &amp;lt;&amp;lt; e.what() &amp;lt;&amp;lt; '\n';
    return -1;
  }

  return 0;
}
&lt;/LI-CODE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;Intel Advisor reports,&lt;/FONT&gt;&lt;/P&gt;
&lt;OL&gt;
&lt;LI class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;FONT face="courier new,courier"&gt;add_parallel_for&lt;/FONT&gt;,&lt;/FONT&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;FONT face="helvetica" color="#000000"&gt;- call tree,&lt;/FONT&gt;&lt;BR /&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="add_parallel_for_call_stack.png" style="width: 500px;"&gt;&lt;img src="https://community.intel.com/t5/image/serverpage/image-id/14172iF50DD33BC43AFA51/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999&amp;amp;whitelist-exif-data=Orientation%2CResolution%2COriginalDefaultFinalSize%2CCopyright" role="button" title="add_parallel_for_call_stack.png" alt="add_parallel_for_call_stack.png" /&gt;&lt;/span&gt;&lt;/FONT&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;FONT face="helvetica" color="#000000"&gt;- assembly,&lt;/FONT&gt;&lt;BR /&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="add_parallel_for_assembly.png" style="width: 314px;"&gt;&lt;img src="https://community.intel.com/t5/image/serverpage/image-id/14173iCE758D8151B55D19/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999&amp;amp;whitelist-exif-data=Orientation%2CResolution%2COriginalDefaultFinalSize%2CCopyright" role="button" title="add_parallel_for_assembly.png" alt="add_parallel_for_assembly.png" /&gt;&lt;/span&gt;&lt;/FONT&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/LI&gt;
&lt;LI class="lia-indent-padding-left-30px"&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;FONT face="courier new,courier"&gt;add_single_task&lt;/FONT&gt;,&lt;/FONT&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;FONT face="helvetica" color="#000000"&gt;- source insights,&lt;/FONT&gt;&lt;BR /&gt;&lt;FONT face="helvetica" color="#000000"&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="add_single_task_insights.PNG" style="width: 352px;"&gt;&lt;img src="https://community.intel.com/t5/image/serverpage/image-id/14174i9A52787C9D818260/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999&amp;amp;whitelist-exif-data=Orientation%2CResolution%2COriginalDefaultFinalSize%2CCopyright" role="button" title="add_single_task_insights.PNG" alt="add_single_task_insights.PNG" /&gt;&lt;/span&gt;&lt;/FONT&gt;&lt;/LI&gt;
&lt;/OL&gt;
&lt;P&gt;&lt;FONT face="helvetica" color="#000000"&gt;Are those call&amp;nbsp;instructions necessary and is there a way to request the AOT/JIT compiler to not generate them? And for &lt;FONT face="courier new,courier"&gt;single_task&lt;/FONT&gt;, shouldn't optimization be applied as well (was simply interested to see how it&amp;nbsp;fare against the host compiler optimization, &lt;FONT face="courier new,courier"&gt;add&lt;/FONT&gt;)?&lt;/FONT&gt;&lt;/P&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;
&lt;/DIV&gt;</description>
      <pubDate>Thu, 17 Dec 2020 06:57:04 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1238192#M842</guid>
      <dc:creator>ChoonHo</dc:creator>
      <dc:date>2020-12-17T06:57:04Z</dc:date>
    </item>
    <item>
      <title>Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1239749#M855</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;Thanks for reaching out to us!&lt;/P&gt;&lt;P&gt;We are escalating this thread to the Subject Matter Expert(SME) who will guide you further. &lt;/P&gt;&lt;P&gt;Have a Good day&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Goutham&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Tue, 22 Dec 2020 10:38:44 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1239749#M855</guid>
      <dc:creator>GouthamK_Intel</dc:creator>
      <dc:date>2020-12-22T10:38:44Z</dc:date>
    </item>
    <item>
      <title>Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1240537#M861</link>
      <description>&lt;P&gt;I reproduced the second issue (No loop optimization is applied when using single_task).  Since this is a missed performance opportunity, I suppose it might be escalated as a feature request. I am presently investigating it and will get back to you shortly with an update.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;However, I wasn't able to reproduce &lt;B&gt;callq &lt;/B&gt;inside add_parallel_for. Could you please share the compiler options you used? Which compiler driver, dpcpp or icx\icpx, did you use?&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Thu, 24 Dec 2020 13:00:19 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1240537#M861</guid>
      <dc:creator>Alina_S_Intel</dc:creator>
      <dc:date>2020-12-24T13:00:19Z</dc:date>
    </item>
    <item>
      <title>Re: Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241066#M864</link>
      <description>&lt;P&gt;Using default settings on release mode in Visual Studio.&lt;/P&gt;
&lt;P&gt;/O2 which should translate to -O3 by clang-cl.&lt;/P&gt;
&lt;P&gt;Was reproducible in,&lt;/P&gt;
&lt;UL&gt;
&lt;LI&gt;
&lt;P&gt;Intel(R) Core(TM) i5-7300HQ&lt;/P&gt;
&lt;/LI&gt;
&lt;LI&gt;
&lt;P&gt;Intel(R) Xeon(R) Gold 6230N&lt;/P&gt;
&lt;/LI&gt;
&lt;/UL&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 28 Dec 2020 01:32:29 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241066#M864</guid>
      <dc:creator>ChoonHo</dc:creator>
      <dc:date>2020-12-28T01:32:29Z</dc:date>
    </item>
    <item>
      <title>Re: Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241069#M865</link>
      <description>&lt;P&gt;If it's still not reproducible, try removing the &lt;FONT face="courier new,courier"&gt;add&lt;/FONT&gt; inside main, leaving only &lt;FONT face="courier new,courier"&gt;add_single_task&lt;/FONT&gt; and &lt;FONT face="courier new,courier"&gt;add_parallel_for&lt;/FONT&gt;.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 28 Dec 2020 01:36:32 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241069#M865</guid>
      <dc:creator>ChoonHo</dc:creator>
      <dc:date>2020-12-28T01:36:32Z</dc:date>
    </item>
    <item>
      <title>Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241700#M873</link>
      <description>&lt;P&gt;No, it is not reproducible, even with O3. Could you please share a compiler command line and other steps to reproduce?&lt;/P&gt;&lt;P&gt;What do you mean by 'which should translate to -O3 by clang-cl'?&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Tue, 29 Dec 2020 17:46:50 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241700#M873</guid>
      <dc:creator>Alina_S_Intel</dc:creator>
      <dc:date>2020-12-29T17:46:50Z</dc:date>
    </item>
    <item>
      <title>Re: Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241834#M876</link>
      <description>&lt;P&gt;Steps:&lt;/P&gt;
&lt;OL&gt;
&lt;LI&gt;Create a new project, select &lt;STRONG&gt;Empty Project&lt;/STRONG&gt;.&lt;/LI&gt;
&lt;LI&gt;Change &lt;STRONG&gt;Platform Toolset&lt;/STRONG&gt; from &lt;STRONG&gt;Visual Studio 2019 (v142)&lt;/STRONG&gt; to&amp;nbsp;&lt;STRONG&gt;Intel(R) oneAPI DPC++ Compiler&lt;/STRONG&gt;.&lt;/LI&gt;
&lt;LI&gt;Change &lt;STRONG&gt;x86&lt;/STRONG&gt; to &lt;STRONG&gt;x64&lt;/STRONG&gt; and &lt;STRONG&gt;Debug&lt;/STRONG&gt; to &lt;STRONG&gt;Release&lt;/STRONG&gt;.&lt;/LI&gt;
&lt;LI&gt;Paste the script and build.&lt;/LI&gt;
&lt;/OL&gt;
&lt;P&gt;* &lt;STRONG&gt;DPC++ Console Application&lt;/STRONG&gt; template project should work too (without having to go through steps 1 and 2).&lt;/P&gt;
&lt;P&gt;For reference, these are the arguments passed to the compiler.&lt;/P&gt;
&lt;LI-CODE lang="markup"&gt;/O2 /Zi /D "NDEBUG" /D "_CONSOLE" /D "_UNICODE" /D "UNICODE" /WX- /MD /EHsc /W1 /nologo /Fo"x64\Release\" &lt;/LI-CODE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;As to "&lt;SPAN&gt;which should translate to -O3 by clang-cl", as seen above, I'm using /O2 which is a msvc option, not a gcc/clang option. However, clang-cl should translate it to -O3.&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;I have also attached a zipped file which contains the project and executable along with Intel Advisor's report.&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 30 Dec 2020 01:46:00 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1241834#M876</guid>
      <dc:creator>ChoonHo</dc:creator>
      <dc:date>2020-12-30T01:46:00Z</dc:date>
    </item>
    <item>
      <title>Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1242089#M880</link>
      <description>&lt;P&gt;Thanks for sharing!&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN style="font-family: Consolas, Monaco, &amp;quot;Andale Mono&amp;quot;, &amp;quot;Ubuntu Mono&amp;quot;, monospace; font-size: 14px;"&gt;/Zi&amp;nbsp;&lt;/SPAN&gt;tells the compiler to generate full debugging information and call instructions are generated when it enabled. Without this option, there are no callq instructions. Please, note that /Zi is not recommended to use in the release code. So, this is not a bug.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Also, please, note that O0-O3 options are also supported by dpcpp \ icx compilers as well.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Wed, 30 Dec 2020 18:02:55 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1242089#M880</guid>
      <dc:creator>Alina_S_Intel</dc:creator>
      <dc:date>2020-12-30T18:02:55Z</dc:date>
    </item>
    <item>
      <title>Re: Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1242230#M882</link>
      <description>&lt;P&gt;Yes, that works.&lt;/P&gt;
&lt;P&gt;And the generated assembly is much much better, see attached image.&lt;/P&gt;
&lt;P&gt;Finally, is there any way to use intel loop directives&amp;nbsp;&lt;A href="https://software.intel.com/content/www/us/en/develop/documentation/oneapi-fpga-optimization-guide/top/fpga-optimization-flags-attributes-pragmas-and-extensions/loop-directives.html" target="_self"&gt;FPGA loop directives&lt;/A&gt;&amp;nbsp;for a CPU/GPU kernel, like &lt;FONT face="courier new,courier"&gt;[[intel::invdep]]&lt;/FONT&gt;?&lt;/P&gt;
&lt;P&gt;Using the same example,&lt;SPAN&gt;&lt;FONT face="courier new,courier"&gt;&amp;nbsp;c[y * c_stride + x] = a[y * a_stride + x] + b[y * b_stride + x]&lt;/FONT&gt;, I believe the optimizer detects possible memory aliasing here (&lt;FONT face="courier new,courier"&gt;y * stride&lt;/FONT&gt;), and disables other loop transformations, like loop unrolling, permutation, tiling, etc.&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 31 Dec 2020 01:41:35 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1242230#M882</guid>
      <dc:creator>ChoonHo</dc:creator>
      <dc:date>2020-12-31T01:41:35Z</dc:date>
    </item>
    <item>
      <title>Re:CPU backend performance issues.</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1283077#M1165</link>
      <description>&lt;P&gt;Hi,&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks for the confirmation!&lt;/P&gt;&lt;P&gt;As this issue has been resolved, we will no longer respond to this thread.&amp;nbsp;&lt;/P&gt;&lt;P&gt;If you require any additional assistance from Intel, please start a new thread.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Any further interaction in this thread will be considered community only.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Have a Good day.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;I&gt;Thanks &amp;amp; Regards&lt;/I&gt;&lt;/P&gt;&lt;P&gt;&lt;I&gt;Goutham&lt;/I&gt;&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Thu, 20 May 2021 07:28:41 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/CPU-backend-performance-issues/m-p/1283077#M1165</guid>
      <dc:creator>GouthamK_Intel</dc:creator>
      <dc:date>2021-05-20T07:28:41Z</dc:date>
    </item>
  </channel>
</rss>

