<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re:Measuring Time inside kernel on intel GPU(P630) in Intel® oneAPI DPC++/C++ Compiler</title>
    <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1385225#M2171</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks for reaching out to us.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;we can measure the actual kernel execution time on the device using DPC++ built-in profiling API.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please refer to the below link for more details:&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.intel.com/content/www/us/en/develop/documentation/oneapi-gpu-optimization-guide/top/kernels/kernel-launch.html" target="_blank"&gt;https://www.intel.com/content/www/us/en/develop/documentation/oneapi-gpu-optimization-guide/top/kernels/kernel-launch.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please get back to us if you face any issues with a sample reproducer.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan.&lt;/P&gt;&lt;BR /&gt;</description>
    <pubDate>Wed, 18 May 2022 10:54:59 GMT</pubDate>
    <dc:creator>NoorjahanSk_Intel</dc:creator>
    <dc:date>2022-05-18T10:54:59Z</dc:date>
    <item>
      <title>Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1384741#M2156</link>
      <description>&lt;P&gt;I have fair amount of experience on GPU programming using CUDA. I used to use clock function inside CUDA kernel (as mentioned in here) to measure ticks of certain operations inside the kernel. I wrote a simple oneAPI kernel and tried to run it on the intel integrated GPU. &lt;SPAN&gt;Errors will be generated.&lt;/SPAN&gt;&lt;/P&gt;
&lt;LI-CODE lang="cpp"&gt;__kernel void testVecAdd(__global const int *a,__global const int *b,__global int *c,
                 __global float *t){

clock_t start = clock();

 int gid = get_global_id(0);
 c[gid] = a[gid] + b[gid];

 t[gid] = (float)(clock()-start)/CLOCKS_PER_SEC;

}&lt;/LI-CODE&gt;
&lt;P&gt;error info:&lt;/P&gt;
&lt;LI-CODE lang="bash"&gt;Native API returns: -999 (Unknown OpenCL error code) -999 (Unknown OpenCL error code)Exception caught at file:latency.cpp, line:500&lt;/LI-CODE&gt;
&lt;P&gt;&amp;nbsp;How 2 fix it? Thx&lt;/P&gt;</description>
      <pubDate>Tue, 17 May 2022 03:29:37 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1384741#M2156</guid>
      <dc:creator>PcDack1</dc:creator>
      <dc:date>2022-05-17T03:29:37Z</dc:date>
    </item>
    <item>
      <title>Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1385225#M2171</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks for reaching out to us.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;we can measure the actual kernel execution time on the device using DPC++ built-in profiling API.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please refer to the below link for more details:&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.intel.com/content/www/us/en/develop/documentation/oneapi-gpu-optimization-guide/top/kernels/kernel-launch.html" target="_blank"&gt;https://www.intel.com/content/www/us/en/develop/documentation/oneapi-gpu-optimization-guide/top/kernels/kernel-launch.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please get back to us if you face any issues with a sample reproducer.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Wed, 18 May 2022 10:54:59 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1385225#M2171</guid>
      <dc:creator>NoorjahanSk_Intel</dc:creator>
      <dc:date>2022-05-18T10:54:59Z</dc:date>
    </item>
    <item>
      <title>Re: Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1385422#M2176</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;SPAN&gt;Noorjahan,&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Thanks for your answer, I would like to use this &lt;A href="https://arxiv.org/pdf/1509.02308&amp;amp;ved...qHEz78QnmcIVCSXvg&amp;amp;sig2=IdzxfrzQgNv8yq7e1mkeVg" target="_self"&gt;method&lt;/A&gt; to get Memory Latency. so using profiler tool seems not good to do it. Is there a tool in oneAPI to get Memory Latency?&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Thanks &amp;amp; Regards,&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Dack.&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2022 00:22:31 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1385422#M2176</guid>
      <dc:creator>PcDack1</dc:creator>
      <dc:date>2022-05-19T00:22:31Z</dc:date>
    </item>
    <item>
      <title>Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1386945#M2196</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;You can try using the Intel® Memory Latency Checker v3.9a tool to get memory latency.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please refer to the below link for more details regarding MLC tool.&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.intel.com/content/www/us/en/developer/articles/tool/intelr-memory-latency-checker.html" target="_blank"&gt;https://www.intel.com/content/www/us/en/developer/articles/tool/intelr-memory-latency-checker.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;You can also use the Vrune profiler tool which you get by downloading oneAPI Basetoolkit to get memory latency.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please refer to the below link for more details:&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.intel.com/content/www/us/en/develop/documentation/vtune-help/top/reference/cpu-metrics-reference/memory-bound/dram-bound/memory-latency.html" target="_blank"&gt;https://www.intel.com/content/www/us/en/develop/documentation/vtune-help/top/reference/cpu-metrics-reference/memory-bound/dram-bound/memory-latency.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please let us know whether this tool matches your use case.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Tue, 24 May 2022 10:54:04 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1386945#M2196</guid>
      <dc:creator>NoorjahanSk_Intel</dc:creator>
      <dc:date>2022-05-24T10:54:04Z</dc:date>
    </item>
    <item>
      <title>Re: Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1387519#M2207</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;SPAN&gt;Noorjahan,&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Thank you for your answer. First, I think the Intel® Memory Latency Checker v3.9a tool only works on the CPU, and I now want to test the GPU's Memory Latency. Secondly, the Vtune profiler tool can only get the L3 Miss of the GPU, I can't get the L1 and L2 Miss. Does the tool exist for me to get GPUs(HD serial) L1 and L2 Miss?&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Thanks &amp;amp; Regards,&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Dack.&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 26 May 2022 00:57:00 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1387519#M2207</guid>
      <dc:creator>PcDack1</dc:creator>
      <dc:date>2022-05-26T00:57:00Z</dc:date>
    </item>
    <item>
      <title>Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1390505#M2258</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;We are checking with the concerned team and we will get back to you soon.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Tue, 07 Jun 2022 06:38:44 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1390505#M2258</guid>
      <dc:creator>NoorjahanSk_Intel</dc:creator>
      <dc:date>2022-06-07T06:38:44Z</dc:date>
    </item>
    <item>
      <title>Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1393363#M2282</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;EM&gt;&amp;gt;&amp;gt; Does the tool exist for me to get GPUs(HD serial) L1 and L2 Miss?&lt;/EM&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;In Gen9 compute architecture, the sampler/images includes L1 and L2 cache Miss and buffers include L3 cache miss.&lt;/P&gt;&lt;P&gt;You can get the L1 and L2 miss using the Vtune profiler if you use sycl images/samplers in your application.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please refer to the below link for more details:&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.intel.com/content/dam/develop/external/us/en/documents/the-compute-architecture-of-intel-processor-graphics-gen9-v1d0.pdf#page=10" target="_blank"&gt;https://www.intel.com/content/dam/develop/external/us/en/documents/the-compute-architecture-of-intel-processor-graphics-gen9-v1d0.pdf#page=10&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Fri, 17 Jun 2022 09:36:51 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1393363#M2282</guid>
      <dc:creator>NoorjahanSk_Intel</dc:creator>
      <dc:date>2022-06-17T09:36:51Z</dc:date>
    </item>
    <item>
      <title>Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1395604#M2311</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;We haven't heard back from you. Could you please provide an update on your issue?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 27 Jun 2022 09:22:52 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1395604#M2311</guid>
      <dc:creator>NoorjahanSk_Intel</dc:creator>
      <dc:date>2022-06-27T09:22:52Z</dc:date>
    </item>
    <item>
      <title>Re:Measuring Time inside kernel on intel GPU(P630)</title>
      <link>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1395610#M2312</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks for accepting our solution.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;As this issue has been resolved, we will no longer respond to this thread. If you need any additional information, please submit a new question.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Noorjahan.&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 27 Jun 2022 09:39:19 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-oneAPI-DPC-C-Compiler/Measuring-Time-inside-kernel-on-intel-GPU-P630/m-p/1395610#M2312</guid>
      <dc:creator>NoorjahanSk_Intel</dc:creator>
      <dc:date>2022-06-27T09:39:19Z</dc:date>
    </item>
  </channel>
</rss>

