<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic UCX ERROR with Intel MPI 2021.1.1 in Intel® MPI Library</title>
    <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1535715#M11039</link>
    <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I was running MPI job on multiple nodes with Intel MPI 2021.1.1, jobs aborted due to the following error:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;[1690463626.483072] [n148:434957:0] cma_ep.c:62 UCX ERROR process_vm_readv(pid=434958 length=42432) returned -1: No such process&lt;BR /&gt;[1690463626.521152] [n148:434969:0] cma_ep.c:62 UCX ERROR process_vm_readv(pid=434968 length=42432) returned -1: No such process&lt;BR /&gt;[1690463626.522181] [n148:434970:0] cma_ep.c:62 UCX ERROR process_vm_readv(pid=434969 length=42432) returned -1: No such process&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;===================================================================================&lt;BR /&gt;= BAD TERMINATION OF ONE OF YOUR APPLICATION PROCESSES&lt;BR /&gt;= RANK 0 PID 434942 RUNNING AT n148&lt;BR /&gt;= KILLED BY SIGNAL: 9 (Killed)&lt;BR /&gt;===================================================================================&lt;/P&gt;&lt;P&gt;===================================================================================&lt;BR /&gt;= BAD TERMINATION OF ONE OF YOUR APPLICATION PROCESSES&lt;BR /&gt;= RANK 0 PID 434942 RUNNING AT n148&lt;BR /&gt;= KILLED BY SIGNAL: 9 (Killed)&lt;BR /&gt;===================================================================================&lt;BR /&gt;...&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Under what conditions does this error occur?&lt;/P&gt;&lt;P&gt;It is difficult to provide detailed information such as execution script, but I hope to obtain some clues for resolving this error.&lt;/P&gt;&lt;P&gt;MPI job was running on 16 nodes, and the same job was running on other nodes at the same time.&lt;/P&gt;&lt;P&gt;Information on OS, kernel, and ucx versions is below:&lt;BR /&gt;&amp;nbsp; OS: CentOS 8.4&lt;BR /&gt;&amp;nbsp; kernel: 4.18.0-305.25.1.el8_4.x86_64&lt;BR /&gt;&amp;nbsp; OFED: MLNX_OFED_LINUX-4.9-4.0.8.0&lt;BR /&gt;&amp;nbsp; UCX: 1.8.0&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;1kan&lt;/P&gt;</description>
    <pubDate>Fri, 20 Oct 2023 02:55:50 GMT</pubDate>
    <dc:creator>1kan</dc:creator>
    <dc:date>2023-10-20T02:55:50Z</dc:date>
    <item>
      <title>UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1535715#M11039</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I was running MPI job on multiple nodes with Intel MPI 2021.1.1, jobs aborted due to the following error:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;[1690463626.483072] [n148:434957:0] cma_ep.c:62 UCX ERROR process_vm_readv(pid=434958 length=42432) returned -1: No such process&lt;BR /&gt;[1690463626.521152] [n148:434969:0] cma_ep.c:62 UCX ERROR process_vm_readv(pid=434968 length=42432) returned -1: No such process&lt;BR /&gt;[1690463626.522181] [n148:434970:0] cma_ep.c:62 UCX ERROR process_vm_readv(pid=434969 length=42432) returned -1: No such process&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;===================================================================================&lt;BR /&gt;= BAD TERMINATION OF ONE OF YOUR APPLICATION PROCESSES&lt;BR /&gt;= RANK 0 PID 434942 RUNNING AT n148&lt;BR /&gt;= KILLED BY SIGNAL: 9 (Killed)&lt;BR /&gt;===================================================================================&lt;/P&gt;&lt;P&gt;===================================================================================&lt;BR /&gt;= BAD TERMINATION OF ONE OF YOUR APPLICATION PROCESSES&lt;BR /&gt;= RANK 0 PID 434942 RUNNING AT n148&lt;BR /&gt;= KILLED BY SIGNAL: 9 (Killed)&lt;BR /&gt;===================================================================================&lt;BR /&gt;...&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Under what conditions does this error occur?&lt;/P&gt;&lt;P&gt;It is difficult to provide detailed information such as execution script, but I hope to obtain some clues for resolving this error.&lt;/P&gt;&lt;P&gt;MPI job was running on 16 nodes, and the same job was running on other nodes at the same time.&lt;/P&gt;&lt;P&gt;Information on OS, kernel, and ucx versions is below:&lt;BR /&gt;&amp;nbsp; OS: CentOS 8.4&lt;BR /&gt;&amp;nbsp; kernel: 4.18.0-305.25.1.el8_4.x86_64&lt;BR /&gt;&amp;nbsp; OFED: MLNX_OFED_LINUX-4.9-4.0.8.0&lt;BR /&gt;&amp;nbsp; UCX: 1.8.0&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;1kan&lt;/P&gt;</description>
      <pubDate>Fri, 20 Oct 2023 02:55:50 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1535715#M11039</guid>
      <dc:creator>1kan</dc:creator>
      <dc:date>2023-10-20T02:55:50Z</dc:date>
    </item>
    <item>
      <title>Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1536245#M11047</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks for posting in the Intel forums.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you please let us know whether you are facing a similar issue with the latest version of Intel oneAPI 2023.2?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you please try with the supported OS version. For more details please refer to the below link.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.intel.com/content/www/us/en/developer/articles/system-requirements/mpi-library-system-requirements.html" target="_blank"&gt;https://www.intel.com/content/www/us/en/developer/articles/system-requirements/mpi-library-system-requirements.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please provide us the complete debug log setting I_MPI_DEBUG=10 and also the command line you have been using.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Shivani&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 23 Oct 2023 05:46:05 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1536245#M11047</guid>
      <dc:creator>ShivaniK_Intel</dc:creator>
      <dc:date>2023-10-23T05:46:05Z</dc:date>
    </item>
    <item>
      <title>Re: UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1536629#M11050</link>
      <description>&lt;P&gt;&lt;SPAN&gt;Hi Shivani,&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you for your reply.&lt;/P&gt;&lt;P&gt;Intel oneAPI 2023.2 is not installed on the system I am using.&lt;BR /&gt;I just want to run MPI jobs using Intel oneAPI 2021.1.1.&lt;BR /&gt;If you know anything about what causes this error, please let me know.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;1kan&lt;/P&gt;</description>
      <pubDate>Tue, 24 Oct 2023 02:54:12 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1536629#M11050</guid>
      <dc:creator>1kan</dc:creator>
      <dc:date>2023-10-24T02:54:12Z</dc:date>
    </item>
    <item>
      <title>Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1537909#M11083</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Please provide us the complete debug log setting I_MPI_DEBUG=10 and also the command line you have been using.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you please provide us with the sample reproducer and steps to reproduce the issue at our end?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you also please let us know whether you are able to run your application on a single node and Intel MPI benchmark on a multi-node which will help us to&lt;/P&gt;&lt;P&gt;investigate the issue at our end?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Shivani&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Fri, 27 Oct 2023 09:28:18 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1537909#M11083</guid>
      <dc:creator>ShivaniK_Intel</dc:creator>
      <dc:date>2023-10-27T09:28:18Z</dc:date>
    </item>
    <item>
      <title>Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1540180#M11102</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;As we did not hear back from you could you please respond to my previous post?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Shivani&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Fri, 03 Nov 2023 06:44:37 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1540180#M11102</guid>
      <dc:creator>ShivaniK_Intel</dc:creator>
      <dc:date>2023-11-03T06:44:37Z</dc:date>
    </item>
    <item>
      <title>Re: Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1542162#M11121</link>
      <description>&lt;P class=""&gt;&lt;SPAN class=""&gt;Hi Shivani,&lt;/SPAN&gt;&lt;/P&gt;&lt;P class=""&gt;&amp;nbsp;&lt;/P&gt;&lt;P class=""&gt;Sorry for the late reply.&lt;/P&gt;&lt;P class=""&gt;As you suggested, I would consider using Intel oneAPI 2023.2 to run MPI jobs.&lt;/P&gt;&lt;P class=""&gt;&amp;nbsp;&lt;/P&gt;&lt;P class=""&gt;Thanks,&lt;/P&gt;&lt;P class=""&gt;1kan&lt;/P&gt;</description>
      <pubDate>Thu, 09 Nov 2023 07:50:15 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1542162#M11121</guid>
      <dc:creator>1kan</dc:creator>
      <dc:date>2023-11-09T07:50:15Z</dc:date>
    </item>
    <item>
      <title>Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1543169#M11129</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Could you please let us know whether you are facing a similar issue with the latest version of Intel oneAPI 2023.2?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Shivani&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 13 Nov 2023 03:12:09 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1543169#M11129</guid>
      <dc:creator>ShivaniK_Intel</dc:creator>
      <dc:date>2023-11-13T03:12:09Z</dc:date>
    </item>
    <item>
      <title>Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1545458#M11158</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;As we did not hear back from you could you please respond to my previous post?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Shivani&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 20 Nov 2023 05:47:44 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1545458#M11158</guid>
      <dc:creator>ShivaniK_Intel</dc:creator>
      <dc:date>2023-11-20T05:47:44Z</dc:date>
    </item>
    <item>
      <title>Re:UCX ERROR with Intel MPI 2021.1.1</title>
      <link>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1547633#M11188</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;​&lt;/P&gt;&lt;P&gt;We have not heard back from you. This thread will be no longer monitored by Intel. If you need any further assistance, please post a new question.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards&lt;/P&gt;&lt;P&gt;Shivani&lt;/P&gt;&lt;P&gt;​&lt;/P&gt;&lt;P&gt;​&lt;/P&gt;&lt;BR /&gt;</description>
      <pubDate>Mon, 27 Nov 2023 03:56:21 GMT</pubDate>
      <guid>https://community.intel.com/t5/Intel-MPI-Library/UCX-ERROR-with-Intel-MPI-2021-1-1/m-p/1547633#M11188</guid>
      <dc:creator>ShivaniK_Intel</dc:creator>
      <dc:date>2023-11-27T03:56:21Z</dc:date>
    </item>
  </channel>
</rss>

