Skip to content

Commit a88ae33

Browse files
authored
Merge pull request #3077 from jsquyres/pr/tcp-btl-make-the-output-optional
btl/tcp: direct a warning message to show_help
2 parents 4f810d5 + 5b484c9 commit a88ae33

File tree

2 files changed

+25
-7
lines changed

2 files changed

+25
-7
lines changed

opal/mca/btl/tcp/btl_tcp_proc.c

Lines changed: 9 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
* and Technology (RIST). All rights reserved.
1717
* Copyright (c) 2015-2016 Los Alamos National Security, LLC. All rights
1818
* reserved.
19-
* Copyright (c) 2015 Cisco Systems, Inc. All rights reserved.
19+
* Copyright (c) 2015-2017 Cisco Systems, Inc. All rights reserved
2020
* $COPYRIGHT$
2121
*
2222
* Additional copyrights may follow
@@ -41,6 +41,7 @@
4141
#include "opal/util/if.h"
4242
#include "opal/util/net.h"
4343
#include "opal/util/proc.h"
44+
#include "opal/util/show_help.h"
4445

4546
#include "btl_tcp.h"
4647
#include "btl_tcp_proc.h"
@@ -846,11 +847,13 @@ void mca_btl_tcp_proc_accept(mca_btl_tcp_proc_t* btl_proc, struct sockaddr* addr
846847
len = 1024 - strlen(addr_str);
847848
}
848849
}
849-
opal_output(0, "btl: tcp: Incoming connection from %s does not match known addresses for peer %s [hostname=%s addr=%s]. Drop !\n",
850-
opal_net_get_hostname((struct sockaddr*)addr),
851-
OPAL_NAME_PRINT(btl_proc->proc_opal->proc_name),
852-
btl_proc->proc_opal->proc_hostname,
853-
addr_str);
850+
opal_show_help("help-mpi-btl-tcp.txt", "dropped inbound connection",
851+
true, opal_process_info.nodename,
852+
getpid(),
853+
btl_proc->proc_opal->proc_hostname,
854+
OPAL_NAME_PRINT(btl_proc->proc_opal->proc_name),
855+
opal_net_get_hostname((struct sockaddr*)addr),
856+
addr_str);
854857
free(addr_str);
855858
}
856859
OPAL_THREAD_UNLOCK(&btl_proc->proc_lock);

opal/mca/btl/tcp/help-mpi-btl-tcp.txt

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# -*- text -*-
22
#
3-
# Copyright (c) 2009-2016 Cisco Systems, Inc. All rights reserved.
3+
# Copyright (c) 2009-2017 Cisco Systems, Inc. All rights reserved
44
# Copyright (c) 2015-2016 The University of Tennessee and The University
55
# of Tennessee Research Foundation. All rights
66
# reserved.
@@ -85,3 +85,18 @@ or other external events.
8585
Local PID: %d
8686
Peer host: %s
8787
#
88+
[dropped inbound connection]
89+
Open MPI detected an inbound MPI TCP connection request from a peer
90+
that appears to be part of this MPI job (i.e., it identified itself as
91+
part of this Open MPI job), but it is from an IP address that is
92+
unexpected. This is highly unusual.
93+
94+
The inbound connection has been dropped, and the peer should simply
95+
try again with a different IP interface (i.e., the job should
96+
hopefully be able to continue).
97+
98+
Local host: %s
99+
Local PID: %d
100+
Peer hostname: %s (%s)
101+
Source IP of socket: %s
102+
Known IPs of peer: %s

0 commit comments

Comments
 (0)