Skip to content

Commit d03a471

Browse files
Merge pull request #20950 from danwinship/egressip-ping-errors
Improve egress IP node-offline-tracking error checking
2 parents 1a61ff2 + 7dbbfda commit d03a471

File tree

1 file changed

+16
-9
lines changed

1 file changed

+16
-9
lines changed

pkg/network/common/egressip.go

+16-9
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,9 @@ package common
33
import (
44
"fmt"
55
"net"
6+
"os"
67
"sync"
8+
"syscall"
79
"time"
810

911
"github.com/golang/glog"
@@ -468,11 +470,12 @@ func (eit *EgressIPTracker) lookupNodeIP(ip string) string {
468470
return ip
469471
}
470472

471-
// Ping a node and return whether or not it is online. We do this by trying to open a TCP
472-
// connection to the "discard" service (port 9); if the node is offline, the attempt will
473-
// time out with no response (and we will return false). If the node is online then we
474-
// presumably will get a "connection refused" error; the code below assumes that anything
475-
// other than timing out indicates that the node is online.
473+
// Ping a node and return whether or not we think it is online. We do this by trying to
474+
// open a TCP connection to the "discard" service (port 9); if the node is offline, the
475+
// attempt will either time out with no response, or else return "no route to host" (and
476+
// we will return false). If the node is online then we presumably will get a "connection
477+
// refused" error; but the code below assumes that anything other than timeout or "no
478+
// route" indicates that the node is online.
476479
func (eit *EgressIPTracker) Ping(ip string, timeout time.Duration) bool {
477480
// If the caller used a public node IP, replace it with the SDN IP
478481
ip = eit.lookupNodeIP(ip)
@@ -481,11 +484,15 @@ func (eit *EgressIPTracker) Ping(ip string, timeout time.Duration) bool {
481484
if conn != nil {
482485
conn.Close()
483486
}
484-
if opErr, ok := err.(*net.OpError); ok && opErr.Timeout() {
485-
return false
486-
} else {
487-
return true
487+
if opErr, ok := err.(*net.OpError); ok {
488+
if opErr.Timeout() {
489+
return false
490+
}
491+
if sysErr, ok := opErr.Err.(*os.SyscallError); ok && sysErr.Err == syscall.EHOSTUNREACH {
492+
return false
493+
}
488494
}
495+
return true
489496
}
490497

491498
// Finds the best node to allocate the egress IP to, given the existing allocation. The

0 commit comments

Comments
 (0)