553 lines
17 KiB
Go
553 lines
17 KiB
Go
//go:build windows && cgo
|
|
|
|
package ingress
|
|
|
|
/*
|
|
#include <iphlpapi.h>
|
|
#include <icmpapi.h>
|
|
*/
|
|
import "C"
|
|
import (
|
|
"context"
|
|
"encoding/binary"
|
|
"fmt"
|
|
"net/netip"
|
|
"runtime/debug"
|
|
"syscall"
|
|
"time"
|
|
"unsafe"
|
|
|
|
"github.com/google/gopacket/layers"
|
|
"github.com/pkg/errors"
|
|
"github.com/rs/zerolog"
|
|
"go.opentelemetry.io/otel/attribute"
|
|
"golang.org/x/net/icmp"
|
|
"golang.org/x/net/ipv4"
|
|
"golang.org/x/net/ipv6"
|
|
|
|
"github.com/cloudflare/cloudflared/packet"
|
|
"github.com/cloudflare/cloudflared/tracing"
|
|
)
|
|
|
|
const (
|
|
// Value defined in https://docs.microsoft.com/en-us/windows/win32/api/winsock2/nf-winsock2-wsasocketw
|
|
AF_INET6 = 23
|
|
icmpEchoReplyCode = 0
|
|
nullParameter = uintptr(0)
|
|
)
|
|
|
|
var (
|
|
Iphlpapi = syscall.NewLazyDLL("Iphlpapi.dll")
|
|
IcmpCreateFile_proc = Iphlpapi.NewProc("IcmpCreateFile")
|
|
Icmp6CreateFile_proc = Iphlpapi.NewProc("Icmp6CreateFile")
|
|
IcmpSendEcho_proc = Iphlpapi.NewProc("IcmpSendEcho")
|
|
Icmp6SendEcho_proc = Iphlpapi.NewProc("Icmp6SendEcho2")
|
|
echoReplySize = unsafe.Sizeof(echoReply{})
|
|
echoV6ReplySize = unsafe.Sizeof(echoV6Reply{})
|
|
icmpv6ErrMessageSize = 8
|
|
ioStatusBlockSize = unsafe.Sizeof(ioStatusBlock{})
|
|
endian = binary.LittleEndian
|
|
)
|
|
|
|
// IP_STATUS code, see https://docs.microsoft.com/en-us/windows/win32/api/ipexport/ns-ipexport-icmp_echo_reply32#members
|
|
// for possible values
|
|
type ipStatus uint32
|
|
|
|
const (
|
|
success ipStatus = 0
|
|
bufTooSmall = iota + 11000
|
|
destNetUnreachable
|
|
destHostUnreachable
|
|
destProtocolUnreachable
|
|
destPortUnreachable
|
|
noResources
|
|
badOption
|
|
hwError
|
|
packetTooBig
|
|
reqTimedOut
|
|
badReq
|
|
badRoute
|
|
ttlExpiredTransit
|
|
ttlExpiredReassembly
|
|
paramProblem
|
|
sourceQuench
|
|
optionTooBig
|
|
badDestination
|
|
// Can be returned for malformed ICMP packets
|
|
generalFailure = 11050
|
|
)
|
|
|
|
// Additional IP_STATUS codes for ICMPv6 https://docs.microsoft.com/en-us/windows/win32/api/ipexport/ns-ipexport-icmpv6_echo_reply_lh#members
|
|
const (
|
|
ipv6DestUnreachable ipStatus = iota + 11040
|
|
ipv6TimeExceeded
|
|
ipv6BadHeader
|
|
ipv6UnrecognizedNextHeader
|
|
ipv6ICMPError
|
|
ipv6DestScopeMismatch
|
|
)
|
|
|
|
func (is ipStatus) String() string {
|
|
switch is {
|
|
case success:
|
|
return "Success"
|
|
case bufTooSmall:
|
|
return "The reply buffer too small"
|
|
case destNetUnreachable:
|
|
return "The destination network was unreachable"
|
|
case destHostUnreachable:
|
|
return "The destination host was unreachable"
|
|
case destProtocolUnreachable:
|
|
return "The destination protocol was unreachable"
|
|
case destPortUnreachable:
|
|
return "The destination port was unreachable"
|
|
case noResources:
|
|
return "Insufficient IP resources were available"
|
|
case badOption:
|
|
return "A bad IP option was specified"
|
|
case hwError:
|
|
return "A hardware error occurred"
|
|
case packetTooBig:
|
|
return "The packet was too big"
|
|
case reqTimedOut:
|
|
return "The request timed out"
|
|
case badReq:
|
|
return "Bad request"
|
|
case badRoute:
|
|
return "Bad route"
|
|
case ttlExpiredTransit:
|
|
return "The TTL expired in transit"
|
|
case ttlExpiredReassembly:
|
|
return "The TTL expired during fragment reassembly"
|
|
case paramProblem:
|
|
return "A parameter problem"
|
|
case sourceQuench:
|
|
return "Datagrams are arriving too fast to be processed and datagrams may have been discarded"
|
|
case optionTooBig:
|
|
return "The IP option was too big"
|
|
case badDestination:
|
|
return "Bad destination"
|
|
case ipv6DestUnreachable:
|
|
return "IPv6 destination unreachable"
|
|
case ipv6TimeExceeded:
|
|
return "IPv6 time exceeded"
|
|
case ipv6BadHeader:
|
|
return "IPv6 bad IP header"
|
|
case ipv6UnrecognizedNextHeader:
|
|
return "IPv6 unrecognized next header"
|
|
case ipv6ICMPError:
|
|
return "IPv6 ICMP error"
|
|
case ipv6DestScopeMismatch:
|
|
return "IPv6 destination scope ID mismatch"
|
|
case generalFailure:
|
|
return "The ICMP packet might be malformed"
|
|
default:
|
|
return fmt.Sprintf("Unknown ip status %d", is)
|
|
}
|
|
}
|
|
|
|
// https://docs.microsoft.com/en-us/windows/win32/api/ipexport/ns-ipexport-ip_option_information
|
|
type ipOption struct {
|
|
TTL uint8
|
|
Tos uint8
|
|
Flags uint8
|
|
OptionsSize uint8
|
|
OptionsData uintptr
|
|
}
|
|
|
|
// https://docs.microsoft.com/en-us/windows/win32/api/ipexport/ns-ipexport-icmp_echo_reply
|
|
type echoReply struct {
|
|
Address uint32
|
|
Status ipStatus
|
|
RoundTripTime uint32
|
|
DataSize uint16
|
|
Reserved uint16
|
|
// The pointer size defers between 32-bit and 64-bit platforms
|
|
DataPointer *byte
|
|
Options ipOption
|
|
}
|
|
|
|
type echoV6Reply struct {
|
|
Address ipv6AddrEx
|
|
Status ipStatus
|
|
RoundTripTime uint32
|
|
}
|
|
|
|
// https://docs.microsoft.com/en-us/windows/win32/api/ipexport/ns-ipexport-ipv6_address_ex
|
|
// All the fields are in network byte order. The memory alignment is 4 bytes
|
|
type ipv6AddrEx struct {
|
|
port uint16
|
|
// flowInfo is uint32. Because of field alignment, when we cast reply buffer to ipv6AddrEx, it starts at the 5th byte
|
|
// But looking at the raw bytes, flowInfo starts at the 3rd byte. We device flowInfo into 2 uint16 so it's aligned
|
|
flowInfoUpper uint16
|
|
flowInfoLower uint16
|
|
addr [8]uint16
|
|
scopeID uint32
|
|
}
|
|
|
|
// https://docs.microsoft.com/en-us/windows/win32/winsock/sockaddr-2
|
|
type sockAddrIn6 struct {
|
|
family int16
|
|
// Can't embed ipv6AddrEx, that changes the memory alignment
|
|
port uint16
|
|
flowInfo uint32
|
|
addr [16]byte
|
|
scopeID uint32
|
|
}
|
|
|
|
func newSockAddrIn6(addr netip.Addr) (*sockAddrIn6, error) {
|
|
if !addr.Is6() {
|
|
return nil, fmt.Errorf("%s is not IPv6", addr)
|
|
}
|
|
return &sockAddrIn6{
|
|
family: AF_INET6,
|
|
port: 10,
|
|
addr: addr.As16(),
|
|
}, nil
|
|
}
|
|
|
|
// https://docs.microsoft.com/en-us/windows-hardware/drivers/ddi/wdm/ns-wdm-_io_status_block#syntax
|
|
type ioStatusBlock struct {
|
|
// The first field is an union of NTSTATUS and PVOID. NTSTATUS is int32 while PVOID depends on the platform.
|
|
// We model it as uintptr whose size depends on if the platform is 32-bit or 64-bit
|
|
// https://docs.microsoft.com/en-us/openspecs/windows_protocols/ms-erref/596a1078-e883-4972-9bbc-49e60bebca55
|
|
statusOrPointer uintptr
|
|
information uintptr
|
|
}
|
|
|
|
type icmpProxy struct {
|
|
// An open handle that can send ICMP requests https://docs.microsoft.com/en-us/windows/win32/api/icmpapi/nf-icmpapi-icmpcreatefile
|
|
handle uintptr
|
|
// This is a ICMPv6 if srcSocketAddr is not nil
|
|
srcSocketAddr *sockAddrIn6
|
|
logger *zerolog.Logger
|
|
}
|
|
|
|
func newICMPProxy(listenIP netip.Addr, logger *zerolog.Logger, idleTimeout time.Duration) (*icmpProxy, error) {
|
|
var (
|
|
srcSocketAddr *sockAddrIn6
|
|
handle uintptr
|
|
err error
|
|
)
|
|
if listenIP.Is4() {
|
|
handle, _, err = IcmpCreateFile_proc.Call()
|
|
} else {
|
|
srcSocketAddr, err = newSockAddrIn6(listenIP)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
handle, _, err = Icmp6CreateFile_proc.Call()
|
|
}
|
|
// Windows procedure calls always return non-nil error constructed from the result of GetLastError.
|
|
// Caller need to inspect the primary returned value
|
|
if syscall.Handle(handle) == syscall.InvalidHandle {
|
|
return nil, errors.Wrap(err, "invalid ICMP handle")
|
|
}
|
|
return &icmpProxy{
|
|
handle: handle,
|
|
srcSocketAddr: srcSocketAddr,
|
|
logger: logger,
|
|
}, nil
|
|
}
|
|
|
|
func (ip *icmpProxy) Serve(ctx context.Context) error {
|
|
<-ctx.Done()
|
|
syscall.CloseHandle(syscall.Handle(ip.handle))
|
|
return ctx.Err()
|
|
}
|
|
|
|
// Request sends an ICMP echo request and wait for a reply or timeout.
|
|
// The async version of Win32 APIs take a callback whose memory is not garbage collected, so we use the synchronous version.
|
|
// It's possible that a slow request will block other requests, so we set the timeout to only 1s.
|
|
func (ip *icmpProxy) Request(ctx context.Context, pk *packet.ICMP, responder ICMPResponder) error {
|
|
defer func() {
|
|
if r := recover(); r != nil {
|
|
ip.logger.Error().Interface("error", r).Msgf("Recover panic from sending icmp request/response, error %s", debug.Stack())
|
|
}
|
|
}()
|
|
|
|
_, requestSpan := responder.RequestSpan(ctx, pk)
|
|
defer responder.ExportSpan()
|
|
|
|
echo, err := getICMPEcho(pk.Message)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
observeICMPRequest(ip.logger, requestSpan, pk.Src.String(), pk.Dst.String(), echo.ID, echo.Seq)
|
|
|
|
resp, err := ip.icmpEchoRoundtrip(pk.Dst, echo)
|
|
if err != nil {
|
|
ip.logger.Err(err).Msg("ICMP echo roundtrip failed")
|
|
tracing.EndWithErrorStatus(requestSpan, err)
|
|
return err
|
|
}
|
|
tracing.End(requestSpan)
|
|
responder.ExportSpan()
|
|
|
|
_, replySpan := responder.ReplySpan(ctx, ip.logger)
|
|
err = ip.handleEchoReply(pk, echo, resp, responder)
|
|
if err != nil {
|
|
ip.logger.Err(err).Msg("Failed to send ICMP reply")
|
|
tracing.EndWithErrorStatus(replySpan, err)
|
|
return errors.Wrap(err, "failed to handle ICMP echo reply")
|
|
}
|
|
observeICMPReply(ip.logger, replySpan, pk.Dst.String(), echo.ID, echo.Seq)
|
|
replySpan.SetAttributes(
|
|
attribute.Int64("rtt", int64(resp.rtt())),
|
|
attribute.String("status", resp.status().String()),
|
|
)
|
|
tracing.End(replySpan)
|
|
return nil
|
|
}
|
|
|
|
func (ip *icmpProxy) handleEchoReply(request *packet.ICMP, echoReq *icmp.Echo, resp echoResp, responder ICMPResponder) error {
|
|
var replyType icmp.Type
|
|
if request.Dst.Is4() {
|
|
replyType = ipv4.ICMPTypeEchoReply
|
|
} else {
|
|
replyType = ipv6.ICMPTypeEchoReply
|
|
}
|
|
|
|
pk := packet.ICMP{
|
|
IP: &packet.IP{
|
|
Src: request.Dst,
|
|
Dst: request.Src,
|
|
Protocol: layers.IPProtocol(request.Type.Protocol()),
|
|
TTL: packet.DefaultTTL,
|
|
},
|
|
Message: &icmp.Message{
|
|
Type: replyType,
|
|
Code: icmpEchoReplyCode,
|
|
Body: &icmp.Echo{
|
|
ID: echoReq.ID,
|
|
Seq: echoReq.Seq,
|
|
Data: resp.payload(),
|
|
},
|
|
},
|
|
}
|
|
return responder.ReturnPacket(&pk)
|
|
}
|
|
|
|
func (ip *icmpProxy) icmpEchoRoundtrip(dst netip.Addr, echo *icmp.Echo) (echoResp, error) {
|
|
if dst.Is6() {
|
|
if ip.srcSocketAddr == nil {
|
|
return nil, fmt.Errorf("cannot send ICMPv6 using ICMPv4 proxy")
|
|
}
|
|
resp, err := ip.icmp6SendEcho(dst, echo)
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "failed to send/receive ICMPv6 echo")
|
|
}
|
|
return resp, nil
|
|
}
|
|
if ip.srcSocketAddr != nil {
|
|
return nil, fmt.Errorf("cannot send ICMPv4 using ICMPv6 proxy")
|
|
}
|
|
resp, err := ip.icmpSendEcho(dst, echo)
|
|
if err != nil {
|
|
return nil, errors.Wrap(err, "failed to send/receive ICMPv4 echo")
|
|
}
|
|
return resp, nil
|
|
}
|
|
|
|
/*
|
|
Wrapper to call https://docs.microsoft.com/en-us/windows/win32/api/icmpapi/nf-icmpapi-icmpsendecho
|
|
Parameters:
|
|
- IcmpHandle: Handle created by IcmpCreateFile
|
|
- DestinationAddress: IPv4 in the form of https://docs.microsoft.com/en-us/windows/win32/api/inaddr/ns-inaddr-in_addr#syntax
|
|
- RequestData: A pointer to echo data
|
|
- RequestSize: Number of bytes in buffer pointed by echo data
|
|
- RequestOptions: IP header options
|
|
- ReplyBuffer: A pointer to the buffer for echoReply, options and data
|
|
- ReplySize: Number of bytes allocated for ReplyBuffer
|
|
- Timeout: Timeout in milliseconds to wait for a reply
|
|
Returns:
|
|
- the number of replies in uint32 https://docs.microsoft.com/en-us/windows/win32/api/icmpapi/nf-icmpapi-icmpsendecho#return-value
|
|
To retain the reference allocated objects, conversion from pointer to uintptr must happen as arguments to the
|
|
syscall function
|
|
*/
|
|
func (ip *icmpProxy) icmpSendEcho(dst netip.Addr, echo *icmp.Echo) (*echoV4Resp, error) {
|
|
dataSize := len(echo.Data)
|
|
replySize := echoReplySize + uintptr(dataSize)
|
|
replyBuf := make([]byte, replySize)
|
|
noIPHeaderOption := nullParameter
|
|
inAddr, err := inAddrV4(dst)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
replyCount, _, err := IcmpSendEcho_proc.Call(
|
|
ip.handle,
|
|
uintptr(inAddr),
|
|
uintptr(unsafe.Pointer(&echo.Data[0])),
|
|
uintptr(dataSize),
|
|
noIPHeaderOption,
|
|
uintptr(unsafe.Pointer(&replyBuf[0])),
|
|
replySize,
|
|
icmpRequestTimeoutMs,
|
|
)
|
|
if replyCount == 0 {
|
|
// status is returned in 5th to 8th byte of reply buffer
|
|
if status, parseErr := unmarshalIPStatus(replyBuf[4:8]); parseErr == nil && status != success {
|
|
return nil, errors.Wrapf(err, "received ip status: %s", status)
|
|
}
|
|
return nil, errors.Wrap(err, "did not receive ICMP echo reply")
|
|
} else if replyCount > 1 {
|
|
ip.logger.Warn().Msgf("Received %d ICMP echo replies, only sending 1 back", replyCount)
|
|
}
|
|
return newEchoV4Resp(replyBuf)
|
|
}
|
|
|
|
// Third definition of https://docs.microsoft.com/en-us/windows/win32/api/inaddr/ns-inaddr-in_addr#syntax is address in uint32
|
|
func inAddrV4(ip netip.Addr) (uint32, error) {
|
|
if !ip.Is4() {
|
|
return 0, fmt.Errorf("%s is not IPv4", ip)
|
|
}
|
|
v4 := ip.As4()
|
|
return endian.Uint32(v4[:]), nil
|
|
}
|
|
|
|
type echoResp interface {
|
|
status() ipStatus
|
|
rtt() uint32
|
|
payload() []byte
|
|
}
|
|
|
|
type echoV4Resp struct {
|
|
reply *echoReply
|
|
data []byte
|
|
}
|
|
|
|
func (r *echoV4Resp) status() ipStatus {
|
|
return r.reply.Status
|
|
}
|
|
|
|
func (r *echoV4Resp) rtt() uint32 {
|
|
return r.reply.RoundTripTime
|
|
}
|
|
|
|
func (r *echoV4Resp) payload() []byte {
|
|
return r.data
|
|
}
|
|
|
|
func newEchoV4Resp(replyBuf []byte) (*echoV4Resp, error) {
|
|
if len(replyBuf) == 0 {
|
|
return nil, fmt.Errorf("reply buffer is empty")
|
|
}
|
|
// This is pattern 1 of https://pkg.go.dev/unsafe@master#Pointer, conversion of *replyBuf to *echoReply
|
|
// replyBuf size is larger than echoReply
|
|
reply := *(*echoReply)(unsafe.Pointer(&replyBuf[0]))
|
|
if reply.Status != success {
|
|
return nil, fmt.Errorf("status %d", reply.Status)
|
|
}
|
|
dataBufStart := len(replyBuf) - int(reply.DataSize)
|
|
if dataBufStart < int(echoReplySize) {
|
|
return nil, fmt.Errorf("reply buffer size %d is too small to hold data of size %d", len(replyBuf), int(reply.DataSize))
|
|
}
|
|
return &echoV4Resp{
|
|
reply: &reply,
|
|
data: replyBuf[dataBufStart:],
|
|
}, nil
|
|
}
|
|
|
|
/*
|
|
Wrapper to call https://docs.microsoft.com/en-us/windows/win32/api/icmpapi/nf-icmpapi-icmp6sendecho2
|
|
Parameters:
|
|
- IcmpHandle: Handle created by Icmp6CreateFile
|
|
- Event (optional): Event object to be signaled when a reply arrives
|
|
- ApcRoutine (optional): Routine to call when the calling thread is in an alertable thread and a reply arrives
|
|
- ApcContext (optional): Optional parameter to ApcRoutine
|
|
- SourceAddress: Source address of the request
|
|
- DestinationAddress: Destination address of the request
|
|
- RequestData: A pointer to echo data
|
|
- RequestSize: Number of bytes in buffer pointed by echo data
|
|
- RequestOptions (optional): A pointer to the IPv6 header options
|
|
- ReplyBuffer: A pointer to the buffer for echoReply, options and data
|
|
- ReplySize: Number of bytes allocated for ReplyBuffer
|
|
- Timeout: Timeout in milliseconds to wait for a reply
|
|
Returns:
|
|
- the number of replies in uint32
|
|
To retain the reference allocated objects, conversion from pointer to uintptr must happen as arguments to the
|
|
syscall function
|
|
*/
|
|
|
|
func (ip *icmpProxy) icmp6SendEcho(dst netip.Addr, echo *icmp.Echo) (*echoV6Resp, error) {
|
|
dstAddr, err := newSockAddrIn6(dst)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
dataSize := len(echo.Data)
|
|
// Reply buffer needs to be big enough to hold an echoV6Reply, echo data, 8 bytes for ICMP error message
|
|
// and ioStatusBlock
|
|
replySize := echoV6ReplySize + uintptr(dataSize) + uintptr(icmpv6ErrMessageSize) + ioStatusBlockSize
|
|
replyBuf := make([]byte, replySize)
|
|
noEvent := nullParameter
|
|
noApcRoutine := nullParameter
|
|
noAppCtx := nullParameter
|
|
noIPHeaderOption := nullParameter
|
|
replyCount, _, err := Icmp6SendEcho_proc.Call(
|
|
ip.handle,
|
|
noEvent,
|
|
noApcRoutine,
|
|
noAppCtx,
|
|
uintptr(unsafe.Pointer(ip.srcSocketAddr)),
|
|
uintptr(unsafe.Pointer(dstAddr)),
|
|
uintptr(unsafe.Pointer(&echo.Data[0])),
|
|
uintptr(dataSize),
|
|
noIPHeaderOption,
|
|
uintptr(unsafe.Pointer(&replyBuf[0])),
|
|
replySize,
|
|
icmpRequestTimeoutMs,
|
|
)
|
|
if replyCount == 0 {
|
|
// status is in the 4 bytes after ipv6AddrEx. The reply buffer size is at least size of ipv6AddrEx + 4
|
|
if status, parseErr := unmarshalIPStatus(replyBuf[unsafe.Sizeof(ipv6AddrEx{}) : unsafe.Sizeof(ipv6AddrEx{})+4]); parseErr == nil && status != success {
|
|
return nil, fmt.Errorf("received ip status: %s", status)
|
|
}
|
|
return nil, errors.Wrap(err, "did not receive ICMP echo reply")
|
|
} else if replyCount > 1 {
|
|
ip.logger.Warn().Msgf("Received %d ICMP echo replies, only sending 1 back", replyCount)
|
|
}
|
|
return newEchoV6Resp(replyBuf, dataSize)
|
|
}
|
|
|
|
type echoV6Resp struct {
|
|
reply *echoV6Reply
|
|
data []byte
|
|
}
|
|
|
|
func (r *echoV6Resp) status() ipStatus {
|
|
return r.reply.Status
|
|
}
|
|
|
|
func (r *echoV6Resp) rtt() uint32 {
|
|
return r.reply.RoundTripTime
|
|
}
|
|
|
|
func (r *echoV6Resp) payload() []byte {
|
|
return r.data
|
|
}
|
|
|
|
func newEchoV6Resp(replyBuf []byte, dataSize int) (*echoV6Resp, error) {
|
|
if len(replyBuf) == 0 {
|
|
return nil, fmt.Errorf("reply buffer is empty")
|
|
}
|
|
reply := *(*echoV6Reply)(unsafe.Pointer(&replyBuf[0]))
|
|
if reply.Status != success {
|
|
return nil, fmt.Errorf("status %d", reply.Status)
|
|
}
|
|
if uintptr(len(replyBuf)) < unsafe.Sizeof(reply)+uintptr(dataSize) {
|
|
return nil, fmt.Errorf("reply buffer size %d is too small to hold reply size %d + data size %d", len(replyBuf), echoV6ReplySize, dataSize)
|
|
}
|
|
return &echoV6Resp{
|
|
reply: &reply,
|
|
data: replyBuf[echoV6ReplySize : echoV6ReplySize+uintptr(dataSize)],
|
|
}, nil
|
|
}
|
|
|
|
func unmarshalIPStatus(replyBuf []byte) (ipStatus, error) {
|
|
if len(replyBuf) != 4 {
|
|
return 0, fmt.Errorf("ipStatus needs to be 4 bytes, got %d", len(replyBuf))
|
|
}
|
|
return ipStatus(endian.Uint32(replyBuf)), nil
|
|
}
|