blob: 4b0800dd73a2ab2a5760213dd9c77b2aaabc6a3e [file]
/*
* tcp.cpp - ip router
*
* Basilisk II (C) 1997-2008 Christian Bauer
*
* Windows platform specific code copyright (C) Lauri Pesonen
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*/
/*
* Features implemented:
* state machine, flow control, sequence numbers, RST/SYN/FIN/ACK/PSH
*
* Features not implemented:
* oob data, urgent pointer, window sliding, some options
* "Half-Nagle" implementation is a bit weird (mac-router interface; winsock has it on by default)
*
*
* All possible tcp state machine transitions:
*
* CLOSED -> LISTEN passive open
* CLOSED -> SYN_SENT active open SYN->
*
* LISTEN -> SYN_SENT send data SYN->
* LISTEN -> SYN_RCVD ->SYN SYN+ACK->
*
* SYN_SENT -> SYN_RCVD ->SYN SYN+ACK->
* SYN_SENT -> ESTABLISHED ->SYN+ACK ACK->
* SYN_SENT -> CLOSED close/timeout
*
* SYN_RCVD -> CLOSED timeout RST->
* SYN_RCVD -> LISTEN ->RST
* SYN_RCVD -> ESTABLISHED ->ACK
* SYN_RCVD -> FINWAIT_1 close FIN->
*
* ESTABLISHED -> FINWAIT_1 close FIN->
* ESTABLISHED -> CLOSE_WAIT ->FIN ACK->
*
* CLOSE_WAIT -> LAST_ACK close FIN->
*
* LAST_ACK -> CLOSED ->ACK
*
* FINWAIT_1 -> CLOSING ->FIN ACK->
* FINWAIT_1 -> FINWAIT_2 ->ACK
* FINWAIT_1 -> TIME_WAIT ->FIN+ACK ACK->
*
* FINWAIT_2 -> TIME_WAIT ->FIN ACK->
*
* CLOSING -> TIME_WAIT ->ACK
*
* TIME_WAIT -> CLOSED timeout (2*msl)
*
*/
#include "sysdeps.h"
#include "main.h"
#include <process.h>
#include "cpu_emulation.h"
#include "ws2tcpip.h"
#include "ether_windows.h"
#include "ether.h"
#include "prefs.h"
#include "router.h"
#include "router_types.h"
#include "dynsockets.h"
#include "iphelp.h"
#include "tcp.h"
#include "dump.h"
#include "mib/interfaces.h"
#include "ftp.h"
#if DEBUG
#pragma optimize("",off)
#endif
#include "debug.h"
// If you need more, use multiple threads.
#define MAX_SOCKETS MAXIMUM_WAIT_OBJECTS
// If true, always sends the PSH tcp flag with data.
// Otherwise only when a full buffer was received.
#define PUSH_ALWAYS 0
// In milliseconds. A TCP implementation should implement
// this dynamically, adapting the timeout value to match to the
// averaged packet round-trip time.
#define RESEND_TIMEOUT 750
// Just time out incoming connections after 5 secs if Mac has no time to reply
// No backlogs.
#define SYN_FLOOD_PROTECTION_TIMEOUT 5000
const int MAX_SEGMENT_SIZE = 1460;
// Shorthands
#define ISSET(f,x) ( ((f) & (x)) != 0 )
#define ISCLEAR(f,x) ( ((f) & (x)) == 0 )
// Local aliases
#define URG tcp_flags_URG
#define ACK tcp_flags_ACK
#define PSH tcp_flags_PSH
#define RST tcp_flags_RST
#define SYN tcp_flags_SYN
#define FIN tcp_flags_FIN
// Local aliases
#define CLOSED tcp_state_closed
#define LISTEN tcp_state_listen
#define SYN_SENT tcp_state_syn_sent
#define SYN_RCVD tcp_state_syn_rcvd
#define ESTABLISHED tcp_state_established
#define CLOSE_WAIT tcp_state_close_wait
#define LAST_ACK tcp_state_last_ack
#define FINWAIT_1 tcp_state_finwait_1
#define FINWAIT_2 tcp_state_finwait_2
#define CLOSING tcp_state_closing
#define TIME_WAIT tcp_state_time_wait
// For debugging only
static const char *_tcp_state_name[] = {
"CLOSED",
"LISTEN",
"SYN_SENT",
"SYN_RCVD",
"ESTABLISHED",
"CLOSE_WAIT",
"LAST_ACK",
"FINWAIT_1",
"FINWAIT_2",
"CLOSING",
"TIME_WAIT"
};
#define STATENAME(i) _tcp_state_name[i]
static CRITICAL_SECTION tcp_section;
typedef struct {
SOCKET s;
int state;
uint32 ip_src; // "source" is the mac, dest is the remote host,
uint32 ip_dest; // no matter who opened the connection.
uint16 src_port; // all in host byte order.
uint16 dest_port;
struct sockaddr_in from; // remote host address, network byte order.
int from_len;
// note: no true windows sliding, only one buffer.
WSABUF buffers_read[1]; // data from remote host to Mac
DWORD buffer_count_read;
DWORD bytes_received;
DWORD flags_read;
WSAOVERLAPPED overlapped_read;
WSABUF buffers_write[1]; // data from Mac to remote host
DWORD buffer_count_write;
DWORD bytes_written;
DWORD flags_write;
WSAOVERLAPPED overlapped_write;
bool remote_closed; // remote will not send any more data
bool accept_more_data_from_mac; // are we ready to accept more data from mac
uint32 seq_in; // will ack this mac sequence number
uint32 seq_out; // next sequence number to mac (unless a resend is needed)
uint32 mac_ack; // mac has acked this byte count. can be used to determined when to send some more data
uint32 bytes_to_send; // total send block size
uint32 bytes_remaining_to_send; // unsent byte count
uint16 mac_window; // mac tcp receive window, slides according to the window principle
uint16 our_window; // not really used
uint16 mac_mss; // maximum segment size that mac reported at SYN handshaking
// resend info
uint32 last_seq_out; // remember last packet seq number if a resend is needed
uint32 resend_timeout; // currently set t0 0.75 secs but not updated
uint32 stream_to_mac_stalled_until; // tick count indicating resend time
DWORD time_wait; // do a graceful close after MSL*2
DWORD msl;
int child;
WSAEVENT ev; // used to signal remote-initiated close and host-initiated connect.
bool in_use;
} tcp_socket_t;
static tcp_socket_t sockets[MAX_SOCKETS];
typedef struct {
SOCKET s;
uint16 port;
uint32 ip;
uint32 iface;
bool once;
int parent;
WSAEVENT ev;
} tcp_listening_socket_t;
static tcp_listening_socket_t l_sockets[MAX_SOCKETS];
static void CALLBACK tcp_read_completion(
DWORD error,
DWORD bytes_read,
LPWSAOVERLAPPED lpOverlapped,
DWORD flags
);
static void CALLBACK tcp_write_completion(
DWORD error,
DWORD bytes_read,
LPWSAOVERLAPPED lpOverlapped,
DWORD flags
);
// socket utilities assume that the critical section has already been entered.
static void free_socket( const int t )
{
_WSAResetEvent( sockets[t].ev );
if(sockets[t].s != INVALID_SOCKET) {
_closesocket( sockets[t].s );
sockets[t].s = INVALID_SOCKET;
}
sockets[t].state = CLOSED;
sockets[t].stream_to_mac_stalled_until = 0;
sockets[t].in_use = false;
sockets[t].time_wait = 0;
// if there was an attached listening socket (ftp), close it.
int lst = sockets[t].child;
if( lst >= 0 ) {
if(l_sockets[lst].s != INVALID_SOCKET) {
D(bug(" closing listening socket %d\r\n", lst));
_closesocket( l_sockets[lst].s );
l_sockets[lst].s = INVALID_SOCKET;
}
l_sockets[lst].port = 0;
l_sockets[lst].parent = -1;
}
sockets[t].child = -1;
}
static int alloc_socket()
{
static int last_allocated_socket = -1;
int i = last_allocated_socket;
for( int j=0; j<MAX_SOCKETS; j++ ) {
if( ++i >= MAX_SOCKETS ) i = 0;
if( !sockets[i].in_use ) {
D(bug("<%d> Socket allocated\r\n", i));
last_allocated_socket = i;
sockets[i].in_use = true;
sockets[i].s = INVALID_SOCKET;
sockets[i].state = CLOSED;
sockets[i].remote_closed = false;
sockets[i].accept_more_data_from_mac = false;
sockets[i].ip_src = sockets[i].ip_dest = 0;
// sockets[i].src_port = sockets[i].dest_port = 0;
memset( &sockets[i].overlapped_read, 0, sizeof(sockets[i].overlapped_read) );
sockets[i].overlapped_read.hEvent = (HANDLE)i;
memset( &sockets[i].overlapped_write, 0, sizeof(sockets[i].overlapped_write) );
sockets[i].overlapped_write.hEvent = (HANDLE)i;
sockets[i].bytes_received = 0;
sockets[i].bytes_written = 0;
sockets[i].flags_read = 0;
sockets[i].flags_write = 0;
// sockets[i].from_len = sizeof(struct sockaddr_in);
// memset( &sockets[i].from, 0, sizeof(sockets[i].from) );
// sockets[i].from.sin_family = AF_INET;
sockets[i].buffer_count_read = 1;
sockets[i].buffers_read[0].len = MAX_SEGMENT_SIZE;
if(!sockets[i].buffers_read[0].buf) {
sockets[i].buffers_read[0].buf = new char [sockets[i].buffers_read[0].len];
}
sockets[i].buffer_count_write = 1;
sockets[i].buffers_write[0].len = MAX_SEGMENT_SIZE;
if(!sockets[i].buffers_write[0].buf) {
sockets[i].buffers_write[0].buf = new char [sockets[i].buffers_write[0].len];
}
sockets[i].mac_window = MAX_SEGMENT_SIZE; // updated for all mac datagrams
sockets[i].our_window = MAX_SEGMENT_SIZE; // should use about 8-16 kB, really
sockets[i].mac_mss = 0; // not known yet
sockets[i].time_wait = 0;
sockets[i].msl = 5000L; // The round-trip time can be hard to estimate.
sockets[i].seq_in = 0;
sockets[i].seq_out = 0x00000001;
sockets[i].mac_ack = 0;
sockets[i].stream_to_mac_stalled_until = 0;
sockets[i].resend_timeout = RESEND_TIMEOUT;
sockets[i].child = -1;
break;
}
}
if(i == MAX_SOCKETS) {
D(bug("Out of free sockets\r\n"));
i = -1;
}
return i;
}
static int alloc_new_socket( const uint16 src_port, const uint16 dest_port, const uint32 ip_dest )
{
int t = alloc_socket();
if(t >= 0) {
sockets[t].s = _socket( AF_INET, SOCK_STREAM, IPPROTO_TCP );
if(sockets[t].s == INVALID_SOCKET) {
free_socket( t );
t = -1;
} else {
sockets[t].src_port = src_port;
sockets[t].dest_port = dest_port;
sockets[t].from_len = sizeof(sockets[t].from);
memset( &sockets[t].from, 0, sockets[t].from_len );
sockets[t].from.sin_family = AF_INET;
sockets[t].from.sin_port = htons(dest_port);
sockets[t].from.sin_addr.s_addr = htonl(ip_dest);
struct sockaddr_in to;
memset( &to, 0, sizeof(to) );
to.sin_family = AF_INET;
if( _bind ( sockets[t].s, (const struct sockaddr *)&to, sizeof(to) ) == 0 ) {
D(bug("<%d> socket bound\r\n", t));
} else {
if( _WSAGetLastError() == WSAEINPROGRESS ) {
D(bug("<%d> bind: a blocking call is in progress.\r\n", t));
} else {
D(bug("<%d> bind failed with error code %d\r\n", t, _WSAGetLastError()));
}
free_socket( t );
t = -1;
}
}
}
return t;
}
static int get_socket_index( const uint16 src_port, const uint16 dest_port )
{
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(sockets[i].in_use && sockets[i].src_port == src_port && sockets[i].dest_port == dest_port ) {
return i;
}
}
return -1;
}
static int get_socket_index( const uint16 src_port )
{
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(sockets[i].in_use && sockets[i].src_port == src_port ) {
return i;
}
}
return -1;
}
static int find_socket( const uint16 src_port, const uint16 dest_port )
{
int i = get_socket_index( src_port, dest_port );
if( i < 0 ) {
i = get_socket_index( src_port );
if( i >= 0 ) {
if( sockets[i].s == INVALID_SOCKET ) {
D(bug("find_socket reusing slot %d...\r\n", i));
sockets[i].in_use = false;
} else {
D(bug("find_socket forcing close %d...\r\n", i));
free_socket( i );
}
i = -1;
}
}
D(bug("<%d> find_socket(%d,%d): %s\r\n", i, src_port, dest_port, i>=0 ? "found" : "not found"));
return i;
}
static int alloc_listen_socket( const uint16 port, const uint32 ip, const uint32 iface, const bool once )
{
static int last_allocated_socket = -1;
int i = last_allocated_socket;
for( int j=0; j<MAX_SOCKETS; j++ ) {
if( ++i >= MAX_SOCKETS ) i = 0;
if( l_sockets[i].port == 0 ) {
D(bug("[%d] Slot allocated for listening port %d\r\n", i, port));
l_sockets[i].port = port;
l_sockets[i].ip = ip;
l_sockets[i].iface = iface;
l_sockets[i].once = once;
l_sockets[i].parent = -1;
last_allocated_socket = i;
_WSAResetEvent( l_sockets[i].ev );
return i;
}
}
return -1;
}
static void tcp_start_listen( const int i )
{
if( l_sockets[i].port ) {
uint32 iface = l_sockets[i].iface;
D(bug("[%d] binding to interface 0x%08X\r\n", i, iface));
l_sockets[i].s = _socket( AF_INET, SOCK_STREAM, IPPROTO_TCP );
if(l_sockets[i].s != INVALID_SOCKET) {
struct sockaddr_in to;
memset( &to, 0, sizeof(to) );
to.sin_family = AF_INET;
to.sin_port = htons( l_sockets[i].port );
to.sin_addr.s_addr = htonl( iface );
if( _bind ( l_sockets[i].s, (const struct sockaddr *)&to, sizeof(to) ) == 0 )
{
D(bug("[%d] socket bound to port %d on interface 0x%08X\r\n", i, l_sockets[i].port, iface));
if( _listen( l_sockets[i].s, SOMAXCONN ) == SOCKET_ERROR ) {
D(bug("[%d] listen() failed with error code %d\r\n", i, _WSAGetLastError()));
} else {
D(bug("[%d] listening to port %d\r\n", i, l_sockets[i].port));
_WSAResetEvent( l_sockets[i].ev );
if( SOCKET_ERROR == _WSAEventSelect( l_sockets[i].s, l_sockets[i].ev, FD_ACCEPT ) ) {
D(bug("[%d] WSAEventSelect() failed with error code %d\r\n", i, _WSAGetLastError()));
}
}
} else {
D(bug("[%d] bind to port %d failed with error code %d\r\n", i, l_sockets[i].port, _WSAGetLastError()));
}
} else {
D(bug("[%d] could not create a socket for port %d, error = %d\r\n", i, l_sockets[i].port, _WSAGetLastError()));
}
}
}
static void set_ttl( const int t, const uint8 ttl )
{
int _ttl = ttl; // defensive programming, I know VCx
if(_setsockopt( sockets[t].s, IPPROTO_IP, IP_TTL, (const char *)&_ttl, sizeof(int) ) == SOCKET_ERROR ) {
D(bug("<%d> could not set ttl to %d, error=%d\r\n", t, ttl, _WSAGetLastError()));
} else {
D(bug("<%d> ttl set to %d.\r\n", t, ttl));
}
}
static void tcp_reply( const int flags, const int t )
{
int tcp_size = sizeof(tcp_t);
tcp_t *tcp = (tcp_t *)malloc( tcp_size );
if(tcp) {
memcpy( tcp->ip.mac.dest, ether_addr, 6 );
memcpy( tcp->ip.mac.src, router_mac_addr, 6 );
tcp->ip.mac.type = htons(mac_type_ip4);
tcp->ip.version = 4;
tcp->ip.header_len = 5;
tcp->ip.tos = 0;
tcp->ip.total_len = htons(tcp_size - sizeof(mac_t));
tcp->ip.ident = htons(next_ip_ident_number++);
tcp->ip.flags_n_frag_offset = 0;
tcp->ip.ttl = 128;
tcp->ip.proto = ip_proto_tcp;
tcp->ip.src = htonl(sockets[t].ip_dest);
tcp->ip.dest = htonl(sockets[t].ip_src);
make_ip4_checksum( (ip_t *)tcp );
D(bug("<%d> Reply: Seq=%d, Ack=%d\r\n", t, sockets[t].seq_out, sockets[t].seq_in));
tcp->src_port = htons(sockets[t].dest_port);
tcp->dest_port = htons(sockets[t].src_port);
tcp->seq = htonl(sockets[t].seq_out);
tcp->ack = htonl(sockets[t].seq_in);
tcp->header_len = (uint8)( 20 << 2 );
tcp->flags = flags;
tcp->window = htons( sockets[t].our_window );
tcp->urgent_ptr = 0;
make_tcp_checksum( tcp, tcp_size );
// dump_bytes( (uint8 *)tcp, tcp_size );
enqueue_packet( (uint8 *)tcp, tcp_size );
free(tcp);
}
}
static bool has_mac_read_space( const int t )
{
uint32 pending_bytes = sockets[t].seq_out - sockets[t].mac_ack;
uint32 mac_can_accept_bytes = sockets[t].mac_window - pending_bytes;
D(bug("<%d> mac_can_accept_bytes = %d\r\n", t, mac_can_accept_bytes));
// Modified Nagle, effectively disabling window sliding (which I don't support anyway):
return pending_bytes == 0;
// Use more of window bandwidth
// Enabling this would require that the buffers seq numbers are stored somewhere
// return mac_can_accept_bytes >= sockets[t].buffers_read[0].len;
}
static bool b_recfrom( const int t )
{
bool result;
if( !has_mac_read_space(t) ) {
D(bug("<%d> read stalled, mac cannot accept any more data\r\n", t));
sockets[t].stream_to_mac_stalled_until = GetTickCount() + sockets[t].resend_timeout;
return true;
}
int ret = _WSARecv(
sockets[t].s,
sockets[t].buffers_read,
sockets[t].buffer_count_read,
&sockets[t].bytes_received,
&sockets[t].flags_read,
&sockets[t].overlapped_read,
tcp_read_completion
);
if(ret == SOCKET_ERROR) {
int socket_error = _WSAGetLastError();
if(socket_error == WSA_IO_PENDING) {
D(bug("<%d> WSARecv() i/o pending\r\n", t));
result = true;
} else {
D(bug("<%d> WSARecv() returned error %d\r\n", t, socket_error));
result = false;
}
} else /*if(ret == 0) */ {
D(bug("<%d> WSARecv() ok\r\n", t));
// Completion routine call is already scheduled.
result = true;
}
return result;
}
static bool b_send( const int t )
{
int ret = _WSASend(
sockets[t].s,
sockets[t].buffers_write,
sockets[t].buffer_count_write,
&sockets[t].bytes_written,
sockets[t].flags_write,
&sockets[t].overlapped_write,
tcp_write_completion
);
bool result;
if(ret == SOCKET_ERROR) {
int socket_error = _WSAGetLastError();
if(socket_error == WSA_IO_PENDING) {
D(bug("<%d> WSASend() i/o pending\r\n", t));
result = true;
} else {
D(bug("<%d> WSASend() returned %d\r\n", t, socket_error));
result = false;
}
} else /*if(ret == 0) */ {
D(bug("<%d> WSASend() ok\r\n", t));
// Completion routine call is already scheduled.
result = true;
}
return result;
}
static void send_buffer( const int t, const bool resending )
{
if(resending) {
if(sockets[t].last_seq_out == 0) {
D(bug("<%d> resend failure\r\n", t ));
return;
}
sockets[t].seq_out = sockets[t].last_seq_out;
} else {
sockets[t].last_seq_out = sockets[t].seq_out;
}
D(bug("<%d> %s data to Mac: Seq=%d, Ack=%d\r\n", t, (resending ? "resending" : "sending"), sockets[t].seq_out, sockets[t].seq_in));
uint32 bytes_read = sockets[t].bytes_received;
if( sockets[t].mac_mss && bytes_read > sockets[t].mac_mss ) {
D(bug("<%d> impossible: %d bytes to send, Mac mss is only %d\r\n", t, sockets[t].mac_mss && bytes_read, sockets[t].mac_mss));
}
int tcp_size = sizeof(tcp_t) + bytes_read;
tcp_t *tcp = (tcp_t *)malloc( tcp_size );
if(tcp) {
// Build MAC
// memcpy( tcp->ip.mac.dest, sockets[t].mac_src, 6 );
memcpy( tcp->ip.mac.dest, ether_addr, 6 );
memcpy( tcp->ip.mac.src, router_mac_addr, 6 );
tcp->ip.mac.type = htons(mac_type_ip4);
// Build IP
tcp->ip.version = 4;
tcp->ip.header_len = 5;
tcp->ip.tos = 0;
tcp->ip.total_len = htons(sizeof(tcp_t) - sizeof(mac_t) + bytes_read); // no options
tcp->ip.ident = htons(next_ip_ident_number++);
tcp->ip.flags_n_frag_offset = 0;
tcp->ip.ttl = 128; // one hop actually!
tcp->ip.proto = ip_proto_tcp;
tcp->ip.src = htonl(sockets[t].ip_dest);
tcp->ip.dest = htonl(sockets[t].ip_src);
make_ip4_checksum( (ip_t *)tcp );
// Copy payload (used by tcp checksum)
memcpy( (char *)tcp + sizeof(tcp_t), sockets[t].buffers_read[0].buf, bytes_read );
// Build tcp
tcp->src_port = htons(sockets[t].dest_port);
tcp->dest_port = htons(sockets[t].src_port);
tcp->seq = htonl(sockets[t].seq_out);
tcp->ack = htonl(sockets[t].seq_in);
tcp->header_len = (uint8)( 20 << 2 );
#if PUSH_ALWAYS
tcp->flags = ACK|PSH;
#else
tcp->flags = (bytes_read == MAX_SEGMENT_SIZE) ? ACK : (ACK|PSH);
#endif
tcp->window = htons( sockets[t].our_window );
tcp->urgent_ptr = 0;
make_tcp_checksum( tcp, tcp_size );
sockets[t].seq_out += bytes_read;
// dump_bytes( (uint8 *)tcp, tcp_size );
enqueue_packet( (uint8 *)tcp, tcp_size );
free(tcp);
}
}
static void CALLBACK tcp_read_completion(
DWORD error,
DWORD bytes_read,
LPWSAOVERLAPPED lpOverlapped,
DWORD flags
)
{
EnterCriticalSection( &tcp_section );
const int t = (int)lpOverlapped->hEvent;
sockets[t].bytes_received = bytes_read;
D(bug("<%d> tcp_read_completion(error=%d, bytes_read=%d)\r\n", t, error, bytes_read));
D(bug("<%d> tcp_read_completion() start, old state = %s\r\n", t, STATENAME(sockets[t].state)));
if(!sockets[t].in_use) {
D(bug("<%d> ignoring canceled read\r\n", t));
} else {
if( error != 0 ) {
D(bug("<%d> resetting after read error\r\n", t));
tcp_reply( RST, t );
free_socket(t);
} else {
if(bytes_read == 0) {
_closesocket( sockets[t].s );
sockets[t].s = INVALID_SOCKET;
} else if( bytes_read > 0) {
send_buffer( t, false );
}
switch( sockets[t].state ) {
case SYN_RCVD:
if( bytes_read == 0 ) {
D(bug("<%d> Closing: SYN_RCVD -> FINWAIT_1\r\n", t));
tcp_reply( ACK|FIN, t );
sockets[t].seq_out++;
sockets[t].state = FINWAIT_1;
}
break;
case ESTABLISHED:
if( bytes_read == 0 ) {
D(bug("<%d> Closing: ESTABLISHED -> FINWAIT_1\r\n", t));
tcp_reply( ACK|FIN, t );
sockets[t].seq_out++;
sockets[t].state = FINWAIT_1;
}
break;
case LISTEN:
tcp_reply( SYN, t );
sockets[t].seq_out++;
sockets[t].state = SYN_SENT;
sockets[t].time_wait = GetTickCount() + SYN_FLOOD_PROTECTION_TIMEOUT;
D(bug("<%d> LISTEN -> SYN_SENT\r\n", t));
break;
case CLOSE_WAIT:
if( bytes_read == 0) {
tcp_reply( ACK|FIN, t );
sockets[t].seq_out++;
sockets[t].state = LAST_ACK;
D(bug("<%d> Closing: CLOSE_WAIT -> LAST_ACK\r\n", t));
if(sockets[t].remote_closed) {
// Just in case that mac gets out of sync.
_closesocket(sockets[t].s);
sockets[t].s = INVALID_SOCKET;
}
}
break;
default:
break;
}
if(!is_router_shutting_down && sockets[t].s != INVALID_SOCKET) {
if(sockets[t].state != LISTEN) {
b_recfrom(t);
}
}
}
}
LeaveCriticalSection( &tcp_section );
}
static void CALLBACK tcp_write_completion(
DWORD error,
DWORD bytes_written,
LPWSAOVERLAPPED lpOverlapped,
DWORD flags
)
{
EnterCriticalSection( &tcp_section );
const int t = (int)lpOverlapped->hEvent;
sockets[t].bytes_written = bytes_written;
sockets[t].bytes_remaining_to_send -= bytes_written;
D(bug("<%d> tcp_write_completion(error=%d, bytes_written=%d)\r\n", t, error, bytes_written));
if(!sockets[t].in_use) {
D(bug("<%d> ignoring canceled write\r\n", t));
} else {
if(is_router_shutting_down || sockets[t].s == INVALID_SOCKET) {
D(bug("<%d> is not alive for sending.\r\n", t));
} else {
if( sockets[t].bytes_remaining_to_send <= 0 ) {
D(bug("<%d> all data sent, accepting some more.\r\n", t));
sockets[t].seq_in += sockets[t].bytes_to_send;
sockets[t].bytes_to_send = sockets[t].bytes_remaining_to_send = 0; // superfluous
tcp_reply( ACK, t );
sockets[t].accept_more_data_from_mac = true;
} else {
D(bug("<%d> %d bytes (of %d total) remaining, sending.\r\n", t, sockets[t].bytes_remaining_to_send, sockets[t].bytes_to_send));
sockets[t].buffers_write[0].len = sockets[t].bytes_remaining_to_send;
char *p = sockets[t].buffers_write[0].buf;
memmove( p, &p[bytes_written], sockets[t].bytes_remaining_to_send );
if(!b_send(t)) {
} else {
}
}
}
}
LeaveCriticalSection( &tcp_section );
}
static void tcp_connect_callback( const int t )
{
D(bug("<%d> tcp_connect_callback() start, old state = %s\r\n", t, STATENAME(sockets[t].state)));
switch( sockets[t].state ) {
case LISTEN:
tcp_reply( SYN|ACK, t );
sockets[t].seq_out++;
sockets[t].state = SYN_RCVD;
D(bug("<%d> Connect: LISTEN -> SYN_RCVD\r\n", t));
break;
default:
break;
}
D(bug("<%d> tcp_connect_callback() end, new state = %s\r\n", t, STATENAME(sockets[t].state)));
}
static void tcp_accept_callback( const int lst )
{
D(bug("[%d] tcp_accept_callback()\r\n", lst));
struct sockaddr_in to;
memset( &to, 0, sizeof(to) );
to.sin_family = AF_INET;
int tolen = sizeof(to);
SOCKET s = _accept( l_sockets[lst].s, (struct sockaddr *)&to, &tolen );
if( s == INVALID_SOCKET ) {
D(bug("[%d] connection not accepted, error code %d\r\n", lst, _WSAGetLastError()));
} else {
_WSAEventSelect( s, 0, 0 );
uint16 src_port = l_sockets[lst].port;
uint16 dest_port = ntohs(to.sin_port);
uint32 ip_dest = ntohl(to.sin_addr.s_addr);
D(bug("[%d] connection accepted, local port:%d, remote %s:%d\r\n", lst, src_port, _inet_ntoa(to.sin_addr), dest_port));
if( l_sockets[lst].ip != 0 && l_sockets[lst].ip != ip_dest ) {
_closesocket( s );
D(bug("[%d] authorization failure. connection closed.\r\n", lst ));
} else {
int t = alloc_new_socket( src_port, dest_port, ip_dest );
if( t < 0 ) {
D(bug("<%d> out of slot space, connection dropped\r\n", t ));
free_socket(t);
} else {
sockets[t].s = s;
sockets[t].state = LISTEN;
sockets[t].src_port = src_port;
sockets[t].dest_port = dest_port;
sockets[t].ip_src = macos_ip_address;
sockets[t].ip_dest = ip_dest;
sockets[t].seq_out = 0x00000001;
sockets[t].seq_in = 0; // not known yet
sockets[t].mac_ack = sockets[t].seq_out; // zero out pending bytes
tcp_reply( SYN, t );
sockets[t].seq_out++;
sockets[t].state = SYN_SENT;
sockets[t].time_wait = GetTickCount() + SYN_FLOOD_PROTECTION_TIMEOUT;
D(bug("<%d> Connect: LISTEN -> SYN_SENT\r\n", t));
_WSAResetEvent( sockets[t].ev );
if( SOCKET_ERROR == _WSAEventSelect( sockets[t].s, sockets[t].ev, FD_CLOSE ) ) {
D(bug("<%d> WSAEventSelect() failed with error code %d\r\n", t, _WSAGetLastError()));
}
// No data from the remote host is needed until the connection is established.
// So don't initiate read yet.
}
}
}
}
/*
MSS is the only option I care about, and since I'm on ethernet
I already pretty much know everything needed.
AFAIK window scaling is not in effect unless both parties specify it,
and I'm not doing it.
*/
static void process_options( const int t, const uint8 *opt, int len, uint32 &mss )
{
mss = 0;
while( len > 0 ) {
switch( *opt ) {
case 0: // End of Option List
D(bug("<%d> End of Option List\r\n", t));
len = 0;
break;
case 1: // No-Operation
D(bug("<%d> No-Operation\r\n", t));
len--;
opt++;
break;
case 2: // Maximum Segment Size
{
mss = ntohs( *((uint16 *)&opt[2]) );
D(bug("<%d> Maximum Segment Size = %d\r\n", t, mss));
len -= 4;
opt += 4;
}
break;
case 3: // Window Scale
{
int wscale = opt[2];
D(bug("<%d> Window Scale = %d\r\n", t, (int)wscale));
len -= 3;
opt += 3;
}
break;
case 4: // Sack-Permitted
D(bug("<%d> Sack-Permitted option is set\r\n", t));
len -= 2;
opt += 2;
break;
case 5: // Sack
{
int sack_len = opt[1];
int hf = (sack_len-2) / 4;
D(bug("<%d> Sack, %d half-blocks\r\n", t, hf));
len -= sack_len;
opt += sack_len;
}
break;
case 8: // Time Stamps
{
int valve = ntohl( *((uint32 *)&opt[2]) );
int ereply = ntohl( *((uint32 *)&opt[6]) );
D(bug("<%d> Time Stamps, TS valve = 0x%X, TS echo reply = 0x%X\r\n", t, valve, ereply));
len -= 10;
opt += 10;
}
break;
default:
D(bug("<%d> Unknown tcp header option 0x%02x, breaking out\r\n", t, (int)*opt));
len = 0;
break;
}
}
}
void write_tcp( tcp_t *tcp, int len )
{
if(len < sizeof(tcp_t)) {
D(bug("<%d> Too small tcp packet(%d) on unknown slot, dropped\r\n", -1, len));
return;
}
uint16 src_port = ntohs(tcp->src_port);
uint16 dest_port = ntohs(tcp->dest_port);
BOOL ok = true;
BOOL handle_data = false;
BOOL initiate_read = false;
EnterCriticalSection( &tcp_section );
int t = find_socket( src_port, dest_port );
if(t < 0) {
t = alloc_new_socket( src_port, dest_port, ntohl(tcp->ip.dest) );
ok = t >= 0;
}
if(ok) {
D(bug("<%d> write_tcp %d bytes from port %d to port %d\r\n", t, len, src_port, dest_port));
} else {
D(bug("<%d> FAILED write_tcp %d bytes from port %d to port %d\r\n", t, len, src_port, dest_port));
}
if( ok && ISSET(tcp->flags,RST) ) {
D(bug("<%d> RST set, resetting socket\r\n", t));
if( sockets[t].s != INVALID_SOCKET ) {
D(bug("<%d> doing an extra shutdown (ie4)\r\n", t));
_shutdown( sockets[t].s, SD_BOTH );
}
free_socket( t );
ok = false;
}
if(ok) {
D(bug("<%d> State machine start = %s\r\n", t, STATENAME(sockets[t].state)));
// always update receive window
sockets[t].mac_window = ntohs(tcp->window);
int header_len = tcp->header_len >> 2;
int option_bytes = header_len - 20;
char *data = (char *)tcp + sizeof(tcp_t) + option_bytes;
int dlen = len - sizeof(tcp_t) - option_bytes;
if( !ISSET(tcp->flags,ACK) ) {
D(bug("<%d> ACK not set\r\n", t));
}
if( ISSET(tcp->flags,SYN) ) {
D(bug("<%d> SYN set\r\n", t));
// Note that some options are valid even if there is no SYN.
// I don't care about those however.
uint32 new_mss;
process_options( t, (uint8 *)data - option_bytes, option_bytes, new_mss );
if(new_mss) {
sockets[t].mac_mss = (int)new_mss;
if( new_mss < sockets[t].buffers_read[0].len ) {
sockets[t].buffers_read[0].len = new_mss;
}
D(bug("<%d> Max segment size set to %d\r\n", t, new_mss));
}
}
if( ISSET(tcp->flags,FIN) ) {
D(bug("<%d> FIN set\r\n", t));
}
// The sequence number Mac expects to see next time.
sockets[t].mac_ack = ntohl(tcp->ack);
D(bug("<%d> From Mac: Seq=%d, Ack=%d, window=%d, router Seq=%d\r\n", t, ntohl(tcp->seq), sockets[t].mac_ack, sockets[t].mac_window, sockets[t].seq_out));
if( sockets[t].stream_to_mac_stalled_until &&
sockets[t].mac_ack == sockets[t].seq_out &&
(sockets[t].state == ESTABLISHED || sockets[t].state == CLOSE_WAIT) )
{
if( has_mac_read_space(t) ) {
initiate_read = true;
sockets[t].stream_to_mac_stalled_until = 0;
D(bug("<%d> read resumed, mac can accept more data\r\n", t));
}
}
switch( sockets[t].state ) {
case CLOSED:
sockets[t].src_port = src_port;
sockets[t].dest_port = dest_port;
sockets[t].ip_src = ntohl(tcp->ip.src);
sockets[t].ip_dest = ntohl(tcp->ip.dest);
if( ISSET(tcp->flags,SYN) ) {
sockets[t].seq_out = 0x00000001;
sockets[t].seq_in = ntohl(tcp->seq) + 1;
_WSAResetEvent( sockets[t].ev );
if( SOCKET_ERROR == _WSAEventSelect( sockets[t].s, sockets[t].ev, FD_CONNECT | FD_CLOSE ) ) {
D(bug("<%d> WSAEventSelect() failed with error code %d\r\n", t, _WSAGetLastError()));
}
D(bug("<%d> connecting local port %d to remote %s:%d\r\n", t, src_port, _inet_ntoa(sockets[t].from.sin_addr), dest_port));
sockets[t].state = LISTEN;
if( _WSAConnect(
sockets[t].s,
(const struct sockaddr *)&sockets[t].from,
sockets[t].from_len,
NULL, NULL,
NULL, NULL
) == SOCKET_ERROR )
{
int connect_error = _WSAGetLastError();
if( connect_error == WSAEWOULDBLOCK ) {
D(bug("<%d> WSAConnect() i/o pending.\r\n", t));
} else {
D(bug("<%d> WSAConnect() failed with error %d.\r\n", t, connect_error));
}
} else {
D(bug("<%d> WSAConnect() ok.\r\n", t));
}
} else {
if( ISSET(tcp->flags,FIN) ) {
D(bug("<%d> No SYN but FIN on a closed socket.\r\n", t));
free_socket(t);
} else {
D(bug("<%d> No SYN on a closed socket. resetting.\r\n", t));
free_socket(t);
}
}
break;
case LISTEN:
// handled in connect callback
break;
case SYN_SENT:
if( ISSET(tcp->flags,SYN) && ISSET(tcp->flags,ACK) ) {
sockets[t].seq_in = ntohl(tcp->seq) + 1;
tcp_reply( ACK, t );
sockets[t].state = ESTABLISHED;
initiate_read = true;
sockets[t].accept_more_data_from_mac = true;
sockets[t].time_wait = 0;
} else if( ISSET(tcp->flags,SYN) ) {
sockets[t].seq_in = ntohl(tcp->seq) + 1;
tcp_reply( ACK|SYN, t );
sockets[t].seq_out++;
sockets[t].state = SYN_RCVD;
sockets[t].time_wait = 0;
} else if( ISSET(tcp->flags,ACK) ) {
// What was the bright idea here.
D(bug("<%d> State is SYN_SENT, but got only ACK from Mac??\r\n", t));
sockets[t].state = FINWAIT_2;
sockets[t].time_wait = 0;
}
break;
case SYN_RCVD:
if( ISSET(tcp->flags,ACK) ) {
sockets[t].state = ESTABLISHED;
handle_data = true;
initiate_read = true;
sockets[t].accept_more_data_from_mac = true;
}
break;
case ESTABLISHED:
if( ISSET(tcp->flags,FIN) ) {
sockets[t].seq_in++;
tcp_reply( ACK, t );
_shutdown( sockets[t].s, SD_SEND );
sockets[t].state = CLOSE_WAIT;
}
handle_data = true;
break;
case CLOSE_WAIT:
// handled in tcp_read_completion
break;
case LAST_ACK:
if( ISSET(tcp->flags,ACK) ) {
D(bug("<%d> LAST_ACK received, socket closed\r\n", t));
free_socket( t );
}
break;
case FINWAIT_1:
if( ISSET(tcp->flags,FIN) && ISSET(tcp->flags,ACK) ) {
sockets[t].seq_in++;
tcp_reply( ACK, t );
if(sockets[t].remote_closed) {
_closesocket(sockets[t].s);
sockets[t].s = INVALID_SOCKET;
} else {
_shutdown( sockets[t].s, SD_SEND );
}
sockets[t].state = TIME_WAIT;
sockets[t].time_wait = GetTickCount() + 2 * sockets[t].msl;
} else if( ISSET(tcp->flags,FIN) ) {
sockets[t].seq_in++;
tcp_reply( ACK, t );
if(sockets[t].remote_closed) {
_closesocket(sockets[t].s);
sockets[t].s = INVALID_SOCKET;
} else {
_shutdown( sockets[t].s, SD_SEND );
}
sockets[t].state = CLOSING;
} else if( ISSET(tcp->flags,ACK) ) {
sockets[t].state = FINWAIT_2;
}
break;
case FINWAIT_2:
if( ISSET(tcp->flags,FIN) ) {
sockets[t].seq_in++;
tcp_reply( ACK, t );
if(sockets[t].remote_closed) {
_closesocket(sockets[t].s);
sockets[t].s = INVALID_SOCKET;
} else {
_shutdown( sockets[t].s, SD_SEND );
}
sockets[t].state = TIME_WAIT;
sockets[t].time_wait = GetTickCount() + 2 * sockets[t].msl;
}
break;
case CLOSING:
if( ISSET(tcp->flags,ACK) ) {
sockets[t].state = TIME_WAIT;
sockets[t].time_wait = GetTickCount() + 2 * sockets[t].msl;
}
break;
case TIME_WAIT:
// Catching stray packets: wait MSL * 2 seconds, -> CLOSED
// Timer already set since we might not get here at all.
// I'm using exceptionally low MSL value (5 secs).
D(bug("<%d> time wait, datagram discarded\r\n", t));
break;
}
// The "t" descriptor may already be freed. However, it's safe
// to peek the state value inside the critical section.
D(bug("<%d> State machine end = %s\r\n", t, STATENAME(sockets[t].state)));
D(bug("<%d> handle_data=%d, initiate_read=%d\r\n", t, handle_data, initiate_read));
if( handle_data && dlen && sockets[t].accept_more_data_from_mac ) {
if( sockets[t].seq_in != ntohl(tcp->seq) ) {
D(bug("<%d> dropping duplicate datagram seq=%d, expected=%d\r\n", t, ntohl(tcp->seq), sockets[t].seq_in));
} else {
set_ttl( t, tcp->ip.ttl );
struct sockaddr_in to;
memset( &to, 0, sizeof(to) );
to.sin_family = AF_INET;
to.sin_port = tcp->dest_port;
to.sin_addr.s_addr = tcp->ip.dest;
D(bug("<%d> sending %d bytes to remote host\r\n", t, dlen));
sockets[t].accept_more_data_from_mac = false;
if( dlen > MAX_SEGMENT_SIZE ) {
D(bug("<%d> IMPOSSIBLE: b_send() dropped %d bytes! \r\n", t, dlen-MAX_SEGMENT_SIZE));
dlen = MAX_SEGMENT_SIZE;
}
memcpy( sockets[t].buffers_write[0].buf, data, dlen );
sockets[t].buffers_write[0].len = dlen;
sockets[t].bytes_remaining_to_send = dlen;
sockets[t].bytes_to_send = dlen;
bool send_now = false;
if( ISSET(tcp->flags,PSH) ) {
send_now = true;
} else {
// todo -- delayed send
send_now = true;
}
if(send_now) {
// Patch ftp server or client address if needed.
int lst = 1;
bool is_pasv;
uint16 ftp_data_port = 0;
if(ftp_is_ftp_port(sockets[t].src_port)) {
// Local ftp server may be entering to passive mode.
is_pasv = true;
ftp_parse_port_command(
sockets[t].buffers_write[0].buf,
dlen,
ftp_data_port,
is_pasv
);
} else if(ftp_is_ftp_port(sockets[t].dest_port)) {
// Local ftp client may be using port command.
is_pasv = false;
ftp_parse_port_command(
sockets[t].buffers_write[0].buf,
dlen,
ftp_data_port,
is_pasv
);
}
if(ftp_data_port) {
D(bug("<%d> ftp %s command detected, port %d\r\n", t, (is_pasv ? "SERVER PASV REPLY" : "CLIENT PORT"), ftp_data_port ));
// Note: for security reasons, only allow incoming connection from sockets[t].ip_dest
lst = alloc_listen_socket( ftp_data_port, sockets[t].ip_dest, 0/*iface*/, true );
if(lst < 0) {
D(bug("<%d> no more free slots\r\n", t));
} else {
// First start listening (need to know the local name later)
tcp_start_listen( lst );
// When t is closed, lst must be closed too.
sockets[t].child = lst;
l_sockets[lst].parent = t;
// Find out the local name
struct sockaddr_in name;
int namelen = sizeof(name);
memset( &name, 0, sizeof(name) );
if( _getsockname( sockets[t].s, (struct sockaddr *)&name, &namelen ) == SOCKET_ERROR ) {
D(bug("_getsockname() failed, error=%d\r\n", _WSAGetLastError() ));
}
ftp_modify_port_command(
sockets[t].buffers_write[0].buf,
dlen,
MAX_SEGMENT_SIZE,
ntohl(name.sin_addr.s_addr),
ftp_data_port,
is_pasv
);
sockets[t].buffers_write[0].len = dlen;
sockets[t].bytes_remaining_to_send = dlen;
// Do not change "bytes_to_send" field as it is used for ack calculation
}
} // end of ftp patch
if(!b_send(t)) {
// on error, close the ftp data listening socket if one was created
if(lst >= 0) {
D(bug("[%d] closing listening port %d after write error\r\n", t, l_sockets[lst].port));
_closesocket( l_sockets[lst].s );
l_sockets[lst].s = INVALID_SOCKET;
l_sockets[lst].port = 0;
l_sockets[lst].ip = 0;
l_sockets[lst].parent = -1;
sockets[t].child = -1;
}
}
}
}
}
if(initiate_read) {
if(!b_recfrom(t)) {
// post icmp error message
}
}
}
LeaveCriticalSection( &tcp_section );
}
/*
- Dispatch remote close and connect events.
- Expire time-waits.
- Handle resend timeouts.
*/
static unsigned int WINAPI tcp_connect_close_thread(void *arg)
{
WSAEVENT wait_handles[MAX_SOCKETS];
for( int i=0; i<MAX_SOCKETS; i++ ) {
wait_handles[i] = sockets[i].ev;
}
while(!is_router_shutting_down) {
DWORD ret = WaitForMultipleObjects(
MAX_SOCKETS,
wait_handles,
FALSE,
200
);
if(is_router_shutting_down) break;
EnterCriticalSection( &tcp_section );
if( ret >= WAIT_OBJECT_0 && ret < WAIT_OBJECT_0 + MAX_SOCKETS ) {
const int t = ret - WAIT_OBJECT_0;
D(bug("<%d> Event %d\r\n", t, ret));
if(sockets[t].in_use) {
WSANETWORKEVENTS what;
if( _WSAEnumNetworkEvents( sockets[t].s, sockets[t].ev, &what ) != SOCKET_ERROR ) {
if( what.lNetworkEvents & FD_CONNECT ) {
if( what.iErrorCode[FD_CONNECT_BIT] == 0 ) {
D(bug("<%d> Connect ok\r\n", t));
tcp_connect_callback(t);
} else {
D(bug("<%d> Connect error=%d\r\n", t, what.iErrorCode[FD_CONNECT_BIT]));
// Post icmp error
}
} else if( what.lNetworkEvents & FD_CLOSE ) {
if( what.iErrorCode[FD_CLOSE_BIT] == 0 ) {
D(bug("<%d> graceful close, state = %s\r\n", t, STATENAME(sockets[t].state)));
} else {
D(bug("<%d> abortive close, state = %s, code=%d\r\n", t, STATENAME(sockets[t].state), what.iErrorCode[FD_CLOSE_BIT]));
}
sockets[t].remote_closed = true;
}
} else {
int err = _WSAGetLastError();
if( err == WSAENOTSOCK ) {
D(bug("<%d> WSAEnumNetworkEvents: socket is already closed\r\n", t));
} else {
D(bug("<%d> WSAEnumNetworkEvents failed with error code %d, freeing slot\r\n", t, err));
free_socket( t );
}
}
}
_WSAResetEvent( sockets[t].ev );
} else {
static int interval = 5;
if( !--interval ) {
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(sockets[i].in_use) {
DWORD tmw = sockets[i].time_wait;
DWORD stl = sockets[i].stream_to_mac_stalled_until;
if( tmw ) {
if( GetTickCount() >= tmw ) {
if( sockets[i].state == SYN_SENT ) {
/*
A very basic SYN flood protection. Note that watching
SYN_SENT instead of SYN_RCVD, because the state codes are
from the point of view of the Mac-Router interface, not Router-Remote.
*/
D(bug("<%d> SYN_SENT time-out expired\r\n", i));
} else {
D(bug("<%d> TIME_WAIT expired\r\n", i));
}
free_socket( i );
}
} else if( stl ) {
if( sockets[i].state == ESTABLISHED ) {
if( GetTickCount() >= stl ) {
D(bug("<%d> RESEND timeout expired\r\n", i));
sockets[i].stream_to_mac_stalled_until = GetTickCount() + sockets[i].resend_timeout;
send_buffer( i, true );
}
} else {
sockets[i].stream_to_mac_stalled_until = 0;
}
}
}
}
interval = 5;
}
}
LeaveCriticalSection( &tcp_section );
}
return 0;
}
static unsigned int WINAPI tcp_listen_thread(void *arg)
{
WSAEVENT wait_handles[MAX_SOCKETS];
for( int i=0; i<MAX_SOCKETS; i++ ) {
wait_handles[i] = l_sockets[i].ev;
tcp_start_listen( i );
}
while(!is_router_shutting_down) {
DWORD ret = WaitForMultipleObjects(
MAX_SOCKETS,
wait_handles,
FALSE,
200
);
if(is_router_shutting_down) break;
EnterCriticalSection( &tcp_section );
if( ret >= WAIT_OBJECT_0 && ret < WAIT_OBJECT_0 + MAX_SOCKETS ) {
const int lst = ret - WAIT_OBJECT_0;
D(bug("[%d] connection attempt to port %d\r\n", lst, l_sockets[lst].port));
WSANETWORKEVENTS what;
if( _WSAEnumNetworkEvents( l_sockets[lst].s, l_sockets[lst].ev, &what ) != SOCKET_ERROR ) {
if( what.lNetworkEvents & FD_ACCEPT ) {
if( what.iErrorCode[FD_ACCEPT_BIT] == 0 ) {
D(bug("[%d] Connect ok\r\n", lst));
tcp_accept_callback(lst);
} else {
D(bug("[%d] Connect error=%d\r\n", lst, what.iErrorCode[FD_ACCEPT_BIT]));
// Post icmp error
}
}
}
// close on errors too
if(l_sockets[lst].once) {
D(bug("[%d] once mode: closing listening socket on port %d\r\n", lst, l_sockets[lst].port));
if( _closesocket( l_sockets[lst].s ) == SOCKET_ERROR ) {
int err = _WSAGetLastError();
D(bug("[%d] close error %d\r\n", lst, err));
}
l_sockets[lst].s = INVALID_SOCKET;
l_sockets[lst].port = 0;
l_sockets[lst].ip = 0;
int t = l_sockets[lst].parent;
if( t >= 0 ) {
sockets[t].child = -1;
}
l_sockets[lst].parent = -1;
}
_WSAResetEvent( l_sockets[lst].ev );
}
LeaveCriticalSection( &tcp_section );
}
return 0;
}
/*
tcp_port=<port> [,<interface to bind>]
tcp_port=21,192.168.0.1
*/
static void init_tcp_listen_ports()
{
int32 index = 0;
const char *port_str;
while ((port_str = PrefsFindString("tcp_port", index++)) != NULL) {
uint32 iface = 0;
const char *if_str = strchr(port_str,',');
if(if_str) {
if_str++;
uint32 if_net = _inet_addr( if_str );
if(if_net == INADDR_NONE) if_net = INADDR_ANY;
iface = ntohl( if_net );
}
uint16 port = (uint16)strtoul( port_str, 0, 0 );
if( port ) {
uint32 ip = 0;
bool once = false;
alloc_listen_socket( port, ip, iface, once );
}
}
}
static HANDLE tcp_handle = 0;
static HANDLE tcp_l_handle = 0;
void init_tcp()
{
InitializeCriticalSection( &tcp_section );
for( int i=0; i<MAX_SOCKETS; i++ ) {
memset( &sockets[i], 0, sizeof(tcp_socket_t) );
sockets[i].s = INVALID_SOCKET;
sockets[i].state = CLOSED;
sockets[i].ev = _WSACreateEvent();
sockets[i].child = -1;
}
for( int i=0; i<MAX_SOCKETS; i++ ) {
memset( &l_sockets[i], 0, sizeof(tcp_listening_socket_t) );
l_sockets[i].s = INVALID_SOCKET;
l_sockets[i].ev = _WSACreateEvent();
l_sockets[i].parent = -1;
/*
l_sockets[i].port = 0;
l_sockets[i].ip = 0;
l_sockets[i].iface = 0;
l_sockets[i].once = false;
*/
}
init_tcp_listen_ports();
unsigned int tcp_tid;
tcp_handle = (HANDLE)_beginthreadex( 0, 0, tcp_connect_close_thread, 0, 0, &tcp_tid );
unsigned int tcp_l_tid;
tcp_l_handle = (HANDLE)_beginthreadex( 0, 0, tcp_listen_thread, 0, 0, &tcp_l_tid );
}
void final_tcp()
{
D(bug("closing all tcp sockets\r\n"));
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(sockets[i].s != INVALID_SOCKET) {
D(bug(" closing socket %d\r\n", i));
}
free_socket( i );
if(sockets[i].buffers_write[0].buf) {
delete [] sockets[i].buffers_write[0].buf;
sockets[i].buffers_write[0].buf = 0;
}
if(sockets[i].buffers_read[0].buf) {
delete [] sockets[i].buffers_read[0].buf;
sockets[i].buffers_read[0].buf = 0;
}
}
D(bug("closing all tcp listening socket\r\n"));
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(l_sockets[i].s != INVALID_SOCKET) {
D(bug(" closing listening socket %d\r\n", i));
_closesocket( l_sockets[i].s );
l_sockets[i].s = INVALID_SOCKET;
}
}
// The router module has already set the shutdown flag.
WaitForSingleObject( tcp_handle, INFINITE );
WaitForSingleObject( tcp_l_handle, INFINITE );
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(sockets[i].ev != WSA_INVALID_EVENT) {
_WSACloseEvent(sockets[i].ev);
sockets[i].ev = WSA_INVALID_EVENT;
}
}
for( int i=0; i<MAX_SOCKETS; i++ ) {
if(l_sockets[i].ev != WSA_INVALID_EVENT) {
_WSACloseEvent(l_sockets[i].ev);
l_sockets[i].ev = WSA_INVALID_EVENT;
}
}
DeleteCriticalSection( &tcp_section );
}