/* * COPYRIGHT: See COPYING in the top level directory * PROJECT: ReactOS TCP/IP protocol driver * FILE: transport/tcp/tcp.c * PURPOSE: Transmission Control Protocol * PROGRAMMERS: Casper S. Hornstrup (chorns@users.sourceforge.net) * Art Yerkes (arty@users.sf.net) * REVISIONS: * CSH 01/08-2000 Created * arty 12/21/2004 Added accept */ #include "precomp.h" LONG TCP_IPIdentification = 0; static BOOLEAN TCPInitialized = FALSE; PORT_SET TCPPorts; #include "lwip/pbuf.h" #include "lwip/ip.h" #include "lwip/init.h" #include "lwip/arch.h" #include NPAGED_LOOKASIDE_LIST TdiBucketLookasideList; static IO_WORKITEM_ROUTINE DisconnectWorker; _Use_decl_annotations_ VOID NTAPI DisconnectWorker( _Unreferenced_parameter_ PDEVICE_OBJECT DeviceObject, _In_ PVOID Context ) { PCONNECTION_ENDPOINT Connection = (PCONNECTION_ENDPOINT)Context; PLIST_ENTRY Entry; PTDI_BUCKET Bucket; /* We timed out waiting for pending sends so force it to shutdown */ TCPTranslateError(LibTCPShutdown(Connection, 0, 1)); LockObject(Connection); while (!IsListEmpty(&Connection->SendRequest)) { Entry = RemoveHeadList(&Connection->SendRequest); Bucket = CONTAINING_RECORD(Entry, TDI_BUCKET, Entry); Bucket->Information = 0; Bucket->Status = STATUS_FILE_CLOSED; CompleteBucket(Connection, Bucket, FALSE); } while (!IsListEmpty(&Connection->ShutdownRequest)) { Entry = RemoveHeadList( &Connection->ShutdownRequest ); Bucket = CONTAINING_RECORD( Entry, TDI_BUCKET, Entry ); Bucket->Status = STATUS_TIMEOUT; Bucket->Information = 0; CompleteBucket(Connection, Bucket, FALSE); } UnlockObject(Connection); DereferenceObject(Connection); } VOID NTAPI DisconnectTimeoutDpc(PKDPC Dpc, PVOID DeferredContext, PVOID SystemArgument1, PVOID SystemArgument2) { PCONNECTION_ENDPOINT Connection = (PCONNECTION_ENDPOINT)DeferredContext; IoQueueWorkItem(Connection->DisconnectWorkItem, DisconnectWorker, DelayedWorkQueue, Connection); } VOID ConnectionFree(PVOID Object) { PCONNECTION_ENDPOINT Connection = (PCONNECTION_ENDPOINT)Object; KIRQL OldIrql; TI_DbgPrint(DEBUG_TCP, ("Freeing TCP Endpoint\n")); TcpipAcquireSpinLock(&ConnectionEndpointListLock, &OldIrql); RemoveEntryList(&Connection->ListEntry); TcpipReleaseSpinLock(&ConnectionEndpointListLock, OldIrql); ExDeleteResourceLite(&Connection->Resource); IoFreeWorkItem(Connection->DisconnectWorkItem); ExFreePoolWithTag( Connection, CONN_ENDPT_TAG ); } PCONNECTION_ENDPOINT TCPAllocateConnectionEndpoint( PVOID ClientContext ) { PCONNECTION_ENDPOINT Connection = (PCONNECTION_ENDPOINT) ExAllocatePoolWithTag(NonPagedPool, sizeof(CONNECTION_ENDPOINT), CONN_ENDPT_TAG); if (!Connection) return Connection; TI_DbgPrint(DEBUG_CPOINT, ("Connection point file object allocated at (0x%X).\n", Connection)); RtlZeroMemory(Connection, sizeof(CONNECTION_ENDPOINT)); /* Initialize spin lock that protects the connection endpoint file object */ ExInitializeResourceLite(&Connection->Resource); InitializeListHead(&Connection->ConnectRequest); InitializeListHead(&Connection->ListenRequest); InitializeListHead(&Connection->ReceiveRequest); InitializeListHead(&Connection->SendRequest); InitializeListHead(&Connection->ShutdownRequest); InitializeListHead(&Connection->PacketQueue); /* Initialize disconnect timer */ KeInitializeTimer(&Connection->DisconnectTimer); KeInitializeDpc(&Connection->DisconnectDpc, DisconnectTimeoutDpc, Connection); Connection->DisconnectWorkItem = IoAllocateWorkItem(TCPDeviceObject); if (!Connection->DisconnectWorkItem) { ExDeleteResourceLite(&Connection->Resource); ExFreePoolWithTag( Connection, CONN_ENDPT_TAG ); return NULL; } /* Save client context pointer */ Connection->ClientContext = ClientContext; Connection->RefCount = 1; Connection->Free = ConnectionFree; /* Add connection endpoint to global list */ ExInterlockedInsertTailList(&ConnectionEndpointListHead, &Connection->ListEntry, &ConnectionEndpointListLock); return Connection; } NTSTATUS TCPSocket( PCONNECTION_ENDPOINT Connection, UINT Family, UINT Type, UINT Proto ) { NTSTATUS Status; LockObject(Connection); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSocket] Called: Connection %x, Family %d, Type %d, " "Proto %d, sizeof(CONNECTION_ENDPOINT) = %d\n", Connection, Family, Type, Proto, sizeof(CONNECTION_ENDPOINT))); Connection->SocketContext = LibTCPSocket(Connection); if (Connection->SocketContext) Status = STATUS_SUCCESS; else Status = STATUS_INSUFFICIENT_RESOURCES; UnlockObject(Connection); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSocket] Leaving. Status = 0x%x\n", Status)); return Status; } NTSTATUS TCPClose( PCONNECTION_ENDPOINT Connection ) { LockObject(Connection); FlushAllQueues(Connection, STATUS_CANCELLED); UnlockObject(Connection); LibTCPClose(Connection, FALSE, TRUE); DereferenceObject(Connection); return STATUS_SUCCESS; } VOID TCPReceive(PIP_INTERFACE Interface, PIP_PACKET IPPacket) /* * FUNCTION: Receives and queues TCP data * ARGUMENTS: * IPPacket = Pointer to an IP packet that was received * NOTES: * This is the low level interface for receiving TCP data */ { TI_DbgPrint(DEBUG_TCP,("Sending packet %d (%d) to lwIP\n", IPPacket->TotalSize, IPPacket->HeaderSize)); LibIPInsertPacket(Interface->TCPContext, IPPacket->Header, IPPacket->TotalSize); } NTSTATUS TCPStartup(VOID) /* * FUNCTION: Initializes the TCP subsystem * RETURNS: * Status of operation */ { NTSTATUS Status; Status = PortsStartup(&TCPPorts, 1, 0xffff); if (!NT_SUCCESS(Status)) { return Status; } ExInitializeNPagedLookasideList(&TdiBucketLookasideList, NULL, NULL, 0, sizeof(TDI_BUCKET), TDI_BUCKET_TAG, 0); /* Initialize our IP library */ LibIPInitialize(); /* Register this protocol with IP layer */ IPRegisterProtocol(IPPROTO_TCP, TCPReceive); TCPInitialized = TRUE; return STATUS_SUCCESS; } NTSTATUS TCPShutdown(VOID) /* * FUNCTION: Shuts down the TCP subsystem * RETURNS: * Status of operation */ { if (!TCPInitialized) return STATUS_SUCCESS; ExDeleteNPagedLookasideList(&TdiBucketLookasideList); LibIPShutdown(); /* Deregister this protocol with IP layer */ IPRegisterProtocol(IPPROTO_TCP, NULL); TCPInitialized = FALSE; PortsShutdown( &TCPPorts ); return STATUS_SUCCESS; } NTSTATUS TCPTranslateError(const err_t err) { NTSTATUS Status; switch (err) { case ERR_OK: Status = STATUS_SUCCESS; return Status; //0 case ERR_MEM: Status = STATUS_INSUFFICIENT_RESOURCES; break; //-1 case ERR_BUF: Status = STATUS_BUFFER_TOO_SMALL; break; //-2 case ERR_TIMEOUT: Status = STATUS_TIMEOUT; break; // -3 case ERR_RTE: Status = STATUS_NETWORK_UNREACHABLE; break; //-4 case ERR_INPROGRESS: Status = STATUS_PENDING; return Status; //-5 case ERR_VAL: Status = STATUS_INVALID_PARAMETER; break; //-6 case ERR_WOULDBLOCK: Status = STATUS_CANT_WAIT; break; //-7 case ERR_USE: Status = STATUS_ADDRESS_ALREADY_EXISTS; break; //-8 case ERR_ISCONN: Status = STATUS_UNSUCCESSFUL; break; //-9 (FIXME) case ERR_ABRT: Status = STATUS_LOCAL_DISCONNECT; break; //-10 case ERR_RST: Status = STATUS_REMOTE_DISCONNECT; break; //-11 case ERR_CLSD: Status = STATUS_FILE_CLOSED; break; //-12 case ERR_CONN: Status = STATUS_INVALID_CONNECTION; break; //-13 case ERR_ARG: Status = STATUS_INVALID_PARAMETER; break; //-14 case ERR_IF: Status = STATUS_UNEXPECTED_NETWORK_ERROR; break; //-15 default: DbgPrint("Invalid error value: %d\n", err); ASSERT(FALSE); Status = STATUS_UNSUCCESSFUL; break; } TI_DbgPrint(DEBUG_TCP,("TCP operation failed: 0x%x (%d)\n", Status, err)); return Status; } NTSTATUS TCPConnect ( PCONNECTION_ENDPOINT Connection, PTDI_CONNECTION_INFORMATION ConnInfo, PTDI_CONNECTION_INFORMATION ReturnInfo, PTCP_COMPLETION_ROUTINE Complete, PVOID Context ) { NTSTATUS Status; ip_addr_t bindaddr, connaddr; IP_ADDRESS RemoteAddress; USHORT RemotePort; TA_IP_ADDRESS LocalAddress; PTDI_BUCKET Bucket; PNEIGHBOR_CACHE_ENTRY NCE; TI_DbgPrint(DEBUG_TCP,("[IP, TCPConnect] Called\n")); Status = AddrBuildAddress ((PTRANSPORT_ADDRESS)ConnInfo->RemoteAddress, &RemoteAddress, &RemotePort); if (!NT_SUCCESS(Status)) { TI_DbgPrint(DEBUG_TCP, ("Could not AddrBuildAddress in TCPConnect\n")); return Status; } /* Freed in TCPSocketState */ TI_DbgPrint(DEBUG_TCP, ("Connecting to address %x:%x\n", RemoteAddress.Address.IPv4Address, RemotePort)); LockObject(Connection); if (!Connection->AddressFile) { UnlockObject(Connection); return STATUS_INVALID_PARAMETER; } if (AddrIsUnspecified(&Connection->AddressFile->Address)) { if (!(NCE = RouteGetRouteToDestination(&RemoteAddress))) { UnlockObject(Connection); return STATUS_NETWORK_UNREACHABLE; } bindaddr.addr = NCE->Interface->Unicast.Address.IPv4Address; } else { bindaddr.addr = Connection->AddressFile->Address.Address.IPv4Address; } Status = TCPTranslateError(LibTCPBind(Connection, &bindaddr, Connection->AddressFile->Port)); if (!NT_SUCCESS(Status)) { UnlockObject(Connection); return Status; } /* Copy bind address into connection */ Connection->AddressFile->Address.Address.IPv4Address = bindaddr.addr; /* Check if we had an unspecified port */ if (!Connection->AddressFile->Port) { UINT AllocatedPort; /* We did, so we need to copy back the port */ Status = TCPGetSockAddress(Connection, (PTRANSPORT_ADDRESS)&LocalAddress, FALSE); if (!NT_SUCCESS(Status)) { UnlockObject(Connection); return Status; } /* Allocate the port in the port bitmap */ AllocatedPort = TCPAllocatePort(LocalAddress.Address[0].Address[0].sin_port); /* This should never fail unless all ports are in use */ if (AllocatedPort == (UINT) -1) { DbgPrint("ERR: No more ports available.\n"); UnlockObject(Connection); return STATUS_TOO_MANY_ADDRESSES; } Connection->AddressFile->Port = AllocatedPort; } connaddr.addr = RemoteAddress.Address.IPv4Address; Bucket = ExAllocateFromNPagedLookasideList(&TdiBucketLookasideList); if (!Bucket) { UnlockObject(Connection); return STATUS_NO_MEMORY; } Bucket->Request.RequestNotifyObject = (PVOID)Complete; Bucket->Request.RequestContext = Context; InsertTailList( &Connection->ConnectRequest, &Bucket->Entry ); UnlockObject(Connection); Status = TCPTranslateError(LibTCPConnect(Connection, &connaddr, RemotePort)); if (!NT_SUCCESS(Status)) { LockObject(Connection); RemoveEntryList(&Bucket->Entry); UnlockObject(Connection); ExFreeToNPagedLookasideList(&TdiBucketLookasideList, Bucket); } TI_DbgPrint(DEBUG_TCP,("[IP, TCPConnect] Leaving. Status = 0x%x\n", Status)); return Status; } NTSTATUS TCPDisconnect ( PCONNECTION_ENDPOINT Connection, UINT Flags, PLARGE_INTEGER Timeout, PTDI_CONNECTION_INFORMATION ConnInfo, PTDI_CONNECTION_INFORMATION ReturnInfo, PTCP_COMPLETION_ROUTINE Complete, PVOID Context ) { NTSTATUS Status = STATUS_INVALID_PARAMETER; PTDI_BUCKET Bucket; LARGE_INTEGER ActualTimeout; TI_DbgPrint(DEBUG_TCP,("[IP, TCPDisconnect] Called\n")); LockObject(Connection); if (Connection->SocketContext) { if (Flags & TDI_DISCONNECT_RELEASE) { if (IsListEmpty(&Connection->SendRequest)) { ReferenceObject(Connection); UnlockObject(Connection); Status = TCPTranslateError(LibTCPShutdown(Connection, 0, 1)); LockObject(Connection); DereferenceObject(Connection); } else if (Timeout && Timeout->QuadPart == 0) { FlushSendQueue(Connection, STATUS_FILE_CLOSED); ReferenceObject(Connection); UnlockObject(Connection); LibTCPShutdown(Connection, 0, 1); LockObject(Connection); DereferenceObject(Connection); Status = STATUS_TIMEOUT; } else { /* Use the timeout specified or 1 second if none was specified */ if (Timeout) { ActualTimeout = *Timeout; } else { ActualTimeout.QuadPart = -1000000; } /* We couldn't complete the request now because we need to wait for outstanding I/O */ Bucket = ExAllocateFromNPagedLookasideList(&TdiBucketLookasideList); if (!Bucket) { UnlockObject(Connection); return STATUS_NO_MEMORY; } Bucket->Request.RequestNotifyObject = (PVOID)Complete; Bucket->Request.RequestContext = Context; InsertTailList(&Connection->ShutdownRequest, &Bucket->Entry); ReferenceObject(Connection); if (KeSetTimer(&Connection->DisconnectTimer, ActualTimeout, &Connection->DisconnectDpc)) { /* Timer was already in the queue. */ DereferenceObject(Connection); } Status = STATUS_PENDING; } } if ((Flags & TDI_DISCONNECT_ABORT) || !Flags) { FlushReceiveQueue(Connection, STATUS_FILE_CLOSED); FlushSendQueue(Connection, STATUS_FILE_CLOSED); FlushShutdownQueue(Connection, STATUS_FILE_CLOSED); ReferenceObject(Connection); UnlockObject(Connection); Status = TCPTranslateError(LibTCPShutdown(Connection, 1, 1)); DereferenceObject(Connection); } else { UnlockObject(Connection); } } else { UnlockObject(Connection); /* We already got closed by the other side so just return success */ Status = STATUS_SUCCESS; } TI_DbgPrint(DEBUG_TCP,("[IP, TCPDisconnect] Leaving. Status = 0x%x\n", Status)); return Status; } NTSTATUS TCPReceiveData ( PCONNECTION_ENDPOINT Connection, PNDIS_BUFFER Buffer, ULONG ReceiveLength, PULONG BytesReceived, ULONG ReceiveFlags, PTCP_COMPLETION_ROUTINE Complete, PVOID Context ) { PTDI_BUCKET Bucket; PUCHAR DataBuffer; UINT DataLen, Received; NTSTATUS Status; TI_DbgPrint(DEBUG_TCP,("[IP, TCPReceiveData] Called for %d bytes (on socket %x)\n", ReceiveLength, Connection->SocketContext)); NdisQueryBuffer(Buffer, &DataBuffer, &DataLen); Status = LibTCPGetDataFromConnectionQueue(Connection, DataBuffer, DataLen, &Received); if (Status == STATUS_PENDING) { Bucket = ExAllocateFromNPagedLookasideList(&TdiBucketLookasideList); if (!Bucket) { TI_DbgPrint(DEBUG_TCP,("[IP, TCPReceiveData] Failed to allocate bucket\n")); return STATUS_NO_MEMORY; } Bucket->Request.RequestNotifyObject = Complete; Bucket->Request.RequestContext = Context; LockObject(Connection); InsertTailList( &Connection->ReceiveRequest, &Bucket->Entry ); UnlockObject(Connection); TI_DbgPrint(DEBUG_TCP,("[IP, TCPReceiveData] Queued read irp\n")); TI_DbgPrint(DEBUG_TCP,("[IP, TCPReceiveData] Leaving. Status = STATUS_PENDING\n")); (*BytesReceived) = 0; } else { (*BytesReceived) = Received; } return Status; } NTSTATUS TCPSendData ( PCONNECTION_ENDPOINT Connection, PCHAR BufferData, ULONG SendLength, PULONG BytesSent, ULONG Flags, PTCP_COMPLETION_ROUTINE Complete, PVOID Context ) { NTSTATUS Status; PTDI_BUCKET Bucket; ReferenceObject(Connection); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSendData] Called for %d bytes (on socket %x)\n", SendLength, Connection->SocketContext)); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSendData] Connection = %x\n", Connection)); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSendData] Connection->SocketContext = %x\n", Connection->SocketContext)); Status = TCPTranslateError(LibTCPSend(Connection, BufferData, SendLength, BytesSent, FALSE)); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSendData] Send: %x, %d\n", Status, SendLength)); /* Keep this request around ... there was no data yet */ if (Status == STATUS_PENDING) { /* Freed in TCPSocketState */ Bucket = ExAllocateFromNPagedLookasideList(&TdiBucketLookasideList); if (!Bucket) { DereferenceObject(Connection); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSendData] Failed to allocate bucket\n")); return STATUS_NO_MEMORY; } Bucket->Request.RequestNotifyObject = Complete; Bucket->Request.RequestContext = Context; LockObject(Connection); InsertTailList( &Connection->SendRequest, &Bucket->Entry ); TI_DbgPrint(DEBUG_TCP,("[IP, TCPSendData] Queued write irp\n")); UnlockObject(Connection); } TI_DbgPrint(DEBUG_TCP, ("[IP, TCPSendData] Leaving. Status = %x\n", Status)); DereferenceObject(Connection); return Status; } UINT TCPAllocatePort(const UINT HintPort) { if (HintPort) { if (AllocatePort(&TCPPorts, HintPort)) return HintPort; else { TI_DbgPrint(MID_TRACE,("We got a hint port but couldn't allocate it\n")); return (UINT)-1; } } else return AllocatePortFromRange( &TCPPorts, 1024, 5000 ); } VOID TCPFreePort(const UINT Port) { DeallocatePort(&TCPPorts, Port); } NTSTATUS TCPGetSockAddress ( PCONNECTION_ENDPOINT Connection, PTRANSPORT_ADDRESS Address, BOOLEAN GetRemote ) { PTA_IP_ADDRESS AddressIP = (PTA_IP_ADDRESS)Address; ip_addr_t ipaddr; NTSTATUS Status; AddressIP->TAAddressCount = 1; AddressIP->Address[0].AddressLength = TDI_ADDRESS_LENGTH_IP; AddressIP->Address[0].AddressType = TDI_ADDRESS_TYPE_IP; LockObject(Connection); if (GetRemote) { Status = TCPTranslateError(LibTCPGetPeerName(Connection->SocketContext, &ipaddr, &AddressIP->Address[0].Address[0].sin_port)); } else { Status = TCPTranslateError(LibTCPGetHostName(Connection->SocketContext, &ipaddr, &AddressIP->Address[0].Address[0].sin_port)); } UnlockObject(Connection); AddressIP->Address[0].Address[0].in_addr = ipaddr.addr; RtlZeroMemory(&AddressIP->Address[0].Address[0].sin_zero, sizeof(AddressIP->Address[0].Address[0].sin_zero)); return Status; } BOOLEAN TCPRemoveIRP( PCONNECTION_ENDPOINT Endpoint, PIRP Irp ) { PLIST_ENTRY Entry; PLIST_ENTRY ListHead[5]; PTDI_BUCKET Bucket; UINT i = 0; BOOLEAN Found = FALSE; ListHead[0] = &Endpoint->SendRequest; ListHead[1] = &Endpoint->ReceiveRequest; ListHead[2] = &Endpoint->ConnectRequest; ListHead[3] = &Endpoint->ListenRequest; ListHead[4] = &Endpoint->ShutdownRequest; LockObject(Endpoint); for( i = 0; i < 5; i++ ) { for( Entry = ListHead[i]->Flink; Entry != ListHead[i]; Entry = Entry->Flink ) { Bucket = CONTAINING_RECORD( Entry, TDI_BUCKET, Entry ); if( Bucket->Request.RequestContext == Irp ) { RemoveEntryList( &Bucket->Entry ); ExFreeToNPagedLookasideList(&TdiBucketLookasideList, Bucket); Found = TRUE; break; } } } UnlockObject(Endpoint); return Found; } NTSTATUS TCPSetNoDelay( PCONNECTION_ENDPOINT Connection, BOOLEAN Set) { if (!Connection) return STATUS_UNSUCCESSFUL; if (Connection->SocketContext == NULL) return STATUS_UNSUCCESSFUL; LibTCPSetNoDelay(Connection->SocketContext, Set); return STATUS_SUCCESS; } NTSTATUS TCPGetSocketStatus( PCONNECTION_ENDPOINT Connection, PULONG State) { if (!Connection) return STATUS_UNSUCCESSFUL; if (Connection->SocketContext == NULL) return STATUS_UNSUCCESSFUL; LibTCPGetSocketStatus(Connection->SocketContext, State); return STATUS_SUCCESS; } /* EOF */