/* * Copyright (c) 2018-2020, Andreas Kling * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, this * list of conditions and the following disclaimer. * * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include //#define IPV4_SOCKET_DEBUG namespace Kernel { Lockable>& IPv4Socket::all_sockets() { static Lockable>* s_table; if (!s_table) s_table = new Lockable>; return *s_table; } KResultOr> IPv4Socket::create(int type, int protocol) { if (type == SOCK_STREAM) return TCPSocket::create(protocol); if (type == SOCK_DGRAM) return UDPSocket::create(protocol); if (type == SOCK_RAW) return adopt(*new IPv4Socket(type, protocol)); return KResult(-EINVAL); } IPv4Socket::IPv4Socket(int type, int protocol) : Socket(AF_INET, type, protocol) { #ifdef IPV4_SOCKET_DEBUG dbg() << "IPv4Socket{" << this << "} created with type=" << type << ", protocol=" << protocol; #endif m_buffer_mode = type == SOCK_STREAM ? BufferMode::Bytes : BufferMode::Packets; if (m_buffer_mode == BufferMode::Bytes) { m_scratch_buffer = KBuffer::create_with_size(65536); } LOCKER(all_sockets().lock()); all_sockets().resource().set(this); } IPv4Socket::~IPv4Socket() { LOCKER(all_sockets().lock()); all_sockets().resource().remove(this); } void IPv4Socket::get_local_address(sockaddr* address, socklen_t* address_size) { sockaddr_in local_address = { AF_INET, htons(m_local_port), { m_local_address.to_in_addr_t() }, { 0 } }; memcpy(address, &local_address, min(static_cast(*address_size), sizeof(sockaddr_in))); *address_size = sizeof(sockaddr_in); } void IPv4Socket::get_peer_address(sockaddr* address, socklen_t* address_size) { sockaddr_in peer_address = { AF_INET, htons(m_peer_port), { m_peer_address.to_in_addr_t() }, { 0 } }; memcpy(address, &peer_address, min(static_cast(*address_size), sizeof(sockaddr_in))); *address_size = sizeof(sockaddr_in); } KResult IPv4Socket::bind(const sockaddr* user_address, socklen_t address_size) { ASSERT(setup_state() == SetupState::Unstarted); if (address_size != sizeof(sockaddr_in)) return KResult(-EINVAL); sockaddr_in address; copy_from_user(&address, user_address, sizeof(sockaddr_in)); if (address.sin_family != AF_INET) return KResult(-EINVAL); auto requested_local_port = ntohs(address.sin_port); if (!Process::current->is_superuser()) { if (requested_local_port < 1024) { dbg() << "UID " << Process::current->uid() << " attempted to bind " << class_name() << " to port " << requested_local_port; return KResult(-EACCES); } } m_local_address = IPv4Address((const u8*)&address.sin_addr.s_addr); m_local_port = requested_local_port; #ifdef IPV4_SOCKET_DEBUG dbg() << "IPv4Socket::bind " << class_name() << "{" << this << "} to " << m_local_address << ":" << m_local_port; #endif return protocol_bind(); } KResult IPv4Socket::listen(size_t backlog) { int rc = allocate_local_port_if_needed(); if (rc < 0) return KResult(-EADDRINUSE); set_backlog(backlog); m_role = Role::Listener; #ifdef IPV4_SOCKET_DEBUG dbg() << "IPv4Socket{" << this << "} listening with backlog=" << backlog; #endif return protocol_listen(); } KResult IPv4Socket::connect(FileDescription& description, const sockaddr* address, socklen_t address_size, ShouldBlock should_block) { if (address_size != sizeof(sockaddr_in)) return KResult(-EINVAL); if (address->sa_family != AF_INET) return KResult(-EINVAL); if (m_role == Role::Connected) return KResult(-EISCONN); auto& ia = *(const sockaddr_in*)address; m_peer_address = IPv4Address((const u8*)&ia.sin_addr.s_addr); m_peer_port = ntohs(ia.sin_port); return protocol_connect(description, should_block); } void IPv4Socket::attach(FileDescription&) { } void IPv4Socket::detach(FileDescription&) { } bool IPv4Socket::can_read(const FileDescription&, size_t) const { if (m_role == Role::Listener) return can_accept(); if (protocol_is_disconnected()) return true; return m_can_read; } bool IPv4Socket::can_write(const FileDescription&, size_t) const { return is_connected(); } int IPv4Socket::allocate_local_port_if_needed() { if (m_local_port) return m_local_port; int port = protocol_allocate_local_port(); if (port < 0) return port; m_local_port = (u16)port; return port; } ssize_t IPv4Socket::sendto(FileDescription&, const void* data, size_t data_length, int flags, const sockaddr* addr, socklen_t addr_length) { (void)flags; if (addr && addr_length != sizeof(sockaddr_in)) return -EINVAL; if (addr) { if (addr->sa_family != AF_INET) { klog() << "sendto: Bad address family: " << addr->sa_family << " is not AF_INET!"; return -EAFNOSUPPORT; } auto& ia = *(const sockaddr_in*)addr; m_peer_address = IPv4Address((const u8*)&ia.sin_addr.s_addr); m_peer_port = ntohs(ia.sin_port); } auto routing_decision = route_to(m_peer_address, m_local_address, bound_interface()); if (routing_decision.is_zero()) return -EHOSTUNREACH; if (m_local_address.to_u32() == 0) m_local_address = routing_decision.adapter->ipv4_address(); int rc = allocate_local_port_if_needed(); if (rc < 0) return rc; #ifdef IPV4_SOCKET_DEBUG klog() << "sendto: destination=" << m_peer_address.to_string().characters() << ":" << m_peer_port; #endif if (type() == SOCK_RAW) { routing_decision.adapter->send_ipv4(routing_decision.next_hop, m_peer_address, (IPv4Protocol)protocol(), (const u8*)data, data_length, m_ttl); return data_length; } int nsent = protocol_send(data, data_length); if (nsent > 0) Thread::current->did_ipv4_socket_write(nsent); return nsent; } ssize_t IPv4Socket::receive_byte_buffered(FileDescription& description, void* buffer, size_t buffer_length, int, sockaddr*, socklen_t*) { Locker locker(lock()); if (m_receive_buffer.is_empty()) { if (protocol_is_disconnected()) return 0; if (!description.is_blocking()) return -EAGAIN; locker.unlock(); auto res = Thread::current->block(description); locker.lock(); if (!m_can_read) { if (res != Thread::BlockResult::WokeNormally) return -EINTR; // Unblocked due to timeout. return -EAGAIN; } } ASSERT(!m_receive_buffer.is_empty()); int nreceived = m_receive_buffer.read((u8*)buffer, buffer_length); if (nreceived > 0) Thread::current->did_ipv4_socket_read((size_t)nreceived); m_can_read = !m_receive_buffer.is_empty(); return nreceived; } ssize_t IPv4Socket::receive_packet_buffered(FileDescription& description, void* buffer, size_t buffer_length, int flags, sockaddr* addr, socklen_t* addr_length) { Locker locker(lock()); ReceivedPacket packet; { if (m_receive_queue.is_empty()) { // FIXME: Shouldn't this return -ENOTCONN instead of EOF? // But if so, we still need to deliver at least one EOF read to userspace.. right? if (protocol_is_disconnected()) return 0; if (!description.is_blocking()) return -EAGAIN; } if (!m_receive_queue.is_empty()) { packet = m_receive_queue.take_first(); m_can_read = !m_receive_queue.is_empty(); #ifdef IPV4_SOCKET_DEBUG dbg() << "IPv4Socket(" << this << "): recvfrom without blocking " << packet.data.value().size() << " bytes, packets in queue: " << m_receive_queue.size_slow(); #endif } } if (!packet.data.has_value()) { if (protocol_is_disconnected()) { dbg() << "IPv4Socket{" << this << "} is protocol-disconnected, returning 0 in recvfrom!"; return 0; } locker.unlock(); auto res = Thread::current->block(description); locker.lock(); if (!m_can_read) { if (res != Thread::BlockResult::WokeNormally) return -EINTR; // Unblocked due to timeout. return -EAGAIN; } ASSERT(m_can_read); ASSERT(!m_receive_queue.is_empty()); packet = m_receive_queue.take_first(); m_can_read = !m_receive_queue.is_empty(); #ifdef IPV4_SOCKET_DEBUG dbg() << "IPv4Socket(" << this << "): recvfrom with blocking " << packet.data.value().size() << " bytes, packets in queue: " << m_receive_queue.size_slow(); #endif } ASSERT(packet.data.has_value()); auto& ipv4_packet = *(const IPv4Packet*)(packet.data.value().data()); if (addr) { #ifdef IPV4_SOCKET_DEBUG dbg() << "Incoming packet is from: " << packet.peer_address << ":" << packet.peer_port; #endif auto& ia = *(sockaddr_in*)addr; memcpy(&ia.sin_addr, &packet.peer_address, sizeof(IPv4Address)); ia.sin_port = htons(packet.peer_port); ia.sin_family = AF_INET; ASSERT(addr_length); *addr_length = sizeof(sockaddr_in); } if (type() == SOCK_RAW) { ASSERT(buffer_length >= ipv4_packet.payload_size()); memcpy(buffer, ipv4_packet.payload(), ipv4_packet.payload_size()); return ipv4_packet.payload_size(); } return protocol_receive(packet.data.value(), buffer, buffer_length, flags); } ssize_t IPv4Socket::recvfrom(FileDescription& description, void* buffer, size_t buffer_length, int flags, sockaddr* addr, socklen_t* addr_length) { if (addr_length && *addr_length < sizeof(sockaddr_in)) return -EINVAL; #ifdef IPV4_SOCKET_DEBUG klog() << "recvfrom: type=" << type() << ", local_port=" << local_port(); #endif ssize_t nreceived = 0; if (buffer_mode() == BufferMode::Bytes) nreceived = receive_byte_buffered(description, buffer, buffer_length, flags, addr, addr_length); else nreceived = receive_packet_buffered(description, buffer, buffer_length, flags, addr, addr_length); if (nreceived > 0) Thread::current->did_ipv4_socket_read(nreceived); return nreceived; } bool IPv4Socket::did_receive(const IPv4Address& source_address, u16 source_port, KBuffer&& packet) { LOCKER(lock()); if (is_shut_down_for_reading()) return false; auto packet_size = packet.size(); if (buffer_mode() == BufferMode::Bytes) { size_t space_in_receive_buffer = m_receive_buffer.space_for_writing(); if (packet_size > space_in_receive_buffer) { dbg() << "IPv4Socket(" << this << "): did_receive refusing packet since buffer is full."; ASSERT(m_can_read); return false; } int nreceived = protocol_receive(packet, m_scratch_buffer.value().data(), m_scratch_buffer.value().size(), 0); m_receive_buffer.write(m_scratch_buffer.value().data(), nreceived); m_can_read = !m_receive_buffer.is_empty(); } else { // FIXME: Maybe track the number of packets so we don't have to walk the entire packet queue to count them.. if (m_receive_queue.size_slow() > 2000) { dbg() << "IPv4Socket(" << this << "): did_receive refusing packet since queue is full."; return false; } m_receive_queue.append({ source_address, source_port, move(packet) }); m_can_read = true; } m_bytes_received += packet_size; #ifdef IPV4_SOCKET_DEBUG if (buffer_mode() == BufferMode::Bytes) dbg() << "IPv4Socket(" << this << "): did_receive " << packet_size << " bytes, total_received=" << m_bytes_received; else dbg() << "IPv4Socket(" << this << "): did_receive " << packet_size << " bytes, total_received=" << m_bytes_received << ", packets in queue: " << m_receive_queue.size_slow(); #endif return true; } String IPv4Socket::absolute_path(const FileDescription&) const { if (m_role == Role::None) return "socket"; StringBuilder builder; builder.append("socket:"); builder.appendf("%s:%d", m_local_address.to_string().characters(), m_local_port); if (m_role == Role::Accepted || m_role == Role::Connected) builder.appendf(" / %s:%d", m_peer_address.to_string().characters(), m_peer_port); switch (m_role) { case Role::Listener: builder.append(" (listening)"); break; case Role::Accepted: builder.append(" (accepted)"); break; case Role::Connected: builder.append(" (connected)"); break; case Role::Connecting: builder.append(" (connecting)"); break; default: ASSERT_NOT_REACHED(); } return builder.to_string(); } KResult IPv4Socket::setsockopt(int level, int option, const void* value, socklen_t value_size) { if (level != IPPROTO_IP) return Socket::setsockopt(level, option, value, value_size); switch (option) { case IP_TTL: if (value_size < sizeof(int)) return KResult(-EINVAL); if (*(const int*)value < 0 || *(const int*)value > 255) return KResult(-EINVAL); m_ttl = (u8) * (const int*)value; return KSuccess; default: return KResult(-ENOPROTOOPT); } } KResult IPv4Socket::getsockopt(FileDescription& description, int level, int option, void* value, socklen_t* value_size) { if (level != IPPROTO_IP) return Socket::getsockopt(description, level, option, value, value_size); switch (option) { case IP_TTL: if (*value_size < sizeof(int)) return KResult(-EINVAL); *(int*)value = m_ttl; return KSuccess; default: return KResult(-ENOPROTOOPT); } } int IPv4Socket::ioctl(FileDescription&, unsigned request, unsigned arg) { REQUIRE_PROMISE(inet); auto ioctl_route = [request, arg]() { auto* route = (rtentry*)arg; if (!Process::current->validate_read_typed(route)) return -EFAULT; char namebuf[IFNAMSIZ + 1]; memcpy(namebuf, route->rt_dev, IFNAMSIZ); namebuf[sizeof(namebuf) - 1] = '\0'; auto adapter = NetworkAdapter::lookup_by_name(namebuf); if (!adapter) return -ENODEV; switch (request) { case SIOCADDRT: if (!Process::current->is_superuser()) return -EPERM; if (route->rt_gateway.sa_family != AF_INET) return -EAFNOSUPPORT; if ((route->rt_flags & (RTF_UP | RTF_GATEWAY)) != (RTF_UP | RTF_GATEWAY)) return -EINVAL; // FIXME: Find the correct value to return adapter->set_ipv4_gateway(IPv4Address(((sockaddr_in&)route->rt_gateway).sin_addr.s_addr)); return 0; case SIOCDELRT: // FIXME: Support gateway deletion return 0; } return -EINVAL; }; auto ioctl_interface = [request, arg]() { auto* ifr = (ifreq*)arg; if (!Process::current->validate_read_typed(ifr)) return -EFAULT; char namebuf[IFNAMSIZ + 1]; memcpy(namebuf, ifr->ifr_name, IFNAMSIZ); namebuf[sizeof(namebuf) - 1] = '\0'; auto adapter = NetworkAdapter::lookup_by_name(namebuf); if (!adapter) return -ENODEV; switch (request) { case SIOCSIFADDR: if (!Process::current->is_superuser()) return -EPERM; if (ifr->ifr_addr.sa_family != AF_INET) return -EAFNOSUPPORT; adapter->set_ipv4_address(IPv4Address(((sockaddr_in&)ifr->ifr_addr).sin_addr.s_addr)); return 0; case SIOCSIFNETMASK: if (!Process::current->is_superuser()) return -EPERM; if (ifr->ifr_addr.sa_family != AF_INET) return -EAFNOSUPPORT; adapter->set_ipv4_netmask(IPv4Address(((sockaddr_in&)ifr->ifr_netmask).sin_addr.s_addr)); return 0; case SIOCGIFADDR: if (!Process::current->validate_write_typed(ifr)) return -EFAULT; ifr->ifr_addr.sa_family = AF_INET; ((sockaddr_in&)ifr->ifr_addr).sin_addr.s_addr = adapter->ipv4_address().to_u32(); return 0; case SIOCGIFHWADDR: if (!Process::current->validate_write_typed(ifr)) return -EFAULT; ifr->ifr_hwaddr.sa_family = AF_INET; { auto mac_address = adapter->mac_address(); memcpy(ifr->ifr_hwaddr.sa_data, &mac_address, sizeof(MACAddress)); } return 0; } return -EINVAL; }; switch (request) { case SIOCSIFADDR: case SIOCSIFNETMASK: case SIOCGIFADDR: case SIOCGIFHWADDR: return ioctl_interface(); case SIOCADDRT: case SIOCDELRT: return ioctl_route(); } return -EINVAL; } void IPv4Socket::close() { shutdown(SHUT_RDWR); } void IPv4Socket::shut_down_for_reading() { Socket::shut_down_for_reading(); m_can_read = true; } }