/* * ZeroTier One - Network Virtualization Everywhere * Copyright (C) 2011-2015 ZeroTier, Inc. * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . * * -- * * ZeroTier may be used and distributed under the terms of the GPLv3, which * are available at: http://www.gnu.org/licenses/gpl-3.0.html * * If you would like to embed ZeroTier into a commercial application or * redistribute it in a modified binary form, please contact ZeroTier Networks * LLC. Start here: http://www.zerotier.com/ */ #ifdef ZT_ENABLE_NETCON #include #include #include #include "NetconEthernetTap.hpp" #include "../node/Utils.hpp" #include "../node/Node.hpp" // for //TRACE #include "../osdep/OSUtils.hpp" #include "../osdep/Phy.hpp" #include "lwip/tcp_impl.h" #include "netif/etharp.h" #include "lwip/ip.h" #include "lwip/ip_addr.h" #include "lwip/ip_frag.h" #include "LWIPStack.hpp" #include "NetconService.hpp" #include "Intercept.h" #include "NetconUtilities.hpp" #define APPLICATION_POLL_FREQ 1 namespace ZeroTier { NetconEthernetTap::NetconEthernetTap( const char *homePath, const MAC &mac, unsigned int mtu, unsigned int metric, uint64_t nwid, const char *friendlyName, void (*handler)(void *,uint64_t,const MAC &,const MAC &,unsigned int,unsigned int,const void *,unsigned int), void *arg) : _phy(this,false,true), _unixListenSocket((PhySocket *)0), _handler(handler), _arg(arg), _nwid(nwid), _mac(mac), _homePath(homePath), _mtu(mtu), _enabled(true), _run(true) { char sockPath[4096]; Utils::snprintf(sockPath,sizeof(sockPath),"/tmp/.ztnc_%.16llx",(unsigned long long)nwid); _dev = sockPath; lwipstack = new LWIPStack("/root/dev/netcon/liblwip.so"); if(!lwipstack) // TODO double check this check throw std::runtime_error("unable to load lwip lib."); lwipstack->lwip_init(); _unixListenSocket = _phy.unixListen(sockPath,(void *)this); if (!_unixListenSocket) throw std::runtime_error(std::string("unable to bind to ")+sockPath); _thread = Thread::start(this); } NetconEthernetTap::~NetconEthernetTap() { _run = false; _phy.whack(); _phy.whack(); Thread::join(_thread); _phy.close(_unixListenSocket,false); } void NetconEthernetTap::setEnabled(bool en) { _enabled = en; } bool NetconEthernetTap::enabled() const { return _enabled; } bool NetconEthernetTap::addIp(const InetAddress &ip) { Mutex::Lock _l(_ips_m); if (std::find(_ips.begin(),_ips.end(),ip) == _ips.end()) { _ips.push_back(ip); std::sort(_ips.begin(),_ips.end()); if (ip.isV4()) { Mutex::Lock _l2(_arp_m); _arp.addLocal((uint32_t)(reinterpret_cast(&ip)->sin_addr.s_addr),_mac); } // TODO: alloc IP in LWIP //netif_set_addr(netif, ipaddr, netmask, gw); } return true; // TODO: what is exapected? } bool NetconEthernetTap::removeIp(const InetAddress &ip) { Mutex::Lock _l(_ips_m); std::vector::iterator i(std::find(_ips.begin(),_ips.end(),ip)); if (i == _ips.end()) return false; _ips.erase(i); if (ip.isV4()) { Mutex::Lock _l2(_arp_m); _arp.remove((uint32_t)(reinterpret_cast(&ip)->sin_addr.s_addr)); } // TODO: dealloc IP from LWIP return true; } std::vector NetconEthernetTap::ips() const { Mutex::Lock _l(_ips_m); return _ips; } void NetconEthernetTap::put(const MAC &from,const MAC &to,unsigned int etherType,const void *data,unsigned int len) { fprintf(stderr, "put\n"); if (!_enabled) return; if (etherType == ZT_ETHERTYPE_ARP) { char arpReplyBuf[ZT_ARP_BUF_LENGTH]; unsigned int arpReplyLen = 0; MAC arpReplyDest; Mutex::Lock _l2(_arp_m); _arp.processIncomingArp(data,len,arpReplyBuf,arpReplyLen,arpReplyDest); if (arpReplyLen > 0) _handler(_arg,_nwid,_mac,from,ZT_ETHERTYPE_ARP,0,arpReplyBuf,arpReplyLen); } else if (etherType == ZT_ETHERTYPE_IPV4) { // Pass IPV4 packets to LWIP struct pbuf *p, *q; u16_t len; char *bufptr; // allocate a pbuf chain of pbufs from the pool p = lwipstack->pbuf_alloc(PBUF_RAW, len, PBUF_POOL); if(p != NULL) { // We iterate over the pbuf chain until we have read the entire packet into the pbuf. bufptr = (char*)data; for(q = p; q != NULL; q = q->next) { // read data into(q->payload, q->len); memcpy(q->payload, bufptr, q->len); bufptr += q->len; } // acknowledge that packet has been read(); } else { fprintf(stderr, "packet dropped\n"); } } } std::string NetconEthernetTap::deviceName() const { return _dev; } void NetconEthernetTap::setFriendlyName(const char *friendlyName) { } void NetconEthernetTap::scanMulticastGroups(std::vector &added,std::vector &removed) { fprintf(stderr, "scanMulticastGroups\n"); std::vector newGroups; Mutex::Lock _l(_multicastGroups_m); // TODO: get multicast subscriptions from LWIP std::vector allIps(ips()); for(std::vector::iterator ip(allIps.begin());ip!=allIps.end();++ip) newGroups.push_back(MulticastGroup::deriveMulticastGroupForAddressResolution(*ip)); std::sort(newGroups.begin(),newGroups.end()); std::unique(newGroups.begin(),newGroups.end()); for(std::vector::iterator m(newGroups.begin());m!=newGroups.end();++m) { if (!std::binary_search(_multicastGroups.begin(),_multicastGroups.end(),*m)) added.push_back(*m); } for(std::vector::iterator m(_multicastGroups.begin());m!=_multicastGroups.end();++m) { if (!std::binary_search(newGroups.begin(),newGroups.end(),*m)) removed.push_back(*m); } _multicastGroups.swap(newGroups); } NetconConnection *NetconEthernetTap::getConnectionByPCB(struct tcp_pcb *pcb) { NetconConnection *c; for(size_t i=0; icontainsPCB(pcb); if(c) { return c; } } return NULL; } NetconConnection *NetconEthernetTap::getConnectionByThisFD(int fd) { for(size_t i=0; iconnections.size(); j++) { if(_phy.getDescriptor(clients[i]->connections[j]->sock) == fd) { return clients[i]->connections[j]; } } } return NULL; } NetconClient *NetconEthernetTap::getClientByPCB(struct tcp_pcb *pcb) { for(size_t i=0; icontainsPCB(pcb)) { return clients[i]; } } return NULL; } void NetconEthernetTap::closeClient(NetconClient *client) { fprintf(stderr, "closeClient\n"); NetconConnection *temp_conn; closeConnection(client->rpc); for(size_t i=0; iconnections.size(); i++) { temp_conn = client->connections[i]; closeConnection(client->connections[i]); delete temp_conn; } delete client; } void NetconEthernetTap::closeConnection(NetconConnection *conn) { fprintf(stderr, "closeConnection\n"); NetconClient *client = conn->owner; _phy.close(conn->sock); lwipstack->tcp_close(conn->pcb); client->removeConnection(conn->sock); } void NetconEthernetTap::threadMain() throw() { fprintf(stderr, "starting threadMain()\n"); static ip_addr_t ipaddr, netmask, gw; char ip_str[16] = {0}, nm_str[16] = {0}, gw_str[16] = {0}; IP4_ADDR(&gw, 192,168,0,1); IP4_ADDR(&netmask, 255,255,255,0); IP4_ADDR(&ipaddr, 192,168,0,2); strncpy(ip_str, lwipstack->ipaddr_ntoa(&ipaddr), sizeof(ip_str)); strncpy(nm_str, lwipstack->ipaddr_ntoa(&netmask), sizeof(nm_str)); strncpy(gw_str, lwipstack->ipaddr_ntoa(&gw), sizeof(gw_str)); unsigned long tcp_time = ARP_TMR_INTERVAL / 5000; unsigned long etharp_time = IP_TMR_INTERVAL / 1000; unsigned long prev_tcp_time = 0; unsigned long prev_etharp_time = 0; unsigned long curr_time; unsigned long since_tcp; unsigned long since_etharp; struct timeval tv; while (_run) { gettimeofday(&tv, NULL); curr_time = (unsigned long)(tv.tv_sec) * 1000 + (unsigned long)(tv.tv_usec) / 1000; since_tcp = curr_time - prev_tcp_time; since_etharp = curr_time - prev_etharp_time; int min_time = min(since_tcp, since_etharp) * 1000; // usec if(since_tcp > tcp_time) { prev_tcp_time = curr_time+1; lwipstack->tcp_tmr(); } if(since_etharp > etharp_time) { prev_etharp_time = curr_time; lwipstack->etharp_tmr(); } fprintf(stderr, "_run\n"); _phy.poll(min_time / 1000); // conversion from usec to millisec, TODO: double check } // TODO: cleanup -- destroy LWIP state, kill any clients, unload .so, etc. } void NetconEthernetTap::phyOnSocketPairEndpointClose(PhySocket *sock, void **uptr) { fprintf(stderr, "phyOnSocketPairEndpointClose\n"); NetconClient *client = (NetconClient*)*uptr; closeConnection(client->getConnection(sock)); } void NetconEthernetTap::phyOnSocketPairEndpointData(PhySocket *sock, void **uptr, void *buf, unsigned long n) { fprintf(stderr, "phyOnSocketPairEndpointData\n"); int r; NetconConnection *c = ((NetconClient*)*uptr)->getConnection(sock); if(c) { if(c->idx < DEFAULT_READ_BUFFER_SIZE) { if((r = read(_phy.getDescriptor(c->sock), (&c->buf)+c->idx, DEFAULT_READ_BUFFER_SIZE-(c->idx))) > 0) { c->idx += r; handle_write(c); } } } } void NetconEthernetTap::phyOnSocketPairEndpointWritable(PhySocket *sock, void **uptr) { //_phy.setNotifyWritable(sock, false); } // Unused -- no UDP or TCP from this thread/Phy<> void NetconEthernetTap::phyOnDatagram(PhySocket *sock,void **uptr,const struct sockaddr *from,void *data,unsigned long len) {} void NetconEthernetTap::phyOnTcpConnect(PhySocket *sock,void **uptr,bool success) {} void NetconEthernetTap::phyOnTcpAccept(PhySocket *sockL,PhySocket *sockN,void **uptrL,void **uptrN,const struct sockaddr *from) {} void NetconEthernetTap::phyOnTcpClose(PhySocket *sock,void **uptr) {} void NetconEthernetTap::phyOnTcpData(PhySocket *sock,void **uptr,void *data,unsigned long len) {} void NetconEthernetTap::phyOnTcpWritable(PhySocket *sock,void **uptr) {} void NetconEthernetTap::phyOnUnixAccept(PhySocket *sockL,PhySocket *sockN,void **uptrL,void **uptrN) { NetconClient *newClient = new NetconClient(); newClient->addConnection(RPC, *uptrN); } void NetconEthernetTap::phyOnUnixClose(PhySocket *sock,void **uptr) { fprintf(stderr, "phyOnUnixClose\n"); closeClient(((NetconClient*)*uptr)); } void NetconEthernetTap::phyOnUnixData(PhySocket *sock,void **uptr,void *data,unsigned long len) { unsigned char *buf = (unsigned char*)data; NetconClient *client = (NetconClient*)*uptr; switch(buf[0]) { case RPC_SOCKET: fprintf(stderr, "RPC_SOCKET\n"); struct socket_st socket_rpc; memcpy(&socket_rpc, &buf[1], sizeof(struct socket_st)); client->tid = socket_rpc.__tid; handle_socket(client, &socket_rpc); break; case RPC_LISTEN: fprintf(stderr, "RPC_LISTEN\n"); struct listen_st listen_rpc; memcpy(&listen_rpc, &buf[1], sizeof(struct listen_st)); client->tid = listen_rpc.__tid; handle_listen(client, &listen_rpc); break; case RPC_BIND: fprintf(stderr, "RPC_BIND\n"); struct bind_st bind_rpc; memcpy(&bind_rpc, &buf[1], sizeof(struct bind_st)); client->tid = bind_rpc.__tid; handle_bind(client, &bind_rpc); break; case RPC_KILL_INTERCEPT: fprintf(stderr, "RPC_KILL_INTERCEPT\n"); closeClient(client); break; case RPC_CONNECT: fprintf(stderr, "RPC_CONNECT\n"); struct connect_st connect_rpc; memcpy(&connect_rpc, &buf[1], sizeof(struct connect_st)); client->tid = connect_rpc.__tid; handle_connect(client, &connect_rpc); break; case RPC_FD_MAP_COMPLETION: fprintf(stderr, "RPC_FD_MAP_COMPLETION\n"); handle_retval(client, buf); break; default: break; } } void NetconEthernetTap::phyOnUnixWritable(PhySocket *sock,void **uptr) { } int NetconEthernetTap::send_return_value(NetconClient *client, int retval) { fprintf(stderr, "send_return_value\n"); if(!client->waiting_for_retval){ fprintf(stderr, "intercept isn't waiting for return value. Why are we here?\n"); return 0; } char retmsg[4]; memset(&retmsg, '\0', sizeof(retmsg)); retmsg[0]=RPC_RETVAL; memcpy(&retmsg[1], &retval, sizeof(retval)); int n = write(_phy.getDescriptor(client->rpc->sock), &retmsg, sizeof(retmsg)); if(n > 0) { // signal that we've satisfied this requirement client->waiting_for_retval = false; } else { fprintf(stderr, "unable to send return value to the intercept\n"); closeClient(client); } return n; } /*------------------------------------------------------------------------------ --------------------------------- LWIP callbacks ------------------------------- ------------------------------------------------------------------------------*/ err_t NetconEthernetTap::nc_poll(void* arg, struct tcp_pcb *tpcb) { fprintf(stderr, "nc_poll\n"); Larg *l = (Larg*)arg; NetconConnection *c = l->tap->getConnectionByPCB(tpcb); NetconEthernetTap *tap = l->tap; if(c) tap->handle_write(c); return ERR_OK; } err_t NetconEthernetTap::nc_accept(void *arg, struct tcp_pcb *newpcb, err_t err) { fprintf(stderr, "nc_accept\n"); return ERR_OK; } err_t NetconEthernetTap::nc_recved(void *arg, struct tcp_pcb *tpcb, struct pbuf *p, err_t err) { fprintf(stderr, "nc_recved\n"); Larg *l = (Larg*)arg; NetconConnection *c = l->tap->getConnectionByPCB(tpcb); NetconEthernetTap *tap = l->tap; int n; struct pbuf* q = p; int our_fd = tap->_phy.getDescriptor(c->sock); if(!c) { return ERR_OK; // ? } if(p == NULL) { if(c) { nc_close(tpcb); close(our_fd); // TODO: Check logic tap->closeConnection(c); } else { fprintf(stderr, "can't locate connection via (arg)\n"); } return err; } q = p; while(p != NULL) { // Cycle through pbufs and write them to the socket if(p->len <= 0) break; // ? if((n = write(our_fd, p->payload, p->len)) > 0) { if(n < p->len) { fprintf(stderr, "ERROR: unable to write entire pbuf to buffer\n"); //tap->_phy.setNotifyWritable(l->sock, true); } tap->lwipstack->tcp_recved(tpcb, n); } else { fprintf(stderr, "Error: No data written to intercept buffer\n"); } p = p->next; } tap->lwipstack->pbuf_free(q); // free pbufs return ERR_OK; } void NetconEthernetTap::nc_err(void *arg, err_t err) { fprintf(stderr, "nc_err\n"); Larg *l = (Larg*)arg; NetconEthernetTap *tap = l->tap; NetconConnection *c = tap->getConnectionByThisFD(tap->_phy.getDescriptor(l->sock)); if(c) { tap->closeConnection(c); } else { fprintf(stderr, "can't locate connection object for PCB\n"); } } void NetconEthernetTap::nc_close(struct tcp_pcb* tpcb) { fprintf(stderr, "nc_close\n"); //closeConnection(getConnectionByPCB(tpcb)); /* lwipstack->tcp_arg(tpcb, NULL); lwipstack->tcp_sent(tpcb, NULL); lwipstack->tcp_recv(tpcb, NULL); lwipstack->tcp_err(tpcb, NULL); lwipstack->tcp_poll(tpcb, NULL, 0); lwipstack->tcp_close(tpcb); */ } err_t NetconEthernetTap::nc_send(struct tcp_pcb *tpcb) { fprintf(stderr, "nc_send\n"); return ERR_OK; } err_t NetconEthernetTap::nc_sent(void* arg, struct tcp_pcb *tpcb, u16_t len) { fprintf(stderr, "nc_sent\n"); return len; } err_t NetconEthernetTap::nc_connected(void *arg, struct tcp_pcb *tpcb, err_t err) { fprintf(stderr, "nc_connected\n"); Larg *l = (Larg*)arg; NetconEthernetTap *tap = l->tap; for(size_t i=0; iclients.size(); i++) { if(tap->clients[i]->containsPCB(tpcb)) { tap->send_return_value(tap->clients[i],err); } } return err; } /*------------------------------------------------------------------------------ ----------------------------- RPC Handler functions ---------------------------- ------------------------------------------------------------------------------*/ void NetconEthernetTap::handle_bind(NetconClient *client, struct bind_st *bind_rpc) { // FIXME: Is this hack still needed? struct sockaddr_in *connaddr; connaddr = (struct sockaddr_in *) &bind_rpc->addr; int conn_port = lwipstack->ntohs(connaddr->sin_port); ip_addr_t conn_addr; IP4_ADDR(&conn_addr, 192,168,0,2); /* int ip = connaddr->sin_addr.s_addr; unsigned char bytes[4]; bytes[0] = ip & 0xFF; bytes[1] = (ip >> 8) & 0xFF; bytes[2] = (ip >> 16) & 0xFF; bytes[3] = (ip >> 24) & 0xFF; "binding to: %d.%d.%d.%d", bytes[0], bytes[1], bytes[2], bytes[3] */ NetconConnection *c = client->getConnectionByTheirFD(bind_rpc->sockfd); if(c) { if(c->pcb->state == CLOSED){ int err = lwipstack->tcp_bind(c->pcb, &conn_addr, conn_port); if(err != ERR_OK) { fprintf(stderr, "error while binding to addr/port\n"); } else { fprintf(stderr, "bind successful\n"); } } else { fprintf(stderr, "PCB not in CLOSED state. Ignoring BIND request.\n"); } } else { fprintf(stderr, "can't locate connection for PCB\n"); } } void NetconEthernetTap::handle_listen(NetconClient *client, struct listen_st *listen_rpc) { NetconConnection *c = client->getConnectionByTheirFD(listen_rpc->sockfd); if(c) { if(c->pcb->state == LISTEN) { fprintf(stderr, "PCB is already in listening state.\n"); return; } struct tcp_pcb* listening_pcb = lwipstack->tcp_listen(c->pcb); if(listening_pcb != NULL) { c->pcb = listening_pcb; lwipstack->tcp_accept(listening_pcb, nc_accept); lwipstack->tcp_arg(listening_pcb, new Larg(this, c->sock)); client->waiting_for_retval=true; } else { fprintf(stderr, "unable to allocate memory for new listening PCB\n"); } } else { fprintf(stderr, "can't locate connection for PCB\n"); } } void NetconEthernetTap::handle_retval(NetconClient *client, unsigned char* buf) { if(client->unmapped_conn != NULL) { memcpy(&(client->unmapped_conn->their_fd), &buf[1], sizeof(int)); client->unmapped_conn = NULL; } } void NetconEthernetTap::handle_socket(NetconClient *client, struct socket_st* socket_rpc) { struct tcp_pcb *pcb = lwipstack->tcp_new(); if(pcb != NULL) { int *their_fd = NULL; NetconConnection *new_conn = client->addConnection(BUFFER, _phy.createSocketPair(*their_fd, client)); new_conn->their_fd = *their_fd; new_conn->pcb = pcb; sock_fd_write(_phy.getDescriptor(client->rpc->sock), *their_fd); client->unmapped_conn = new_conn; } else { fprintf(stderr, "Memory not available for new PCB\n"); } } void NetconEthernetTap::handle_connect(NetconClient *client, struct connect_st* connect_rpc) { // FIXME: Parse out address information -- Probably a more elegant way to do this struct sockaddr_in *connaddr; connaddr = (struct sockaddr_in *) &connect_rpc->__addr; int conn_port = lwipstack->ntohs(connaddr->sin_port); ip_addr_t conn_addr = convert_ip((struct sockaddr_in *)&connect_rpc->__addr); NetconConnection *c = client->getConnectionByTheirFD(connect_rpc->__fd); if(c!= NULL) { lwipstack->tcp_sent(c->pcb, NetconEthernetTap::nc_sent); // FIXME: Move? lwipstack->tcp_recv(c->pcb, nc_recved); lwipstack->tcp_err(c->pcb, nc_err); lwipstack->tcp_poll(c->pcb, nc_poll, APPLICATION_POLL_FREQ); lwipstack->tcp_arg(c->pcb, new Larg(this, c->sock)); int err = 0; if((err = lwipstack->tcp_connect(c->pcb,&conn_addr,conn_port, nc_connected)) < 0) { // dwr(h->tid, "tcp_connect() = %s\n", lwiperror(err)); // We should only return a value if failure happens immediately // Otherwise, we still need to wait for a callback from lwIP. // - This is because an ERR_OK from tcp_connect() only verifies // that the SYN packet was enqueued onto the stack properly, // that's it! // - Most instances of a retval for a connect() should happen // in the nc_connect() and nc_err() callbacks! send_return_value(client, err); } // Everything seems to be ok, but we don't have enough info to retval client->waiting_for_retval=true; } else { fprintf(stderr, "could not locate PCB based on their fd\n"); } } void NetconEthernetTap::handle_write(NetconConnection *c) { if(c) { int sndbuf = c->pcb->snd_buf; float avail = (float)sndbuf; float max = (float)TCP_SND_BUF; float load = 1.0 - (avail / max); if(load >= 0.9) { return; } int write_allowance = sndbuf < c->idx ? sndbuf : c->idx; int sz; if(write_allowance > 0) { int err = lwipstack->tcp_write(c->pcb, &c->buf, write_allowance, TCP_WRITE_FLAG_COPY); if(err != ERR_OK) { fprintf(stderr, "error while writing to PCB\n"); return; } else { sz = (c->idx)-write_allowance; if(sz) { memmove(&c->buf, (c->buf+write_allowance), sz); } c->idx -= write_allowance; //c->data_sent += write_allowance; return; } } else { fprintf(stderr, "lwIP stack full\n"); return; } } else { fprintf(stderr, "could not locate connection for this fd\n"); } } } // namespace ZeroTier #endif // ZT_ENABLE_NETCON