You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-11-03 17:13:17 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			1041 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			1041 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/* Copyright (C) 2014 InfiniDB, Inc.
 | 
						|
 | 
						|
   This program is free software; you can redistribute it and/or
 | 
						|
   modify it under the terms of the GNU General Public License
 | 
						|
   as published by the Free Software Foundation; version 2 of
 | 
						|
   the License.
 | 
						|
 | 
						|
   This program is distributed in the hope that it will be useful,
 | 
						|
   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
   GNU General Public License for more details.
 | 
						|
 | 
						|
   You should have received a copy of the GNU General Public License
 | 
						|
   along with this program; if not, write to the Free Software
 | 
						|
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | 
						|
   MA 02110-1301, USA. */
 | 
						|
 | 
						|
/*
 | 
						|
  Copyright (c) 2007 Alexander Eremin <netwhistler@gmail.com>
 | 
						|
All rights reserved.
 | 
						|
 | 
						|
Redistribution and use in source and binary forms, with or without
 | 
						|
modification, are permitted provided that the following conditions are met:
 | 
						|
 | 
						|
1. Redistributions of source code must retain the above copyright notice, this
 | 
						|
   list of conditions and the following disclaimer.
 | 
						|
2. Redistributions in binary form must reproduce the above copyright notice,
 | 
						|
   this list of conditions and the following disclaimer in the documentation
 | 
						|
   and/or other materials provided with the distribution.
 | 
						|
 | 
						|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 | 
						|
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 | 
						|
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 | 
						|
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
 | 
						|
ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 | 
						|
(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 | 
						|
LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 | 
						|
ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 | 
						|
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 | 
						|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | 
						|
 | 
						|
The views and conclusions contained in the software and documentation are those
 | 
						|
of the authors and should not be interpreted as representing official policies,
 | 
						|
either expressed or implied, of the FreeBSD Project.
 | 
						|
*/
 | 
						|
 | 
						|
#include "mcsconfig.h"
 | 
						|
 | 
						|
#include <cstdio>
 | 
						|
#include <cerrno>
 | 
						|
#if __FreeBSD__
 | 
						|
#include <sys/types.h>
 | 
						|
#include <netinet/in.h>
 | 
						|
#include <netinet/ip.h>
 | 
						|
#endif
 | 
						|
#include <sys/socket.h>
 | 
						|
#include <poll.h>
 | 
						|
#include <netinet/in.h>
 | 
						|
#include <netinet/ip_icmp.h>
 | 
						|
#include <arpa/inet.h>
 | 
						|
#include <netinet/tcp.h>
 | 
						|
#include <fcntl.h>
 | 
						|
#include <sys/ioctl.h>
 | 
						|
#include <sys/types.h>
 | 
						|
#include <sys/time.h>
 | 
						|
#include <cstring>
 | 
						|
 | 
						|
#include <stdexcept>
 | 
						|
#include <string>
 | 
						|
#include <sstream>
 | 
						|
using namespace std;
 | 
						|
 | 
						|
#include <boost/scoped_array.hpp>
 | 
						|
using boost::scoped_array;
 | 
						|
 | 
						|
#define INETSTREAMSOCKET_DLLEXPORT
 | 
						|
#include "inetstreamsocket.h"
 | 
						|
#undef INETSTREAMSOCKET_DLLEXPORT
 | 
						|
#include "bytestream.h"
 | 
						|
#include "iosocket.h"
 | 
						|
#include "socketparms.h"
 | 
						|
#include "socketclosed.h"
 | 
						|
#include "logger.h"
 | 
						|
#include "loggingid.h"
 | 
						|
#include "idbcompress.h"
 | 
						|
#include "rowgroup.h"
 | 
						|
 | 
						|
// some static functions
 | 
						|
namespace
 | 
						|
{
 | 
						|
// @bug 2441 - Retry after 512 read() error.
 | 
						|
// ERESTARTSYS (512) is a kernal I/O errno that is similar to a EINTR, except
 | 
						|
// that it is not supposed to "leak" out into the user space.   But we are
 | 
						|
// sometimes seeing "unknown error 512" error msgs in response to calls to
 | 
						|
// read(), so adding logic to retry after ERESTARTSYS the way we do for EINTR.
 | 
						|
// const int KERR_ERESTARTSYS = 512;
 | 
						|
 | 
						|
int in_cksum(unsigned short* buf, int sz)
 | 
						|
{
 | 
						|
  int nleft = sz;
 | 
						|
  int sum = 0;
 | 
						|
  unsigned short* w = buf;
 | 
						|
  unsigned short ans = 0;
 | 
						|
 | 
						|
  while (nleft > 1)
 | 
						|
  {
 | 
						|
    sum += *w++;
 | 
						|
    nleft -= 2;
 | 
						|
  }
 | 
						|
 | 
						|
  if (nleft == 1)
 | 
						|
  {
 | 
						|
    *(unsigned char*)(&ans) = *(unsigned char*)w;
 | 
						|
    sum += ans;
 | 
						|
  }
 | 
						|
 | 
						|
  sum = (sum >> 16) + (sum & 0xFFFF);
 | 
						|
  sum += (sum >> 16);
 | 
						|
  ans = ~sum;
 | 
						|
  return ans;
 | 
						|
}
 | 
						|
 | 
						|
}  // namespace
 | 
						|
 | 
						|
namespace messageqcpp
 | 
						|
{
 | 
						|
InetStreamSocket::InetStreamSocket(size_t blocksize)
 | 
						|
 : fSocketParms(PF_INET, SOCK_STREAM, IPPROTO_TCP), fBlocksize(blocksize), fSyncProto(true), fMagicBuffer(0)
 | 
						|
{
 | 
						|
  memset(&fSa, 0, sizeof(fSa));
 | 
						|
  fConnectionTimeout.tv_sec = 20;
 | 
						|
  fConnectionTimeout.tv_nsec = 0;
 | 
						|
}
 | 
						|
 | 
						|
InetStreamSocket::~InetStreamSocket() = default;
 | 
						|
 | 
						|
void InetStreamSocket::open()
 | 
						|
{
 | 
						|
  int bufferSize;
 | 
						|
  int ret;
 | 
						|
  socklen_t bufferSizeSize;
 | 
						|
 | 
						|
  if (isOpen())
 | 
						|
    throw logic_error("InetStreamSocket::open: socket is already open");
 | 
						|
 | 
						|
  int sd;
 | 
						|
  sd = ::socket(fSocketParms.domain(), fSocketParms.type(), fSocketParms.protocol());
 | 
						|
  int e = errno;
 | 
						|
 | 
						|
  if (sd < 0)
 | 
						|
  {
 | 
						|
    string msg = "InetStreamSocket::open: socket() error: ";
 | 
						|
    scoped_array<char> buf(new char[80]);
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
    const char* p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) != 0)
 | 
						|
      msg += p;
 | 
						|
 | 
						|
#else
 | 
						|
    int p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) == 0)
 | 
						|
      msg += buf.get();
 | 
						|
 | 
						|
#endif
 | 
						|
    throw runtime_error(msg);
 | 
						|
  }
 | 
						|
 | 
						|
  /*  XXXPAT:  If we have latency problems again, try these...
 | 
						|
      bufferSizeSize = 4;
 | 
						|
      bufferSize = 512000;
 | 
						|
      setsockopt(sd, SOL_SOCKET, SO_SNDBUF, &bufferSize, bufferSizeSize);
 | 
						|
      bufferSize = 512000;
 | 
						|
      setsockopt(sd, SOL_SOCKET, SO_RCVBUF, &bufferSize, bufferSizeSize);
 | 
						|
      bufferSize = 1;
 | 
						|
      setsockopt(sd, SOL_SOCKET, SO_RCVLOWAT, &bufferSize, bufferSizeSize);
 | 
						|
      setsockopt(sd, SOL_SOCKET, SO_SNDLOWAT, &bufferSize, bufferSizeSize);
 | 
						|
  */
 | 
						|
  bufferSize = 1;
 | 
						|
  bufferSizeSize = 4;
 | 
						|
  ret = setsockopt(sd, IPPROTO_TCP, TCP_NODELAY, (const char*)&bufferSize, bufferSizeSize);
 | 
						|
 | 
						|
  if (ret < 0)
 | 
						|
  {
 | 
						|
    perror("setsockopt");
 | 
						|
    exit(1);
 | 
						|
  }
 | 
						|
 | 
						|
  bufferSize = 1;
 | 
						|
  ret = setsockopt(sd, SOL_SOCKET, SO_REUSEADDR, (const char*)&bufferSize, bufferSizeSize);
 | 
						|
 | 
						|
  if (ret < 0)
 | 
						|
  {
 | 
						|
    perror("setsockopt");
 | 
						|
    exit(1);
 | 
						|
  }
 | 
						|
 | 
						|
  fSocketParms.sd(sd);
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::close()
 | 
						|
{
 | 
						|
  if (isOpen())
 | 
						|
  {
 | 
						|
    ::shutdown(fSocketParms.sd(), SHUT_RDWR);
 | 
						|
    ::close(fSocketParms.sd());
 | 
						|
    fSocketParms.sd(-1);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
// needs to be in sync with clone()
 | 
						|
void InetStreamSocket::doCopy(const InetStreamSocket& rhs)
 | 
						|
{
 | 
						|
  fBlocksize = rhs.fBlocksize;
 | 
						|
  fSocketParms = rhs.fSocketParms;
 | 
						|
  fSa = rhs.fSa;
 | 
						|
  fConnectionTimeout = rhs.fConnectionTimeout;
 | 
						|
  fSyncProto = rhs.fSyncProto;
 | 
						|
}
 | 
						|
 | 
						|
// needs to be in sync with doCopy()
 | 
						|
Socket* InetStreamSocket::clone() const
 | 
						|
{
 | 
						|
  InetStreamSocket* iss = new InetStreamSocket(fBlocksize);
 | 
						|
  iss->fSocketParms = fSocketParms;
 | 
						|
  iss->fSa = fSa;
 | 
						|
  iss->fConnectionTimeout = fConnectionTimeout;
 | 
						|
  iss->fSyncProto = fSyncProto;
 | 
						|
  return iss;
 | 
						|
}
 | 
						|
 | 
						|
InetStreamSocket::InetStreamSocket(const InetStreamSocket& rhs)
 | 
						|
{
 | 
						|
  doCopy(rhs);
 | 
						|
}
 | 
						|
 | 
						|
InetStreamSocket& InetStreamSocket::operator=(const InetStreamSocket& rhs)
 | 
						|
{
 | 
						|
  if (this != &rhs)
 | 
						|
    doCopy(rhs);
 | 
						|
 | 
						|
  return *this;
 | 
						|
}
 | 
						|
 | 
						|
/* The caller needs to know when/if the remote closes the connection or sends data.
 | 
						|
 * Returns 0 on timeout, 1 if there is data to read, 2 if the connection was dropped.
 | 
						|
 */
 | 
						|
int InetStreamSocket::pollConnection(int connectionNum, long msecs)
 | 
						|
{
 | 
						|
  struct pollfd pfd[1];
 | 
						|
  int err;
 | 
						|
 | 
						|
retry:
 | 
						|
  memset(&pfd, 0, sizeof(struct pollfd));
 | 
						|
  pfd[0].fd = connectionNum;
 | 
						|
  pfd[0].events = POLLIN;
 | 
						|
  err = poll(pfd, 1, msecs);
 | 
						|
 | 
						|
  if (err < 0)
 | 
						|
  {
 | 
						|
    int e = errno;
 | 
						|
 | 
						|
    if (e == EINTR || e == KERR_ERESTARTSYS)
 | 
						|
      goto retry;
 | 
						|
  }
 | 
						|
 | 
						|
  // Linux doesn't set POLLHUP, need add'l check for data or EOF
 | 
						|
  if (pfd[0].revents & POLLIN)
 | 
						|
  {
 | 
						|
    char buf;
 | 
						|
    err = ::recv(connectionNum, &buf, 1, MSG_PEEK);
 | 
						|
 | 
						|
    if (err == 0)
 | 
						|
      return 2;
 | 
						|
    else if (err == 1)  // there is in fact data to read
 | 
						|
      return 1;
 | 
						|
    else
 | 
						|
      return 3;
 | 
						|
  }
 | 
						|
 | 
						|
  if (err == 0)  // timeout
 | 
						|
    return 0;
 | 
						|
 | 
						|
  return 3;  // catch-all error code
 | 
						|
}
 | 
						|
 | 
						|
/* returns true when the next thing in the stream is the beginning of a new
 | 
						|
ByteStream object. */
 | 
						|
bool InetStreamSocket::readToMagic(long msecs, bool* isTimeOut, Stats* stats) const
 | 
						|
{
 | 
						|
  int err;
 | 
						|
  struct pollfd pfd[1];
 | 
						|
  uint8_t* magicBuffer8;
 | 
						|
 | 
						|
  fMagicBuffer = 0;
 | 
						|
  magicBuffer8 = reinterpret_cast<uint8_t*>(&fMagicBuffer);
 | 
						|
  pfd[0].fd = fSocketParms.sd();
 | 
						|
  pfd[0].events = POLLIN;
 | 
						|
 | 
						|
  while ((fMagicBuffer != BYTESTREAM_MAGIC) && (fMagicBuffer != COMPRESSED_BYTESTREAM_MAGIC))
 | 
						|
  {
 | 
						|
    if (msecs >= 0)
 | 
						|
    {
 | 
						|
      pfd[0].revents = 0;
 | 
						|
 | 
						|
      err = poll(pfd, 1, msecs);
 | 
						|
 | 
						|
      if (err < 0)
 | 
						|
      {
 | 
						|
        int e = errno;
 | 
						|
 | 
						|
        if (e == EINTR)
 | 
						|
        {
 | 
						|
          continue;
 | 
						|
        }
 | 
						|
 | 
						|
        if (e == KERR_ERESTARTSYS)
 | 
						|
        {
 | 
						|
          logIoError("InetStreamSocket::readToMagic(): I/O error1", e);
 | 
						|
          continue;
 | 
						|
        }
 | 
						|
 | 
						|
        ostringstream oss;
 | 
						|
        oss << "InetStreamSocket::readToMagic(): I/O error1: " << strerror(e);
 | 
						|
        throw runtime_error(oss.str());
 | 
						|
      }
 | 
						|
 | 
						|
      if (pfd[0].revents & (POLLHUP | POLLNVAL | POLLERR))
 | 
						|
      {
 | 
						|
        ostringstream oss;
 | 
						|
        oss << "InetStreamSocket::readToMagic(): I/O error1: rc-" << err << "; poll signal interrupt ( ";
 | 
						|
 | 
						|
        if (pfd[0].revents & POLLHUP)
 | 
						|
          oss << "POLLHUP ";
 | 
						|
 | 
						|
        if (pfd[0].revents & POLLNVAL)
 | 
						|
          oss << "POLLNVAL ";
 | 
						|
 | 
						|
        if (pfd[0].revents & POLLERR)
 | 
						|
          oss << "POLLERR ";
 | 
						|
 | 
						|
        oss << ")";
 | 
						|
        throw runtime_error(oss.str());
 | 
						|
      }
 | 
						|
 | 
						|
      if (err == 0)  // timeout
 | 
						|
      {
 | 
						|
        if (isTimeOut)
 | 
						|
          *isTimeOut = true;
 | 
						|
 | 
						|
        return false;
 | 
						|
      }
 | 
						|
    }
 | 
						|
 | 
						|
    fMagicBuffer = fMagicBuffer >> 8;
 | 
						|
  retry:
 | 
						|
    err = ::read(fSocketParms.sd(), &magicBuffer8[3], 1);
 | 
						|
 | 
						|
    if (err < 0)
 | 
						|
    {
 | 
						|
      int e = errno;
 | 
						|
 | 
						|
      if (e == EINTR)
 | 
						|
      {
 | 
						|
        goto retry;
 | 
						|
      }
 | 
						|
 | 
						|
      if (e == KERR_ERESTARTSYS)
 | 
						|
      {
 | 
						|
        logIoError("InetStreamSocket::readToMagic(): I/O error2.0", e);
 | 
						|
        goto retry;
 | 
						|
      }
 | 
						|
 | 
						|
      ostringstream oss;
 | 
						|
      oss << "InetStreamSocket::readToMagic(): I/O error2.1: " << "err = " << err << " e = " << e << ": "
 | 
						|
          << strerror(e);
 | 
						|
      throw runtime_error(oss.str());
 | 
						|
    }
 | 
						|
 | 
						|
    // EOF. If no timeout was specified, ByteStream() gets returned to the caller.
 | 
						|
    // If one was, throw SocketClosed.
 | 
						|
    if (err == 0)  // EOF. if a timeout was specified, ByteStream()
 | 
						|
    {
 | 
						|
      if (msecs < 0)
 | 
						|
        return false;
 | 
						|
      else
 | 
						|
        throw SocketClosed("InetStreamSocket::readToMagic: Remote is closed");
 | 
						|
    }
 | 
						|
 | 
						|
    if (stats)
 | 
						|
      stats->dataRecvd(1);
 | 
						|
  }
 | 
						|
 | 
						|
  return true;
 | 
						|
}
 | 
						|
 | 
						|
bool InetStreamSocket::readFixedSizeData(struct pollfd* pfd, uint8_t* buffer, size_t numberOfBytes,
 | 
						|
                                         const struct ::timespec* timeout, bool* isTimeOut, Stats* stats,
 | 
						|
                                         int64_t msecs) const
 | 
						|
{
 | 
						|
  size_t bytesRead = 0;
 | 
						|
  while (bytesRead < numberOfBytes)
 | 
						|
  {
 | 
						|
    ssize_t currentBytesRead;
 | 
						|
    int err;
 | 
						|
 | 
						|
    if (timeout != nullptr)
 | 
						|
    {
 | 
						|
      pfd[0].revents = 0;
 | 
						|
      err = poll(pfd, 1, msecs);
 | 
						|
 | 
						|
      if (err < 0 || pfd[0].revents & (POLLERR | POLLHUP | POLLNVAL))
 | 
						|
      {
 | 
						|
        ostringstream oss;
 | 
						|
        oss << "InetStreamSocket::read: I/O error1: " << strerror(errno);
 | 
						|
        throw runtime_error(oss.str());
 | 
						|
      }
 | 
						|
 | 
						|
      if (err == 0)  // timeout
 | 
						|
      {
 | 
						|
        if (isTimeOut)
 | 
						|
          *isTimeOut = true;
 | 
						|
 | 
						|
        logIoError("InetStreamSocket::read: timeout during first poll", 0);
 | 
						|
        return false;
 | 
						|
      }
 | 
						|
    }
 | 
						|
 | 
						|
    currentBytesRead = ::read(fSocketParms.sd(), buffer + bytesRead, numberOfBytes - bytesRead);
 | 
						|
 | 
						|
    if (currentBytesRead == 0)
 | 
						|
    {
 | 
						|
      if (timeout == nullptr)
 | 
						|
      {
 | 
						|
        logIoError("InetStreamSocket::read: timeout during first read", 0);
 | 
						|
        return false;
 | 
						|
      }
 | 
						|
      else
 | 
						|
        throw SocketClosed("InetStreamSocket::read: Remote is closed");
 | 
						|
    }
 | 
						|
 | 
						|
    if (currentBytesRead < 0)
 | 
						|
    {
 | 
						|
      err = errno;
 | 
						|
 | 
						|
      if (err == EINTR)
 | 
						|
        continue;
 | 
						|
 | 
						|
      if (err == KERR_ERESTARTSYS)
 | 
						|
      {
 | 
						|
        logIoError("InetStreamSocket::read: I/O error2", err);
 | 
						|
        continue;
 | 
						|
      }
 | 
						|
 | 
						|
      ostringstream oss;
 | 
						|
      oss << "InetStreamSocket::read: I/O error2: " << strerror(err);
 | 
						|
      throw runtime_error(oss.str());
 | 
						|
    }
 | 
						|
 | 
						|
    bytesRead += currentBytesRead;
 | 
						|
  }
 | 
						|
 | 
						|
  if (stats)
 | 
						|
    stats->dataRecvd(bytesRead);
 | 
						|
 | 
						|
  return true;
 | 
						|
}
 | 
						|
 | 
						|
const SBS InetStreamSocket::read(const struct ::timespec* timeout, bool* isTimeOut, Stats* stats) const
 | 
						|
{
 | 
						|
  int64_t msecs = -1;
 | 
						|
 | 
						|
  struct pollfd pfd[1];
 | 
						|
  pfd[0].fd = fSocketParms.sd();
 | 
						|
  pfd[0].events = POLLIN;
 | 
						|
 | 
						|
  if (timeout != nullptr)
 | 
						|
    msecs = timeout->tv_sec * 1000 + timeout->tv_nsec / 1000000;
 | 
						|
 | 
						|
  if (readToMagic(msecs, isTimeOut, stats) == false)  // indicates a timeout or EOF
 | 
						|
  {
 | 
						|
    // MCOL-480 The connector calls with timeout in a loop so that
 | 
						|
    // it can check a killed flag. This means that for a long running query,
 | 
						|
    // the following fills the warning log.
 | 
						|
    //		if (isTimeOut && *isTimeOut)
 | 
						|
    //		{
 | 
						|
    //			logIoError("InetStreamSocket::read: timeout during readToMagic", 0);
 | 
						|
    //		}
 | 
						|
    return SBS(new ByteStream(0U));
 | 
						|
  }
 | 
						|
 | 
						|
  // we need to read the 4-byte message length first.
 | 
						|
  uint32_t msglen;
 | 
						|
  if (!readFixedSizeData(pfd, reinterpret_cast<uint8_t*>(&msglen), sizeof(msglen), timeout, isTimeOut, stats,
 | 
						|
                         msecs))
 | 
						|
    return SBS(new ByteStream(0U));
 | 
						|
 | 
						|
  // Read the number of the `long strings` that are deprecated, so it should be 0
 | 
						|
  uint32_t longStringSize;
 | 
						|
  if (!readFixedSizeData(pfd, reinterpret_cast<uint8_t*>(&longStringSize), sizeof(longStringSize), timeout,
 | 
						|
                         isTimeOut, stats, msecs))
 | 
						|
    return SBS(new ByteStream(0U));
 | 
						|
  idbassert(longStringSize == 0);
 | 
						|
 | 
						|
  // Read the actual data of the `ByteStream`.
 | 
						|
  SBS res(new ByteStream(msglen));
 | 
						|
  if (!readFixedSizeData(pfd, res->getInputPtr(), msglen, timeout, isTimeOut, stats, msecs))
 | 
						|
    return SBS(new ByteStream(0U));
 | 
						|
  res->advanceInputPtr(msglen);
 | 
						|
 | 
						|
  return res;
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * The protocol here is that we write the length of the ByteStream first, then the bytes. On the
 | 
						|
 * read side, we reverse it.
 | 
						|
 */
 | 
						|
 | 
						|
void InetStreamSocket::write(SBS msg, Stats* stats)
 | 
						|
{
 | 
						|
  write(*msg, stats);
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::do_write(const ByteStream& msg, uint32_t whichMagic, Stats* stats) const
 | 
						|
{
 | 
						|
  // !!!
 | 
						|
  // !!! Reducing BS size type from 64bit down to 32 and potentially loosing data.
 | 
						|
  // !!!
 | 
						|
  uint32_t msglen = msg.length();
 | 
						|
  uint32_t magic = whichMagic;
 | 
						|
  uint32_t* realBuf;
 | 
						|
 | 
						|
  if (msglen == 0)
 | 
						|
    return;
 | 
						|
 | 
						|
  /* buf.fCurOutPtr points to the data to send; ByteStream guarantees that there
 | 
						|
     are at least 12 bytes before that for the magic & length fields */
 | 
						|
  realBuf = (uint32_t*)msg.buf();
 | 
						|
  realBuf -= 3;
 | 
						|
  realBuf[0] = magic;
 | 
						|
  realBuf[1] = msglen;
 | 
						|
  realBuf[2] = 0;
 | 
						|
 | 
						|
  try
 | 
						|
  {
 | 
						|
    auto bytesToWrite = sizeof(msglen) + sizeof(magic) + sizeof(uint32_t) + msglen;
 | 
						|
    written(fSocketParms.sd(), (const uint8_t*)realBuf, bytesToWrite);
 | 
						|
 | 
						|
    if (stats)
 | 
						|
      stats->dataSent(bytesToWrite);
 | 
						|
  }
 | 
						|
  catch (std::exception& ex)
 | 
						|
  {
 | 
						|
    string errorMsg(ex.what());
 | 
						|
    errorMsg += " -- write from " + toString();
 | 
						|
    throw runtime_error(errorMsg);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::write(const ByteStream& msg, Stats* stats)
 | 
						|
{
 | 
						|
  do_write(msg, BYTESTREAM_MAGIC, stats);
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::write_raw(const ByteStream& msg, Stats* stats) const
 | 
						|
{
 | 
						|
  uint32_t msglen = msg.length();
 | 
						|
 | 
						|
  if (msglen == 0)
 | 
						|
    return;
 | 
						|
 | 
						|
  try
 | 
						|
  {
 | 
						|
    written(fSocketParms.sd(), msg.buf(), msglen);
 | 
						|
  }
 | 
						|
  catch (std::exception& ex)
 | 
						|
  {
 | 
						|
    string errorMsg(ex.what());
 | 
						|
    errorMsg += " -- write_raw from " + toString();
 | 
						|
    throw runtime_error(errorMsg);
 | 
						|
  }
 | 
						|
 | 
						|
  if (stats)
 | 
						|
    stats->dataSent(msglen);
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::bind(const sockaddr* serv_addr)
 | 
						|
{
 | 
						|
  memcpy(&fSa, serv_addr, sizeof(sockaddr_in));
 | 
						|
 | 
						|
  if (::bind(fSocketParms.sd(), serv_addr, sizeof(sockaddr_in)) != 0)
 | 
						|
  {
 | 
						|
    int e = errno;
 | 
						|
    string msg = "InetStreamSocket::bind: bind() error: ";
 | 
						|
    scoped_array<char> buf(new char[80]);
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
    const char* p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) != 0)
 | 
						|
      msg += p;
 | 
						|
 | 
						|
#else
 | 
						|
    int p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) == 0)
 | 
						|
      msg += buf.get();
 | 
						|
 | 
						|
#endif
 | 
						|
    throw runtime_error(msg);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::listen(int backlog)
 | 
						|
{
 | 
						|
  fcntl(socketParms().sd(), F_SETFD, fcntl(socketParms().sd(), F_GETFD) | FD_CLOEXEC);
 | 
						|
 | 
						|
  if (::listen(socketParms().sd(), backlog) != 0)
 | 
						|
  {
 | 
						|
    int e = errno;
 | 
						|
    string msg = "InetStreamSocket::listen: listen() error: ";
 | 
						|
    scoped_array<char> buf(new char[80]);
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
    const char* p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) != 0)
 | 
						|
      msg += p;
 | 
						|
 | 
						|
#else
 | 
						|
    int p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) == 0)
 | 
						|
      msg += buf.get();
 | 
						|
 | 
						|
#endif
 | 
						|
    throw runtime_error(msg);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
const IOSocket InetStreamSocket::accept(const struct timespec* timeout)
 | 
						|
{
 | 
						|
  int clientfd;
 | 
						|
  long msecs = 0;
 | 
						|
 | 
						|
  IOSocket ios(new InetStreamSocket(fBlocksize));
 | 
						|
 | 
						|
  struct pollfd pfd[1];
 | 
						|
  pfd[0].fd = socketParms().sd();
 | 
						|
  pfd[0].events = POLLIN;
 | 
						|
 | 
						|
  if (timeout != nullptr)
 | 
						|
  {
 | 
						|
    msecs = timeout->tv_sec * 1000 + timeout->tv_nsec / 1000000;
 | 
						|
 | 
						|
    if (poll(pfd, 1, msecs) != 1 || (pfd[0].revents & POLLIN) == 0 ||
 | 
						|
        pfd[0].revents & (POLLERR | POLLHUP | POLLNVAL))
 | 
						|
      return ios;
 | 
						|
  }
 | 
						|
 | 
						|
  struct sockaddr sa;
 | 
						|
 | 
						|
  socklen_t sl = sizeof(sa);
 | 
						|
 | 
						|
  int e;
 | 
						|
 | 
						|
  do
 | 
						|
  {
 | 
						|
    clientfd = ::accept(socketParms().sd(), &sa, &sl);
 | 
						|
    e = errno;
 | 
						|
  } while (clientfd < 0 && (e == EINTR ||
 | 
						|
#ifdef ERESTART
 | 
						|
                            e == ERESTART ||
 | 
						|
#endif
 | 
						|
#ifdef ECONNABORTED
 | 
						|
                            e == ECONNABORTED ||
 | 
						|
#endif
 | 
						|
                            false));
 | 
						|
 | 
						|
  if (clientfd < 0)
 | 
						|
  {
 | 
						|
    string msg = "InetStreamSocket::accept: accept() error: ";
 | 
						|
    scoped_array<char> buf(new char[80]);
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
    const char* p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) != 0)
 | 
						|
      msg += p;
 | 
						|
 | 
						|
#else
 | 
						|
    int p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) == 0)
 | 
						|
      msg += buf.get();
 | 
						|
 | 
						|
#endif
 | 
						|
    throw runtime_error(msg);
 | 
						|
  }
 | 
						|
 | 
						|
  if (fSyncProto)
 | 
						|
  {
 | 
						|
    /* send a byte to artificially synchronize with connect() on the remote */
 | 
						|
    char b = 'A';
 | 
						|
    int ret;
 | 
						|
 | 
						|
    ret = ::send(clientfd, &b, 1, 0);
 | 
						|
    e = errno;
 | 
						|
 | 
						|
    if (ret < 0)
 | 
						|
    {
 | 
						|
      ostringstream os;
 | 
						|
      char blah[80];
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
      const char* p;
 | 
						|
 | 
						|
      if ((p = strerror_r(e, blah, 80)) != nullptr)
 | 
						|
        os << "InetStreamSocket::accept sync: " << p;
 | 
						|
 | 
						|
#else
 | 
						|
      int p;
 | 
						|
 | 
						|
      if ((p = strerror_r(e, blah, 80)) == 0)
 | 
						|
        os << "InetStreamSocket::accept sync: " << blah;
 | 
						|
 | 
						|
#endif
 | 
						|
      ::close(clientfd);
 | 
						|
      throw runtime_error(os.str());
 | 
						|
    }
 | 
						|
    else if (ret == 0)
 | 
						|
    {
 | 
						|
      ::close(clientfd);
 | 
						|
      throw runtime_error("InetStreamSocket::accept sync: got unexpected error code");
 | 
						|
    }
 | 
						|
  }
 | 
						|
 | 
						|
  SocketParms sp;
 | 
						|
  sp = ios.socketParms();
 | 
						|
  sp.sd(clientfd);
 | 
						|
  ios.socketParms(sp);
 | 
						|
  ios.sa(&sa);
 | 
						|
  return ios;
 | 
						|
}
 | 
						|
 | 
						|
void InetStreamSocket::connect(const sockaddr* serv_addr)
 | 
						|
{
 | 
						|
  memcpy(&fSa, serv_addr, sizeof(sockaddr_in));
 | 
						|
 | 
						|
  if (::connect(socketParms().sd(), serv_addr, sizeof(sockaddr_in)))
 | 
						|
  {
 | 
						|
    int e = errno;
 | 
						|
    string msg = "InetStreamSocket::connect: connect() error: ";
 | 
						|
    scoped_array<char> buf(new char[80]);
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
    const char* p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) != 0)
 | 
						|
      msg += p;
 | 
						|
 | 
						|
#else
 | 
						|
    int p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, buf.get(), 80)) == 0)
 | 
						|
      msg += buf.get();
 | 
						|
 | 
						|
#endif
 | 
						|
    msg += " to: " + toString();
 | 
						|
    throw runtime_error(msg);
 | 
						|
  }
 | 
						|
 | 
						|
  if (!fSyncProto)
 | 
						|
    return;
 | 
						|
 | 
						|
  /* read a byte to artificially synchronize with accept() on the remote */
 | 
						|
  int ret = -1;
 | 
						|
  int e = EBADF;
 | 
						|
  struct pollfd pfd;
 | 
						|
 | 
						|
  long msecs = fConnectionTimeout.tv_sec * 1000 + fConnectionTimeout.tv_nsec / 1000000;
 | 
						|
 | 
						|
  do
 | 
						|
  {
 | 
						|
    pfd.fd = socketParms().sd();
 | 
						|
    pfd.revents = 0;
 | 
						|
    pfd.events = POLLIN;
 | 
						|
    ret = poll(&pfd, 1, msecs);
 | 
						|
    e = errno;
 | 
						|
  } while (ret == -1 && e == EINTR && !(pfd.revents & (POLLERR | POLLHUP | POLLNVAL)));
 | 
						|
 | 
						|
  // success
 | 
						|
  if (ret == 1)
 | 
						|
  {
 | 
						|
    char buf = '\0';
 | 
						|
    std::ignore = ::read(socketParms().sd(), &buf, 1);  // we know 1 byte is in the recv buffer
 | 
						|
    return;
 | 
						|
  }
 | 
						|
 | 
						|
  /* handle the various errors */
 | 
						|
  if (ret == 0)
 | 
						|
    throw runtime_error("InetStreamSocket::connect: connection timed out");
 | 
						|
  else if (ret == -1 && e != EINTR)
 | 
						|
  {
 | 
						|
    ostringstream os;
 | 
						|
    char blah[80];
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
    const char* p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, blah, 80)) != nullptr)
 | 
						|
      os << "InetStreamSocket::connect: " << p;
 | 
						|
 | 
						|
#else
 | 
						|
    int p;
 | 
						|
 | 
						|
    if ((p = strerror_r(e, blah, 80)) == 0)
 | 
						|
      os << "InetStreamSocket::connect: " << blah;
 | 
						|
 | 
						|
#endif
 | 
						|
    throw runtime_error(os.str());
 | 
						|
  }
 | 
						|
  else
 | 
						|
    throw runtime_error("InetStreamSocket::connect: unknown connection error");
 | 
						|
}
 | 
						|
 | 
						|
const string InetStreamSocket::toString() const
 | 
						|
{
 | 
						|
  ostringstream oss;
 | 
						|
  char buf[INET_ADDRSTRLEN];
 | 
						|
  const SocketParms& sp = fSocketParms;
 | 
						|
  oss << "InetStreamSocket: sd: " << sp.sd()
 | 
						|
      << " inet: " << inet_ntop(AF_INET, &fSa.sin_addr, buf, INET_ADDRSTRLEN)
 | 
						|
      << " port: " << ntohs(fSa.sin_port);
 | 
						|
  return oss.str();
 | 
						|
}
 | 
						|
 | 
						|
//
 | 
						|
//  Log a Warning msg pertaining to an I/O error; Currently used to log a
 | 
						|
//  ERESTARTSYS (errno 512) condition, but could be used to log any other
 | 
						|
//  I/O error that will retried.
 | 
						|
//
 | 
						|
void InetStreamSocket::logIoError(const char* errMsg, int errNum) const
 | 
						|
{
 | 
						|
  logging::Logger logger(31);
 | 
						|
  logging::Message::Args args;
 | 
						|
  logging::LoggingID li(31);
 | 
						|
  args.add(errMsg);
 | 
						|
  args.add(strerror(errNum));
 | 
						|
  args.add(toString());
 | 
						|
 | 
						|
  logging::MsgMap msgMap;
 | 
						|
  msgMap[logging::M0071] = logging::Message(logging::M0071);
 | 
						|
  logger.msgMap(msgMap);
 | 
						|
 | 
						|
  logger.logMessage(logging::LOG_TYPE_WARNING, logging::M0071, args, li);
 | 
						|
}
 | 
						|
 | 
						|
ssize_t InetStreamSocket::written(int fd, const uint8_t* ptr, size_t nbytes) const
 | 
						|
{
 | 
						|
  size_t nleft;
 | 
						|
  ssize_t nwritten;
 | 
						|
  const char* bufp;
 | 
						|
 | 
						|
  nleft = nbytes;
 | 
						|
  bufp = reinterpret_cast<const char*>(ptr);
 | 
						|
 | 
						|
  while (nleft > 0)
 | 
						|
  {
 | 
						|
    // the O_NONBLOCK flag is not set, this is a blocking I/O.
 | 
						|
    if ((nwritten = ::write(fd, bufp, nleft)) < 0)
 | 
						|
    {
 | 
						|
      if (errno == EINTR)
 | 
						|
        nwritten = 0;
 | 
						|
      else
 | 
						|
      {
 | 
						|
        // save the error no first
 | 
						|
        int e = errno;
 | 
						|
        string errorMsg = "InetStreamSocket::write error: ";
 | 
						|
        scoped_array<char> buf(new char[80]);
 | 
						|
#if STRERROR_R_CHAR_P
 | 
						|
        const char* p;
 | 
						|
 | 
						|
        if ((p = strerror_r(e, buf.get(), 80)) != 0)
 | 
						|
          errorMsg += p;
 | 
						|
 | 
						|
#else
 | 
						|
        int p;
 | 
						|
 | 
						|
        if ((p = strerror_r(e, buf.get(), 80)) == 0)
 | 
						|
          errorMsg += buf.get();
 | 
						|
 | 
						|
#endif
 | 
						|
        throw runtime_error(errorMsg);
 | 
						|
      }
 | 
						|
    }
 | 
						|
 | 
						|
    nleft -= nwritten;
 | 
						|
    bufp += nwritten;
 | 
						|
  }
 | 
						|
 | 
						|
  return nbytes;
 | 
						|
}
 | 
						|
 | 
						|
const string InetStreamSocket::addr2String() const
 | 
						|
{
 | 
						|
  string s;
 | 
						|
  char dst[INET_ADDRSTRLEN];
 | 
						|
  s = inet_ntop(AF_INET, &fSa.sin_addr, dst, INET_ADDRSTRLEN);
 | 
						|
  return s;
 | 
						|
}
 | 
						|
 | 
						|
bool InetStreamSocket::isSameAddr(const Socket* rhs) const
 | 
						|
{
 | 
						|
  const InetStreamSocket* issp = dynamic_cast<const InetStreamSocket*>(rhs);
 | 
						|
 | 
						|
  if (!issp)
 | 
						|
    return false;
 | 
						|
 | 
						|
  return (fSa.sin_addr.s_addr == issp->fSa.sin_addr.s_addr);
 | 
						|
}
 | 
						|
bool InetStreamSocket::isSameAddr(const struct in_addr& ipv4Addr) const
 | 
						|
{
 | 
						|
  return (fSa.sin_addr.s_addr == ipv4Addr.s_addr);
 | 
						|
}
 | 
						|
 | 
						|
/*static*/
 | 
						|
int InetStreamSocket::ping(const std::string& ipaddr, const struct timespec* timeout)
 | 
						|
{
 | 
						|
  sockaddr_in pingaddr;
 | 
						|
  memset(&pingaddr, 0, sizeof(pingaddr));
 | 
						|
 | 
						|
  if (inet_aton(ipaddr.c_str(), &pingaddr.sin_addr) == 0)
 | 
						|
    return -1;
 | 
						|
 | 
						|
  long msecs = 30 * 1000;
 | 
						|
 | 
						|
  if (timeout)
 | 
						|
    msecs = timeout->tv_sec * 1000 + timeout->tv_nsec / 1000000;
 | 
						|
 | 
						|
  int pingsock;
 | 
						|
  pingsock = ::socket(PF_INET, SOCK_RAW, IPPROTO_ICMP);
 | 
						|
 | 
						|
  if (pingsock < 0)
 | 
						|
    return -1;
 | 
						|
 | 
						|
  ssize_t len = 0;
 | 
						|
  size_t pktlen = 0;
 | 
						|
  const size_t PktSize = 1024;
 | 
						|
  char pkt[PktSize];
 | 
						|
  memset(pkt, 0, PktSize);
 | 
						|
  struct icmp* pingPktPtr = reinterpret_cast<struct icmp*>(pkt);
 | 
						|
 | 
						|
  pingPktPtr->icmp_type = ICMP_ECHO;
 | 
						|
  pingPktPtr->icmp_cksum = in_cksum(reinterpret_cast<unsigned short*>(pkt), PktSize);
 | 
						|
 | 
						|
  pktlen = 56 + ICMP_MINLEN;
 | 
						|
  len = ::sendto(pingsock, pkt, pktlen, 0, reinterpret_cast<const struct sockaddr*>(&pingaddr),
 | 
						|
                 sizeof(pingaddr));
 | 
						|
 | 
						|
  if (len < 0 || static_cast<size_t>(len) != pktlen)
 | 
						|
  {
 | 
						|
    ::close(pingsock);
 | 
						|
    return -1;
 | 
						|
  }
 | 
						|
 | 
						|
  memset(pkt, 0, PktSize);
 | 
						|
  pktlen = PktSize;
 | 
						|
 | 
						|
  int pollrc = 0;
 | 
						|
  pollrc = pollConnection(pingsock, msecs);
 | 
						|
 | 
						|
  if (pollrc != 1)
 | 
						|
  {
 | 
						|
    ::close(pingsock);
 | 
						|
    return -1;
 | 
						|
  }
 | 
						|
 | 
						|
  len = ::recvfrom(pingsock, pkt, pktlen, 0, nullptr, nullptr);
 | 
						|
 | 
						|
  if (len < 76)
 | 
						|
  {
 | 
						|
    ::close(pingsock);
 | 
						|
    return -1;
 | 
						|
  }
 | 
						|
 | 
						|
  struct ip* iphdr = reinterpret_cast<struct ip*>(pkt);
 | 
						|
 | 
						|
  pingPktPtr = reinterpret_cast<struct icmp*>(pkt + (iphdr->ip_hl << 2));
 | 
						|
 | 
						|
  if (pingPktPtr->icmp_type != ICMP_ECHOREPLY)
 | 
						|
  {
 | 
						|
    ::close(pingsock);
 | 
						|
    return -1;
 | 
						|
  }
 | 
						|
 | 
						|
  ::close(pingsock);
 | 
						|
 | 
						|
  return 0;
 | 
						|
}
 | 
						|
 | 
						|
bool InetStreamSocket::isConnected() const
 | 
						|
{
 | 
						|
  int error = 0;
 | 
						|
  socklen_t len = sizeof(error);
 | 
						|
  int retval = getsockopt(fSocketParms.sd(), SOL_SOCKET, SO_ERROR, &error, &len);
 | 
						|
 | 
						|
  if (error || retval)
 | 
						|
    return false;
 | 
						|
 | 
						|
  struct pollfd pfd[1];
 | 
						|
  pfd[0].fd = fSocketParms.sd();
 | 
						|
  pfd[0].events = POLLIN;
 | 
						|
  pfd[0].revents = 0;
 | 
						|
 | 
						|
  error = poll(pfd, 1, 0);
 | 
						|
 | 
						|
  if ((error < 0) || (pfd[0].revents & (POLLHUP | POLLNVAL | POLLERR)))
 | 
						|
  {
 | 
						|
    return false;
 | 
						|
  }
 | 
						|
 | 
						|
  return true;
 | 
						|
}
 | 
						|
 | 
						|
bool InetStreamSocket::hasData() const
 | 
						|
{
 | 
						|
  int count;
 | 
						|
  char buf[1];
 | 
						|
  ssize_t retval;
 | 
						|
  ioctl(fSocketParms.sd(), FIONREAD, &count);
 | 
						|
 | 
						|
  if (count)
 | 
						|
    return true;
 | 
						|
 | 
						|
  // EAGAIN | EWOULDBLOCK means the socket is clear. Anything else is data or error
 | 
						|
  retval = recv(fSocketParms.sd(), buf, 1, MSG_DONTWAIT);
 | 
						|
 | 
						|
  if (retval & (EAGAIN | EWOULDBLOCK))
 | 
						|
    return false;
 | 
						|
 | 
						|
  return true;
 | 
						|
}
 | 
						|
 | 
						|
}  // namespace messageqcpp
 |