blob: bee9d80d65d0660f3d805869a121a3176bd03a30 [file] [log] [blame]
David Reissea2cba82009-03-30 21:35:00 +00001/*
2 * Licensed to the Apache Software Foundation (ASF) under one
3 * or more contributor license agreements. See the NOTICE file
4 * distributed with this work for additional information
5 * regarding copyright ownership. The ASF licenses this file
6 * to you under the Apache License, Version 2.0 (the
7 * "License"); you may not use this file except in compliance
8 * with the License. You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing,
13 * software distributed under the License is distributed on an
14 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15 * KIND, either express or implied. See the License for the
16 * specific language governing permissions and limitations
17 * under the License.
18 */
Mark Slee9f0c6512007-02-28 23:58:26 +000019
Roger Meier2fa9c312011-09-05 19:15:53 +000020#ifdef HAVE_CONFIG_H
Marc Slemkoe03da182006-07-21 21:32:36 +000021#include <config.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000022#endif
David Reissc88eb8c2008-06-11 01:18:54 +000023#include <cstring>
24#include <sstream>
Roger Meier2fa9c312011-09-05 19:15:53 +000025#ifdef HAVE_SYS_SOCKET_H
Mark Sleee8540632006-05-30 09:24:40 +000026#include <sys/socket.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000027#endif
28#ifdef HAVE_SYS_UN_H
Bryan Duxburya18364a2010-09-28 14:36:07 +000029#include <sys/un.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000030#endif
31#ifdef HAVE_SYS_POLL_H
David Reiss22b18862008-04-08 06:25:45 +000032#include <sys/poll.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000033#endif
Mark Sleedd564972007-08-21 02:39:57 +000034#include <sys/types.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000035#ifdef HAVE_ARPA_INET_H
Mark Sleee8540632006-05-30 09:24:40 +000036#include <arpa/inet.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000037#endif
38#ifdef HAVE_NETINET_IN_H
Mark Sleee8540632006-05-30 09:24:40 +000039#include <netinet/in.h>
40#include <netinet/tcp.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000041#endif
42#ifdef HAVE_UNISTD_H
Mark Sleee8540632006-05-30 09:24:40 +000043#include <unistd.h>
Roger Meier2fa9c312011-09-05 19:15:53 +000044#endif
Mark Sleee8540632006-05-30 09:24:40 +000045#include <errno.h>
Mark Slee29050782006-09-29 00:12:30 +000046#include <fcntl.h>
Mark Sleee8540632006-05-30 09:24:40 +000047
Mark Slee29050782006-09-29 00:12:30 +000048#include "concurrency/Monitor.h"
Marc Slemkod42a2c22006-08-10 03:30:18 +000049#include "TSocket.h"
50#include "TTransportException.h"
Mark Sleee8540632006-05-30 09:24:40 +000051
T Jake Lucianib5e62212009-01-31 22:36:20 +000052namespace apache { namespace thrift { namespace transport {
Marc Slemko6f038a72006-08-03 18:58:09 +000053
Mark Sleee8540632006-05-30 09:24:40 +000054using namespace std;
55
Mark Slee29050782006-09-29 00:12:30 +000056// Global var to track total socket sys calls
Mark Slee8d7e1f62006-06-07 06:48:56 +000057uint32_t g_socket_syscalls = 0;
58
59/**
60 * TSocket implementation.
61 *
Mark Slee8d7e1f62006-06-07 06:48:56 +000062 */
63
Mark Slee256bdc42007-11-27 08:42:19 +000064TSocket::TSocket(string host, int port) :
Mark Slee29050782006-09-29 00:12:30 +000065 host_(host),
66 port_(port),
Bryan Duxburya18364a2010-09-28 14:36:07 +000067 path_(""),
68 socket_(-1),
69 connTimeout_(0),
70 sendTimeout_(0),
71 recvTimeout_(0),
72 lingerOn_(1),
73 lingerVal_(0),
74 noDelay_(1),
75 maxRecvRetries_(5) {
76 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
77 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
78}
79
80TSocket::TSocket(string path) :
81 host_(""),
82 port_(0),
83 path_(path),
Martin Kraemeree341cb2007-02-05 21:40:38 +000084 socket_(-1),
Mark Slee29050782006-09-29 00:12:30 +000085 connTimeout_(0),
86 sendTimeout_(0),
87 recvTimeout_(0),
88 lingerOn_(1),
89 lingerVal_(0),
Aditya Agarwale04475b2007-05-23 02:14:58 +000090 noDelay_(1),
91 maxRecvRetries_(5) {
Mark Sleeb9ff32a2006-11-16 01:00:24 +000092 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
93 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
David Reiss23248712010-10-06 17:10:08 +000094 cachedPeerAddr_.ipv4.sin_family = AF_UNSPEC;
Mark Sleee8540632006-05-30 09:24:40 +000095}
96
Mark Slee256bdc42007-11-27 08:42:19 +000097TSocket::TSocket() :
Aditya Agarwalebc99e02007-01-15 23:14:58 +000098 host_(""),
99 port_(0),
Bryan Duxburya18364a2010-09-28 14:36:07 +0000100 path_(""),
Martin Kraemeree341cb2007-02-05 21:40:38 +0000101 socket_(-1),
Aditya Agarwalebc99e02007-01-15 23:14:58 +0000102 connTimeout_(0),
103 sendTimeout_(0),
104 recvTimeout_(0),
105 lingerOn_(1),
106 lingerVal_(0),
Aditya Agarwale04475b2007-05-23 02:14:58 +0000107 noDelay_(1),
108 maxRecvRetries_(5) {
Aditya Agarwalebc99e02007-01-15 23:14:58 +0000109 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
110 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
David Reiss23248712010-10-06 17:10:08 +0000111 cachedPeerAddr_.ipv4.sin_family = AF_UNSPEC;
Aditya Agarwalebc99e02007-01-15 23:14:58 +0000112}
113
Mark Slee29050782006-09-29 00:12:30 +0000114TSocket::TSocket(int socket) :
115 host_(""),
116 port_(0),
Bryan Duxburya18364a2010-09-28 14:36:07 +0000117 path_(""),
Mark Slee29050782006-09-29 00:12:30 +0000118 socket_(socket),
119 connTimeout_(0),
120 sendTimeout_(0),
121 recvTimeout_(0),
122 lingerOn_(1),
123 lingerVal_(0),
Aditya Agarwale04475b2007-05-23 02:14:58 +0000124 noDelay_(1),
125 maxRecvRetries_(5) {
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000126 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
127 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
David Reiss23248712010-10-06 17:10:08 +0000128 cachedPeerAddr_.ipv4.sin_family = AF_UNSPEC;
Mark Slee29050782006-09-29 00:12:30 +0000129}
Mark Slee256bdc42007-11-27 08:42:19 +0000130
Mark Sleee8540632006-05-30 09:24:40 +0000131TSocket::~TSocket() {
132 close();
133}
134
Mark Slee256bdc42007-11-27 08:42:19 +0000135bool TSocket::isOpen() {
136 return (socket_ >= 0);
Mark Slee8d7e1f62006-06-07 06:48:56 +0000137}
138
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000139bool TSocket::peek() {
140 if (!isOpen()) {
141 return false;
142 }
143 uint8_t buf;
144 int r = recv(socket_, &buf, 1, MSG_PEEK);
145 if (r == -1) {
David Reissbc3dddb2007-08-22 23:20:24 +0000146 int errno_copy = errno;
David Reiss840e7522009-06-04 00:10:50 +0000147 #if defined __FreeBSD__ || defined __MACH__
Kevin Clark022b2242009-03-05 21:05:37 +0000148 /* shigin:
149 * freebsd returns -1 and ECONNRESET if socket was closed by
150 * the other side
151 */
152 if (errno_copy == ECONNRESET)
153 {
154 close();
155 return false;
156 }
157 #endif
David Reiss01e55c12008-07-13 22:18:51 +0000158 GlobalOutput.perror("TSocket::peek() recv() " + getSocketInfo(), errno_copy);
David Reissbc3dddb2007-08-22 23:20:24 +0000159 throw TTransportException(TTransportException::UNKNOWN, "recv()", errno_copy);
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000160 }
161 return (r > 0);
162}
163
Mark Slee6d56eb92007-07-06 22:28:15 +0000164void TSocket::openConnection(struct addrinfo *res) {
Mark Sleea9848d72007-02-21 04:54:05 +0000165 if (isOpen()) {
Bryan Duxbury010f1e02010-09-02 00:56:53 +0000166 return;
Mark Sleea9848d72007-02-21 04:54:05 +0000167 }
Aditya Agarwal4529c4b2007-09-05 01:01:15 +0000168
Bryan Duxburya18364a2010-09-28 14:36:07 +0000169 if (! path_.empty()) {
170 socket_ = socket(PF_UNIX, SOCK_STREAM, IPPROTO_IP);
171 } else {
172 socket_ = socket(res->ai_family, res->ai_socktype, res->ai_protocol);
173 }
174
Mark Sleee8540632006-05-30 09:24:40 +0000175 if (socket_ == -1) {
David Reissbc3dddb2007-08-22 23:20:24 +0000176 int errno_copy = errno;
David Reiss01e55c12008-07-13 22:18:51 +0000177 GlobalOutput.perror("TSocket::open() socket() " + getSocketInfo(), errno_copy);
David Reissbc3dddb2007-08-22 23:20:24 +0000178 throw TTransportException(TTransportException::NOT_OPEN, "socket()", errno_copy);
Mark Sleee8540632006-05-30 09:24:40 +0000179 }
Mark Slee29050782006-09-29 00:12:30 +0000180
181 // Send timeout
182 if (sendTimeout_ > 0) {
183 setSendTimeout(sendTimeout_);
184 }
185
186 // Recv timeout
187 if (recvTimeout_ > 0) {
188 setRecvTimeout(recvTimeout_);
189 }
190
191 // Linger
192 setLinger(lingerOn_, lingerVal_);
193
194 // No delay
195 setNoDelay(noDelay_);
196
David Reiss1c20c872010-03-09 05:20:14 +0000197 // Uses a low min RTO if asked to.
198#ifdef TCP_LOW_MIN_RTO
199 if (getUseLowMinRto()) {
200 int one = 1;
201 setsockopt(socket_, IPPROTO_TCP, TCP_LOW_MIN_RTO, &one, sizeof(one));
202 }
203#endif
204
205
Mark Slee29050782006-09-29 00:12:30 +0000206 // Set the socket to be non blocking for connect if a timeout exists
Mark Slee256bdc42007-11-27 08:42:19 +0000207 int flags = fcntl(socket_, F_GETFL, 0);
Mark Slee29050782006-09-29 00:12:30 +0000208 if (connTimeout_ > 0) {
Mark Sleea5a783f2007-03-02 19:41:08 +0000209 if (-1 == fcntl(socket_, F_SETFL, flags | O_NONBLOCK)) {
David Reiss9b209552008-04-08 06:26:05 +0000210 int errno_copy = errno;
David Reiss01e55c12008-07-13 22:18:51 +0000211 GlobalOutput.perror("TSocket::open() fcntl() " + getSocketInfo(), errno_copy);
David Reiss9b209552008-04-08 06:26:05 +0000212 throw TTransportException(TTransportException::NOT_OPEN, "fcntl() failed", errno_copy);
Mark Sleea5a783f2007-03-02 19:41:08 +0000213 }
Mark Slee29050782006-09-29 00:12:30 +0000214 } else {
Mark Sleea5a783f2007-03-02 19:41:08 +0000215 if (-1 == fcntl(socket_, F_SETFL, flags & ~O_NONBLOCK)) {
David Reiss9b209552008-04-08 06:26:05 +0000216 int errno_copy = errno;
David Reiss01e55c12008-07-13 22:18:51 +0000217 GlobalOutput.perror("TSocket::open() fcntl " + getSocketInfo(), errno_copy);
David Reiss9b209552008-04-08 06:26:05 +0000218 throw TTransportException(TTransportException::NOT_OPEN, "fcntl() failed", errno_copy);
Mark Sleea5a783f2007-03-02 19:41:08 +0000219 }
Mark Slee29050782006-09-29 00:12:30 +0000220 }
221
Mark Sleee8540632006-05-30 09:24:40 +0000222 // Connect the socket
Bryan Duxburya18364a2010-09-28 14:36:07 +0000223 int ret;
224 if (! path_.empty()) {
225 struct sockaddr_un address;
226 socklen_t len;
227
228 if (path_.length() > sizeof(address.sun_path)) {
229 int errno_copy = errno;
230 GlobalOutput.perror("TSocket::open() Unix Domain socket path too long", errno_copy);
231 throw TTransportException(TTransportException::NOT_OPEN, " Unix Domain socket path too long");
232 }
233
234 address.sun_family = AF_UNIX;
Roger Meierd11ca5a2010-10-18 08:22:57 +0000235 snprintf(address.sun_path, sizeof(address.sun_path), "%s", path_.c_str());
Bryan Duxburya18364a2010-09-28 14:36:07 +0000236 len = sizeof(address);
237 ret = connect(socket_, (struct sockaddr *) &address, len);
238 } else {
239 ret = connect(socket_, res->ai_addr, res->ai_addrlen);
240 }
Mark Slee256bdc42007-11-27 08:42:19 +0000241
David Reiss9b209552008-04-08 06:26:05 +0000242 // success case
Mark Slee29050782006-09-29 00:12:30 +0000243 if (ret == 0) {
244 goto done;
245 }
246
247 if (errno != EINPROGRESS) {
David Reissbc3dddb2007-08-22 23:20:24 +0000248 int errno_copy = errno;
David Reiss01e55c12008-07-13 22:18:51 +0000249 GlobalOutput.perror("TSocket::open() connect() " + getSocketInfo(), errno_copy);
David Reiss9b209552008-04-08 06:26:05 +0000250 throw TTransportException(TTransportException::NOT_OPEN, "connect() failed", errno_copy);
Mark Sleee8540632006-05-30 09:24:40 +0000251 }
252
David Reiss22b18862008-04-08 06:25:45 +0000253
254 struct pollfd fds[1];
David Reissc88eb8c2008-06-11 01:18:54 +0000255 std::memset(fds, 0 , sizeof(fds));
David Reiss22b18862008-04-08 06:25:45 +0000256 fds[0].fd = socket_;
257 fds[0].events = POLLOUT;
258 ret = poll(fds, 1, connTimeout_);
Mark Slee29050782006-09-29 00:12:30 +0000259
260 if (ret > 0) {
David Reiss9b209552008-04-08 06:26:05 +0000261 // Ensure the socket is connected and that there are no errors set
Mark Slee29050782006-09-29 00:12:30 +0000262 int val;
263 socklen_t lon;
264 lon = sizeof(int);
265 int ret2 = getsockopt(socket_, SOL_SOCKET, SO_ERROR, (void *)&val, &lon);
266 if (ret2 == -1) {
David Reissbc3dddb2007-08-22 23:20:24 +0000267 int errno_copy = errno;
David Reiss01e55c12008-07-13 22:18:51 +0000268 GlobalOutput.perror("TSocket::open() getsockopt() " + getSocketInfo(), errno_copy);
David Reiss9b209552008-04-08 06:26:05 +0000269 throw TTransportException(TTransportException::NOT_OPEN, "getsockopt()", errno_copy);
Mark Slee29050782006-09-29 00:12:30 +0000270 }
David Reiss9b209552008-04-08 06:26:05 +0000271 // no errors on socket, go to town
Mark Slee29050782006-09-29 00:12:30 +0000272 if (val == 0) {
273 goto done;
274 }
David Reiss01e55c12008-07-13 22:18:51 +0000275 GlobalOutput.perror("TSocket::open() error on socket (after poll) " + getSocketInfo(), val);
David Reiss9b209552008-04-08 06:26:05 +0000276 throw TTransportException(TTransportException::NOT_OPEN, "socket open() error", val);
Mark Slee29050782006-09-29 00:12:30 +0000277 } else if (ret == 0) {
David Reiss9b209552008-04-08 06:26:05 +0000278 // socket timed out
Aditya Agarwal4529c4b2007-09-05 01:01:15 +0000279 string errStr = "TSocket::open() timed out " + getSocketInfo();
280 GlobalOutput(errStr.c_str());
David Reiss9b209552008-04-08 06:26:05 +0000281 throw TTransportException(TTransportException::NOT_OPEN, "open() timed out");
Mark Slee29050782006-09-29 00:12:30 +0000282 } else {
David Reiss9b209552008-04-08 06:26:05 +0000283 // error on poll()
David Reissbc3dddb2007-08-22 23:20:24 +0000284 int errno_copy = errno;
David Reiss01e55c12008-07-13 22:18:51 +0000285 GlobalOutput.perror("TSocket::open() poll() " + getSocketInfo(), errno_copy);
David Reiss9b209552008-04-08 06:26:05 +0000286 throw TTransportException(TTransportException::NOT_OPEN, "poll() failed", errno_copy);
Mark Slee29050782006-09-29 00:12:30 +0000287 }
288
289 done:
290 // Set socket back to normal mode (blocking)
291 fcntl(socket_, F_SETFL, flags);
David Reiss23248712010-10-06 17:10:08 +0000292
Roger Meier18f10502011-06-04 08:57:43 +0000293 if (path_.empty()) {
294 setCachedAddress(res->ai_addr, res->ai_addrlen);
295 }
Mark Sleee8540632006-05-30 09:24:40 +0000296}
297
Mark Slee6d56eb92007-07-06 22:28:15 +0000298void TSocket::open() {
299 if (isOpen()) {
Bryan Duxbury010f1e02010-09-02 00:56:53 +0000300 return;
Mark Slee6d56eb92007-07-06 22:28:15 +0000301 }
Bryan Duxburya18364a2010-09-28 14:36:07 +0000302 if (! path_.empty()) {
303 unix_open();
304 } else {
305 local_open();
306 }
307}
308
309void TSocket::unix_open(){
310 if (! path_.empty()) {
311 // Unix Domain SOcket does not need addrinfo struct, so we pass NULL
312 openConnection(NULL);
313 }
314}
315
316void TSocket::local_open(){
317 if (isOpen()) {
318 return;
319 }
Mark Slee6d56eb92007-07-06 22:28:15 +0000320
321 // Validate port number
David Reiss450e35d2010-03-09 05:19:41 +0000322 if (port_ < 0 || port_ > 0xFFFF) {
Mark Slee6d56eb92007-07-06 22:28:15 +0000323 throw TTransportException(TTransportException::NOT_OPEN, "Specified port is invalid");
324 }
325
326 struct addrinfo hints, *res, *res0;
David Reiss9b209552008-04-08 06:26:05 +0000327 res = NULL;
328 res0 = NULL;
Mark Slee6d56eb92007-07-06 22:28:15 +0000329 int error;
David Reiss450e35d2010-03-09 05:19:41 +0000330 char port[sizeof("65535")];
David Reissc88eb8c2008-06-11 01:18:54 +0000331 std::memset(&hints, 0, sizeof(hints));
Mark Slee6d56eb92007-07-06 22:28:15 +0000332 hints.ai_family = PF_UNSPEC;
333 hints.ai_socktype = SOCK_STREAM;
Mark Slee256bdc42007-11-27 08:42:19 +0000334 hints.ai_flags = AI_PASSIVE | AI_ADDRCONFIG;
Mark Slee6d56eb92007-07-06 22:28:15 +0000335 sprintf(port, "%d", port_);
Mark Slee256bdc42007-11-27 08:42:19 +0000336
Mark Sleec37b4c52007-12-05 23:03:37 +0000337 error = getaddrinfo(host_.c_str(), port, &hints, &res0);
338
Mark Slee6d56eb92007-07-06 22:28:15 +0000339 if (error) {
David Reiss9b209552008-04-08 06:26:05 +0000340 string errStr = "TSocket::open() getaddrinfo() " + getSocketInfo() + string(gai_strerror(error));
341 GlobalOutput(errStr.c_str());
Mark Slee6d56eb92007-07-06 22:28:15 +0000342 close();
343 throw TTransportException(TTransportException::NOT_OPEN, "Could not resolve host for client socket.");
344 }
Mark Slee256bdc42007-11-27 08:42:19 +0000345
Mark Slee6d56eb92007-07-06 22:28:15 +0000346 // Cycle through all the returned addresses until one
347 // connects or push the exception up.
348 for (res = res0; res; res = res->ai_next) {
349 try {
350 openConnection(res);
351 break;
352 } catch (TTransportException& ttx) {
353 if (res->ai_next) {
354 close();
355 } else {
356 close();
Mark Slee85287d32007-07-09 19:50:30 +0000357 freeaddrinfo(res0); // cleanup on failure
Mark Slee6d56eb92007-07-06 22:28:15 +0000358 throw;
359 }
360 }
361 }
Mark Slee85287d32007-07-09 19:50:30 +0000362
363 // Free address structure memory
364 freeaddrinfo(res0);
Mark Slee6d56eb92007-07-06 22:28:15 +0000365}
366
Mark Sleee8540632006-05-30 09:24:40 +0000367void TSocket::close() {
Martin Kraemeree341cb2007-02-05 21:40:38 +0000368 if (socket_ >= 0) {
Mark Sleee8540632006-05-30 09:24:40 +0000369 shutdown(socket_, SHUT_RDWR);
370 ::close(socket_);
371 }
Martin Kraemeree341cb2007-02-05 21:40:38 +0000372 socket_ = -1;
Mark Sleee8540632006-05-30 09:24:40 +0000373}
374
David Reiss105961d2010-10-06 17:10:17 +0000375void TSocket::setSocketFD(int socket) {
376 if (socket_ >= 0) {
377 close();
378 }
379 socket_ = socket;
380}
381
Mark Slee8d7e1f62006-06-07 06:48:56 +0000382uint32_t TSocket::read(uint8_t* buf, uint32_t len) {
Martin Kraemeree341cb2007-02-05 21:40:38 +0000383 if (socket_ < 0) {
Mark Sleef9831082007-02-20 20:59:21 +0000384 throw TTransportException(TTransportException::NOT_OPEN, "Called read on non-open socket");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000385 }
Mark Sleee8540632006-05-30 09:24:40 +0000386
Aditya Agarwale04475b2007-05-23 02:14:58 +0000387 int32_t retries = 0;
388
389 // EAGAIN can be signalled both when a timeout has occurred and when
390 // the system is out of resources (an awesome undocumented feature).
391 // The following is an approximation of the time interval under which
392 // EAGAIN is taken to indicate an out of resources error.
393 uint32_t eagainThresholdMicros = 0;
394 if (recvTimeout_) {
Mark Slee256bdc42007-11-27 08:42:19 +0000395 // if a readTimeout is specified along with a max number of recv retries, then
Aditya Agarwale04475b2007-05-23 02:14:58 +0000396 // the threshold will ensure that the read timeout is not exceeded even in the
397 // case of resource errors
398 eagainThresholdMicros = (recvTimeout_*1000)/ ((maxRecvRetries_>0) ? maxRecvRetries_ : 2);
399 }
400
Mark Slee256bdc42007-11-27 08:42:19 +0000401 try_again:
Mark Slee8d7e1f62006-06-07 06:48:56 +0000402 // Read from the socket
Aditya Agarwale04475b2007-05-23 02:14:58 +0000403 struct timeval begin;
David Reiss105961d2010-10-06 17:10:17 +0000404 if (recvTimeout_ > 0) {
405 gettimeofday(&begin, NULL);
406 } else {
407 // if there is no read timeout we don't need the TOD to determine whether
408 // an EAGAIN is due to a timeout or an out-of-resource condition.
409 begin.tv_sec = begin.tv_usec = 0;
410 }
Mark Slee8d7e1f62006-06-07 06:48:56 +0000411 int got = recv(socket_, buf, len, 0);
Kevin Clark022b2242009-03-05 21:05:37 +0000412 int errno_copy = errno; //gettimeofday can change errno
Mark Slee8d7e1f62006-06-07 06:48:56 +0000413 ++g_socket_syscalls;
Aditya Agarwale04475b2007-05-23 02:14:58 +0000414
Mark Slee8d7e1f62006-06-07 06:48:56 +0000415 // Check for error on read
Mark Slee256bdc42007-11-27 08:42:19 +0000416 if (got < 0) {
Kevin Clark022b2242009-03-05 21:05:37 +0000417 if (errno_copy == EAGAIN) {
David Reiss105961d2010-10-06 17:10:17 +0000418 // if no timeout we can assume that resource exhaustion has occurred.
419 if (recvTimeout_ == 0) {
420 throw TTransportException(TTransportException::TIMED_OUT,
421 "EAGAIN (unavailable resources)");
422 }
Aditya Agarwale04475b2007-05-23 02:14:58 +0000423 // check if this is the lack of resources or timeout case
David Reissa1a15112010-03-09 05:19:54 +0000424 struct timeval end;
425 gettimeofday(&end, NULL);
426 uint32_t readElapsedMicros = (((end.tv_sec - begin.tv_sec) * 1000 * 1000)
427 + (((uint64_t)(end.tv_usec - begin.tv_usec))));
428
Aditya Agarwale04475b2007-05-23 02:14:58 +0000429 if (!eagainThresholdMicros || (readElapsedMicros < eagainThresholdMicros)) {
430 if (retries++ < maxRecvRetries_) {
431 usleep(50);
432 goto try_again;
433 } else {
Mark Slee256bdc42007-11-27 08:42:19 +0000434 throw TTransportException(TTransportException::TIMED_OUT,
Aditya Agarwale04475b2007-05-23 02:14:58 +0000435 "EAGAIN (unavailable resources)");
436 }
437 } else {
438 // infer that timeout has been hit
Mark Slee256bdc42007-11-27 08:42:19 +0000439 throw TTransportException(TTransportException::TIMED_OUT,
Aditya Agarwale04475b2007-05-23 02:14:58 +0000440 "EAGAIN (timed out)");
441 }
Mark Sleee8540632006-05-30 09:24:40 +0000442 }
Mark Slee256bdc42007-11-27 08:42:19 +0000443
Mark Slee8d7e1f62006-06-07 06:48:56 +0000444 // If interrupted, try again
Kevin Clark022b2242009-03-05 21:05:37 +0000445 if (errno_copy == EINTR && retries++ < maxRecvRetries_) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000446 goto try_again;
Mark Sleee8540632006-05-30 09:24:40 +0000447 }
Mark Slee256bdc42007-11-27 08:42:19 +0000448
David Reiss840e7522009-06-04 00:10:50 +0000449 #if defined __FreeBSD__ || defined __MACH__
Kevin Clark022b2242009-03-05 21:05:37 +0000450 if (errno_copy == ECONNRESET) {
Kevin Clark022b2242009-03-05 21:05:37 +0000451 /* shigin: freebsd doesn't follow POSIX semantic of recv and fails with
452 * ECONNRESET if peer performed shutdown
David Reiss105961d2010-10-06 17:10:17 +0000453 * edhall: eliminated close() since we do that in the destructor.
Kevin Clark022b2242009-03-05 21:05:37 +0000454 */
Kevin Clark022b2242009-03-05 21:05:37 +0000455 return 0;
David Reiss840e7522009-06-04 00:10:50 +0000456 }
457 #endif
458
459 // Now it's not a try again case, but a real probblez
460 GlobalOutput.perror("TSocket::read() recv() " + getSocketInfo(), errno_copy);
461
462 // If we disconnect with no linger time
463 if (errno_copy == ECONNRESET) {
Mark Sleef9831082007-02-20 20:59:21 +0000464 throw TTransportException(TTransportException::NOT_OPEN, "ECONNRESET");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000465 }
Mark Slee256bdc42007-11-27 08:42:19 +0000466
Mark Slee8d7e1f62006-06-07 06:48:56 +0000467 // This ish isn't open
Kevin Clark022b2242009-03-05 21:05:37 +0000468 if (errno_copy == ENOTCONN) {
Mark Sleef9831082007-02-20 20:59:21 +0000469 throw TTransportException(TTransportException::NOT_OPEN, "ENOTCONN");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000470 }
Mark Slee256bdc42007-11-27 08:42:19 +0000471
Mark Slee8d7e1f62006-06-07 06:48:56 +0000472 // Timed out!
Kevin Clark022b2242009-03-05 21:05:37 +0000473 if (errno_copy == ETIMEDOUT) {
Mark Sleef9831082007-02-20 20:59:21 +0000474 throw TTransportException(TTransportException::TIMED_OUT, "ETIMEDOUT");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000475 }
Mark Slee256bdc42007-11-27 08:42:19 +0000476
Mark Slee8d7e1f62006-06-07 06:48:56 +0000477 // Some other error, whatevz
David Reiss01e55c12008-07-13 22:18:51 +0000478 throw TTransportException(TTransportException::UNKNOWN, "Unknown", errno_copy);
Mark Slee8d7e1f62006-06-07 06:48:56 +0000479 }
Mark Slee256bdc42007-11-27 08:42:19 +0000480
Mark Slee8d7e1f62006-06-07 06:48:56 +0000481 // The remote host has closed the socket
482 if (got == 0) {
David Reiss105961d2010-10-06 17:10:17 +0000483 // edhall: we used to call close() here, but our caller may want to deal
484 // with the socket fd and we'll close() in our destructor in any case.
Mark Slee8d7e1f62006-06-07 06:48:56 +0000485 return 0;
Mark Sleee8540632006-05-30 09:24:40 +0000486 }
Mark Slee256bdc42007-11-27 08:42:19 +0000487
Mark Sleee8540632006-05-30 09:24:40 +0000488 // Pack data into string
Mark Slee8d7e1f62006-06-07 06:48:56 +0000489 return got;
Mark Sleee8540632006-05-30 09:24:40 +0000490}
491
Mark Slee8d7e1f62006-06-07 06:48:56 +0000492void TSocket::write(const uint8_t* buf, uint32_t len) {
David Reiss105961d2010-10-06 17:10:17 +0000493 uint32_t sent = 0;
494
495 while (sent < len) {
496 uint32_t b = write_partial(buf + sent, len - sent);
497 if (b == 0) {
Bryan Duxbury97592662011-08-29 18:05:26 +0000498 // This should only happen if the timeout set with SO_SNDTIMEO expired.
499 // Raise an exception.
500 throw TTransportException(TTransportException::TIMED_OUT,
501 "send timeout expired");
David Reiss105961d2010-10-06 17:10:17 +0000502 }
503 sent += b;
504 }
505}
506
507uint32_t TSocket::write_partial(const uint8_t* buf, uint32_t len) {
Martin Kraemeree341cb2007-02-05 21:40:38 +0000508 if (socket_ < 0) {
Mark Sleef9831082007-02-20 20:59:21 +0000509 throw TTransportException(TTransportException::NOT_OPEN, "Called write on non-open socket");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000510 }
511
Mark Sleee8540632006-05-30 09:24:40 +0000512 uint32_t sent = 0;
Mark Slee256bdc42007-11-27 08:42:19 +0000513
David Reiss105961d2010-10-06 17:10:17 +0000514 int flags = 0;
515#ifdef MSG_NOSIGNAL
516 // Note the use of MSG_NOSIGNAL to suppress SIGPIPE errors, instead we
517 // check for the EPIPE return condition and close the socket in that case
518 flags |= MSG_NOSIGNAL;
519#endif // ifdef MSG_NOSIGNAL
Marc Slemko9d4a3e22006-07-21 19:53:48 +0000520
David Reiss105961d2010-10-06 17:10:17 +0000521 int b = send(socket_, buf + sent, len - sent, flags);
522 ++g_socket_syscalls;
Marc Slemko9d4a3e22006-07-21 19:53:48 +0000523
David Reiss105961d2010-10-06 17:10:17 +0000524 if (b < 0) {
525 if (errno == EWOULDBLOCK || errno == EAGAIN) {
526 return 0;
527 }
Mark Sleee8540632006-05-30 09:24:40 +0000528 // Fail on a send error
David Reiss105961d2010-10-06 17:10:17 +0000529 int errno_copy = errno;
530 GlobalOutput.perror("TSocket::write_partial() send() " + getSocketInfo(), errno_copy);
David Reiss9b209552008-04-08 06:26:05 +0000531
David Reiss105961d2010-10-06 17:10:17 +0000532 if (errno_copy == EPIPE || errno_copy == ECONNRESET || errno_copy == ENOTCONN) {
533 close();
534 throw TTransportException(TTransportException::NOT_OPEN, "write() send()", errno_copy);
Mark Sleee8540632006-05-30 09:24:40 +0000535 }
Mark Slee256bdc42007-11-27 08:42:19 +0000536
David Reiss105961d2010-10-06 17:10:17 +0000537 throw TTransportException(TTransportException::UNKNOWN, "write() send()", errno_copy);
Mark Sleee8540632006-05-30 09:24:40 +0000538 }
David Reiss105961d2010-10-06 17:10:17 +0000539
540 // Fail on blocked send
541 if (b == 0) {
542 throw TTransportException(TTransportException::NOT_OPEN, "Socket send returned 0.");
543 }
544 return b;
Mark Sleee8540632006-05-30 09:24:40 +0000545}
546
dweatherford14b0ed62007-10-19 01:03:32 +0000547std::string TSocket::getHost() {
548 return host_;
549}
550
551int TSocket::getPort() {
552 return port_;
553}
554
Aditya Agarwalebc99e02007-01-15 23:14:58 +0000555void TSocket::setHost(string host) {
556 host_ = host;
557}
558
559void TSocket::setPort(int port) {
560 port_ = port;
561}
562
Mark Slee8d7e1f62006-06-07 06:48:56 +0000563void TSocket::setLinger(bool on, int linger) {
Mark Slee29050782006-09-29 00:12:30 +0000564 lingerOn_ = on;
565 lingerVal_ = linger;
Martin Kraemeree341cb2007-02-05 21:40:38 +0000566 if (socket_ < 0) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000567 return;
568 }
569
Mark Slee29050782006-09-29 00:12:30 +0000570 struct linger l = {(lingerOn_ ? 1 : 0), lingerVal_};
571 int ret = setsockopt(socket_, SOL_SOCKET, SO_LINGER, &l, sizeof(l));
572 if (ret == -1) {
David Reiss01e55c12008-07-13 22:18:51 +0000573 int errno_copy = errno; // Copy errno because we're allocating memory.
574 GlobalOutput.perror("TSocket::setLinger() setsockopt() " + getSocketInfo(), errno_copy);
Mark Sleee8540632006-05-30 09:24:40 +0000575 }
Mark Sleee8540632006-05-30 09:24:40 +0000576}
577
Mark Slee8d7e1f62006-06-07 06:48:56 +0000578void TSocket::setNoDelay(bool noDelay) {
Mark Slee29050782006-09-29 00:12:30 +0000579 noDelay_ = noDelay;
Roger Meier18f10502011-06-04 08:57:43 +0000580 if (socket_ < 0 || !path_.empty()) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000581 return;
582 }
583
Mark Sleee8540632006-05-30 09:24:40 +0000584 // Set socket to NODELAY
Mark Slee29050782006-09-29 00:12:30 +0000585 int v = noDelay_ ? 1 : 0;
586 int ret = setsockopt(socket_, IPPROTO_TCP, TCP_NODELAY, &v, sizeof(v));
587 if (ret == -1) {
David Reiss01e55c12008-07-13 22:18:51 +0000588 int errno_copy = errno; // Copy errno because we're allocating memory.
589 GlobalOutput.perror("TSocket::setNoDelay() setsockopt() " + getSocketInfo(), errno_copy);
Mark Sleee8540632006-05-30 09:24:40 +0000590 }
Mark Sleee8540632006-05-30 09:24:40 +0000591}
Mark Slee29050782006-09-29 00:12:30 +0000592
593void TSocket::setConnTimeout(int ms) {
594 connTimeout_ = ms;
595}
596
597void TSocket::setRecvTimeout(int ms) {
Aditya Agarwalc31769c2007-12-11 22:23:51 +0000598 if (ms < 0) {
599 char errBuf[512];
600 sprintf(errBuf, "TSocket::setRecvTimeout with negative input: %d\n", ms);
601 GlobalOutput(errBuf);
602 return;
603 }
Mark Slee29050782006-09-29 00:12:30 +0000604 recvTimeout_ = ms;
Aditya Agarwalc31769c2007-12-11 22:23:51 +0000605
Martin Kraemeree341cb2007-02-05 21:40:38 +0000606 if (socket_ < 0) {
Mark Slee29050782006-09-29 00:12:30 +0000607 return;
608 }
609
Aditya Agarwalc31769c2007-12-11 22:23:51 +0000610 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
611 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
612
David Reiss22b18862008-04-08 06:25:45 +0000613 // Copy because poll may modify
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000614 struct timeval r = recvTimeval_;
Mark Slee29050782006-09-29 00:12:30 +0000615 int ret = setsockopt(socket_, SOL_SOCKET, SO_RCVTIMEO, &r, sizeof(r));
616 if (ret == -1) {
David Reiss01e55c12008-07-13 22:18:51 +0000617 int errno_copy = errno; // Copy errno because we're allocating memory.
618 GlobalOutput.perror("TSocket::setRecvTimeout() setsockopt() " + getSocketInfo(), errno_copy);
Mark Slee29050782006-09-29 00:12:30 +0000619 }
620}
621
622void TSocket::setSendTimeout(int ms) {
Aditya Agarwalc31769c2007-12-11 22:23:51 +0000623 if (ms < 0) {
624 char errBuf[512];
625 sprintf(errBuf, "TSocket::setSendTimeout with negative input: %d\n", ms);
626 GlobalOutput(errBuf);
627 return;
628 }
Mark Slee29050782006-09-29 00:12:30 +0000629 sendTimeout_ = ms;
Aditya Agarwalc31769c2007-12-11 22:23:51 +0000630
Martin Kraemeree341cb2007-02-05 21:40:38 +0000631 if (socket_ < 0) {
Mark Slee29050782006-09-29 00:12:30 +0000632 return;
633 }
Mark Slee256bdc42007-11-27 08:42:19 +0000634
Mark Slee29050782006-09-29 00:12:30 +0000635 struct timeval s = {(int)(sendTimeout_/1000),
636 (int)((sendTimeout_%1000)*1000)};
637 int ret = setsockopt(socket_, SOL_SOCKET, SO_SNDTIMEO, &s, sizeof(s));
638 if (ret == -1) {
David Reiss01e55c12008-07-13 22:18:51 +0000639 int errno_copy = errno; // Copy errno because we're allocating memory.
640 GlobalOutput.perror("TSocket::setSendTimeout() setsockopt() " + getSocketInfo(), errno_copy);
Mark Slee29050782006-09-29 00:12:30 +0000641 }
642}
643
Aditya Agarwale04475b2007-05-23 02:14:58 +0000644void TSocket::setMaxRecvRetries(int maxRecvRetries) {
645 maxRecvRetries_ = maxRecvRetries;
646}
647
Aditya Agarwal4529c4b2007-09-05 01:01:15 +0000648string TSocket::getSocketInfo() {
649 std::ostringstream oss;
David Reiss105961d2010-10-06 17:10:17 +0000650 if (host_.empty() || port_ == 0) {
651 oss << "<Host: " << getPeerAddress();
652 oss << " Port: " << getPeerPort() << ">";
653 } else {
654 oss << "<Host: " << host_ << " Port: " << port_ << ">";
655 }
Aditya Agarwal4529c4b2007-09-05 01:01:15 +0000656 return oss.str();
657}
658
Mark Sleeb4552922007-11-28 00:12:11 +0000659std::string TSocket::getPeerHost() {
Roger Meier18f10502011-06-04 08:57:43 +0000660 if (peerHost_.empty() && path_.empty()) {
Mark Sleeb4552922007-11-28 00:12:11 +0000661 struct sockaddr_storage addr;
David Reiss23248712010-10-06 17:10:08 +0000662 struct sockaddr* addrPtr;
663 socklen_t addrLen;
Mark Sleeb4552922007-11-28 00:12:11 +0000664
665 if (socket_ < 0) {
666 return host_;
667 }
668
David Reiss23248712010-10-06 17:10:08 +0000669 addrPtr = getCachedAddress(&addrLen);
Mark Sleeb4552922007-11-28 00:12:11 +0000670
David Reiss23248712010-10-06 17:10:08 +0000671 if (addrPtr == NULL) {
672 addrLen = sizeof(addr);
673 if (getpeername(socket_, (sockaddr*) &addr, &addrLen) != 0) {
674 return peerHost_;
675 }
676 addrPtr = (sockaddr*)&addr;
677
678 setCachedAddress(addrPtr, addrLen);
Mark Sleeb4552922007-11-28 00:12:11 +0000679 }
680
681 char clienthost[NI_MAXHOST];
682 char clientservice[NI_MAXSERV];
683
David Reiss23248712010-10-06 17:10:08 +0000684 getnameinfo((sockaddr*) addrPtr, addrLen,
Mark Sleeb4552922007-11-28 00:12:11 +0000685 clienthost, sizeof(clienthost),
686 clientservice, sizeof(clientservice), 0);
687
688 peerHost_ = clienthost;
689 }
690 return peerHost_;
691}
692
693std::string TSocket::getPeerAddress() {
Roger Meier18f10502011-06-04 08:57:43 +0000694 if (peerAddress_.empty() && path_.empty()) {
Mark Sleeb4552922007-11-28 00:12:11 +0000695 struct sockaddr_storage addr;
David Reiss23248712010-10-06 17:10:08 +0000696 struct sockaddr* addrPtr;
697 socklen_t addrLen;
Mark Sleeb4552922007-11-28 00:12:11 +0000698
699 if (socket_ < 0) {
700 return peerAddress_;
701 }
702
David Reiss23248712010-10-06 17:10:08 +0000703 addrPtr = getCachedAddress(&addrLen);
Mark Sleeb4552922007-11-28 00:12:11 +0000704
David Reiss23248712010-10-06 17:10:08 +0000705 if (addrPtr == NULL) {
706 addrLen = sizeof(addr);
707 if (getpeername(socket_, (sockaddr*) &addr, &addrLen) != 0) {
708 return peerAddress_;
709 }
710 addrPtr = (sockaddr*)&addr;
711
712 setCachedAddress(addrPtr, addrLen);
Mark Sleeb4552922007-11-28 00:12:11 +0000713 }
714
715 char clienthost[NI_MAXHOST];
716 char clientservice[NI_MAXSERV];
717
David Reiss23248712010-10-06 17:10:08 +0000718 getnameinfo(addrPtr, addrLen,
Mark Sleeb4552922007-11-28 00:12:11 +0000719 clienthost, sizeof(clienthost),
720 clientservice, sizeof(clientservice),
721 NI_NUMERICHOST|NI_NUMERICSERV);
722
723 peerAddress_ = clienthost;
724 peerPort_ = std::atoi(clientservice);
725 }
726 return peerAddress_;
727}
728
729int TSocket::getPeerPort() {
730 getPeerAddress();
731 return peerPort_;
732}
733
David Reiss23248712010-10-06 17:10:08 +0000734void TSocket::setCachedAddress(const sockaddr* addr, socklen_t len) {
Roger Meier18f10502011-06-04 08:57:43 +0000735 if (!path_.empty()) {
736 return;
737 }
738
David Reiss23248712010-10-06 17:10:08 +0000739 switch (addr->sa_family) {
740 case AF_INET:
741 if (len == sizeof(sockaddr_in)) {
742 memcpy((void*)&cachedPeerAddr_.ipv4, (void*)addr, len);
743 }
744 break;
745
746 case AF_INET6:
747 if (len == sizeof(sockaddr_in6)) {
748 memcpy((void*)&cachedPeerAddr_.ipv6, (void*)addr, len);
749 }
750 break;
751 }
752}
753
754sockaddr* TSocket::getCachedAddress(socklen_t* len) const {
755 switch (cachedPeerAddr_.ipv4.sin_family) {
756 case AF_INET:
757 *len = sizeof(sockaddr_in);
758 return (sockaddr*) &cachedPeerAddr_.ipv4;
759
760 case AF_INET6:
761 *len = sizeof(sockaddr_in6);
762 return (sockaddr*) &cachedPeerAddr_.ipv6;
763
764 default:
765 return NULL;
766 }
767}
768
David Reiss1c20c872010-03-09 05:20:14 +0000769bool TSocket::useLowMinRto_ = false;
770void TSocket::setUseLowMinRto(bool useLowMinRto) {
771 useLowMinRto_ = useLowMinRto;
772}
773bool TSocket::getUseLowMinRto() {
774 return useLowMinRto_;
775}
776
T Jake Lucianib5e62212009-01-31 22:36:20 +0000777}}} // apache::thrift::transport