blob: 3395dabdc5feb7e2540260a4b71e580b8535ca15 [file] [log] [blame]
Gavin McDonald0b75e1a2010-10-28 02:12:01 +00001/*
2 * Licensed to the Apache Software Foundation (ASF) under one
3 * or more contributor license agreements. See the NOTICE file
4 * distributed with this work for additional information
5 * regarding copyright ownership. The ASF licenses this file
6 * to you under the Apache License, Version 2.0 (the
7 * "License"); you may not use this file except in compliance
8 * with the License. You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing,
13 * software distributed under the License is distributed on an
14 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15 * KIND, either express or implied. See the License for the
16 * specific language governing permissions and limitations
17 * under the License.
18 */
19
20#include <config.h>
21#include <cstring>
22#include <sstream>
23#include <sys/socket.h>
24#include <sys/poll.h>
25#include <sys/types.h>
26#include <arpa/inet.h>
27#include <netinet/in.h>
28#include <netinet/tcp.h>
29#include <netdb.h>
30#include <unistd.h>
31#include <errno.h>
32#include <fcntl.h>
33
34#include "concurrency/Monitor.h"
35#include "TSocket.h"
36#include "TTransportException.h"
37
38namespace apache { namespace thrift { namespace transport {
39
40using namespace std;
41
42// Global var to track total socket sys calls
43uint32_t g_socket_syscalls = 0;
44
45/**
46 * TSocket implementation.
47 *
48 */
49
50TSocket::TSocket(string host, int port) :
51 host_(host),
52 port_(port),
53 socket_(-1),
54 connTimeout_(0),
55 sendTimeout_(0),
56 recvTimeout_(0),
57 lingerOn_(1),
58 lingerVal_(0),
59 noDelay_(1),
60 maxRecvRetries_(5) {
61 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
62 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
63}
64
65TSocket::TSocket() :
66 host_(""),
67 port_(0),
68 socket_(-1),
69 connTimeout_(0),
70 sendTimeout_(0),
71 recvTimeout_(0),
72 lingerOn_(1),
73 lingerVal_(0),
74 noDelay_(1),
75 maxRecvRetries_(5) {
76 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
77 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
78}
79
80TSocket::TSocket(int socket) :
81 host_(""),
82 port_(0),
83 socket_(socket),
84 connTimeout_(0),
85 sendTimeout_(0),
86 recvTimeout_(0),
87 lingerOn_(1),
88 lingerVal_(0),
89 noDelay_(1),
90 maxRecvRetries_(5) {
91 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
92 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
93}
94
95TSocket::~TSocket() {
96 close();
97}
98
99bool TSocket::isOpen() {
100 return (socket_ >= 0);
101}
102
103bool TSocket::peek() {
104 if (!isOpen()) {
105 return false;
106 }
107 uint8_t buf;
108 int r = recv(socket_, &buf, 1, MSG_PEEK);
109 if (r == -1) {
110 int errno_copy = errno;
111 #ifdef __FreeBSD__
112 /* shigin:
113 * freebsd returns -1 and ECONNRESET if socket was closed by
114 * the other side
115 */
116 if (errno_copy == ECONNRESET)
117 {
118 close();
119 return false;
120 }
121 #endif
122 GlobalOutput.perror("TSocket::peek() recv() " + getSocketInfo(), errno_copy);
123 throw TTransportException(TTransportException::UNKNOWN, "recv()", errno_copy);
124 }
125 return (r > 0);
126}
127
128void TSocket::openConnection(struct addrinfo *res) {
129 if (isOpen()) {
130 throw TTransportException(TTransportException::ALREADY_OPEN);
131 }
132
133 socket_ = socket(res->ai_family, res->ai_socktype, res->ai_protocol);
134 if (socket_ == -1) {
135 int errno_copy = errno;
136 GlobalOutput.perror("TSocket::open() socket() " + getSocketInfo(), errno_copy);
137 throw TTransportException(TTransportException::NOT_OPEN, "socket()", errno_copy);
138 }
139
140 // Send timeout
141 if (sendTimeout_ > 0) {
142 setSendTimeout(sendTimeout_);
143 }
144
145 // Recv timeout
146 if (recvTimeout_ > 0) {
147 setRecvTimeout(recvTimeout_);
148 }
149
150 // Linger
151 setLinger(lingerOn_, lingerVal_);
152
153 // No delay
154 setNoDelay(noDelay_);
155
156 // Set the socket to be non blocking for connect if a timeout exists
157 int flags = fcntl(socket_, F_GETFL, 0);
158 if (connTimeout_ > 0) {
159 if (-1 == fcntl(socket_, F_SETFL, flags | O_NONBLOCK)) {
160 int errno_copy = errno;
161 GlobalOutput.perror("TSocket::open() fcntl() " + getSocketInfo(), errno_copy);
162 throw TTransportException(TTransportException::NOT_OPEN, "fcntl() failed", errno_copy);
163 }
164 } else {
165 if (-1 == fcntl(socket_, F_SETFL, flags & ~O_NONBLOCK)) {
166 int errno_copy = errno;
167 GlobalOutput.perror("TSocket::open() fcntl " + getSocketInfo(), errno_copy);
168 throw TTransportException(TTransportException::NOT_OPEN, "fcntl() failed", errno_copy);
169 }
170 }
171
172 // Connect the socket
173 int ret = connect(socket_, res->ai_addr, res->ai_addrlen);
174
175 // success case
176 if (ret == 0) {
177 goto done;
178 }
179
180 if (errno != EINPROGRESS) {
181 int errno_copy = errno;
182 GlobalOutput.perror("TSocket::open() connect() " + getSocketInfo(), errno_copy);
183 throw TTransportException(TTransportException::NOT_OPEN, "connect() failed", errno_copy);
184 }
185
186
187 struct pollfd fds[1];
188 std::memset(fds, 0 , sizeof(fds));
189 fds[0].fd = socket_;
190 fds[0].events = POLLOUT;
191 ret = poll(fds, 1, connTimeout_);
192
193 if (ret > 0) {
194 // Ensure the socket is connected and that there are no errors set
195 int val;
196 socklen_t lon;
197 lon = sizeof(int);
198 int ret2 = getsockopt(socket_, SOL_SOCKET, SO_ERROR, (void *)&val, &lon);
199 if (ret2 == -1) {
200 int errno_copy = errno;
201 GlobalOutput.perror("TSocket::open() getsockopt() " + getSocketInfo(), errno_copy);
202 throw TTransportException(TTransportException::NOT_OPEN, "getsockopt()", errno_copy);
203 }
204 // no errors on socket, go to town
205 if (val == 0) {
206 goto done;
207 }
208 GlobalOutput.perror("TSocket::open() error on socket (after poll) " + getSocketInfo(), val);
209 throw TTransportException(TTransportException::NOT_OPEN, "socket open() error", val);
210 } else if (ret == 0) {
211 // socket timed out
212 string errStr = "TSocket::open() timed out " + getSocketInfo();
213 GlobalOutput(errStr.c_str());
214 throw TTransportException(TTransportException::NOT_OPEN, "open() timed out");
215 } else {
216 // error on poll()
217 int errno_copy = errno;
218 GlobalOutput.perror("TSocket::open() poll() " + getSocketInfo(), errno_copy);
219 throw TTransportException(TTransportException::NOT_OPEN, "poll() failed", errno_copy);
220 }
221
222 done:
223 // Set socket back to normal mode (blocking)
224 fcntl(socket_, F_SETFL, flags);
225}
226
227void TSocket::open() {
228 if (isOpen()) {
229 throw TTransportException(TTransportException::ALREADY_OPEN);
230 }
231
232 // Validate port number
233 if (port_ < 0 || port_ > 65536) {
234 throw TTransportException(TTransportException::NOT_OPEN, "Specified port is invalid");
235 }
236
237 struct addrinfo hints, *res, *res0;
238 res = NULL;
239 res0 = NULL;
240 int error;
241 char port[sizeof("65536")];
242 std::memset(&hints, 0, sizeof(hints));
243 hints.ai_family = PF_UNSPEC;
244 hints.ai_socktype = SOCK_STREAM;
245 hints.ai_flags = AI_PASSIVE | AI_ADDRCONFIG;
246 sprintf(port, "%d", port_);
247
248 error = getaddrinfo(host_.c_str(), port, &hints, &res0);
249
250 if (error) {
251 string errStr = "TSocket::open() getaddrinfo() " + getSocketInfo() + string(gai_strerror(error));
252 GlobalOutput(errStr.c_str());
253 close();
254 throw TTransportException(TTransportException::NOT_OPEN, "Could not resolve host for client socket.");
255 }
256
257 // Cycle through all the returned addresses until one
258 // connects or push the exception up.
259 for (res = res0; res; res = res->ai_next) {
260 try {
261 openConnection(res);
262 break;
263 } catch (TTransportException& ttx) {
264 if (res->ai_next) {
265 close();
266 } else {
267 close();
268 freeaddrinfo(res0); // cleanup on failure
269 throw;
270 }
271 }
272 }
273
274 // Free address structure memory
275 freeaddrinfo(res0);
276}
277
278void TSocket::close() {
279 if (socket_ >= 0) {
280 shutdown(socket_, SHUT_RDWR);
281 ::close(socket_);
282 }
283 socket_ = -1;
284}
285
286uint32_t TSocket::read(uint8_t* buf, uint32_t len) {
287 if (socket_ < 0) {
288 throw TTransportException(TTransportException::NOT_OPEN, "Called read on non-open socket");
289 }
290
291 int32_t retries = 0;
292
293 // EAGAIN can be signalled both when a timeout has occurred and when
294 // the system is out of resources (an awesome undocumented feature).
295 // The following is an approximation of the time interval under which
296 // EAGAIN is taken to indicate an out of resources error.
297 uint32_t eagainThresholdMicros = 0;
298 if (recvTimeout_) {
299 // if a readTimeout is specified along with a max number of recv retries, then
300 // the threshold will ensure that the read timeout is not exceeded even in the
301 // case of resource errors
302 eagainThresholdMicros = (recvTimeout_*1000)/ ((maxRecvRetries_>0) ? maxRecvRetries_ : 2);
303 }
304
305 try_again:
306 // Read from the socket
307 struct timeval begin;
308 gettimeofday(&begin, NULL);
309 int got = recv(socket_, buf, len, 0);
310 int errno_copy = errno; //gettimeofday can change errno
311 struct timeval end;
312 gettimeofday(&end, NULL);
313 uint32_t readElapsedMicros = (((end.tv_sec - begin.tv_sec) * 1000 * 1000)
314 + (((uint64_t)(end.tv_usec - begin.tv_usec))));
315 ++g_socket_syscalls;
316
317 // Check for error on read
318 if (got < 0) {
319 if (errno_copy == EAGAIN) {
320 // check if this is the lack of resources or timeout case
321 if (!eagainThresholdMicros || (readElapsedMicros < eagainThresholdMicros)) {
322 if (retries++ < maxRecvRetries_) {
323 usleep(50);
324 goto try_again;
325 } else {
326 throw TTransportException(TTransportException::TIMED_OUT,
327 "EAGAIN (unavailable resources)");
328 }
329 } else {
330 // infer that timeout has been hit
331 throw TTransportException(TTransportException::TIMED_OUT,
332 "EAGAIN (timed out)");
333 }
334 }
335
336 // If interrupted, try again
337 if (errno_copy == EINTR && retries++ < maxRecvRetries_) {
338 goto try_again;
339 }
340
341 // Now it's not a try again case, but a real probblez
342 GlobalOutput.perror("TSocket::read() recv() " + getSocketInfo(), errno_copy);
343
344 // If we disconnect with no linger time
345 if (errno_copy == ECONNRESET) {
346 #ifdef __FreeBSD__
347 /* shigin: freebsd doesn't follow POSIX semantic of recv and fails with
348 * ECONNRESET if peer performed shutdown
349 */
350 close();
351 return 0;
352 #else
353 throw TTransportException(TTransportException::NOT_OPEN, "ECONNRESET");
354 #endif
355 }
356
357 // This ish isn't open
358 if (errno_copy == ENOTCONN) {
359 throw TTransportException(TTransportException::NOT_OPEN, "ENOTCONN");
360 }
361
362 // Timed out!
363 if (errno_copy == ETIMEDOUT) {
364 throw TTransportException(TTransportException::TIMED_OUT, "ETIMEDOUT");
365 }
366
367 // Some other error, whatevz
368 throw TTransportException(TTransportException::UNKNOWN, "Unknown", errno_copy);
369 }
370
371 // The remote host has closed the socket
372 if (got == 0) {
373 close();
374 return 0;
375 }
376
377 // Pack data into string
378 return got;
379}
380
381void TSocket::write(const uint8_t* buf, uint32_t len) {
382 if (socket_ < 0) {
383 throw TTransportException(TTransportException::NOT_OPEN, "Called write on non-open socket");
384 }
385
386 uint32_t sent = 0;
387
388 while (sent < len) {
389
390 int flags = 0;
391 #ifdef MSG_NOSIGNAL
392 // Note the use of MSG_NOSIGNAL to suppress SIGPIPE errors, instead we
393 // check for the EPIPE return condition and close the socket in that case
394 flags |= MSG_NOSIGNAL;
395 #endif // ifdef MSG_NOSIGNAL
396
397 int b = send(socket_, buf + sent, len - sent, flags);
398 ++g_socket_syscalls;
399
400 // Fail on a send error
401 if (b < 0) {
402 int errno_copy = errno;
403 GlobalOutput.perror("TSocket::write() send() " + getSocketInfo(), errno_copy);
404
405 if (errno == EPIPE || errno == ECONNRESET || errno == ENOTCONN) {
406 close();
407 throw TTransportException(TTransportException::NOT_OPEN, "write() send()", errno_copy);
408 }
409
410 throw TTransportException(TTransportException::UNKNOWN, "write() send()", errno_copy);
411 }
412
413 // Fail on blocked send
414 if (b == 0) {
415 throw TTransportException(TTransportException::NOT_OPEN, "Socket send returned 0.");
416 }
417 sent += b;
418 }
419}
420
421std::string TSocket::getHost() {
422 return host_;
423}
424
425int TSocket::getPort() {
426 return port_;
427}
428
429void TSocket::setHost(string host) {
430 host_ = host;
431}
432
433void TSocket::setPort(int port) {
434 port_ = port;
435}
436
437void TSocket::setLinger(bool on, int linger) {
438 lingerOn_ = on;
439 lingerVal_ = linger;
440 if (socket_ < 0) {
441 return;
442 }
443
444 struct linger l = {(lingerOn_ ? 1 : 0), lingerVal_};
445 int ret = setsockopt(socket_, SOL_SOCKET, SO_LINGER, &l, sizeof(l));
446 if (ret == -1) {
447 int errno_copy = errno; // Copy errno because we're allocating memory.
448 GlobalOutput.perror("TSocket::setLinger() setsockopt() " + getSocketInfo(), errno_copy);
449 }
450}
451
452void TSocket::setNoDelay(bool noDelay) {
453 noDelay_ = noDelay;
454 if (socket_ < 0) {
455 return;
456 }
457
458 // Set socket to NODELAY
459 int v = noDelay_ ? 1 : 0;
460 int ret = setsockopt(socket_, IPPROTO_TCP, TCP_NODELAY, &v, sizeof(v));
461 if (ret == -1) {
462 int errno_copy = errno; // Copy errno because we're allocating memory.
463 GlobalOutput.perror("TSocket::setNoDelay() setsockopt() " + getSocketInfo(), errno_copy);
464 }
465}
466
467void TSocket::setConnTimeout(int ms) {
468 connTimeout_ = ms;
469}
470
471void TSocket::setRecvTimeout(int ms) {
472 if (ms < 0) {
473 char errBuf[512];
474 sprintf(errBuf, "TSocket::setRecvTimeout with negative input: %d\n", ms);
475 GlobalOutput(errBuf);
476 return;
477 }
478 recvTimeout_ = ms;
479
480 if (socket_ < 0) {
481 return;
482 }
483
484 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
485 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
486
487 // Copy because poll may modify
488 struct timeval r = recvTimeval_;
489 int ret = setsockopt(socket_, SOL_SOCKET, SO_RCVTIMEO, &r, sizeof(r));
490 if (ret == -1) {
491 int errno_copy = errno; // Copy errno because we're allocating memory.
492 GlobalOutput.perror("TSocket::setRecvTimeout() setsockopt() " + getSocketInfo(), errno_copy);
493 }
494}
495
496void TSocket::setSendTimeout(int ms) {
497 if (ms < 0) {
498 char errBuf[512];
499 sprintf(errBuf, "TSocket::setSendTimeout with negative input: %d\n", ms);
500 GlobalOutput(errBuf);
501 return;
502 }
503 sendTimeout_ = ms;
504
505 if (socket_ < 0) {
506 return;
507 }
508
509 struct timeval s = {(int)(sendTimeout_/1000),
510 (int)((sendTimeout_%1000)*1000)};
511 int ret = setsockopt(socket_, SOL_SOCKET, SO_SNDTIMEO, &s, sizeof(s));
512 if (ret == -1) {
513 int errno_copy = errno; // Copy errno because we're allocating memory.
514 GlobalOutput.perror("TSocket::setSendTimeout() setsockopt() " + getSocketInfo(), errno_copy);
515 }
516}
517
518void TSocket::setMaxRecvRetries(int maxRecvRetries) {
519 maxRecvRetries_ = maxRecvRetries;
520}
521
522string TSocket::getSocketInfo() {
523 std::ostringstream oss;
524 oss << "<Host: " << host_ << " Port: " << port_ << ">";
525 return oss.str();
526}
527
528std::string TSocket::getPeerHost() {
529 if (peerHost_.empty()) {
530 struct sockaddr_storage addr;
531 socklen_t addrLen = sizeof(addr);
532
533 if (socket_ < 0) {
534 return host_;
535 }
536
537 int rv = getpeername(socket_, (sockaddr*) &addr, &addrLen);
538
539 if (rv != 0) {
540 return peerHost_;
541 }
542
543 char clienthost[NI_MAXHOST];
544 char clientservice[NI_MAXSERV];
545
546 getnameinfo((sockaddr*) &addr, addrLen,
547 clienthost, sizeof(clienthost),
548 clientservice, sizeof(clientservice), 0);
549
550 peerHost_ = clienthost;
551 }
552 return peerHost_;
553}
554
555std::string TSocket::getPeerAddress() {
556 if (peerAddress_.empty()) {
557 struct sockaddr_storage addr;
558 socklen_t addrLen = sizeof(addr);
559
560 if (socket_ < 0) {
561 return peerAddress_;
562 }
563
564 int rv = getpeername(socket_, (sockaddr*) &addr, &addrLen);
565
566 if (rv != 0) {
567 return peerAddress_;
568 }
569
570 char clienthost[NI_MAXHOST];
571 char clientservice[NI_MAXSERV];
572
573 getnameinfo((sockaddr*) &addr, addrLen,
574 clienthost, sizeof(clienthost),
575 clientservice, sizeof(clientservice),
576 NI_NUMERICHOST|NI_NUMERICSERV);
577
578 peerAddress_ = clienthost;
579 peerPort_ = std::atoi(clientservice);
580 }
581 return peerAddress_;
582}
583
584int TSocket::getPeerPort() {
585 getPeerAddress();
586 return peerPort_;
587}
588
589}}} // apache::thrift::transport