blob: 5d653c4df04ef776c3bbaae7b9ef9c7f62a822eb [file] [log] [blame]
Mark Slee9f0c6512007-02-28 23:58:26 +00001// Copyright (c) 2006- Facebook
2// Distributed under the Thrift Software License
3//
4// See accompanying file LICENSE or visit the Thrift site at:
5// http://developers.facebook.com/thrift/
6
Marc Slemkoe03da182006-07-21 21:32:36 +00007#include <config.h>
Mark Sleee8540632006-05-30 09:24:40 +00008#include <sys/socket.h>
9#include <arpa/inet.h>
10#include <netinet/in.h>
11#include <netinet/tcp.h>
12#include <netdb.h>
13#include <unistd.h>
14#include <errno.h>
Mark Slee29050782006-09-29 00:12:30 +000015#include <fcntl.h>
16#include <sys/select.h>
Mark Sleee8540632006-05-30 09:24:40 +000017
Mark Slee29050782006-09-29 00:12:30 +000018#include "concurrency/Monitor.h"
Marc Slemkod42a2c22006-08-10 03:30:18 +000019#include "TSocket.h"
20#include "TTransportException.h"
Mark Sleee8540632006-05-30 09:24:40 +000021
Marc Slemko6f038a72006-08-03 18:58:09 +000022namespace facebook { namespace thrift { namespace transport {
23
Mark Sleee8540632006-05-30 09:24:40 +000024using namespace std;
Mark Slee29050782006-09-29 00:12:30 +000025using namespace facebook::thrift::concurrency;
Mark Sleee8540632006-05-30 09:24:40 +000026
Mark Slee29050782006-09-29 00:12:30 +000027// Global var to track total socket sys calls
Mark Slee8d7e1f62006-06-07 06:48:56 +000028uint32_t g_socket_syscalls = 0;
29
30/**
31 * TSocket implementation.
32 *
33 * @author Mark Slee <mcslee@facebook.com>
34 */
35
Mark Sleee8540632006-05-30 09:24:40 +000036// Mutex to protect syscalls to netdb
Mark Slee29050782006-09-29 00:12:30 +000037static Monitor s_netdb_monitor;
Mark Sleee8540632006-05-30 09:24:40 +000038
39// TODO(mcslee): Make this an option to the socket class
40#define MAX_RECV_RETRIES 20
Mark Slee29050782006-09-29 00:12:30 +000041
42TSocket::TSocket(string host, int port) :
43 host_(host),
44 port_(port),
Martin Kraemeree341cb2007-02-05 21:40:38 +000045 socket_(-1),
Mark Slee29050782006-09-29 00:12:30 +000046 connTimeout_(0),
47 sendTimeout_(0),
48 recvTimeout_(0),
49 lingerOn_(1),
50 lingerVal_(0),
51 noDelay_(1) {
Mark Sleeb9ff32a2006-11-16 01:00:24 +000052 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
53 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
Mark Sleee8540632006-05-30 09:24:40 +000054}
55
Aditya Agarwalebc99e02007-01-15 23:14:58 +000056TSocket::TSocket() :
57 host_(""),
58 port_(0),
Martin Kraemeree341cb2007-02-05 21:40:38 +000059 socket_(-1),
Aditya Agarwalebc99e02007-01-15 23:14:58 +000060 connTimeout_(0),
61 sendTimeout_(0),
62 recvTimeout_(0),
63 lingerOn_(1),
64 lingerVal_(0),
65 noDelay_(1) {
66 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
67 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
68}
69
Mark Slee29050782006-09-29 00:12:30 +000070TSocket::TSocket(int socket) :
71 host_(""),
72 port_(0),
73 socket_(socket),
74 connTimeout_(0),
75 sendTimeout_(0),
76 recvTimeout_(0),
77 lingerOn_(1),
78 lingerVal_(0),
79 noDelay_(1) {
Mark Sleeb9ff32a2006-11-16 01:00:24 +000080 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
81 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
Mark Slee29050782006-09-29 00:12:30 +000082}
83
Mark Sleee8540632006-05-30 09:24:40 +000084TSocket::~TSocket() {
85 close();
86}
87
Mark Slee8d7e1f62006-06-07 06:48:56 +000088bool TSocket::isOpen() {
Martin Kraemeree341cb2007-02-05 21:40:38 +000089 return (socket_ >= 0);
Mark Slee8d7e1f62006-06-07 06:48:56 +000090}
91
Mark Sleeb9ff32a2006-11-16 01:00:24 +000092bool TSocket::peek() {
93 if (!isOpen()) {
94 return false;
95 }
96 uint8_t buf;
97 int r = recv(socket_, &buf, 1, MSG_PEEK);
98 if (r == -1) {
99 perror("TSocket::peek()");
100 close();
Mark Sleef9831082007-02-20 20:59:21 +0000101 throw TTransportException(TTransportException::UNKNOWN, "recv() ERROR:" + errno);
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000102 }
103 return (r > 0);
104}
105
Mark Slee8d7e1f62006-06-07 06:48:56 +0000106void TSocket::open() {
Mark Sleea9848d72007-02-21 04:54:05 +0000107 if (isOpen()) {
108 throw TTransportException(TTransportException::ALREADY_OPEN);
109 }
110
Mark Sleee8540632006-05-30 09:24:40 +0000111 // Create socket
112 socket_ = socket(AF_INET, SOCK_STREAM, 0);
113 if (socket_ == -1) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000114 perror("TSocket::open() socket");
115 close();
Mark Sleef9831082007-02-20 20:59:21 +0000116 throw TTransportException(TTransportException::NOT_OPEN, "socket() ERROR:" + errno);
Mark Sleee8540632006-05-30 09:24:40 +0000117 }
Mark Slee29050782006-09-29 00:12:30 +0000118
119 // Send timeout
120 if (sendTimeout_ > 0) {
121 setSendTimeout(sendTimeout_);
122 }
123
124 // Recv timeout
125 if (recvTimeout_ > 0) {
126 setRecvTimeout(recvTimeout_);
127 }
128
129 // Linger
130 setLinger(lingerOn_, lingerVal_);
131
132 // No delay
133 setNoDelay(noDelay_);
134
Mark Slee8d7e1f62006-06-07 06:48:56 +0000135 // Lookup the hostname
Mark Sleee8540632006-05-30 09:24:40 +0000136 struct sockaddr_in addr;
137 addr.sin_family = AF_INET;
138 addr.sin_port = htons(port_);
139
Mark Sleee8540632006-05-30 09:24:40 +0000140 {
Mark Slee29050782006-09-29 00:12:30 +0000141 // Scope lock on host entry lookup
142 Synchronized s(s_netdb_monitor);
Mark Sleee8540632006-05-30 09:24:40 +0000143 struct hostent *host_entry = gethostbyname(host_.c_str());
144
145 if (host_entry == NULL) {
Mark Slee29050782006-09-29 00:12:30 +0000146 perror("TSocket: dns error: failed call to gethostbyname.");
Mark Sleee8540632006-05-30 09:24:40 +0000147 close();
Mark Sleef9831082007-02-20 20:59:21 +0000148 throw TTransportException(TTransportException::NOT_OPEN, "gethostbyname() failed");
Mark Sleee8540632006-05-30 09:24:40 +0000149 }
150
151 addr.sin_port = htons(port_);
152 memcpy(&addr.sin_addr.s_addr,
153 host_entry->h_addr_list[0],
154 host_entry->h_length);
155 }
Mark Slee29050782006-09-29 00:12:30 +0000156
157 // Set the socket to be non blocking for connect if a timeout exists
158 int flags = fcntl(socket_, F_GETFL, 0);
159 if (connTimeout_ > 0) {
160 fcntl(socket_, F_SETFL, flags | O_NONBLOCK);
161 } else {
162 fcntl(socket_, F_SETFL, flags | ~O_NONBLOCK);
163 }
164
165 // Conn timeout
166 struct timeval c = {(int)(connTimeout_/1000),
167 (int)((connTimeout_%1000)*1000)};
Mark Sleee8540632006-05-30 09:24:40 +0000168
169 // Connect the socket
170 int ret = connect(socket_, (struct sockaddr *)&addr, sizeof(addr));
171
Mark Slee29050782006-09-29 00:12:30 +0000172 if (ret == 0) {
173 goto done;
174 }
175
176 if (errno != EINPROGRESS) {
Mark Sleee8540632006-05-30 09:24:40 +0000177 close();
Mark Slee29050782006-09-29 00:12:30 +0000178 char buff[1024];
179 sprintf(buff, "TSocket::open() connect %s %d", host_.c_str(), port_);
180 perror(buff);
Mark Sleef9831082007-02-20 20:59:21 +0000181 throw TTransportException(TTransportException::NOT_OPEN, "open() ERROR: " + errno);
Mark Sleee8540632006-05-30 09:24:40 +0000182 }
183
Mark Slee29050782006-09-29 00:12:30 +0000184 fd_set fds;
185 FD_ZERO(&fds);
186 FD_SET(socket_, &fds);
187 ret = select(socket_+1, NULL, &fds, NULL, &c);
188
189 if (ret > 0) {
190 // Ensure connected
191 int val;
192 socklen_t lon;
193 lon = sizeof(int);
194 int ret2 = getsockopt(socket_, SOL_SOCKET, SO_ERROR, (void *)&val, &lon);
195 if (ret2 == -1) {
196 close();
197 perror("TSocket::open() getsockopt SO_ERROR");
Mark Sleef9831082007-02-20 20:59:21 +0000198 throw TTransportException(TTransportException::NOT_OPEN, "open() ERROR: " + errno);
Mark Slee29050782006-09-29 00:12:30 +0000199 }
200 if (val == 0) {
201 goto done;
202 }
203 close();
204 perror("TSocket::open() SO_ERROR was set");
Mark Sleef9831082007-02-20 20:59:21 +0000205 throw TTransportException(TTransportException::NOT_OPEN, "open() ERROR: " + errno);
Mark Slee29050782006-09-29 00:12:30 +0000206 } else if (ret == 0) {
207 close();
208 perror("TSocket::open() timeed out");
Mark Sleef9831082007-02-20 20:59:21 +0000209 throw TTransportException(TTransportException::NOT_OPEN, "open() ERROR: " + errno);
Mark Slee29050782006-09-29 00:12:30 +0000210 } else {
211 close();
212 perror("TSocket::open() select error");
Mark Sleef9831082007-02-20 20:59:21 +0000213 throw TTransportException(TTransportException::NOT_OPEN, "open() ERROR: " + errno);
Mark Slee29050782006-09-29 00:12:30 +0000214 }
215
216 done:
217 // Set socket back to normal mode (blocking)
218 fcntl(socket_, F_SETFL, flags);
Mark Sleee8540632006-05-30 09:24:40 +0000219}
220
221void TSocket::close() {
Martin Kraemeree341cb2007-02-05 21:40:38 +0000222 if (socket_ >= 0) {
Mark Sleee8540632006-05-30 09:24:40 +0000223 shutdown(socket_, SHUT_RDWR);
224 ::close(socket_);
225 }
Martin Kraemeree341cb2007-02-05 21:40:38 +0000226 socket_ = -1;
Mark Sleee8540632006-05-30 09:24:40 +0000227}
228
Mark Slee8d7e1f62006-06-07 06:48:56 +0000229uint32_t TSocket::read(uint8_t* buf, uint32_t len) {
Martin Kraemeree341cb2007-02-05 21:40:38 +0000230 if (socket_ < 0) {
Mark Sleef9831082007-02-20 20:59:21 +0000231 throw TTransportException(TTransportException::NOT_OPEN, "Called read on non-open socket");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000232 }
Mark Sleee8540632006-05-30 09:24:40 +0000233
Mark Sleee8540632006-05-30 09:24:40 +0000234 uint32_t retries = 0;
Mark Slee8d7e1f62006-06-07 06:48:56 +0000235
236 try_again:
237 // Read from the socket
238 int got = recv(socket_, buf, len, 0);
239 ++g_socket_syscalls;
240
241 // Check for error on read
Mark Sleec4257802007-01-24 23:14:30 +0000242 if (got < 0) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000243 // If temporarily out of resources, sleep a bit and try again
244 if (errno == EAGAIN && retries++ < MAX_RECV_RETRIES) {
245 usleep(50);
246 goto try_again;
Mark Sleee8540632006-05-30 09:24:40 +0000247 }
248
Mark Slee8d7e1f62006-06-07 06:48:56 +0000249 // If interrupted, try again
250 if (errno == EINTR && retries++ < MAX_RECV_RETRIES) {
251 goto try_again;
Mark Sleee8540632006-05-30 09:24:40 +0000252 }
253
Mark Sleec4257802007-01-24 23:14:30 +0000254 // Now it's not a try again case, but a real probblez
255 perror("TSocket::read()");
256
Mark Slee8d7e1f62006-06-07 06:48:56 +0000257 // If we disconnect with no linger time
258 if (errno == ECONNRESET) {
Mark Sleef9831082007-02-20 20:59:21 +0000259 throw TTransportException(TTransportException::NOT_OPEN, "ECONNRESET");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000260 }
261
262 // This ish isn't open
263 if (errno == ENOTCONN) {
Mark Sleef9831082007-02-20 20:59:21 +0000264 throw TTransportException(TTransportException::NOT_OPEN, "ENOTCONN");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000265 }
266
267 // Timed out!
268 if (errno == ETIMEDOUT) {
Mark Sleef9831082007-02-20 20:59:21 +0000269 throw TTransportException(TTransportException::TIMED_OUT, "ETIMEDOUT");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000270 }
271
272 // Some other error, whatevz
Mark Sleef9831082007-02-20 20:59:21 +0000273 throw TTransportException(TTransportException::UNKNOWN, "ERROR:" + errno);
Mark Slee8d7e1f62006-06-07 06:48:56 +0000274 }
275
276 // The remote host has closed the socket
277 if (got == 0) {
278 close();
279 return 0;
Mark Sleee8540632006-05-30 09:24:40 +0000280 }
281
282 // Pack data into string
Mark Slee8d7e1f62006-06-07 06:48:56 +0000283 return got;
Mark Sleee8540632006-05-30 09:24:40 +0000284}
285
Mark Slee8d7e1f62006-06-07 06:48:56 +0000286void TSocket::write(const uint8_t* buf, uint32_t len) {
Martin Kraemeree341cb2007-02-05 21:40:38 +0000287 if (socket_ < 0) {
Mark Sleef9831082007-02-20 20:59:21 +0000288 throw TTransportException(TTransportException::NOT_OPEN, "Called write on non-open socket");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000289 }
290
Mark Sleee8540632006-05-30 09:24:40 +0000291 uint32_t sent = 0;
292
Mark Slee8d7e1f62006-06-07 06:48:56 +0000293 while (sent < len) {
Marc Slemko9d4a3e22006-07-21 19:53:48 +0000294
295 int flags = 0;
Mark Slee29050782006-09-29 00:12:30 +0000296 #ifdef MSG_NOSIGNAL
Mark Slee8d7e1f62006-06-07 06:48:56 +0000297 // Note the use of MSG_NOSIGNAL to suppress SIGPIPE errors, instead we
298 // check for the EPIPE return condition and close the socket in that case
Marc Slemko9d4a3e22006-07-21 19:53:48 +0000299 flags |= MSG_NOSIGNAL;
Mark Slee29050782006-09-29 00:12:30 +0000300 #endif // ifdef MSG_NOSIGNAL
Marc Slemko9d4a3e22006-07-21 19:53:48 +0000301
302 int b = send(socket_, buf + sent, len - sent, flags);
Mark Slee8d7e1f62006-06-07 06:48:56 +0000303 ++g_socket_syscalls;
304
Mark Sleee8540632006-05-30 09:24:40 +0000305 // Fail on a send error
306 if (b < 0) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000307 if (errno == EPIPE) {
308 close();
Mark Sleef9831082007-02-20 20:59:21 +0000309 throw TTransportException(TTransportException::NOT_OPEN, "EPIPE");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000310 }
311
312 if (errno == ECONNRESET) {
313 close();
Mark Sleef9831082007-02-20 20:59:21 +0000314 throw TTransportException(TTransportException::NOT_OPEN, "ECONNRESET");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000315 }
316
317 if (errno == ENOTCONN) {
318 close();
Mark Sleef9831082007-02-20 20:59:21 +0000319 throw TTransportException(TTransportException::NOT_OPEN, "ENOTCONN");
Mark Slee8d7e1f62006-06-07 06:48:56 +0000320 }
321
322 perror("TSocket::write() send < 0");
Mark Sleef9831082007-02-20 20:59:21 +0000323 throw TTransportException(TTransportException::UNKNOWN, "ERROR:" + errno);
Mark Sleee8540632006-05-30 09:24:40 +0000324 }
325
326 // Fail on blocked send
327 if (b == 0) {
Mark Sleef9831082007-02-20 20:59:21 +0000328 throw TTransportException(TTransportException::NOT_OPEN, "Socket send returned 0.");
Mark Sleee8540632006-05-30 09:24:40 +0000329 }
Mark Sleee8540632006-05-30 09:24:40 +0000330 sent += b;
331 }
332}
333
Aditya Agarwalebc99e02007-01-15 23:14:58 +0000334void TSocket::setHost(string host) {
335 host_ = host;
336}
337
338void TSocket::setPort(int port) {
339 port_ = port;
340}
341
Mark Slee8d7e1f62006-06-07 06:48:56 +0000342void TSocket::setLinger(bool on, int linger) {
Mark Slee29050782006-09-29 00:12:30 +0000343 lingerOn_ = on;
344 lingerVal_ = linger;
Martin Kraemeree341cb2007-02-05 21:40:38 +0000345 if (socket_ < 0) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000346 return;
347 }
348
Mark Slee29050782006-09-29 00:12:30 +0000349 struct linger l = {(lingerOn_ ? 1 : 0), lingerVal_};
350 int ret = setsockopt(socket_, SOL_SOCKET, SO_LINGER, &l, sizeof(l));
351 if (ret == -1) {
Mark Sleee8540632006-05-30 09:24:40 +0000352 perror("TSocket::setLinger()");
Mark Sleee8540632006-05-30 09:24:40 +0000353 }
Mark Sleee8540632006-05-30 09:24:40 +0000354}
355
Mark Slee8d7e1f62006-06-07 06:48:56 +0000356void TSocket::setNoDelay(bool noDelay) {
Mark Slee29050782006-09-29 00:12:30 +0000357 noDelay_ = noDelay;
Martin Kraemeree341cb2007-02-05 21:40:38 +0000358 if (socket_ < 0) {
Mark Slee8d7e1f62006-06-07 06:48:56 +0000359 return;
360 }
361
Mark Sleee8540632006-05-30 09:24:40 +0000362 // Set socket to NODELAY
Mark Slee29050782006-09-29 00:12:30 +0000363 int v = noDelay_ ? 1 : 0;
364 int ret = setsockopt(socket_, IPPROTO_TCP, TCP_NODELAY, &v, sizeof(v));
365 if (ret == -1) {
Mark Sleee8540632006-05-30 09:24:40 +0000366 perror("TSocket::setNoDelay()");
Mark Sleee8540632006-05-30 09:24:40 +0000367 }
Mark Sleee8540632006-05-30 09:24:40 +0000368}
Mark Slee29050782006-09-29 00:12:30 +0000369
370void TSocket::setConnTimeout(int ms) {
371 connTimeout_ = ms;
372}
373
374void TSocket::setRecvTimeout(int ms) {
375 recvTimeout_ = ms;
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000376 recvTimeval_.tv_sec = (int)(recvTimeout_/1000);
377 recvTimeval_.tv_usec = (int)((recvTimeout_%1000)*1000);
Martin Kraemeree341cb2007-02-05 21:40:38 +0000378 if (socket_ < 0) {
Mark Slee29050782006-09-29 00:12:30 +0000379 return;
380 }
381
Mark Sleeb9ff32a2006-11-16 01:00:24 +0000382 // Copy because select may modify
383 struct timeval r = recvTimeval_;
Mark Slee29050782006-09-29 00:12:30 +0000384 int ret = setsockopt(socket_, SOL_SOCKET, SO_RCVTIMEO, &r, sizeof(r));
385 if (ret == -1) {
386 perror("TSocket::setRecvTimeout()");
387 }
388}
389
390void TSocket::setSendTimeout(int ms) {
391 sendTimeout_ = ms;
Martin Kraemeree341cb2007-02-05 21:40:38 +0000392 if (socket_ < 0) {
Mark Slee29050782006-09-29 00:12:30 +0000393 return;
394 }
395
396 struct timeval s = {(int)(sendTimeout_/1000),
397 (int)((sendTimeout_%1000)*1000)};
398 int ret = setsockopt(socket_, SOL_SOCKET, SO_SNDTIMEO, &s, sizeof(s));
399 if (ret == -1) {
400 perror("TSocket::setSendTimeout()");
401 }
402}
403
Marc Slemko6f038a72006-08-03 18:58:09 +0000404}}} // facebook::thrift::transport