Blame - contrib/fb303/TClientInfo.h - packaging/sources/thrift

blob: 9b2d284f2cbea6e5f4cd5650adb2ce15a88ec821 [file] [log] [blame]

David Reiss	2324871	2010-10-06 17:10:08 +0000	[diff] [blame]	1	/*
				2	* Licensed to the Apache Software Foundation (ASF) under one
				3	* or more contributor license agreements. See the NOTICE file
				4	* distributed with this work for additional information
				5	* regarding copyright ownership. The ASF licenses this file
				6	* to you under the Apache License, Version 2.0 (the
				7	* "License"); you may not use this file except in compliance
				8	* with the License. You may obtain a copy of the License at
				9	*
				10	* http://www.apache.org/licenses/LICENSE-2.0
				11	*
				12	* Unless required by applicable law or agreed to in writing,
				13	* software distributed under the License is distributed on an
				14	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
				15	* KIND, either express or implied. See the License for the
				16	* specific language governing permissions and limitations
				17	* under the License.
				18	*/
				19
				20	#ifndef _FACEBOOK_THRIFT_SERVER_TCLIENTINFO_H_
				21	#define _FACEBOOK_THRIFT_SERVER_TCLIENTINFO_H_ 1
				22
				23	// for inet_ntop --
				24	#include <arpa/inet.h>
				25	#include <server/TServer.h>
				26	#include <transport/TSocket.h>
				27	#include <concurrency/Mutex.h>
				28
				29	namespace apache { namespace thrift { namespace server {
				30
				31	using namespace apache::thrift;
				32	using namespace apache::thrift::transport;
				33	using namespace apache::thrift::concurrency;
				34	using boost::shared_ptr;
				35	using std::string;
				36	using std::vector;
				37
				38	/**
				39	* StableVector -- a minimal vector class where growth is automatic and
				40	* vector elements never move as the vector grows. Allocates new space
				41	* as needed, but does not copy old values.
				42	*
				43	* A level vector stores a list of storage vectors containing the actual
				44	* elements. Levels are added as needed, doubling in size each time.
				45	* Locking is only done when a level is added. Access is amortized
				46	* constant time.
				47	*/
				48	template <typename T>
				49	class StableVector {
				50	/// The initial allocation as an exponent of 2
				51	static const uint32_t kInitialSizePowOf2 = 10;
				52	/// The initial allocation size
				53	static const uint32_t kInitialVectorSize = 1 << kInitialSizePowOf2;
				54	/// This bound is guaranteed not to be exceeded on 64-bit archs
				55	static const int kMaxLevels = 64;
				56
				57	/// Values are kept in one or more of these
				58	typedef vector<T> Vect;
				59	/// One or more value vectors are kept in one of these
				60	typedef vector<Vect*> LevelVector;
				61
				62	Mutex mutex_;
				63	/// current size
				64	size_t size_;
				65	_Atomic_word vectLvl_;
				66	LevelVector vects_;
				67
				68	public:
				69	/**
				70	* Constructor -- initialize the level vector and allocate the
				71	* initial storage vector
				72	*/
				73	StableVector()
				74	: size_(0)
				75	, vectLvl_(0) {
				76	vects_.reserve(kMaxLevels);
				77	Vect* storageVector(new Vect(1 << kInitialSizePowOf2));
				78	vects_.push_back(storageVector);
				79	}
				80
				81	private:
				82	/**
				83	* make sure the requested number of storage levels have been allocated.
				84	*/
				85	void expand(uint32_t level) {
				86	// we need the guard to insure that we only allocate once.
				87	Guard g(mutex_);
				88	while (level > vectLvl_) {
				89	Vect* levelVect(new Vect(1 << (vectLvl_ + kInitialSizePowOf2)));
				90	vects_.push_back(levelVect);
				91	// we need to make sure this is done after levelVect is inserted
				92	// (what we want is effectively a memory barrier here).
				93	__gnu_cxx::__atomic_add(&vectLvl_, 1);
				94	}
				95	}
				96
				97	/**
				98	* Given an index, determine which level and element of that level is
				99	* required. Grows if needed.
				100	*/
				101	void which(uint32_t n, uint32_t* vno, uint32_t* idx) {
				102	if (n >= size_) {
				103	size_ = n + 1;
				104	}
				105	if (n < kInitialVectorSize) {
				106	*idx = n;
				107	*vno = 0;
				108	} else {
				109	uint32_t upper = n >> kInitialSizePowOf2;
				110	vno = CHAR_BITsizeof(upper) - __builtin_clz(upper);
				111	idx = n - (1 << (vno + kInitialSizePowOf2 - 1));
				112	if (*vno > vectLvl_) {
				113	expand(*vno);
				114	}
				115	}
				116	}
				117
				118	public:
				119	/**
				120	* Given an index, return a reference to that element, perhaps after
				121	* allocating additional space.
				122	*
				123	* @param n a positive integer
				124	*/
				125	T& operator[](uint32_t n) {
				126	uint32_t vno;
				127	uint32_t idx;
				128	which(n, &vno, &idx);
				129	return (*vects_[vno])[idx];
				130	}
				131
				132	/**
				133	* Return the present size of the vector.
				134	*/
				135	size_t size() const { return size_; }
				136	};
				137
				138
				139	/**
				140	* This class embodies the representation of a single connection during
				141	* processing. We'll keep one of these per file descriptor in TClientInfo.
				142	*/
				143	class TClientInfoConnection {
				144	public:
				145	const static int kNameLen = 32;
				146
				147	private:
				148	typedef union IPAddrUnion {
				149	sockaddr_in ipv4;
				150	sockaddr_in6 ipv6;
				151	};
				152
				153	char call_[kNameLen]; ///< The name of the thrift call
				154	IPAddrUnion addr_; ///< The client's IP address
				155	timespec time_; ///< Time processing started
				156	uint64_t ncalls_; ///< # of calls processed
				157
				158	public:
				159	/**
				160	* Constructor; insure that no client address or thrift call name is
				161	* represented.
				162	*/
				163	TClientInfoConnection();
				164
				165	/**
				166	* A connection has been made; record its address. Since this is the
				167	* first we'll know of a connection we start the timer here as well.
				168	*/
				169	void recordAddr(const sockaddr* addr);
				170
				171	/**
				172	* Mark the address as empty/unknown.
				173	*/
				174	void eraseAddr();
				175
				176	/**
				177	* Return a string representing the present address, or NULL if none.
				178	* Copies the string into the buffer provided.
				179	*/
				180	const char* getAddr(char* buf, int len) const;
				181
				182	/**
				183	* A call has been made on this connection; record its name. Since this is
				184	* called for every thrift call processed, we also do our call count here.
				185	*/
				186	void recordCall(const char* name);
				187
				188	/**
				189	* Invoked when processing has ended to clear the call name.
				190	*/
				191	void eraseCall();
				192
				193	/**
				194	* Return as string the thrift call either currently being processed or
				195	* most recently processed if the connection is still open for additonal
				196	* calls. Returns NULL if a call hasn't been made yet or processing
				197	* has ended.
				198	*/
				199	const char* getCall() const;
				200
				201	/**
				202	* Get the timespec for the start of this connection (specifically, when
				203	* recordAddr() was first called).
				204	*/
				205	void getTime(timespec* time) const;
				206
				207	/**
				208	* Return the number of calls made on this connection.
				209	*/
				210	uint64_t getNCalls() const;
				211
				212	private:
				213	void initTime();
				214	};
				215
				216
				217	/**
				218	* Store for info about a server's clients -- specifically, the client's IP
				219	* address and the call it is executing. This information is indexed by
				220	* socket file descriptor and in the present implementation is updated
				221	* asynchronously, so it may only approximate reality.
				222	*/
				223	class TClientInfo {
				224	private:
				225	StableVector<TClientInfoConnection> info_;
				226
				227	public:
				228	/**
				229	* Return the info object for a given file descriptor. If "grow" is true
				230	* extend the info vector if required (such as for a file descriptor not seen
				231	* before). If "grow" is false and the info vector isn't large enough,
				232	* or if "fd" is negative, return NULL.
				233	*/
				234	TClientInfoConnection* getConnection(int fd, bool grow);
				235
				236	size_t size() const;
				237	};
				238
				239	/**
				240	* This derivation of TServerEventHandler encapsulates the main status vector
				241	* and provides context to the server's processing loop via overrides.
				242	* Together with TClientInfoCallHandler (derived from TProcessorEventHandler)
				243	* it integrates client info collection into the server.
				244	*/
				245	class TClientInfoServerHandler : public TServerEventHandler {
				246	private:
				247	TClientInfo clientInfo_;
				248
				249	public:
				250	/**
				251	* One of these is constructed for each open connection/descriptor and links
				252	* to both the status vector (clientInfo_) and that descriptor's entry
				253	* within it.
				254	*/
				255	struct Connect {
				256	TClientInfo* clientInfo_;
				257	TClientInfoConnection* callInfo_;
				258
				259	explicit Connect(TClientInfo* clientInfo)
				260	: clientInfo_(clientInfo)
				261	, callInfo_(NULL) {
				262	}
				263	};
				264
				265	/**
				266	* Generate processor context; we don't know what descriptor we belong to
				267	* yet -- we'll get hooked up in contextProcess().
				268	*/
				269	void* createContext(boost::shared_ptr<TProtocol> input,
				270	boost::shared_ptr<TProtocol> output);
				271
				272	/**
				273	* Mark our slot as unused and delete the context created in createContext().
				274	*/
				275	void deleteContext(void* processorContext,
				276	boost::shared_ptr<TProtocol> input,
				277	boost::shared_ptr<TProtocol> output);
				278
				279	/**
				280	* Called in the processing loop just before the server invokes the
				281	* processor itself, on the first call we establish which descriptor
				282	* we correspond to and set it to that socket's peer IP address. This
				283	* also has the side effect of initializing call counting and connection
				284	* timing. We won't know which call we're handling until the handler
				285	* first gets called in TClientInfoCallHandler::getContext().
				286	*/
				287	void processContext(void* processorContext,
				288	shared_ptr<TTransport> transport);
				289
				290	/**
				291	* Get status report for server in the form of a vector of strings.
				292	* Each active client appears as one string in the format:
				293	*
				294	* FD IPADDR CALLNAME DURATION NCALLS
				295	*
				296	* where "FD" is the file descriptor for the client's socket, "IPADDR"
				297	* is the IP address (as reported by accept()), "CALLNAME" is the
				298	* current or most recent Thrift function name, "DURATION" is the
				299	* duration of the connection, while NCALLS is the number of Thrift
				300	* calls made since the connection was made. A single space separates
				301	* fields.
				302	*/
				303	void getStatsStrings(vector<string>& result);
				304	};
				305
				306	/**
				307	* This class derives from TProcessorEventHandler to gain access to the
				308	* function name for the current Thrift call. We need two versions of
				309	* this -- TClientInfoCallStatsHandler is the other -- since in the latter
				310	* case we pass through to TFunctionStatHandler to perform Thrift call
				311	* stats.
				312	*/
				313	class TClientInfoCallHandler : public TProcessorEventHandler {
				314	public:
				315	virtual void* getContext(const char* fn_name, void* serverContext);
				316	};
				317
				318	} } } // namespace apache::thrift::server
				319
				320	#endif // !_FACEBOOK_THRIFT_SERVER_TCLIENTINFO_H_