2 * InspIRCd -- Internet Relay Chat Daemon
4 * Copyright (C) 2009 Daniel De Graaf <danieldg@inspircd.org>
5 * Copyright (C) 2007-2008 Robin Burchell <robin+git@viroteck.net>
6 * Copyright (C) 2005-2007 Craig Edwards <craigedwards@brainbox.cc>
7 * Copyright (C) 2007 Dennis Friis <peavey@inspircd.org>
9 * This file is part of InspIRCd. InspIRCd is free software: you can
10 * redistribute it and/or modify it under the terms of the GNU General Public
11 * License as published by the Free Software Foundation, version 2.
13 * This program is distributed in the hope that it will be useful, but WITHOUT
14 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
15 * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
18 * You should have received a copy of the GNU General Public License
19 * along with this program. If not, see <http://www.gnu.org/licenses/>.
41 * Event mask for SocketEngine events
45 /** Do not test this socket for readability
47 FD_WANT_NO_READ = 0x1,
48 /** Give a read event at all times when reads will not block.
50 FD_WANT_POLL_READ = 0x2,
51 /** Give a read event when there is new data to read.
53 * An event MUST be sent if there is new data to be read, and the most
54 * recent read/recv() on this FD returned EAGAIN. An event MAY be sent
55 * at any time there is data to be read on the socket.
57 FD_WANT_FAST_READ = 0x4,
58 /** Give an optional read event when reads begin to unblock
60 * This state is useful if you want to leave data in the OS receive
61 * queue but not get continuous event notifications about it, because
62 * it may not require a system call to transition from FD_WANT_FAST_READ
64 FD_WANT_EDGE_READ = 0x8,
66 /** Mask for all read events */
67 FD_WANT_READ_MASK = 0x0F,
69 /** Do not test this socket for writeability
71 FD_WANT_NO_WRITE = 0x10,
72 /** Give a write event at all times when writes will not block.
74 * You probably shouldn't use this state; if it's likely that the write
75 * will not block, try it first, then use FD_WANT_FAST_WRITE if it
76 * fails. If it's likely to block (or you are using polling-style reads)
77 * then use FD_WANT_SINGLE_WRITE.
79 FD_WANT_POLL_WRITE = 0x20,
80 /** Give a write event when writes don't block any more
82 * An event MUST be sent if writes will not block, and the most recent
83 * write/send() on this FD returned EAGAIN, or connect() returned
84 * EINPROGRESS. An event MAY be sent at any time that writes will not
87 * Before calling OnEventHandler*(), a socket engine MAY change the state of
88 * the FD back to FD_WANT_EDGE_WRITE if it is simpler (for example, if a
89 * one-shot notification was registered). If further writes are needed,
90 * it is the responsibility of the event handler to change the state to
91 * one that will generate the required notifications
93 FD_WANT_FAST_WRITE = 0x40,
94 /** Give an optional write event on edge-triggered write unblock.
96 * This state is useful to avoid system calls when moving to/from
97 * FD_WANT_FAST_WRITE when writing data to a mostly-unblocked socket.
99 FD_WANT_EDGE_WRITE = 0x80,
100 /** Request a one-shot poll-style write notification. The socket will
101 * return to the FD_WANT_NO_WRITE state before OnEventHandler*() is called.
103 FD_WANT_SINGLE_WRITE = 0x100,
105 /** Mask for all write events */
106 FD_WANT_WRITE_MASK = 0x1F0,
108 /** Add a trial read. During the next DispatchEvents invocation, this
109 * will call OnEventHandlerRead() unless reads are known to be
112 FD_ADD_TRIAL_READ = 0x1000,
113 /** Assert that reads are known to block. This cancels FD_ADD_TRIAL_READ.
114 * Reset by SE before running OnEventHandlerRead().
116 FD_READ_WILL_BLOCK = 0x2000,
118 /** Add a trial write. During the next DispatchEvents invocation, this
119 * will call OnEventHandlerWrite() unless writes are known to be
122 * This could be used to group several writes together into a single
123 * send() syscall, or to ensure that writes are blocking when attempting
124 * to use FD_WANT_FAST_WRITE.
126 FD_ADD_TRIAL_WRITE = 0x4000,
127 /** Assert that writes are known to block. This cancels FD_ADD_TRIAL_WRITE.
128 * Reset by SE before running OnEventHandlerWrite().
130 FD_WRITE_WILL_BLOCK = 0x8000,
132 /** Mask for trial read/trial write */
133 FD_TRIAL_NOTE_MASK = 0x5000
136 /** This class is a basic I/O handler class.
137 * Any object which wishes to receive basic I/O events
138 * from the socketengine must derive from this class and
139 * implement the OnEventHandler*() methods. The derived class
140 * must then be added to SocketEngine using the method
141 * SocketEngine::AddFd(), after which point the derived
142 * class will receive events to its OnEventHandler*() methods.
143 * The event mask passed to SocketEngine::AddFd() determines
144 * what events the EventHandler gets notified about and with
145 * what semantics. SocketEngine::ChangeEventMask() can be
146 * called to update the event mask later. The only
147 * requirement beyond this for an event handler is that it
148 * must have a file descriptor. What this file descriptor
149 * is actually attached to is completely up to you.
151 class CoreExport EventHandler : public classbase
154 /** Private state maintained by socket engine */
157 void SetEventMask(int mask) { event_mask = mask; }
161 * All events which can be handled must have a file descriptor. This
162 * allows you to add events for sockets, fifo's, pipes, and various
163 * other forms of IPC. Do not change this while the object is
164 * registered with the SocketEngine
168 /** Get the current file descriptor
169 * @return The file descriptor of this handler
171 inline int GetFd() const { return fd; }
173 inline int GetEventMask() const { return event_mask; }
175 /** Set a new file desciptor
176 * @param FD The new file descriptor. Do not call this method without
177 * first deleting the object from the SocketEngine if you have
178 * added it to a SocketEngine instance.
188 virtual ~EventHandler() {}
190 /** Called by the socket engine in case of a read event
192 virtual void OnEventHandlerRead() = 0;
194 /** Called by the socket engine in case of a write event.
195 * The default implementation does nothing.
197 virtual void OnEventHandlerWrite();
199 /** Called by the socket engine in case of an error event.
200 * The default implementation does nothing.
201 * @param errornum Error code
203 virtual void OnEventHandlerError(int errornum);
205 friend class SocketEngine;
208 /** Provides basic file-descriptor-based I/O support.
209 * The actual socketengine class presents the
210 * same interface on all operating systems, but
211 * its private members and internal behaviour
212 * should be treated as blackboxed, and vary
213 * from system to system and upon the config
214 * settings chosen by the server admin.
216 class CoreExport SocketEngine
219 /** Socket engine statistics: count of various events, bandwidth usage
223 mutable size_t indata;
224 mutable size_t outdata;
225 mutable time_t lastempty;
227 /** Reset the byte counters and lastempty if there wasn't a reset in this second.
229 void CheckFlush() const;
232 /** Constructor, initializes member vars except indata and outdata because those are set to 0
233 * in CheckFlush() the first time Update() or GetBandwidth() is called.
235 Statistics() : lastempty(0), TotalEvents(0), ReadEvents(0), WriteEvents(0), ErrorEvents(0) { }
237 /** Update counters for network data received.
238 * This should be called after every read-type syscall.
239 * @param len_in Number of bytes received, or -1 for error, as typically
240 * returned by a read-style syscall.
242 void UpdateReadCounters(int len_in);
244 /** Update counters for network data sent.
245 * This should be called after every write-type syscall.
246 * @param len_out Number of bytes sent, or -1 for error, as typically
247 * returned by a read-style syscall.
249 void UpdateWriteCounters(int len_out);
251 /** Get data transfer statistics.
252 * @param kbitpersec_in Filled with incoming traffic in this second in kbit/s.
253 * @param kbitpersec_out Filled with outgoing traffic in this second in kbit/s.
254 * @param kbitpersec_total Filled with total traffic in this second in kbit/s.
256 void CoreExport GetBandwidth(float& kbitpersec_in, float& kbitpersec_out, float& kbitpersec_total) const;
258 unsigned long TotalEvents;
259 unsigned long ReadEvents;
260 unsigned long WriteEvents;
261 unsigned long ErrorEvents;
265 /** Reference table, contains all current handlers
267 static std::vector<EventHandler*> ref;
269 /** Current number of descriptors in the engine. */
270 static size_t CurrentSetSize;
272 /** The maximum number of descriptors in the engine. */
273 static size_t MaxSetSize;
275 /** List of handlers that want a trial read/write
277 static std::set<int> trials;
279 /** Socket engine statistics: count of various events, bandwidth usage
281 static Statistics stats;
283 /** Look up the fd limit using rlimit. */
284 static void LookupMaxFds();
286 static void OnSetEvent(EventHandler* eh, int old_mask, int new_mask);
288 /** Add an event handler to the base socket engine. AddFd(EventHandler*, int) should call this.
290 static bool AddFdRef(EventHandler* eh);
292 static void DelFdRef(EventHandler* eh);
294 template <typename T>
295 static void ResizeDouble(std::vector<T>& vect)
297 if (SocketEngine::CurrentSetSize > vect.size())
298 vect.resize(vect.size() * 2);
303 typedef iovec IOVector;
305 typedef WindowsIOVec IOVector;
309 * The constructor transparently initializes
310 * the socket engine which the ircd is using.
311 * Please note that if there is a catastrophic
312 * failure (for example, you try and enable
313 * epoll on a 2.4 linux kernel) then this
314 * function may bail back to the shell.
315 * @return void, but it is acceptable for this function to bail back to
316 * the shell or operating system on fatal error.
321 * The destructor transparently tidies up
322 * any resources used by the socket engine.
324 static void Deinit();
326 /** Add an EventHandler object to the engine. Use AddFd to add a file
327 * descriptor to the engine and have the socket engine monitor it. You
328 * must provide an object derived from EventHandler which implements
329 * the required OnEventHandler*() methods.
330 * @param eh An event handling object to add
331 * @param event_mask The initial event mask for the object
333 static bool AddFd(EventHandler* eh, int event_mask);
335 /** If you call this function and pass it an
336 * event handler, that event handler will
337 * receive the next available write event,
338 * even if the socket is a readable socket only.
339 * Developers should avoid constantly keeping
340 * an eventhandler in the writeable state,
341 * as this will consume large amounts of
343 * @param eh The event handler to change
344 * @param event_mask The changes to make to the wait state
346 static void ChangeEventMask(EventHandler* eh, int event_mask);
348 /** Returns the number of file descriptors reported by the system this program may use
349 * when it was started.
350 * @return If non-zero the number of file descriptors that the system reported that we
353 static size_t GetMaxFds() { return MaxSetSize; }
355 /** Returns the number of file descriptors being queried
356 * @return The set size
358 static size_t GetUsedFds() { return CurrentSetSize; }
360 /** Delete an event handler from the engine.
361 * This function call deletes an EventHandler
362 * from the engine, returning true if it succeeded
363 * and false if it failed. This does not free the
364 * EventHandler pointer using delete, if this is
365 * required you must do this yourself.
366 * @param eh The event handler object to remove
368 static void DelFd(EventHandler* eh);
370 /** Returns true if a file descriptor exists in
371 * the socket engine's list.
372 * @param fd The event handler to look for
373 * @return True if this fd has an event handler
375 static bool HasFd(int fd);
377 /** Returns the EventHandler attached to a specific fd.
378 * If the fd isnt in the socketengine, returns NULL.
379 * @param fd The event handler to look for
380 * @return A pointer to the event handler, or NULL
382 static EventHandler* GetRef(int fd);
384 /** Waits for events and dispatches them to handlers. Please note that
385 * this doesn't wait long, only a couple of milliseconds. It returns the
386 * number of events which occurred during this call. This method will
387 * dispatch events to their handlers by calling their
388 * EventHandler::OnEventHandler*() methods.
389 * @return The number of events which have occured.
391 static int DispatchEvents();
393 /** Dispatch trial reads and writes. This causes the actual socket I/O
394 * to happen when writes have been pre-buffered.
396 static void DispatchTrialWrites();
398 /** Returns true if the file descriptors in the given event handler are
399 * within sensible ranges which can be handled by the socket engine.
401 static bool BoundsCheckFd(EventHandler* eh);
403 /** Abstraction for BSD sockets accept(2).
404 * This function should emulate its namesake system call exactly.
405 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
406 * @param addr The client IP address and port
407 * @param addrlen The size of the sockaddr parameter.
408 * @return This method should return exactly the same values as the system call it emulates.
410 static int Accept(EventHandler* fd, sockaddr *addr, socklen_t *addrlen);
412 /** Close the underlying fd of an event handler, remove it from the socket engine and set the fd to -1.
413 * @param eh The EventHandler to close.
414 * @return 0 on success, a negative value on error
416 static int Close(EventHandler* eh);
418 /** Abstraction for BSD sockets close(2).
419 * This function should emulate its namesake system call exactly.
420 * This function should emulate its namesake system call exactly.
421 * @return This method should return exactly the same values as the system call it emulates.
423 static int Close(int fd);
425 /** Abstraction for BSD sockets send(2).
426 * This function should emulate its namesake system call exactly.
427 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
428 * @param buf The buffer in which the data that is sent is stored.
429 * @param len The size of the buffer.
430 * @param flags A flag value that controls the sending of the data.
431 * @return This method should return exactly the same values as the system call it emulates.
433 static int Send(EventHandler* fd, const void *buf, size_t len, int flags);
435 /** Abstraction for vector write function writev().
436 * This function should emulate its namesake system call exactly.
437 * @param fd EventHandler to send data with
438 * @param iov Array of IOVectors containing the buffers to send and their lengths in the platform's
440 * @param count Number of elements in iov.
441 * @return This method should return exactly the same values as the system call it emulates.
443 static int WriteV(EventHandler* fd, const IOVector* iov, int count);
446 /** Abstraction for vector write function writev() that accepts a POSIX format iovec.
447 * This function should emulate its namesake system call exactly.
448 * @param fd EventHandler to send data with
449 * @param iov Array of iovecs containing the buffers to send and their lengths in POSIX format.
450 * @param count Number of elements in iov.
451 * @return This method should return exactly the same values as the system call it emulates.
453 static int WriteV(EventHandler* fd, const iovec* iov, int count);
456 /** Abstraction for BSD sockets recv(2).
457 * This function should emulate its namesake system call exactly.
458 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
459 * @param buf The buffer in which the data that is read is stored.
460 * @param len The size of the buffer.
461 * @param flags A flag value that controls the reception of the data.
462 * @return This method should return exactly the same values as the system call it emulates.
464 static int Recv(EventHandler* fd, void *buf, size_t len, int flags);
466 /** Abstraction for BSD sockets recvfrom(2).
467 * This function should emulate its namesake system call exactly.
468 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
469 * @param buf The buffer in which the data that is read is stored.
470 * @param len The size of the buffer.
471 * @param flags A flag value that controls the reception of the data.
472 * @param from The remote IP address and port.
473 * @param fromlen The size of the from parameter.
474 * @return This method should return exactly the same values as the system call it emulates.
476 static int RecvFrom(EventHandler* fd, void *buf, size_t len, int flags, sockaddr *from, socklen_t *fromlen);
478 /** Abstraction for BSD sockets sendto(2).
479 * This function should emulate its namesake system call exactly.
480 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
481 * @param buf The buffer in which the data that is sent is stored.
482 * @param len The size of the buffer.
483 * @param flags A flag value that controls the sending of the data.
484 * @param to The remote IP address and port.
485 * @param tolen The size of the to parameter.
486 * @return This method should return exactly the same values as the system call it emulates.
488 static int SendTo(EventHandler* fd, const void *buf, size_t len, int flags, const sockaddr *to, socklen_t tolen);
490 /** Abstraction for BSD sockets connect(2).
491 * This function should emulate its namesake system call exactly.
492 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
493 * @param serv_addr The server IP address and port.
494 * @param addrlen The size of the sockaddr parameter.
495 * @return This method should return exactly the same values as the system call it emulates.
497 static int Connect(EventHandler* fd, const sockaddr *serv_addr, socklen_t addrlen);
499 /** Make a file descriptor blocking.
500 * @param fd a file descriptor to set to blocking mode
501 * @return 0 on success, -1 on failure, errno is set appropriately.
503 static int Blocking(int fd);
505 /** Make a file descriptor nonblocking.
506 * @param fd A file descriptor to set to nonblocking mode
507 * @return 0 on success, -1 on failure, errno is set appropriately.
509 static int NonBlocking(int fd);
511 /** Abstraction for BSD sockets shutdown(2).
512 * This function should emulate its namesake system call exactly.
513 * @param fd This version of the call takes an EventHandler instead of a bare file descriptor.
514 * @param how What part of the socket to shut down
515 * @return This method should return exactly the same values as the system call it emulates.
517 static int Shutdown(EventHandler* fd, int how);
519 /** Abstraction for BSD sockets shutdown(2).
520 * This function should emulate its namesake system call exactly.
521 * @return This method should return exactly the same values as the system call it emulates.
523 static int Shutdown(int fd, int how);
525 /** Abstraction for BSD sockets bind(2).
526 * This function should emulate its namesake system call exactly.
527 * @return This method should return exactly the same values as the system call it emulates.
529 static int Bind(int fd, const irc::sockets::sockaddrs& addr);
531 /** Abstraction for BSD sockets listen(2).
532 * This function should emulate its namesake system call exactly.
533 * @return This method should return exactly the same values as the system call it emulates.
535 static int Listen(int sockfd, int backlog);
537 /** Set SO_REUSEADDR and SO_LINGER on this file descriptor
539 static void SetReuse(int sockfd);
541 /** This function is called immediately after fork().
542 * Some socket engines (notably kqueue) cannot have their
543 * handles inherited by forked processes. This method
544 * allows for the socket engine to re-create its handle
545 * after the daemon forks as the socket engine is created
546 * long BEFORE the daemon forks.
547 * @return void, but it is acceptable for this function to bail back to
548 * the shell or operating system on fatal error.
550 static void RecoverFromFork();
552 /** Get data transfer and event statistics
554 static const Statistics& GetStats() { return stats; }
556 /** Should we ignore the error in errno?
557 * Checks EAGAIN and WSAEWOULDBLOCK
559 static bool IgnoreError();
561 /** Return the last socket related error. strrerror(errno) on *nix
563 static std::string LastError();
565 /** Returns the error for the given error num, strerror(errnum) on *nix
567 static std::string GetError(int errnum);
570 inline bool SocketEngine::IgnoreError()
572 if ((errno == EAGAIN) || (errno == EWOULDBLOCK))
576 if (WSAGetLastError() == WSAEWOULDBLOCK)