1 /* +------------------------------------+
2 * | Inspire Internet Relay Chat Daemon |
3 * +------------------------------------+
5 * InspIRCd: (C) 2002-2009 InspIRCd Development Team
6 * See: http://www.inspircd.org/wiki/index.php/Credits
8 * This program is free but copyrighted software; see
9 * the file COPYING for details.
11 * ---------------------------------------------------
14 /* Contains a code of Unreal IRCd + Bynets patch ( http://www.unrealircd.com/ and http://www.bynets.org/ )
15 Original patch is made by Dmitry "Killer{R}" Kononko. ( http://killprog.com/ )
16 Changed at 2008-06-15 - 2009-02-11
17 by Chernov-Phoenix Alexey (Phoenix@RusNet) mailto:phoenix /email address separator/ pravmail.ru */
23 /* $ModDesc: Provides an ability to have non-RFC1459 nicks & support for national CASEMAPPING */
25 class lwbNickHandler : public HandlerBase2<bool, const char*, size_t>
29 lwbNickHandler(InspIRCd* Srv) : Server(Srv) { }
30 virtual ~lwbNickHandler() { }
31 virtual bool Call(const char*, size_t);
34 /*,m_reverse_additionalUp[256];*/
35 static unsigned char m_reverse_additional[256],m_additionalMB[256],m_additionalUtf8[256],m_additionalUtf8range[256],m_additionalUtf8interval[256];
37 char utf8checkrest(unsigned char * mb, unsigned char cnt)
39 for (unsigned char * tmp=mb; tmp<mb+cnt; tmp++)
41 /* & is faster! -- Phoenix (char & b11000000 == b10000000) */
42 if ((*tmp & 192) != 128)
49 char utf8size(unsigned char * mb)
55 if ((*mb & 224) == 192)
56 return utf8checkrest(mb + 1,1);
57 if ((*mb & 240) == 224)
58 return utf8checkrest(mb + 1,2);
59 if ((*mb & 248) == 240)
60 return utf8checkrest(mb + 1,3);
65 /* Conditions added */
66 bool lwbNickHandler::Call(const char* n, size_t max)
72 for (const char* i = n; *i; i++, p++)
74 /* 1. Multibyte encodings support: */
75 /* 1.1. 16bit char. areas, e.g. chinese:*/
77 /* if current character is the last, we DO NOT check it against multibyte table */
78 /* if there are mbtable ranges, use ONLY them. No 8bit at all */
79 if (i[1] && m_additionalMB[0])
81 /* otherwise let's take a look at the current character and the following one */
83 for(unsigned char * mb = m_additionalMB; (*mb) && (mb < m_additionalMB + sizeof(m_additionalMB)); mb += 4)
85 if ( (i[0] >= mb[0]) && (i[0] <= mb[1]) && (i[1] >= mb[2]) && (i[1] <= mb[3]) )
87 /* multibyte range character found */
98 /* there are ranges, but incorrect char (8bit?) given, sorry */
102 /* 2. 8bit character support */
103 if (((*i >= 'A') && (*i <= '}')) || m_reverse_additional[(unsigned char)*i])
104 /* "A"-"}" can occur anywhere in a nickname */
107 if ((((*i >= '0') && (*i <= '9')) || (*i == '-')) && (i > n))
108 /* "0"-"9", "-" can occur anywhere BUT the first char of a nickname */
111 /* 3.1. Check against a simple UTF-8 characters enumeration */
112 int cursize, cursize2, ncursize = utf8size((unsigned char *)i);
113 /* do check only if current multibyte character is valid UTF-8 only */
117 for (unsigned char * mb = m_additionalUtf8; (utf8size(mb) != -1) && (mb < m_additionalUtf8 + sizeof(m_additionalUtf8)); mb += cursize)
119 cursize = utf8size(mb);
120 /* Size differs? Pick the next! */
121 if (cursize != ncursize)
124 if (!strncmp(i, (char *)mb, cursize))
135 /* 3.2. Check against an UTF-8 ranges: <start character> and <length of the range>. */
137 for (unsigned char * mb = m_additionalUtf8range; (utf8size(mb) != -1) && (mb < m_additionalUtf8range + sizeof(m_additionalUtf8range)); mb += cursize + 1)
139 cursize = utf8size(mb);
140 /* Size differs (or lengthbyte is zero)? Pick the next! */
141 if ((cursize != ncursize) || (!mb[cursize]))
144 unsigned char uright[5] = {0,0,0,0,0}, range = mb[cursize] - 1;
145 strncpy((char* ) uright, (char *) mb, cursize);
147 for (int temp = cursize - 1; (temp >= 0) && range; --temp)
149 /* all but the first char are 64-based */
152 char part64 = range & 63; /* i.e. % 64 */
153 /* handle carrying over */
154 if (uright[temp] + part64 - 1 > 191)
159 uright[temp] += part64;
160 range >>= 6; /* divide it on a 64 */
162 /* the first char of UTF-8 doesn't follow the rule */
165 uright[temp] += range;
169 if ((strncmp(i, (char *) mb, cursize) >= 0) && (strncmp(i, (char *) uright, cursize) <= 0))
180 /* 3.3. Check against an UTF-8 intervals: <start character> and <end character>. */
182 for (unsigned char * mb = m_additionalUtf8interval; (utf8size(mb) != -1) && (utf8size(mb+utf8size(mb)) != -1)
183 && (mb < m_additionalUtf8interval + sizeof(m_additionalUtf8interval)); mb += (cursize+cursize2) )
185 cursize = utf8size(mb);
186 cursize2= utf8size(mb+cursize);
188 int minlen = cursize > ncursize ? ncursize : cursize;
189 int minlen2 = cursize2 > ncursize ? ncursize : cursize2;
191 unsigned char* uright = mb + cursize;
193 if ((strncmp(i, (char *) mb, minlen) >= 0) && (strncmp(i, (char *) uright, minlen2) <= 0))
205 /* invalid character! abort */
209 /* too long? or not -- pointer arithmetic rocks */
214 class ModuleNationalChars : public Module
218 InspIRCd* ServerInstance;
219 lwbNickHandler* myhandler;
220 std::string charset, casemapping;
221 unsigned char m_additional[256], m_additionalUp[256], m_lower[256], m_upper[256];
222 caller2<bool, const char*, size_t> * rememberer;
224 const unsigned char * lowermap_rememberer;
227 ModuleNationalChars(InspIRCd* Me) : Module(Me)
229 rememberer = (caller2<bool, const char*, size_t> *) malloc(sizeof(rememberer));
231 lowermap_rememberer = national_case_insensitive_map;
232 memcpy(m_lower, rfc_case_insensitive_map, 256);
233 national_case_insensitive_map = m_lower;
237 *rememberer = ServerInstance->IsNick;
238 myhandler = new lwbNickHandler(ServerInstance);
239 ServerInstance->IsNick = myhandler;
241 Implementation eventlist[] = { I_OnRehash, I_On005Numeric };
242 ServerInstance->Modules->Attach(eventlist, this, 2);
246 virtual void On005Numeric(std::string &output)
248 std::string tmp(casemapping);
249 tmp.insert(0, "CASEMAPPING=");
250 SearchAndReplace(output, std::string("CASEMAPPING=rfc1459"), tmp);
253 virtual void OnRehash(User* user, const std::string ¶meter)
255 ConfigReader* conf = new ConfigReader(ServerInstance);
256 charset = conf->ReadValue("nationalchars", "file", 0);
257 casemapping = conf->ReadValue("nationalchars", "casemapping", charset, 0, false);
258 charset.insert(0, "../locales/");
259 unsigned char * tables[8] = { m_additional, m_additionalMB, m_additionalUp, m_lower, m_upper, m_additionalUtf8, m_additionalUtf8range, m_additionalUtf8interval };
260 loadtables(charset, tables, 8, 5);
261 forcequit = conf->ReadFlag("nationalchars", "forcequit", 0);
262 CheckForceQuit("National character set changed");
266 void CheckForceQuit(const char * message)
271 for (std::vector<User*>::iterator iter = ServerInstance->Users->local_users.begin(); iter != ServerInstance->Users->local_users.end(); ++iter)
273 /* Fix by Brain: Dont quit UID users */
275 if (!isdigit(n->nick[0]) && !ServerInstance->IsNick(n->nick.c_str(), ServerInstance->Config->Limits.NickMax))
276 ServerInstance->Users->QuitUser(n, message);
280 virtual ~ModuleNationalChars()
283 ServerInstance->IsNick = *rememberer;
285 national_case_insensitive_map = lowermap_rememberer;
286 CheckForceQuit("National characters module unloaded");
289 virtual Version GetVersion()
291 return Version("$Id: m_nationalchars.cpp 0 2008-12-15 14:24:12SAMT phoenix $",VF_COMMON,API_VERSION);
294 /*make an array to check against it 8bit characters a bit faster. Whether allowed or uppercase (for your needs).*/
295 void makereverse(unsigned char * from, unsigned char * to, unsigned int cnt)
298 for(unsigned char * n=from; (*n) && ((*n)<cnt) && (n<from+cnt); n++)
302 /*so Bynets Unreal distribution stuff*/
303 void loadtables(std::string filename, unsigned char ** tables, unsigned char cnt, char faillimit)
305 std::ifstream ifs(filename.c_str());
308 ServerInstance->Logs->Log("m_nationalchars",DEFAULT,"loadtables() called for missing file: %s", filename.c_str());
312 for (unsigned char n=0; n< cnt; n++)
314 memset(tables[n], 0, 256);
317 memcpy(m_lower, rfc_case_insensitive_map, 256);
319 for (unsigned char n = 0; n < cnt; n++)
321 if (loadtable(ifs, tables[n], 255) && (n < faillimit))
323 ServerInstance->Logs->Log("m_nationalchars",DEFAULT,"loadtables() called for illegal file: %s (line %d)", filename.c_str(), n+1);
328 makereverse(m_additional, m_reverse_additional, sizeof(m_additional));
331 unsigned char symtoi(const char *t,unsigned char base)
332 /* base = 16 for hexadecimal, 10 for decimal, 8 for octal ;) */
334 unsigned char tmp = 0, current;
335 while ((*t) && (*t !=' ') && (*t != 13) && (*t != 10) && (*t != ','))
338 current = ascii_case_insensitive_map[(unsigned char)*t];
340 current = current - 'a' + 10;
342 current = current - '0';
349 int loadtable(std::ifstream &ifs , unsigned char *chartable, unsigned int maxindex)
357 buf.erase(buf.find_last_not_of("\n") + 1);
359 if (buf[0] == '.') /* simple plain-text string after dot */
363 if (i > (maxindex + 1))
366 memcpy(chartable, buf.c_str() + 1, i);
370 const char * p = buf.c_str();
379 if (*p != '\'') /* decimal or hexadecimal char code */
384 /* hex with the leading "0x" */
385 chartable[i] = symtoi(p + 2, 16);
387 chartable[i] = symtoi(p + 1, 8);
392 chartable[i] = symtoi(p + 1, 16);
393 }else /* decimal form */
395 chartable[i] = symtoi(p, 10);
398 else /* plain-text char between '' */
400 if (*(p + 1) == '\\')
402 chartable[i] = *(p + 2);
406 chartable[i] = *(p + 1);
410 while (*p && (*p != ',') && (*p != ' ') && (*p != 13) && (*p != 10))
412 while (*p && ((*p == ',') || (*p == ' ') || (*p == 13) || (*p == 10)))
421 MODULE_INIT(ModuleNationalChars)