src/hashcomp.cpp

   1 /*       +------------------------------------+
   2  *       | Inspire Internet Relay Chat Daemon |
   3  *       +------------------------------------+
   4  *
   5  *  InspIRCd: (C) 2002-2008 InspIRCd Development Team
   6  * See: http://www.inspircd.org/wiki/index.php/Credits
   7  *
   8  * This program is free but copyrighted software; see
   9  *            the file COPYING for details.
  10  *
  11  * ---------------------------------------------------
  12  */
  13
  14 /* $Core: libIRCDhash */
  15
  16 #include "inspircd.h"
  17 #include "hashcomp.h"
  18 #ifndef WIN32
  19 #include <ext/hash_map>
  20 #define nspace __gnu_cxx
  21 #else
  22 #include <hash_map>
  23 #define nspace stdext
  24 using stdext::hash_map;
  25 #endif
  26
  27 /******************************************************
  28  *
  29  * The hash functions of InspIRCd are the centrepoint
  30  * of the entire system. If these functions are
  31  * inefficient or wasteful, the whole program suffers
  32  * as a result. A lot of C programmers in the ircd
  33  * scene spend a lot of time debating (arguing) about
  34  * the best way to write hash functions to hash irc
  35  * nicknames, channels etc.
  36  * We are lucky as C++ developers as hash_map does
  37  * a lot of this for us. It does intellegent memory
  38  * requests, bucketing, search functions, insertion
  39  * and deletion etc. All we have to do is write some
  40  * overloaded comparison and hash value operators which
  41  * cause it to act in an irc-like way. The features we
  42  * add to the standard hash_map are:
  43  *
  44  * Case insensitivity: The hash_map will be case
  45  * insensitive.
  46  *
  47  * Scandanavian Comparisons: The characters [, ], \ will
  48  * be considered the lowercase of {, } and |.
  49  *
  50  ******************************************************/
  51
  52 /* convert a string to lowercase. Note following special circumstances
  53  * taken from RFC 1459. Many "official" server branches still hold to this
  54  * rule so i will too;
  55  *
  56  *  Because of IRC's scandanavian origin, the characters {}| are
  57  *  considered to be the lower case equivalents of the characters []\,
  58  *  respectively. This is a critical issue when determining the
  59  *  equivalence of two nicknames.
  60  */
  61 void nspace::strlower(char *n)
  62 {
  63         if (n)
  64         {
  65                 for (char* t = n; *t; t++)
  66                         *t = lowermap[(unsigned char)*t];
  67         }
  68 }
  69
  70 #ifndef WIN32
  71 size_t nspace::hash<std::string>::operator()(const std::string &s) const
  72 #else
  73 size_t nspace::hash_compare<std::string, std::less<std::string> >::operator()(const std::string &s) const
  74 #endif
  75 {
  76         /* XXX: NO DATA COPIES! :)
  77          * The hash function here is practically
  78          * a copy of the one in STL's hash_fun.h,
  79          * only with *x replaced with lowermap[*x].
  80          * This avoids a copy to use hash<const char*>
  81          */
  82         register size_t t = 0;
  83         for (std::string::const_iterator x = s.begin(); x != s.end(); ++x) /* ++x not x++, as its faster */
  84                 t = 5 * t + lowermap[(unsigned char)*x];
  85         return t;
  86 }
  87
  88 #ifndef WIN32
  89 size_t nspace::hash<irc::string>::operator()(const irc::string &s) const
  90 #else
  91 size_t nspace::hash_compare<irc::string, std::less<irc::string> >::operator()(const irc::string &s) const
  92 #endif
  93 {
  94         register size_t t = 0;
  95         for (irc::string::const_iterator x = s.begin(); x != s.end(); ++x) /* ++x not x++, as its faster */
  96                 t = 5 * t + lowermap[(unsigned char)*x];
  97         return t;
  98 }
  99
 100 bool irc::StrHashComp::operator()(const std::string& s1, const std::string& s2) const
 101 {
 102         const unsigned char* n1 = (const unsigned char*)s1.c_str();
 103         const unsigned char* n2 = (const unsigned char*)s2.c_str();
 104         for (; *n1 && *n2; n1++, n2++)
 105                 if (lowermap[*n1] != lowermap[*n2])
 106                         return false;
 107         return (lowermap[*n1] == lowermap[*n2]);
 108 }
 109
 110 /******************************************************
 111  *
 112  * This is the implementation of our special irc::string
 113  * class which is a case-insensitive equivalent to
 114  * std::string which is not only case-insensitive but
 115  * can also do scandanavian comparisons, e.g. { = [, etc.
 116  *
 117  * This class depends on the const array 'lowermap'.
 118  *
 119  ******************************************************/
 120
 121 bool irc::irc_char_traits::eq(char c1st, char c2nd)
 122 {
 123         return lowermap[(unsigned char)c1st] == lowermap[(unsigned char)c2nd];
 124 }
 125
 126 bool irc::irc_char_traits::ne(char c1st, char c2nd)
 127 {
 128         return lowermap[(unsigned char)c1st] != lowermap[(unsigned char)c2nd];
 129 }
 130
 131 bool irc::irc_char_traits::lt(char c1st, char c2nd)
 132 {
 133         return lowermap[(unsigned char)c1st] < lowermap[(unsigned char)c2nd];
 134 }
 135
 136 int irc::irc_char_traits::compare(const char* str1, const char* str2, size_t n)
 137 {
 138         for(unsigned int i = 0; i < n; i++)
 139         {
 140                 if(lowermap[(unsigned char)*str1] > lowermap[(unsigned char)*str2])
 141                         return 1;
 142
 143                 if(lowermap[(unsigned char)*str1] < lowermap[(unsigned char)*str2])
 144                         return -1;
 145
 146                 if(*str1 == 0 || *str2 == 0)
 147                         return 0;
 148
 149                 str1++;
 150                 str2++;
 151         }
 152         return 0;
 153 }
 154
 155 const char* irc::irc_char_traits::find(const char* s1, int  n, char c)
 156 {
 157         while(n-- > 0 && lowermap[(unsigned char)*s1] != lowermap[(unsigned char)c])
 158                 s1++;
 159         return s1;
 160 }
 161
 162 irc::tokenstream::tokenstream(const std::string &source) : tokens(source), last_pushed(false)
 163 {
 164         /* Record starting position and current position */
 165         last_starting_position = tokens.begin();
 166         n = tokens.begin();
 167 }
 168
 169 irc::tokenstream::~tokenstream()
 170 {
 171 }
 172
 173 bool irc::tokenstream::GetToken(std::string &token)
 174 {
 175         std::string::iterator lsp = last_starting_position;
 176
 177         while (n != tokens.end())
 178         {
 179                 /** Skip multi space, converting "  " into " "
 180                  */
 181                 while ((n+1 != tokens.end()) && (*n == ' ') && (*(n+1) == ' '))
 182                         n++;
 183
 184                 if ((last_pushed) && (*n == ':'))
 185                 {
 186                         /* If we find a token thats not the first and starts with :,
 187                          * this is the last token on the line
 188                          */
 189                         std::string::iterator curr = ++n;
 190                         n = tokens.end();
 191                         token = std::string(curr, tokens.end());
 192                         return true;
 193                 }
 194
 195                 last_pushed = false;
 196
 197                 if ((*n == ' ') || (n+1 == tokens.end()))
 198                 {
 199                         /* If we find a space, or end of string, this is the end of a token.
 200                          */
 201                         last_starting_position = n+1;
 202                         last_pushed = true;
 203
 204                         std::string strip(lsp, n+1 == tokens.end() ? n+1  : n++);
 205                         while ((strip.length()) && (strip.find_last_of(' ') == strip.length() - 1))
 206                                 strip.erase(strip.end() - 1);
 207
 208                         token = strip;
 209                         return !token.empty();
 210                 }
 211
 212                 n++;
 213         }
 214         token.clear();
 215         return false;
 216 }
 217
 218 bool irc::tokenstream::GetToken(irc::string &token)
 219 {
 220         std::string stdstring;
 221         bool returnval = GetToken(stdstring);
 222         token = assign(stdstring);
 223         return returnval;
 224 }
 225
 226 bool irc::tokenstream::GetToken(int &token)
 227 {
 228         std::string tok;
 229         bool returnval = GetToken(tok);
 230         token = ConvToInt(tok);
 231         return returnval;
 232 }
 233
 234 bool irc::tokenstream::GetToken(long &token)
 235 {
 236         std::string tok;
 237         bool returnval = GetToken(tok);
 238         token = ConvToInt(tok);
 239         return returnval;
 240 }
 241
 242 irc::sepstream::sepstream(const std::string &source, char seperator) : tokens(source), sep(seperator)
 243 {
 244         last_starting_position = tokens.begin();
 245         n = tokens.begin();
 246 }
 247
 248 bool irc::sepstream::GetToken(std::string &token)
 249 {
 250         std::string::iterator lsp = last_starting_position;
 251
 252         while (n != tokens.end())
 253         {
 254                 if ((*n == sep) || (n+1 == tokens.end()))
 255                 {
 256                         last_starting_position = n+1;
 257                         token = std::string(lsp, n+1 == tokens.end() ? n+1  : n++);
 258
 259                         while ((token.length()) && (token.find_last_of(sep) == token.length() - 1))
 260                                 token.erase(token.end() - 1);
 261
 262                         if (token.empty())
 263                                 n++;
 264
 265                         return n == tokens.end() ? false : true;
 266                 }
 267
 268                 n++;
 269         }
 270
 271         token = "";
 272         return false;
 273 }
 274
 275 const std::string irc::sepstream::GetRemaining()
 276 {
 277         return std::string(n, tokens.end());
 278 }
 279
 280 bool irc::sepstream::StreamEnd()
 281 {
 282         return ((n + 1) == tokens.end());
 283 }
 284
 285 irc::sepstream::~sepstream()
 286 {
 287 }
 288
 289 std::string irc::hex(const unsigned char *raw, size_t rawsz)
 290 {
 291         if (!rawsz)
 292                 return "";
 293
 294         /* EWW! This used to be using sprintf, which is WAY inefficient. -Special */
 295
 296         const char *hex = "0123456789abcdef";
 297         static char hexbuf[MAXBUF];
 298
 299         size_t i, j;
 300         for (i = 0, j = 0; j < rawsz; ++j)
 301         {
 302                 hexbuf[i++] = hex[raw[j] / 16];
 303                 hexbuf[i++] = hex[raw[j] % 16];
 304         }
 305         hexbuf[i] = 0;
 306
 307         return hexbuf;
 308 }
 309
 310 CoreExport const char* irc::Spacify(const char* n)
 311 {
 312         static char x[MAXBUF];
 313         strlcpy(x,n,MAXBUF);
 314         for (char* y = x; *y; y++)
 315                 if (*y == '_')
 316                         *y = ' ';
 317         return x;
 318 }
 319
 320
 321 irc::modestacker::modestacker(InspIRCd* Instance, bool add) : ServerInstance(Instance), adding(add)
 322 {
 323         sequence.clear();
 324         sequence.push_back("");
 325 }
 326
 327 void irc::modestacker::Push(char modeletter, const std::string &parameter)
 328 {
 329         *(sequence.begin()) += modeletter;
 330         sequence.push_back(parameter);
 331 }
 332
 333 void irc::modestacker::Push(char modeletter)
 334 {
 335         this->Push(modeletter,"");
 336 }
 337
 338 void irc::modestacker::PushPlus()
 339 {
 340         this->Push('+',"");
 341 }
 342
 343 void irc::modestacker::PushMinus()
 344 {
 345         this->Push('-',"");
 346 }
 347
 348 int irc::modestacker::GetStackedLine(std::deque<std::string> &result, int max_line_size)
 349 {
 350         if (sequence.empty())
 351         {
 352                 result.clear();
 353                 return 0;
 354         }
 355
 356         int n = 0;
 357         int size = 1; /* Account for initial +/- char */
 358         int nextsize = 0;
 359         result.clear();
 360         result.push_back(adding ? "+" : "-");
 361
 362         if (sequence.size() > 1)
 363                 nextsize = sequence[1].length() + 2;
 364
 365         while (!sequence[0].empty() && (sequence.size() > 1) && (result.size() < ServerInstance->Config->Limits.MaxModes) && ((size + nextsize) < max_line_size))
 366         {
 367                 result[0] += *(sequence[0].begin());
 368                 if (!sequence[1].empty())
 369                 {
 370                         result.push_back(sequence[1]);
 371                         size += nextsize; /* Account for mode character and whitespace */
 372                 }
 373                 sequence[0].erase(sequence[0].begin());
 374                 sequence.erase(sequence.begin() + 1);
 375
 376                 if (sequence.size() > 1)
 377                         nextsize = sequence[1].length() + 2;
 378
 379                 n++;
 380         }
 381
 382         return n;
 383 }
 384
 385 irc::stringjoiner::stringjoiner(const std::string &seperator, const std::vector<std::string> &sequence, int begin, int end)
 386 {
 387         for (int v = begin; v < end; v++)
 388                 joined.append(sequence[v]).append(seperator);
 389         joined.append(sequence[end]);
 390 }
 391
 392 irc::stringjoiner::stringjoiner(const std::string &seperator, const std::deque<std::string> &sequence, int begin, int end)
 393 {
 394         for (int v = begin; v < end; v++)
 395                 joined.append(sequence[v]).append(seperator);
 396         joined.append(sequence[end]);
 397 }
 398
 399 irc::stringjoiner::stringjoiner(const std::string &seperator, const char* const* sequence, int begin, int end)
 400 {
 401         for (int v = begin; v < end; v++)
 402                 joined.append(sequence[v]).append(seperator);
 403         joined.append(sequence[end]);
 404 }
 405
 406 std::string& irc::stringjoiner::GetJoined()
 407 {
 408         return joined;
 409 }
 410
 411 irc::portparser::portparser(const std::string &source, bool allow_overlapped) : in_range(0), range_begin(0), range_end(0), overlapped(allow_overlapped)
 412 {
 413         sep = new irc::commasepstream(source);
 414         overlap_set.clear();
 415 }
 416
 417 irc::portparser::~portparser()
 418 {
 419         delete sep;
 420 }
 421
 422 bool irc::portparser::Overlaps(long val)
 423 {
 424         if (!overlapped)
 425                 return false;
 426
 427         if (overlap_set.find(val) == overlap_set.end())
 428         {
 429                 overlap_set[val] = true;
 430                 return false;
 431         }
 432         else
 433                 return true;
 434 }
 435
 436 long irc::portparser::GetToken()
 437 {
 438         if (in_range > 0)
 439         {
 440                 in_range++;
 441                 if (in_range <= range_end)
 442                 {
 443                         if (!Overlaps(in_range))
 444                         {
 445                                 return in_range;
 446                         }
 447                         else
 448                         {
 449                                 while (((Overlaps(in_range)) && (in_range <= range_end)))
 450                                         in_range++;
 451
 452                                 if (in_range <= range_end)
 453                                         return in_range;
 454                         }
 455                 }
 456                 else
 457                         in_range = 0;
 458         }
 459
 460         std::string x;
 461         sep->GetToken(x);
 462
 463         if (x.empty())
 464                 return 0;
 465
 466         while (Overlaps(atoi(x.c_str())))
 467         {
 468                 if (!sep->GetToken(x))
 469                         return 0;
 470         }
 471
 472         std::string::size_type dash = x.rfind('-');
 473         if (dash != std::string::npos)
 474         {
 475                 std::string sbegin = x.substr(0, dash);
 476                 std::string send = x.substr(dash+1, x.length());
 477                 range_begin = atoi(sbegin.c_str());
 478                 range_end = atoi(send.c_str());
 479
 480                 if ((range_begin > 0) && (range_end > 0) && (range_begin < 65536) && (range_end < 65536) && (range_begin < range_end))
 481                 {
 482                         in_range = range_begin;
 483                         return in_range;
 484                 }
 485                 else
 486                 {
 487                         /* Assume its just the one port */
 488                         return atoi(sbegin.c_str());
 489                 }
 490         }
 491         else
 492         {
 493                 return atoi(x.c_str());
 494         }
 495 }
 496
 497 irc::dynamicbitmask::dynamicbitmask() : bits_size(4)
 498 {
 499         /* We start with 4 bytes allocated which is room
 500          * for 4 items. Something makes me doubt its worth
 501          * allocating less than 4 bytes.
 502          */
 503         bits = new unsigned char[bits_size];
 504         memset(bits, 0, bits_size);
 505 }
 506
 507 irc::dynamicbitmask::~dynamicbitmask()
 508 {
 509         /* Tidy up the entire used memory on delete */
 510         delete[] bits;
 511 }
 512
 513 irc::bitfield irc::dynamicbitmask::Allocate()
 514 {
 515         /* Yeah, this isnt too efficient, however a module or the core
 516          * should only be allocating bitfields on load, the Toggle and
 517          * Get methods are O(1) as these are called much more often.
 518          */
 519         unsigned char* freebits = this->GetFreeBits();
 520         for (unsigned char i = 0; i < bits_size; i++)
 521         {
 522                 /* Yes, this is right. You'll notice we terminate the  loop when !current_pos,
 523                  * this is because we logic shift our bit off the end of unsigned char, and its
 524                  * lost, making the loop counter 0 when we're done.
 525                  */
 526                 for (unsigned char current_pos = 1; current_pos; current_pos = current_pos << 1)
 527                 {
 528                         if (!(freebits[i] & current_pos))
 529                         {
 530                                 freebits[i] |= current_pos;
 531                                 return std::make_pair(i, current_pos);
 532                         }
 533                 }
 534         }
 535         /* We dont have any free space left, increase by one */
 536
 537         if (bits_size == 255)
 538                 /* Oh dear, cant grow it any further */
 539                 throw std::bad_alloc();
 540
 541         unsigned char old_bits_size = bits_size;
 542         bits_size++;
 543         /* Allocate new bitfield space */
 544         unsigned char* temp_bits = new unsigned char[bits_size];
 545         unsigned char* temp_freebits = new unsigned char[bits_size];
 546         /* Copy the old data in */
 547         memcpy(temp_bits, bits, old_bits_size);
 548         memcpy(temp_freebits, freebits, old_bits_size);
 549         /* Delete the old data pointers */
 550         delete[] bits;
 551         delete[] freebits;
 552         /* Swap the pointers over so now the new
 553          * pointers point to our member values
 554          */
 555         bits = temp_bits;
 556         freebits = temp_freebits;
 557         this->SetFreeBits(freebits);
 558         /* Initialize the new byte on the end of
 559          * the bitfields, pre-allocate the one bit
 560          * for this allocation
 561          */
 562         bits[old_bits_size] = 0;
 563         freebits[old_bits_size] = 1;
 564         /* We already know where we just allocated
 565          * the bitfield, so no loop needed
 566          */
 567         return std::make_pair(old_bits_size, 1);
 568 }
 569
 570 bool irc::dynamicbitmask::Deallocate(irc::bitfield &pos)
 571 {
 572         /* We dont bother to shrink the bitfield
 573          * on deallocation, the most we could do
 574          * is save one byte (!) and this would cost
 575          * us a loop (ugly O(n) stuff) so we just
 576          * clear the bit and leave the memory
 577          * claimed -- nobody will care about one
 578          * byte.
 579          */
 580         if (pos.first < bits_size)
 581         {
 582                 this->GetFreeBits()[pos.first] &= ~pos.second;
 583                 return true;
 584         }
 585         /* They gave a bitfield outside of the
 586          * length of our array. BAD programmer.
 587          */
 588         return false;
 589 }
 590
 591 void irc::dynamicbitmask::Toggle(irc::bitfield &pos, bool state)
 592 {
 593         /* Range check the value */
 594         if (pos.first < bits_size)
 595         {
 596                 if (state)
 597                         /* Set state, OR the state in */
 598                         bits[pos.first] |= pos.second;
 599                 else
 600                         /* Clear state, AND the !state out */
 601                         bits[pos.first] &= ~pos.second;
 602         }
 603 }
 604
 605 bool irc::dynamicbitmask::Get(irc::bitfield &pos)
 606 {
 607         /* Range check the value */
 608         if (pos.first < bits_size)
 609                 return (bits[pos.first] & pos.second);
 610         else
 611                 /* We can't return false, otherwise we can't
 612                  * distinguish between failure and a cleared bit!
 613                  * Our only sensible choice is to throw (ew).
 614                  */
 615                 throw ModuleException("irc::dynamicbitmask::Get(): Invalid bitfield, out of range");
 616 }
 617
 618 unsigned char irc::dynamicbitmask::GetSize()
 619 {
 620         return bits_size;
 621 }
 622