apt-pkg/contrib/strutl.cc

   1 // -*- mode: cpp; mode: fold -*-
   2 // Description                                                          /*{{{*/
   3 // $Id: strutl.cc,v 1.44 2001/06/08 05:16:39 jgg Exp $
   4 /* ######################################################################
   5
   6    String Util - Some useful string functions.
   7
   8    These have been collected from here and there to do all sorts of useful
   9    things to strings. They are useful in file parsers, URI handlers and
  10    especially in APT methods.
  11
  12    This source is placed in the Public Domain, do with it what you will
  13    It was originally written by Jason Gunthorpe <jgg@gpu.srv.ualberta.ca>
  14
  15    ##################################################################### */
  16                                                                         /*}}}*/
  17 // Includes                                                             /*{{{*/
  18 #ifdef __GNUG__
  19 #pragma implementation "apt-pkg/strutl.h"
  20 #endif
  21
  22 #include <apt-pkg/strutl.h>
  23 #include <apt-pkg/fileutl.h>
  24 #include <apt-pkg/error.h>
  25
  26 #include <apti18n.h>
  27
  28 #include <ctype.h>
  29 #include <string.h>
  30 #include <stdio.h>
  31 #include <unistd.h>
  32 #include <regex.h>
  33 #include <errno.h>
  34 #include <stdarg.h>
  35
  36 using namespace std;
  37                                                                         /*}}}*/
  38
  39 // strstrip - Remove white space from the front and back of a string    /*{{{*/
  40 // ---------------------------------------------------------------------
  41 /* This is handy to use when parsing a file. It also removes \n's left
  42    over from fgets and company */
  43 char *_strstrip(char *String)
  44 {
  45    for (;*String != 0 && (*String == ' ' || *String == '\t'); String++);
  46
  47    if (*String == 0)
  48       return String;
  49
  50    char *End = String + strlen(String) - 1;
  51    for (;End != String - 1 && (*End == ' ' || *End == '\t' || *End == '\n' ||
  52                                *End == '\r'); End--);
  53    End++;
  54    *End = 0;
  55    return String;
  56 };
  57                                                                         /*}}}*/
  58 // strtabexpand - Converts tabs into 8 spaces                           /*{{{*/
  59 // ---------------------------------------------------------------------
  60 /* */
  61 char *_strtabexpand(char *String,size_t Len)
  62 {
  63    for (char *I = String; I != I + Len && *I != 0; I++)
  64    {
  65       if (*I != '\t')
  66          continue;
  67       if (I + 8 > String + Len)
  68       {
  69          *I = 0;
  70          return String;
  71       }
  72
  73       /* Assume the start of the string is 0 and find the next 8 char
  74          division */
  75       int Len;
  76       if (String == I)
  77          Len = 1;
  78       else
  79          Len = 8 - ((String - I) % 8);
  80       Len -= 2;
  81       if (Len <= 0)
  82       {
  83          *I = ' ';
  84          continue;
  85       }
  86
  87       memmove(I + Len,I + 1,strlen(I) + 1);
  88       for (char *J = I; J + Len != I; *I = ' ', I++);
  89    }
  90    return String;
  91 }
  92                                                                         /*}}}*/
  93 // ParseQuoteWord - Parse a single word out of a string                 /*{{{*/
  94 // ---------------------------------------------------------------------
  95 /* This grabs a single word, converts any % escaped characters to their
  96    proper values and advances the pointer. Double quotes are understood
  97    and striped out as well. This is for URI/URL parsing. It also can
  98    understand [] brackets.*/
  99 bool ParseQuoteWord(const char *&String,string &Res)
 100 {
 101    // Skip leading whitespace
 102    const char *C = String;
 103    for (;*C != 0 && *C == ' '; C++);
 104    if (*C == 0)
 105       return false;
 106
 107    // Jump to the next word
 108    for (;*C != 0 && isspace(*C) == 0; C++)
 109    {
 110       if (*C == '"')
 111       {
 112          for (C++; *C != 0 && *C != '"'; C++);
 113          if (*C == 0)
 114             return false;
 115       }
 116       if (*C == '[')
 117       {
 118          for (C++; *C != 0 && *C != ']'; C++);
 119          if (*C == 0)
 120             return false;
 121       }
 122    }
 123
 124    // Now de-quote characters
 125    char Buffer[1024];
 126    char Tmp[3];
 127    const char *Start = String;
 128    char *I;
 129    for (I = Buffer; I < Buffer + sizeof(Buffer) && Start != C; I++)
 130    {
 131       if (*Start == '%' && Start + 2 < C)
 132       {
 133          Tmp[0] = Start[1];
 134          Tmp[1] = Start[2];
 135          Tmp[2] = 0;
 136          *I = (char)strtol(Tmp,0,16);
 137          Start += 3;
 138          continue;
 139       }
 140       if (*Start != '"')
 141          *I = *Start;
 142       else
 143          I--;
 144       Start++;
 145    }
 146    *I = 0;
 147    Res = Buffer;
 148
 149    // Skip ending white space
 150    for (;*C != 0 && isspace(*C) != 0; C++);
 151    String = C;
 152    return true;
 153 }
 154                                                                         /*}}}*/
 155 // ParseCWord - Parses a string like a C "" expression                  /*{{{*/
 156 // ---------------------------------------------------------------------
 157 /* This expects a series of space separated strings enclosed in ""'s.
 158    It concatenates the ""'s into a single string. */
 159 bool ParseCWord(const char *&String,string &Res)
 160 {
 161    // Skip leading whitespace
 162    const char *C = String;
 163    for (;*C != 0 && *C == ' '; C++);
 164    if (*C == 0)
 165       return false;
 166
 167    char Buffer[1024];
 168    char *Buf = Buffer;
 169    if (strlen(String) >= sizeof(Buffer))
 170        return false;
 171
 172    for (; *C != 0; C++)
 173    {
 174       if (*C == '"')
 175       {
 176          for (C++; *C != 0 && *C != '"'; C++)
 177             *Buf++ = *C;
 178
 179          if (*C == 0)
 180             return false;
 181
 182          continue;
 183       }
 184
 185       if (C != String && isspace(*C) != 0 && isspace(C[-1]) != 0)
 186          continue;
 187       if (isspace(*C) == 0)
 188          return false;
 189       *Buf++ = ' ';
 190    }
 191    *Buf = 0;
 192    Res = Buffer;
 193    String = C;
 194    return true;
 195 }
 196                                                                         /*}}}*/
 197 // QuoteString - Convert a string into quoted from                      /*{{{*/
 198 // ---------------------------------------------------------------------
 199 /* */
 200 string QuoteString(string Str,const char *Bad)
 201 {
 202    string Res;
 203    for (string::iterator I = Str.begin(); I != Str.end(); I++)
 204    {
 205       if (strchr(Bad,*I) != 0 || isprint(*I) == 0 ||
 206           *I <= 0x20 || *I >= 0x7F)
 207       {
 208          char Buf[10];
 209          sprintf(Buf,"%%%02x",(int)*I);
 210          Res += Buf;
 211       }
 212       else
 213          Res += *I;
 214    }
 215    return Res;
 216 }
 217                                                                         /*}}}*/
 218 // DeQuoteString - Convert a string from quoted from                    /*{{{*/
 219 // ---------------------------------------------------------------------
 220 /* This undoes QuoteString */
 221 string DeQuoteString(string Str)
 222 {
 223    string Res;
 224    for (string::const_iterator I = Str.begin(); I != Str.end(); I++)
 225    {
 226       if (*I == '%' && I + 2 < Str.end())
 227       {
 228          char Tmp[3];
 229          Tmp[0] = I[1];
 230          Tmp[1] = I[2];
 231          Tmp[2] = 0;
 232          Res += (char)strtol(Tmp,0,16);
 233          I += 2;
 234          continue;
 235       }
 236       else
 237          Res += *I;
 238    }
 239    return Res;
 240 }
 241
 242                                                                         /*}}}*/
 243 // SizeToStr - Convert a long into a human readable size                /*{{{*/
 244 // ---------------------------------------------------------------------
 245 /* A max of 4 digits are shown before conversion to the next highest unit.
 246    The max length of the string will be 5 chars unless the size is > 10
 247    YottaBytes (E24) */
 248 string SizeToStr(double Size)
 249 {
 250    char S[300];
 251    double ASize;
 252    if (Size >= 0)
 253       ASize = Size;
 254    else
 255       ASize = -1*Size;
 256
 257    /* bytes, KiloBytes, MegaBytes, GigaBytes, TeraBytes, PetaBytes,
 258       ExaBytes, ZettaBytes, YottaBytes */
 259    char Ext[] = {'\0','k','M','G','T','P','E','Z','Y'};
 260    int I = 0;
 261    while (I <= 8)
 262    {
 263       if (ASize < 100 && I != 0)
 264       {
 265          sprintf(S,"%.1f%c",ASize,Ext[I]);
 266          break;
 267       }
 268
 269       if (ASize < 10000)
 270       {
 271          sprintf(S,"%.0f%c",ASize,Ext[I]);
 272          break;
 273       }
 274       ASize /= 1000.0;
 275       I++;
 276    }
 277
 278    return S;
 279 }
 280                                                                         /*}}}*/
 281 // TimeToStr - Convert the time into a string                           /*{{{*/
 282 // ---------------------------------------------------------------------
 283 /* Converts a number of seconds to a hms format */
 284 string TimeToStr(unsigned long Sec)
 285 {
 286    char S[300];
 287
 288    while (1)
 289    {
 290       if (Sec > 60*60*24)
 291       {
 292          sprintf(S,"%lid %lih%lim%lis",Sec/60/60/24,(Sec/60/60) % 24,(Sec/60) % 60,Sec % 60);
 293          break;
 294       }
 295
 296       if (Sec > 60*60)
 297       {
 298          sprintf(S,"%lih%lim%lis",Sec/60/60,(Sec/60) % 60,Sec % 60);
 299          break;
 300       }
 301
 302       if (Sec > 60)
 303       {
 304          sprintf(S,"%lim%lis",Sec/60,Sec % 60);
 305          break;
 306       }
 307
 308       sprintf(S,"%lis",Sec);
 309       break;
 310    }
 311
 312    return S;
 313 }
 314                                                                         /*}}}*/
 315 // SubstVar - Substitute a string for another string                    /*{{{*/
 316 // ---------------------------------------------------------------------
 317 /* This replaces all occurances of Subst with Contents in Str. */
 318 string SubstVar(string Str,string Subst,string Contents)
 319 {
 320    string::size_type Pos = 0;
 321    string::size_type OldPos = 0;
 322    string Temp;
 323
 324    while (OldPos < Str.length() &&
 325           (Pos = Str.find(Subst,OldPos)) != string::npos)
 326    {
 327       Temp += string(Str,OldPos,Pos) + Contents;
 328       OldPos = Pos + Subst.length();
 329    }
 330
 331    if (OldPos == 0)
 332       return Str;
 333
 334    return Temp + string(Str,OldPos);
 335 }
 336
 337 string SubstVar(string Str,const struct SubstVar *Vars)
 338 {
 339    for (; Vars->Subst != 0; Vars++)
 340       Str = SubstVar(Str,Vars->Subst,*Vars->Contents);
 341    return Str;
 342 }
 343                                                                         /*}}}*/
 344 // URItoFileName - Convert the uri into a unique file name              /*{{{*/
 345 // ---------------------------------------------------------------------
 346 /* This converts a URI into a safe filename. It quotes all unsafe characters
 347    and converts / to _ and removes the scheme identifier. The resulting
 348    file name should be unique and never occur again for a different file */
 349 string URItoFileName(string URI)
 350 {
 351    // Nuke 'sensitive' items
 352    ::URI U(URI);
 353    U.User = string();
 354    U.Password = string();
 355    U.Access = "";
 356
 357    // "\x00-\x20{}|\\\\^\\[\\]<>\"\x7F-\xFF";
 358    URI = QuoteString(U,"\\|{}[]<>\"^~_=!@#$%^&*");
 359    string::iterator J = URI.begin();
 360    for (; J != URI.end(); J++)
 361       if (*J == '/')
 362          *J = '_';
 363    return URI;
 364 }
 365                                                                         /*}}}*/
 366 // Base64Encode - Base64 Encoding routine for short strings             /*{{{*/
 367 // ---------------------------------------------------------------------
 368 /* This routine performs a base64 transformation on a string. It was ripped
 369    from wget and then patched and bug fixed.
 370
 371    This spec can be found in rfc2045 */
 372 string Base64Encode(string S)
 373 {
 374    // Conversion table.
 375    static char tbl[64] = {'A','B','C','D','E','F','G','H',
 376                           'I','J','K','L','M','N','O','P',
 377                           'Q','R','S','T','U','V','W','X',
 378                           'Y','Z','a','b','c','d','e','f',
 379                           'g','h','i','j','k','l','m','n',
 380                           'o','p','q','r','s','t','u','v',
 381                           'w','x','y','z','0','1','2','3',
 382                           '4','5','6','7','8','9','+','/'};
 383
 384    // Pre-allocate some space
 385    string Final;
 386    Final.reserve((4*S.length() + 2)/3 + 2);
 387
 388    /* Transform the 3x8 bits to 4x6 bits, as required by
 389       base64.  */
 390    for (string::const_iterator I = S.begin(); I < S.end(); I += 3)
 391    {
 392       char Bits[3] = {0,0,0};
 393       Bits[0] = I[0];
 394       if (I + 1 < S.end())
 395          Bits[1] = I[1];
 396       if (I + 2 < S.end())
 397          Bits[2] = I[2];
 398
 399       Final += tbl[Bits[0] >> 2];
 400       Final += tbl[((Bits[0] & 3) << 4) + (Bits[1] >> 4)];
 401
 402       if (I + 1 >= S.end())
 403          break;
 404
 405       Final += tbl[((Bits[1] & 0xf) << 2) + (Bits[2] >> 6)];
 406
 407       if (I + 2 >= S.end())
 408          break;
 409
 410       Final += tbl[Bits[2] & 0x3f];
 411    }
 412
 413    /* Apply the padding elements, this tells how many bytes the remote
 414       end should discard */
 415    if (S.length() % 3 == 2)
 416       Final += '=';
 417    if (S.length() % 3 == 1)
 418       Final += "==";
 419
 420    return Final;
 421 }
 422                                                                         /*}}}*/
 423 // stringcmp - Arbitary string compare                                  /*{{{*/
 424 // ---------------------------------------------------------------------
 425 /* This safely compares two non-null terminated strings of arbitary
 426    length */
 427 int stringcmp(const char *A,const char *AEnd,const char *B,const char *BEnd)
 428 {
 429    for (; A != AEnd && B != BEnd; A++, B++)
 430       if (*A != *B)
 431          break;
 432
 433    if (A == AEnd && B == BEnd)
 434       return 0;
 435    if (A == AEnd)
 436       return 1;
 437    if (B == BEnd)
 438       return -1;
 439    if (*A < *B)
 440       return -1;
 441    return 1;
 442 }
 443
 444 #if __GNUC__ >= 3
 445 int stringcmp(string::const_iterator A,string::const_iterator AEnd,
 446               const char *B,const char *BEnd)
 447 {
 448    for (; A != AEnd && B != BEnd; A++, B++)
 449       if (*A != *B)
 450          break;
 451
 452    if (A == AEnd && B == BEnd)
 453       return 0;
 454    if (A == AEnd)
 455       return 1;
 456    if (B == BEnd)
 457       return -1;
 458    if (*A < *B)
 459       return -1;
 460    return 1;
 461 }
 462 int stringcmp(string::const_iterator A,string::const_iterator AEnd,
 463               string::const_iterator B,string::const_iterator BEnd)
 464 {
 465    for (; A != AEnd && B != BEnd; A++, B++)
 466       if (*A != *B)
 467          break;
 468
 469    if (A == AEnd && B == BEnd)
 470       return 0;
 471    if (A == AEnd)
 472       return 1;
 473    if (B == BEnd)
 474       return -1;
 475    if (*A < *B)
 476       return -1;
 477    return 1;
 478 }
 479 #endif
 480                                                                         /*}}}*/
 481 // stringcasecmp - Arbitary case insensitive string compare             /*{{{*/
 482 // ---------------------------------------------------------------------
 483 /* */
 484 int stringcasecmp(const char *A,const char *AEnd,const char *B,const char *BEnd)
 485 {
 486    for (; A != AEnd && B != BEnd; A++, B++)
 487       if (toupper(*A) != toupper(*B))
 488          break;
 489
 490    if (A == AEnd && B == BEnd)
 491       return 0;
 492    if (A == AEnd)
 493       return 1;
 494    if (B == BEnd)
 495       return -1;
 496    if (toupper(*A) < toupper(*B))
 497       return -1;
 498    return 1;
 499 }
 500 #if __GNUC__ >= 3
 501 int stringcasecmp(string::const_iterator A,string::const_iterator AEnd,
 502                   const char *B,const char *BEnd)
 503 {
 504    for (; A != AEnd && B != BEnd; A++, B++)
 505       if (toupper(*A) != toupper(*B))
 506          break;
 507
 508    if (A == AEnd && B == BEnd)
 509       return 0;
 510    if (A == AEnd)
 511       return 1;
 512    if (B == BEnd)
 513       return -1;
 514    if (toupper(*A) < toupper(*B))
 515       return -1;
 516    return 1;
 517 }
 518 int stringcasecmp(string::const_iterator A,string::const_iterator AEnd,
 519                   string::const_iterator B,string::const_iterator BEnd)
 520 {
 521    for (; A != AEnd && B != BEnd; A++, B++)
 522       if (toupper(*A) != toupper(*B))
 523          break;
 524
 525    if (A == AEnd && B == BEnd)
 526       return 0;
 527    if (A == AEnd)
 528       return 1;
 529    if (B == BEnd)
 530       return -1;
 531    if (toupper(*A) < toupper(*B))
 532       return -1;
 533    return 1;
 534 }
 535 #endif
 536                                                                         /*}}}*/
 537 // LookupTag - Lookup the value of a tag in a taged string              /*{{{*/
 538 // ---------------------------------------------------------------------
 539 /* The format is like those used in package files and the method
 540    communication system */
 541 string LookupTag(string Message,const char *Tag,const char *Default)
 542 {
 543    // Look for a matching tag.
 544    int Length = strlen(Tag);
 545    for (string::iterator I = Message.begin(); I + Length < Message.end(); I++)
 546    {
 547       // Found the tag
 548       if (I[Length] == ':' && stringcasecmp(I,I+Length,Tag) == 0)
 549       {
 550          // Find the end of line and strip the leading/trailing spaces
 551          string::iterator J;
 552          I += Length + 1;
 553          for (; isspace(*I) != 0 && I < Message.end(); I++);
 554          for (J = I; *J != '\n' && J < Message.end(); J++);
 555          for (; J > I && isspace(J[-1]) != 0; J--);
 556
 557          return string(I,J);
 558       }
 559
 560       for (; *I != '\n' && I < Message.end(); I++);
 561    }
 562
 563    // Failed to find a match
 564    if (Default == 0)
 565       return string();
 566    return Default;
 567 }
 568                                                                         /*}}}*/
 569 // StringToBool - Converts a string into a boolean                      /*{{{*/
 570 // ---------------------------------------------------------------------
 571 /* This inspects the string to see if it is true or if it is false and
 572    then returns the result. Several varients on true/false are checked. */
 573 int StringToBool(string Text,int Default)
 574 {
 575    char *End;
 576    int Res = strtol(Text.c_str(),&End,0);
 577    if (End != Text.c_str() && Res >= 0 && Res <= 1)
 578       return Res;
 579
 580    // Check for positives
 581    if (strcasecmp(Text.c_str(),"no") == 0 ||
 582        strcasecmp(Text.c_str(),"false") == 0 ||
 583        strcasecmp(Text.c_str(),"without") == 0 ||
 584        strcasecmp(Text.c_str(),"off") == 0 ||
 585        strcasecmp(Text.c_str(),"disable") == 0)
 586       return 0;
 587
 588    // Check for negatives
 589    if (strcasecmp(Text.c_str(),"yes") == 0 ||
 590        strcasecmp(Text.c_str(),"true") == 0 ||
 591        strcasecmp(Text.c_str(),"with") == 0 ||
 592        strcasecmp(Text.c_str(),"on") == 0 ||
 593        strcasecmp(Text.c_str(),"enable") == 0)
 594       return 1;
 595
 596    return Default;
 597 }
 598                                                                         /*}}}*/
 599 // TimeRFC1123 - Convert a time_t into RFC1123 format                   /*{{{*/
 600 // ---------------------------------------------------------------------
 601 /* This converts a time_t into a string time representation that is
 602    year 2000 complient and timezone neutral */
 603 string TimeRFC1123(time_t Date)
 604 {
 605    struct tm Conv = *gmtime(&Date);
 606    char Buf[300];
 607
 608    const char *Day[] = {"Sun","Mon","Tue","Wed","Thu","Fri","Sat"};
 609    const char *Month[] = {"Jan","Feb","Mar","Apr","May","Jun","Jul",
 610                           "Aug","Sep","Oct","Nov","Dec"};
 611
 612    sprintf(Buf,"%s, %02i %s %i %02i:%02i:%02i GMT",Day[Conv.tm_wday],
 613            Conv.tm_mday,Month[Conv.tm_mon],Conv.tm_year+1900,Conv.tm_hour,
 614            Conv.tm_min,Conv.tm_sec);
 615    return Buf;
 616 }
 617                                                                         /*}}}*/
 618 // ReadMessages - Read messages from the FD                             /*{{{*/
 619 // ---------------------------------------------------------------------
 620 /* This pulls full messages from the input FD into the message buffer.
 621    It assumes that messages will not pause during transit so no
 622    fancy buffering is used. */
 623 bool ReadMessages(int Fd, vector<string> &List)
 624 {
 625    char Buffer[4000];
 626    char *End = Buffer;
 627
 628    while (1)
 629    {
 630       int Res = read(Fd,End,sizeof(Buffer) - (End-Buffer));
 631       if (Res < 0 && errno == EINTR)
 632          continue;
 633
 634       // Process is dead, this is kind of bad..
 635       if (Res == 0)
 636          return false;
 637
 638       // No data
 639       if (Res < 0 && errno == EAGAIN)
 640          return true;
 641       if (Res < 0)
 642          return false;
 643
 644       End += Res;
 645
 646       // Look for the end of the message
 647       for (char *I = Buffer; I + 1 < End; I++)
 648       {
 649          if (I[0] != '\n' || I[1] != '\n')
 650             continue;
 651
 652          // Pull the message out
 653          string Message(Buffer,0,I-Buffer);
 654
 655          // Fix up the buffer
 656          for (; I < End && *I == '\n'; I++);
 657          End -= I-Buffer;
 658          memmove(Buffer,I,End-Buffer);
 659          I = Buffer;
 660
 661          List.push_back(Message);
 662       }
 663       if (End == Buffer)
 664          return true;
 665
 666       if (WaitFd(Fd) == false)
 667          return false;
 668    }
 669 }
 670                                                                         /*}}}*/
 671 // MonthConv - Converts a month string into a number                    /*{{{*/
 672 // ---------------------------------------------------------------------
 673 /* This was lifted from the boa webserver which lifted it from 'wn-v1.07'
 674    Made it a bit more robust with a few touppers though. */
 675 static int MonthConv(char *Month)
 676 {
 677    switch (toupper(*Month))
 678    {
 679       case 'A':
 680       return toupper(Month[1]) == 'P'?3:7;
 681       case 'D':
 682       return 11;
 683       case 'F':
 684       return 1;
 685       case 'J':
 686       if (toupper(Month[1]) == 'A')
 687          return 0;
 688       return toupper(Month[2]) == 'N'?5:6;
 689       case 'M':
 690       return toupper(Month[2]) == 'R'?2:4;
 691       case 'N':
 692       return 10;
 693       case 'O':
 694       return 9;
 695       case 'S':
 696       return 8;
 697
 698       // Pretend it is January..
 699       default:
 700       return 0;
 701    }
 702 }
 703                                                                         /*}}}*/
 704 // timegm - Internal timegm function if gnu is not available            /*{{{*/
 705 // ---------------------------------------------------------------------
 706 /* Ripped this evil little function from wget - I prefer the use of
 707    GNU timegm if possible as this technique will have interesting problems
 708    with leap seconds, timezones and other.
 709
 710    Converts struct tm to time_t, assuming the data in tm is UTC rather
 711    than local timezone (mktime assumes the latter).
 712
 713    Contributed by Roger Beeman <beeman@cisco.com>, with the help of
 714    Mark Baushke <mdb@cisco.com> and the rest of the Gurus at CISCO. */
 715 #ifndef __USE_MISC        // glib sets this
 716 static time_t timegm(struct tm *t)
 717 {
 718    time_t tl, tb;
 719
 720    tl = mktime (t);
 721    if (tl == -1)
 722       return -1;
 723    tb = mktime (gmtime (&tl));
 724    return (tl <= tb ? (tl + (tl - tb)) : (tl - (tb - tl)));
 725 }
 726 #endif
 727                                                                         /*}}}*/
 728 // StrToTime - Converts a string into a time_t                          /*{{{*/
 729 // ---------------------------------------------------------------------
 730 /* This handles all 3 populare time formats including RFC 1123, RFC 1036
 731    and the C library asctime format. It requires the GNU library function
 732    'timegm' to convert a struct tm in UTC to a time_t. For some bizzar
 733    reason the C library does not provide any such function :< This also
 734    handles the weird, but unambiguous FTP time format*/
 735 bool StrToTime(string Val,time_t &Result)
 736 {
 737    struct tm Tm;
 738    char Month[10];
 739    const char *I = Val.c_str();
 740
 741    // Skip the day of the week
 742    for (;*I != 0  && *I != ' '; I++);
 743
 744    // Handle RFC 1123 time
 745    Month[0] = 0;
 746    if (sscanf(I," %d %3s %d %d:%d:%d GMT",&Tm.tm_mday,Month,&Tm.tm_year,
 747               &Tm.tm_hour,&Tm.tm_min,&Tm.tm_sec) != 6)
 748    {
 749       // Handle RFC 1036 time
 750       if (sscanf(I," %d-%3s-%d %d:%d:%d GMT",&Tm.tm_mday,Month,
 751                  &Tm.tm_year,&Tm.tm_hour,&Tm.tm_min,&Tm.tm_sec) == 6)
 752          Tm.tm_year += 1900;
 753       else
 754       {
 755          // asctime format
 756          if (sscanf(I," %3s %d %d:%d:%d %d",Month,&Tm.tm_mday,
 757                     &Tm.tm_hour,&Tm.tm_min,&Tm.tm_sec,&Tm.tm_year) != 6)
 758          {
 759             // 'ftp' time
 760             if (sscanf(Val.c_str(),"%4d%2d%2d%2d%2d%2d",&Tm.tm_year,&Tm.tm_mon,
 761                        &Tm.tm_mday,&Tm.tm_hour,&Tm.tm_min,&Tm.tm_sec) != 6)
 762                return false;
 763             Tm.tm_mon--;
 764          }
 765       }
 766    }
 767
 768    Tm.tm_isdst = 0;
 769    if (Month[0] != 0)
 770       Tm.tm_mon = MonthConv(Month);
 771    Tm.tm_year -= 1900;
 772
 773    // Convert to local time and then to GMT
 774    Result = timegm(&Tm);
 775    return true;
 776 }
 777                                                                         /*}}}*/
 778 // StrToNum - Convert a fixed length string to a number                 /*{{{*/
 779 // ---------------------------------------------------------------------
 780 /* This is used in decoding the crazy fixed length string headers in
 781    tar and ar files. */
 782 bool StrToNum(const char *Str,unsigned long &Res,unsigned Len,unsigned Base)
 783 {
 784    char S[30];
 785    if (Len >= sizeof(S))
 786       return false;
 787    memcpy(S,Str,Len);
 788    S[Len] = 0;
 789
 790    // All spaces is a zero
 791    Res = 0;
 792    unsigned I;
 793    for (I = 0; S[I] == ' '; I++);
 794    if (S[I] == 0)
 795       return true;
 796
 797    char *End;
 798    Res = strtoul(S,&End,Base);
 799    if (End == S)
 800       return false;
 801
 802    return true;
 803 }
 804                                                                         /*}}}*/
 805 // HexDigit - Convert a hex character into an integer                   /*{{{*/
 806 // ---------------------------------------------------------------------
 807 /* Helper for Hex2Num */
 808 static int HexDigit(int c)
 809 {
 810    if (c >= '0' && c <= '9')
 811       return c - '0';
 812    if (c >= 'a' && c <= 'f')
 813       return c - 'a' + 10;
 814    if (c >= 'A' && c <= 'F')
 815       return c - 'A' + 10;
 816    return 0;
 817 }
 818                                                                         /*}}}*/
 819 // Hex2Num - Convert a long hex number into a buffer                    /*{{{*/
 820 // ---------------------------------------------------------------------
 821 /* The length of the buffer must be exactly 1/2 the length of the string. */
 822 bool Hex2Num(string Str,unsigned char *Num,unsigned int Length)
 823 {
 824    if (Str.length() != Length*2)
 825       return false;
 826
 827    // Convert each digit. We store it in the same order as the string
 828    int J = 0;
 829    for (string::const_iterator I = Str.begin(); I != Str.end();J++, I += 2)
 830    {
 831       if (isxdigit(*I) == 0 || isxdigit(I[1]) == 0)
 832          return false;
 833
 834       Num[J] = HexDigit(I[0]) << 4;
 835       Num[J] += HexDigit(I[1]);
 836    }
 837
 838    return true;
 839 }
 840                                                                         /*}}}*/
 841 // TokSplitString - Split a string up by a given token                  /*{{{*/
 842 // ---------------------------------------------------------------------
 843 /* This is intended to be a faster splitter, it does not use dynamic
 844    memories. Input is changed to insert nulls at each token location. */
 845 bool TokSplitString(char Tok,char *Input,char **List,
 846                     unsigned long ListMax)
 847 {
 848    // Strip any leading spaces
 849    char *Start = Input;
 850    char *Stop = Start + strlen(Start);
 851    for (; *Start != 0 && isspace(*Start) != 0; Start++);
 852
 853    unsigned long Count = 0;
 854    char *Pos = Start;
 855    while (Pos != Stop)
 856    {
 857       // Skip to the next Token
 858       for (; Pos != Stop && *Pos != Tok; Pos++);
 859
 860       // Back remove spaces
 861       char *End = Pos;
 862       for (; End > Start && (End[-1] == Tok || isspace(End[-1]) != 0); End--);
 863       *End = 0;
 864
 865       List[Count++] = Start;
 866       if (Count >= ListMax)
 867       {
 868          List[Count-1] = 0;
 869          return false;
 870       }
 871
 872       // Advance pos
 873       for (; Pos != Stop && (*Pos == Tok || isspace(*Pos) != 0 || *Pos == 0); Pos++);
 874       Start = Pos;
 875    }
 876
 877    List[Count] = 0;
 878    return true;
 879 }
 880                                                                         /*}}}*/
 881 // RegexChoice - Simple regex list/list matcher                         /*{{{*/
 882 // ---------------------------------------------------------------------
 883 /* */
 884 unsigned long RegexChoice(RxChoiceList *Rxs,const char **ListBegin,
 885                       const char **ListEnd)
 886 {
 887    for (RxChoiceList *R = Rxs; R->Str != 0; R++)
 888       R->Hit = false;
 889
 890    unsigned long Hits = 0;
 891    for (; ListBegin != ListEnd; ListBegin++)
 892    {
 893       // Check if the name is a regex
 894       const char *I;
 895       bool Regex = true;
 896       for (I = *ListBegin; *I != 0; I++)
 897          if (*I == '.' || *I == '?' || *I == '*' || *I == '|')
 898             break;
 899       if (*I == 0)
 900          Regex = false;
 901
 902       // Compile the regex pattern
 903       regex_t Pattern;
 904       if (Regex == true)
 905          if (regcomp(&Pattern,*ListBegin,REG_EXTENDED | REG_ICASE |
 906                      REG_NOSUB) != 0)
 907             Regex = false;
 908
 909       // Search the list
 910       bool Done = false;
 911       for (RxChoiceList *R = Rxs; R->Str != 0; R++)
 912       {
 913          if (R->Str[0] == 0)
 914             continue;
 915
 916          if (strcasecmp(R->Str,*ListBegin) != 0)
 917          {
 918             if (Regex == false)
 919                continue;
 920             if (regexec(&Pattern,R->Str,0,0,0) != 0)
 921                continue;
 922          }
 923          Done = true;
 924
 925          if (R->Hit == false)
 926             Hits++;
 927
 928          R->Hit = true;
 929       }
 930
 931       if (Regex == true)
 932          regfree(&Pattern);
 933
 934       if (Done == false)
 935          _error->Warning(_("Selection %s not found"),*ListBegin);
 936    }
 937
 938    return Hits;
 939 }
 940                                                                         /*}}}*/
 941 // ioprintf - C format string outputter to C++ iostreams                /*{{{*/
 942 // ---------------------------------------------------------------------
 943 /* This is used to make the internationalization strinc easier to translate
 944  and to allow reordering of parameters */
 945 void ioprintf(ostream &out,const char *format,...)
 946 {
 947    va_list args;
 948    va_start(args,format);
 949
 950    // sprintf the description
 951    char S[400];
 952    vsnprintf(S,sizeof(S),format,args);
 953    out << S;
 954 }
 955                                                                         /*}}}*/
 956
 957 // CheckDomainList - See if Host is in a , seperate list                /*{{{*/
 958 // ---------------------------------------------------------------------
 959 /* The domain list is a comma seperate list of domains that are suffix
 960    matched against the argument */
 961 bool CheckDomainList(string Host,string List)
 962 {
 963    string::const_iterator Start = List.begin();
 964    for (string::const_iterator Cur = List.begin(); Cur <= List.end(); Cur++)
 965    {
 966       if (Cur < List.end() && *Cur != ',')
 967          continue;
 968
 969       // Match the end of the string..
 970       if ((Host.size() >= (unsigned)(Cur - Start)) &&
 971           Cur - Start != 0 &&
 972           stringcasecmp(Host.end() - (Cur - Start),Host.end(),Start,Cur) == 0)
 973          return true;
 974
 975       Start = Cur + 1;
 976    }
 977    return false;
 978 }
 979                                                                         /*}}}*/
 980
 981 // URI::CopyFrom - Copy from an object                                  /*{{{*/
 982 // ---------------------------------------------------------------------
 983 /* This parses the URI into all of its components */
 984 void URI::CopyFrom(string U)
 985 {
 986    string::const_iterator I = U.begin();
 987
 988    // Locate the first colon, this separates the scheme
 989    for (; I < U.end() && *I != ':' ; I++);
 990    string::const_iterator FirstColon = I;
 991
 992    /* Determine if this is a host type URI with a leading double //
 993       and then search for the first single / */
 994    string::const_iterator SingleSlash = I;
 995    if (I + 3 < U.end() && I[1] == '/' && I[2] == '/')
 996       SingleSlash += 3;
 997
 998    /* Find the / indicating the end of the hostname, ignoring /'s in the
 999       square brackets */
1000    bool InBracket = false;
1001    for (; SingleSlash < U.end() && (*SingleSlash != '/' || InBracket == true); SingleSlash++)
1002    {
1003       if (*SingleSlash == '[')
1004          InBracket = true;
1005       if (InBracket == true && *SingleSlash == ']')
1006          InBracket = false;
1007    }
1008
1009    if (SingleSlash > U.end())
1010       SingleSlash = U.end();
1011
1012    // We can now write the access and path specifiers
1013    Access = string(U,0,FirstColon - U.begin());
1014    if (SingleSlash != U.end())
1015       Path = string(U,SingleSlash - U.begin());
1016    if (Path.empty() == true)
1017       Path = "/";
1018
1019    // Now we attempt to locate a user:pass@host fragment
1020    if (FirstColon[1] == '/' && FirstColon[2] == '/')
1021       FirstColon += 3;
1022    else
1023       FirstColon += 1;
1024    if (FirstColon >= U.end())
1025       return;
1026
1027    if (FirstColon > SingleSlash)
1028       FirstColon = SingleSlash;
1029
1030    // Find the colon...
1031    I = FirstColon + 1;
1032    if (I > SingleSlash)
1033       I = SingleSlash;
1034    for (; I < SingleSlash && *I != ':'; I++);
1035    string::const_iterator SecondColon = I;
1036
1037    // Search for the @ after the colon
1038    for (; I < SingleSlash && *I != '@'; I++);
1039    string::const_iterator At = I;
1040
1041    // Now write the host and user/pass
1042    if (At == SingleSlash)
1043    {
1044       if (FirstColon < SingleSlash)
1045          Host = string(U,FirstColon - U.begin(),SingleSlash - FirstColon);
1046    }
1047    else
1048    {
1049       Host = string(U,At - U.begin() + 1,SingleSlash - At - 1);
1050       User = string(U,FirstColon - U.begin(),SecondColon - FirstColon);
1051       if (SecondColon < At)
1052          Password = string(U,SecondColon - U.begin() + 1,At - SecondColon - 1);
1053    }
1054
1055    // Now we parse the RFC 2732 [] hostnames.
1056    unsigned long PortEnd = 0;
1057    InBracket = false;
1058    for (unsigned I = 0; I != Host.length();)
1059    {
1060       if (Host[I] == '[')
1061       {
1062          InBracket = true;
1063          Host.erase(I,1);
1064          continue;
1065       }
1066
1067       if (InBracket == true && Host[I] == ']')
1068       {
1069          InBracket = false;
1070          Host.erase(I,1);
1071          PortEnd = I;
1072          continue;
1073       }
1074       I++;
1075    }
1076
1077    // Tsk, weird.
1078    if (InBracket == true)
1079    {
1080       Host = string();
1081       return;
1082    }
1083
1084    // Now we parse off a port number from the hostname
1085    Port = 0;
1086    string::size_type Pos = Host.rfind(':');
1087    if (Pos == string::npos || Pos < PortEnd)
1088       return;
1089
1090    Port = atoi(string(Host,Pos+1).c_str());
1091    Host = string(Host,0,Pos);
1092 }
1093                                                                         /*}}}*/
1094 // URI::operator string - Convert the URI to a string                   /*{{{*/
1095 // ---------------------------------------------------------------------
1096 /* */
1097 URI::operator string()
1098 {
1099    string Res;
1100
1101    if (Access.empty() == false)
1102       Res = Access + ':';
1103
1104    if (Host.empty() == false)
1105    {
1106       if (Access.empty() == false)
1107          Res += "//";
1108
1109       if (User.empty() == false)
1110       {
1111          Res +=  User;
1112          if (Password.empty() == false)
1113             Res += ":" + Password;
1114          Res += "@";
1115       }
1116
1117       // Add RFC 2732 escaping characters
1118       if (Access.empty() == false &&
1119           (Host.find('/') != string::npos || Host.find(':') != string::npos))
1120          Res += '[' + Host + ']';
1121       else
1122          Res += Host;
1123
1124       if (Port != 0)
1125       {
1126          char S[30];
1127          sprintf(S,":%u",Port);
1128          Res += S;
1129       }
1130    }
1131
1132    if (Path.empty() == false)
1133    {
1134       if (Path[0] != '/')
1135          Res += "/" + Path;
1136       else
1137          Res += Path;
1138    }
1139
1140    return Res;
1141 }
1142                                                                         /*}}}*/
1143 // URI::SiteOnly - Return the schema and site for the URI               /*{{{*/
1144 // ---------------------------------------------------------------------
1145 /* */
1146 string URI::SiteOnly(string URI)
1147 {
1148    ::URI U(URI);
1149    U.User = string();
1150    U.Password = string();
1151    U.Path = string();
1152    U.Port = 0;
1153    return U;
1154 }
1155                                                                         /*}}}*/