source4/lib/util_str.c

   1 /*
   2    Unix SMB/CIFS implementation.
   3    Samba utility functions
   4
   5    Copyright (C) Andrew Tridgell 1992-2001
   6    Copyright (C) Simo Sorce      2001-2002
   7    Copyright (C) Martin Pool     2003
   8
   9    This program is free software; you can redistribute it and/or modify
  10    it under the terms of the GNU General Public License as published by
  11    the Free Software Foundation; either version 2 of the License, or
  12    (at your option) any later version.
  13
  14    This program is distributed in the hope that it will be useful,
  15    but WITHOUT ANY WARRANTY; without even the implied warranty of
  16    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  17    GNU General Public License for more details.
  18
  19    You should have received a copy of the GNU General Public License
  20    along with this program; if not, write to the Free Software
  21    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  22 */
  23
  24 #include "includes.h"
  25 #include "system/iconv.h"
  26 #include "smb.h"
  27 #include "pstring.h"
  28 #include "lib/ldb/include/ldb.h"
  29
  30 /**
  31  * @file
  32  * @brief String utilities.
  33  **/
  34
  35 /**
  36  * Get the next token from a string, return False if none found.
  37  * Handles double-quotes.
  38  *
  39  * Based on a routine by GJC@VILLAGE.COM.
  40  * Extensively modified by Andrew.Tridgell@anu.edu.au
  41  **/
  42 BOOL next_token(const char **ptr,char *buff, const char *sep, size_t bufsize)
  43 {
  44         const char *s;
  45         BOOL quoted;
  46         size_t len=1;
  47
  48         if (!ptr)
  49                 return(False);
  50
  51         s = *ptr;
  52
  53         /* default to simple separators */
  54         if (!sep)
  55                 sep = " \t\n\r";
  56
  57         /* find the first non sep char */
  58         while (*s && strchr_m(sep,*s))
  59                 s++;
  60
  61         /* nothing left? */
  62         if (! *s)
  63                 return(False);
  64
  65         /* copy over the token */
  66         for (quoted = False; len < bufsize && *s && (quoted || !strchr_m(sep,*s)); s++) {
  67                 if (*s == '\"') {
  68                         quoted = !quoted;
  69                 } else {
  70                         len++;
  71                         *buff++ = *s;
  72                 }
  73         }
  74
  75         *ptr = (*s) ? s+1 : s;
  76         *buff = 0;
  77
  78         return(True);
  79 }
  80
  81 /**
  82  Case insensitive string compararison
  83 **/
  84 int strcasecmp_m(const char *s1, const char *s2)
  85 {
  86         codepoint_t c1=0, c2=0;
  87         size_t size1, size2;
  88
  89         while (*s1 && *s2) {
  90                 c1 = next_codepoint(s1, &size1);
  91                 c2 = next_codepoint(s2, &size2);
  92
  93                 s1 += size1;
  94                 s2 += size2;
  95
  96                 if (c1 == c2) {
  97                         continue;
  98                 }
  99
 100                 if (c1 == INVALID_CODEPOINT ||
 101                     c2 == INVALID_CODEPOINT) {
 102                         /* what else can we do?? */
 103                         return c1 - c2;
 104                 }
 105
 106                 if (toupper_w(c1) != toupper_w(c2)) {
 107                         return c1 - c2;
 108                 }
 109         }
 110
 111         return *s1 - *s2;
 112 }
 113
 114 /**
 115  * Compare 2 strings.
 116  *
 117  * @note The comparison is case-insensitive.
 118  **/
 119 BOOL strequal(const char *s1, const char *s2)
 120 {
 121         if (s1 == s2)
 122                 return(True);
 123         if (!s1 || !s2)
 124                 return(False);
 125
 126         return strcasecmp_m(s1,s2) == 0;
 127 }
 128
 129 /**
 130  Compare 2 strings (case sensitive).
 131 **/
 132 BOOL strcsequal(const char *s1,const char *s2)
 133 {
 134         if (s1 == s2)
 135                 return(True);
 136         if (!s1 || !s2)
 137                 return(False);
 138
 139         return strcmp(s1,s2) == 0;
 140 }
 141
 142
 143 /**
 144 Do a case-insensitive, whitespace-ignoring string compare.
 145 **/
 146 int strwicmp(const char *psz1, const char *psz2)
 147 {
 148         /* if BOTH strings are NULL, return TRUE, if ONE is NULL return */
 149         /* appropriate value. */
 150         if (psz1 == psz2)
 151                 return (0);
 152         else if (psz1 == NULL)
 153                 return (-1);
 154         else if (psz2 == NULL)
 155                 return (1);
 156
 157         /* sync the strings on first non-whitespace */
 158         while (1) {
 159                 while (isspace((int)*psz1))
 160                         psz1++;
 161                 while (isspace((int)*psz2))
 162                         psz2++;
 163                 if (toupper((unsigned char)*psz1) != toupper((unsigned char)*psz2)
 164                     || *psz1 == '\0'
 165                     || *psz2 == '\0')
 166                         break;
 167                 psz1++;
 168                 psz2++;
 169         }
 170         return (*psz1 - *psz2);
 171 }
 172
 173 /**
 174  String replace.
 175  NOTE: oldc and newc must be 7 bit characters
 176 **/
 177 void string_replace(char *s, char oldc, char newc)
 178 {
 179         while (*s) {
 180                 size_t size;
 181                 codepoint_t c = next_codepoint(s, &size);
 182                 if (c == oldc) {
 183                         *s = newc;
 184                 }
 185                 s += size;
 186         }
 187 }
 188
 189 /**
 190  Trim the specified elements off the front and back of a string.
 191 **/
 192 BOOL trim_string(char *s,const char *front,const char *back)
 193 {
 194         BOOL ret = False;
 195         size_t front_len;
 196         size_t back_len;
 197         size_t len;
 198
 199         /* Ignore null or empty strings. */
 200         if (!s || (s[0] == '\0'))
 201                 return False;
 202
 203         front_len       = front? strlen(front) : 0;
 204         back_len        = back? strlen(back) : 0;
 205
 206         len = strlen(s);
 207
 208         if (front_len) {
 209                 while (len && strncmp(s, front, front_len)==0) {
 210                         /* Must use memmove here as src & dest can
 211                          * easily overlap. Found by valgrind. JRA. */
 212                         memmove(s, s+front_len, (len-front_len)+1);
 213                         len -= front_len;
 214                         ret=True;
 215                 }
 216         }
 217
 218         if (back_len) {
 219                 while ((len >= back_len) && strncmp(s+len-back_len,back,back_len)==0) {
 220                         s[len-back_len]='\0';
 221                         len -= back_len;
 222                         ret=True;
 223                 }
 224         }
 225         return ret;
 226 }
 227
 228 /**
 229  Find the number of 'c' chars in a string
 230 **/
 231 size_t count_chars(const char *s, char c)
 232 {
 233         size_t count = 0;
 234
 235         while (*s) {
 236                 size_t size;
 237                 codepoint_t c2 = next_codepoint(s, &size);
 238                 if (c2 == c) count++;
 239                 s += size;
 240         }
 241
 242         return count;
 243 }
 244
 245 /**
 246  Safe string copy into a known length string. maxlength does not
 247  include the terminating zero.
 248 **/
 249 char *safe_strcpy(char *dest,const char *src, size_t maxlength)
 250 {
 251         size_t len;
 252
 253         if (!dest) {
 254                 DEBUG(0,("ERROR: NULL dest in safe_strcpy\n"));
 255                 return NULL;
 256         }
 257
 258 #ifdef DEVELOPER
 259         /* We intentionally write out at the extremity of the destination
 260          * string.  If the destination is too short (e.g. pstrcpy into mallocd
 261          * or fstring) then this should cause an error under a memory
 262          * checker. */
 263         dest[maxlength] = '\0';
 264         if (PTR_DIFF(&len, dest) > 0) {  /* check if destination is on the stack, ok if so */
 265                 log_suspicious_usage("safe_strcpy", src);
 266         }
 267 #endif
 268
 269         if (!src) {
 270                 *dest = 0;
 271                 return dest;
 272         }
 273
 274         len = strlen(src);
 275
 276         if (len > maxlength) {
 277                 DEBUG(0,("ERROR: string overflow by %u (%u - %u) in safe_strcpy [%.50s]\n",
 278                          (uint_t)(len-maxlength), (unsigned)len, (unsigned)maxlength, src));
 279                 len = maxlength;
 280         }
 281
 282         memmove(dest, src, len);
 283         dest[len] = 0;
 284         return dest;
 285 }
 286
 287 /**
 288  Safe string cat into a string. maxlength does not
 289  include the terminating zero.
 290 **/
 291 char *safe_strcat(char *dest, const char *src, size_t maxlength)
 292 {
 293         size_t src_len, dest_len;
 294
 295         if (!dest) {
 296                 DEBUG(0,("ERROR: NULL dest in safe_strcat\n"));
 297                 return NULL;
 298         }
 299
 300         if (!src)
 301                 return dest;
 302
 303 #ifdef DEVELOPER
 304         if (PTR_DIFF(&src_len, dest) > 0) {  /* check if destination is on the stack, ok if so */
 305                 log_suspicious_usage("safe_strcat", src);
 306         }
 307 #endif
 308         src_len = strlen(src);
 309         dest_len = strlen(dest);
 310
 311         if (src_len + dest_len > maxlength) {
 312                 DEBUG(0,("ERROR: string overflow by %d in safe_strcat [%.50s]\n",
 313                          (int)(src_len + dest_len - maxlength), src));
 314                 if (maxlength > dest_len) {
 315                         memcpy(&dest[dest_len], src, maxlength - dest_len);
 316                 }
 317                 dest[maxlength] = 0;
 318                 return NULL;
 319         }
 320
 321         memcpy(&dest[dest_len], src, src_len);
 322         dest[dest_len + src_len] = 0;
 323         return dest;
 324 }
 325
 326 /**
 327  Paranoid strcpy into a buffer of given length (includes terminating
 328  zero. Strips out all but 'a-Z0-9' and the character in other_safe_chars
 329  and replaces with '_'. Deliberately does *NOT* check for multibyte
 330  characters. Don't change it !
 331 **/
 332
 333 char *alpha_strcpy(char *dest, const char *src, const char *other_safe_chars, size_t maxlength)
 334 {
 335         size_t len, i;
 336
 337         if (maxlength == 0) {
 338                 /* can't fit any bytes at all! */
 339                 return NULL;
 340         }
 341
 342         if (!dest) {
 343                 DEBUG(0,("ERROR: NULL dest in alpha_strcpy\n"));
 344                 return NULL;
 345         }
 346
 347         if (!src) {
 348                 *dest = 0;
 349                 return dest;
 350         }
 351
 352         len = strlen(src);
 353         if (len >= maxlength)
 354                 len = maxlength - 1;
 355
 356         if (!other_safe_chars)
 357                 other_safe_chars = "";
 358
 359         for(i = 0; i < len; i++) {
 360                 int val = (src[i] & 0xff);
 361                 if (isupper(val) || islower(val) || isdigit(val) || strchr_m(other_safe_chars, val))
 362                         dest[i] = src[i];
 363                 else
 364                         dest[i] = '_';
 365         }
 366
 367         dest[i] = '\0';
 368
 369         return dest;
 370 }
 371
 372 /**
 373  Like strncpy but always null terminates. Make sure there is room!
 374  The variable n should always be one less than the available size.
 375 **/
 376
 377 char *StrnCpy(char *dest,const char *src,size_t n)
 378 {
 379         char *d = dest;
 380         if (!dest)
 381                 return(NULL);
 382         if (!src) {
 383                 *dest = 0;
 384                 return(dest);
 385         }
 386         while (n-- && (*d++ = *src++))
 387                 ;
 388         *d = 0;
 389         return(dest);
 390 }
 391
 392
 393 /**
 394  Routine to get hex characters and turn them into a 16 byte array.
 395  the array can be variable length, and any non-hex-numeric
 396  characters are skipped.  "0xnn" or "0Xnn" is specially catered
 397  for.
 398
 399  valid examples: "0A5D15"; "0x15, 0x49, 0xa2"; "59\ta9\te3\n"
 400
 401
 402 **/
 403 size_t strhex_to_str(char *p, size_t len, const char *strhex)
 404 {
 405         size_t i;
 406         size_t num_chars = 0;
 407         uint8_t   lonybble, hinybble;
 408         const char     *hexchars = "0123456789ABCDEF";
 409         char           *p1 = NULL, *p2 = NULL;
 410
 411         for (i = 0; i < len && strhex[i] != 0; i++) {
 412                 if (strncasecmp(hexchars, "0x", 2) == 0) {
 413                         i++; /* skip two chars */
 414                         continue;
 415                 }
 416
 417                 if (!(p1 = strchr_m(hexchars, toupper((unsigned char)strhex[i]))))
 418                         break;
 419
 420                 i++; /* next hex digit */
 421
 422                 if (!(p2 = strchr_m(hexchars, toupper((unsigned char)strhex[i]))))
 423                         break;
 424
 425                 /* get the two nybbles */
 426                 hinybble = PTR_DIFF(p1, hexchars);
 427                 lonybble = PTR_DIFF(p2, hexchars);
 428
 429                 p[num_chars] = (hinybble << 4) | lonybble;
 430                 num_chars++;
 431
 432                 p1 = NULL;
 433                 p2 = NULL;
 434         }
 435         return num_chars;
 436 }
 437
 438 DATA_BLOB strhex_to_data_blob(const char *strhex)
 439 {
 440         DATA_BLOB ret_blob = data_blob(NULL, strlen(strhex)/2+1);
 441
 442         ret_blob.length = strhex_to_str(ret_blob.data,
 443                                         strlen(strhex),
 444                                         strhex);
 445
 446         return ret_blob;
 447 }
 448
 449
 450 /**
 451  * Routine to print a buffer as HEX digits, into an allocated string.
 452  */
 453 void hex_encode(const unsigned char *buff_in, size_t len, char **out_hex_buffer)
 454 {
 455         int i;
 456         char *hex_buffer;
 457
 458         *out_hex_buffer = smb_xmalloc((len*2)+1);
 459         hex_buffer = *out_hex_buffer;
 460
 461         for (i = 0; i < len; i++)
 462                 slprintf(&hex_buffer[i*2], 3, "%02X", buff_in[i]);
 463 }
 464
 465 /**
 466  Check if a string is part of a list.
 467 **/
 468 BOOL in_list(const char *s, const char *list, BOOL casesensitive)
 469 {
 470         pstring tok;
 471         const char *p=list;
 472
 473         if (!list)
 474                 return(False);
 475
 476         while (next_token(&p,tok,LIST_SEP,sizeof(tok))) {
 477                 if (casesensitive) {
 478                         if (strcmp(tok,s) == 0)
 479                                 return(True);
 480                 } else {
 481                         if (strcasecmp_m(tok,s) == 0)
 482                                 return(True);
 483                 }
 484         }
 485         return(False);
 486 }
 487
 488 /**
 489  Set a string value, allocing the space for the string
 490 **/
 491 static BOOL string_init(char **dest,const char *src)
 492 {
 493         if (!src) src = "";
 494
 495         (*dest) = strdup(src);
 496         if ((*dest) == NULL) {
 497                 DEBUG(0,("Out of memory in string_init\n"));
 498                 return False;
 499         }
 500         return True;
 501 }
 502
 503 /**
 504  Free a string value.
 505 **/
 506 void string_free(char **s)
 507 {
 508         if (s) SAFE_FREE(*s);
 509 }
 510
 511 /**
 512  Set a string value, deallocating any existing space, and allocing the space
 513  for the string
 514 **/
 515 BOOL string_set(char **dest, const char *src)
 516 {
 517         string_free(dest);
 518         return string_init(dest,src);
 519 }
 520
 521 /**
 522  Substitute a string for a pattern in another string. Make sure there is
 523  enough room!
 524
 525  This routine looks for pattern in s and replaces it with
 526  insert. It may do multiple replacements.
 527
 528  Any of " ; ' $ or ` in the insert string are replaced with _
 529  if len==0 then the string cannot be extended. This is different from the old
 530  use of len==0 which was for no length checks to be done.
 531 **/
 532
 533 void string_sub(char *s,const char *pattern, const char *insert, size_t len)
 534 {
 535         char *p;
 536         ssize_t ls,lp,li, i;
 537
 538         if (!insert || !pattern || !*pattern || !s)
 539                 return;
 540
 541         ls = (ssize_t)strlen(s);
 542         lp = (ssize_t)strlen(pattern);
 543         li = (ssize_t)strlen(insert);
 544
 545         if (len == 0)
 546                 len = ls + 1; /* len is number of *bytes* */
 547
 548         while (lp <= ls && (p = strstr(s,pattern))) {
 549                 if (ls + (li-lp) >= len) {
 550                         DEBUG(0,("ERROR: string overflow by %d in string_sub(%.50s, %d)\n",
 551                                  (int)(ls + (li-lp) - len),
 552                                  pattern, (int)len));
 553                         break;
 554                 }
 555                 if (li != lp) {
 556                         memmove(p+li,p+lp,strlen(p+lp)+1);
 557                 }
 558                 for (i=0;i<li;i++) {
 559                         switch (insert[i]) {
 560                         case '`':
 561                         case '"':
 562                         case '\'':
 563                         case ';':
 564                         case '$':
 565                         case '%':
 566                         case '\r':
 567                         case '\n':
 568                                 p[i] = '_';
 569                                 break;
 570                         default:
 571                                 p[i] = insert[i];
 572                         }
 573                 }
 574                 s = p + li;
 575                 ls += (li-lp);
 576         }
 577 }
 578
 579
 580 /**
 581  Similar to string_sub() but allows for any character to be substituted.
 582  Use with caution!
 583  if len==0 then the string cannot be extended. This is different from the old
 584  use of len==0 which was for no length checks to be done.
 585 **/
 586
 587 void all_string_sub(char *s,const char *pattern,const char *insert, size_t len)
 588 {
 589         char *p;
 590         ssize_t ls,lp,li;
 591
 592         if (!insert || !pattern || !s)
 593                 return;
 594
 595         ls = (ssize_t)strlen(s);
 596         lp = (ssize_t)strlen(pattern);
 597         li = (ssize_t)strlen(insert);
 598
 599         if (!*pattern)
 600                 return;
 601
 602         if (len == 0)
 603                 len = ls + 1; /* len is number of *bytes* */
 604
 605         while (lp <= ls && (p = strstr(s,pattern))) {
 606                 if (ls + (li-lp) >= len) {
 607                         DEBUG(0,("ERROR: string overflow by %d in all_string_sub(%.50s, %d)\n",
 608                                  (int)(ls + (li-lp) - len),
 609                                  pattern, (int)len));
 610                         break;
 611                 }
 612                 if (li != lp) {
 613                         memmove(p+li,p+lp,strlen(p+lp)+1);
 614                 }
 615                 memcpy(p, insert, li);
 616                 s = p + li;
 617                 ls += (li-lp);
 618         }
 619 }
 620
 621
 622 /**
 623  Strchr and strrchr_m are a bit complex on general multi-byte strings.
 624 **/
 625 char *strchr_m(const char *s, char c)
 626 {
 627         /* characters below 0x3F are guaranteed to not appear in
 628            non-initial position in multi-byte charsets */
 629         if ((c & 0xC0) == 0) {
 630                 return strchr(s, c);
 631         }
 632
 633         while (*s) {
 634                 size_t size;
 635                 codepoint_t c2 = next_codepoint(s, &size);
 636                 if (c2 == c) {
 637                         return discard_const(s);
 638                 }
 639                 s += size;
 640         }
 641
 642         return NULL;
 643 }
 644
 645 char *strrchr_m(const char *s, char c)
 646 {
 647         char *ret = NULL;
 648
 649         /* characters below 0x3F are guaranteed to not appear in
 650            non-initial position in multi-byte charsets */
 651         if ((c & 0xC0) == 0) {
 652                 return strrchr(s, c);
 653         }
 654
 655         while (*s) {
 656                 size_t size;
 657                 codepoint_t c2 = next_codepoint(s, &size);
 658                 if (c2 == c) {
 659                         ret = discard_const(s);
 660                 }
 661                 s += size;
 662         }
 663
 664         return ret;
 665 }
 666
 667 /*
 668   return True if any (multi-byte) character is lower case
 669 */
 670 BOOL strhaslower(const char *string)
 671 {
 672         while (*string) {
 673                 size_t c_size;
 674                 codepoint_t s;
 675                 codepoint_t t;
 676
 677                 s = next_codepoint(string, &c_size);
 678                 string += c_size;
 679
 680                 t = toupper_w(s);
 681
 682                 if (s != t) {
 683                         return True; /* that means it has lower case chars */
 684                 }
 685         }
 686
 687         return False;
 688 }
 689
 690 /*
 691   return True if any (multi-byte) character is upper case
 692 */
 693 BOOL strhasupper(const char *string)
 694 {
 695         while (*string) {
 696                 size_t c_size;
 697                 codepoint_t s;
 698                 codepoint_t t;
 699
 700                 s = next_codepoint(string, &c_size);
 701                 string += c_size;
 702
 703                 t = tolower_w(s);
 704
 705                 if (s != t) {
 706                         return True; /* that means it has upper case chars */
 707                 }
 708         }
 709
 710         return False;
 711 }
 712
 713 /**
 714  Convert a string to lower case, allocated with talloc
 715 **/
 716 char *strlower_talloc(TALLOC_CTX *ctx, const char *src)
 717 {
 718         size_t size=0;
 719         char *dest;
 720
 721         /* this takes advantage of the fact that upper/lower can't
 722            change the length of a character by more than 1 byte */
 723         dest = talloc_size(ctx, 2*(strlen(src))+1);
 724         if (dest == NULL) {
 725                 return NULL;
 726         }
 727
 728         while (*src) {
 729                 size_t c_size;
 730                 codepoint_t c = next_codepoint(src, &c_size);
 731                 src += c_size;
 732
 733                 c = tolower_w(c);
 734
 735                 c_size = push_codepoint(dest+size, c);
 736                 if (c_size == -1) {
 737                         talloc_free(dest);
 738                         return NULL;
 739                 }
 740                 size += c_size;
 741         }
 742
 743         dest[size] = 0;
 744
 745         return dest;
 746 }
 747
 748 /**
 749  Convert a string to UPPER case, allocated with talloc
 750 **/
 751 char *strupper_talloc(TALLOC_CTX *ctx, const char *src)
 752 {
 753         size_t size=0;
 754         char *dest;
 755
 756         if (!src) {
 757                 return NULL;
 758         }
 759
 760         /* this takes advantage of the fact that upper/lower can't
 761            change the length of a character by more than 1 byte */
 762         dest = talloc_size(ctx, 2*(strlen(src))+1);
 763         if (dest == NULL) {
 764                 return NULL;
 765         }
 766
 767         while (*src) {
 768                 size_t c_size;
 769                 codepoint_t c = next_codepoint(src, &c_size);
 770                 src += c_size;
 771
 772                 c = toupper_w(c);
 773
 774                 c_size = push_codepoint(dest+size, c);
 775                 if (c_size == -1) {
 776                         talloc_free(dest);
 777                         return NULL;
 778                 }
 779                 size += c_size;
 780         }
 781
 782         dest[size] = 0;
 783
 784         return dest;
 785 }
 786
 787 /**
 788  Convert a string to lower case.
 789 **/
 790 void strlower_m(char *s)
 791 {
 792         char *d;
 793
 794         /* this is quite a common operation, so we want it to be
 795            fast. We optimise for the ascii case, knowing that all our
 796            supported multi-byte character sets are ascii-compatible
 797            (ie. they match for the first 128 chars) */
 798         while (*s && !(((uint8_t)s[0]) & 0x7F)) {
 799                 *s = tolower((uint8_t)*s);
 800                 s++;
 801         }
 802
 803         if (!*s)
 804                 return;
 805
 806         d = s;
 807
 808         while (*s) {
 809                 size_t c_size, c_size2;
 810                 codepoint_t c = next_codepoint(s, &c_size);
 811                 c_size2 = push_codepoint(d, tolower_w(c));
 812                 if (c_size2 > c_size) {
 813                         DEBUG(0,("FATAL: codepoint 0x%x (0x%x) expanded from %d to %d bytes in strlower_m\n",
 814                                  c, tolower_w(c), (int)c_size, (int)c_size2));
 815                         smb_panic("codepoint expansion in strlower_m\n");
 816                 }
 817                 s += c_size;
 818                 d += c_size2;
 819         }
 820         *d = 0;
 821 }
 822
 823 /**
 824  Convert a string to UPPER case.
 825 **/
 826 void strupper_m(char *s)
 827 {
 828         char *d;
 829
 830         /* this is quite a common operation, so we want it to be
 831            fast. We optimise for the ascii case, knowing that all our
 832            supported multi-byte character sets are ascii-compatible
 833            (ie. they match for the first 128 chars) */
 834         while (*s && !(((uint8_t)s[0]) & 0x7F)) {
 835                 *s = toupper((uint8_t)*s);
 836                 s++;
 837         }
 838
 839         if (!*s)
 840                 return;
 841
 842         d = s;
 843
 844         while (*s) {
 845                 size_t c_size, c_size2;
 846                 codepoint_t c = next_codepoint(s, &c_size);
 847                 c_size2 = push_codepoint(d, toupper_w(c));
 848                 if (c_size2 > c_size) {
 849                         DEBUG(0,("FATAL: codepoint 0x%x (0x%x) expanded from %d to %d bytes in strupper_m\n",
 850                                  c, toupper_w(c), (int)c_size, (int)c_size2));
 851                         smb_panic("codepoint expansion in strupper_m\n");
 852                 }
 853                 s += c_size;
 854                 d += c_size2;
 855         }
 856         *d = 0;
 857 }
 858
 859 /**
 860  Count the number of UCS2 characters in a string. Normally this will
 861  be the same as the number of bytes in a string for single byte strings,
 862  but will be different for multibyte.
 863 **/
 864 size_t strlen_m(const char *s)
 865 {
 866         size_t count = 0;
 867
 868         if (!s) {
 869                 return 0;
 870         }
 871
 872         while (*s && !(((uint8_t)s[0]) & 0x7F)) {
 873                 s++;
 874                 count++;
 875         }
 876
 877         if (!*s) {
 878                 return count;
 879         }
 880
 881         while (*s) {
 882                 size_t c_size;
 883                 codepoint_t c = next_codepoint(s, &c_size);
 884                 if (c < 0x10000) {
 885                         count += 1;
 886                 } else {
 887                         count += 2;
 888                 }
 889                 s += c_size;
 890         }
 891
 892         return count;
 893 }
 894
 895 /**
 896    Work out the number of multibyte chars in a string, including the NULL
 897    terminator.
 898 **/
 899 size_t strlen_m_term(const char *s)
 900 {
 901         if (!s) {
 902                 return 0;
 903         }
 904
 905         return strlen_m(s) + 1;
 906 }
 907
 908 /**
 909  Unescape a URL encoded string, in place.
 910 **/
 911
 912 void rfc1738_unescape(char *buf)
 913 {
 914         char *p=buf;
 915
 916         while ((p=strchr_m(p,'+')))
 917                 *p = ' ';
 918
 919         p = buf;
 920
 921         while (p && *p && (p=strchr_m(p,'%'))) {
 922                 int c1 = p[1];
 923                 int c2 = p[2];
 924
 925                 if (c1 >= '0' && c1 <= '9')
 926                         c1 = c1 - '0';
 927                 else if (c1 >= 'A' && c1 <= 'F')
 928                         c1 = 10 + c1 - 'A';
 929                 else if (c1 >= 'a' && c1 <= 'f')
 930                         c1 = 10 + c1 - 'a';
 931                 else {p++; continue;}
 932
 933                 if (c2 >= '0' && c2 <= '9')
 934                         c2 = c2 - '0';
 935                 else if (c2 >= 'A' && c2 <= 'F')
 936                         c2 = 10 + c2 - 'A';
 937                 else if (c2 >= 'a' && c2 <= 'f')
 938                         c2 = 10 + c2 - 'a';
 939                 else {p++; continue;}
 940
 941                 *p = (c1<<4) | c2;
 942
 943                 memmove(p+1, p+3, strlen(p+3)+1);
 944                 p++;
 945         }
 946 }
 947
 948 /**
 949  * Decode a base64 string into a DATA_BLOB - simple and slow algorithm
 950  **/
 951 DATA_BLOB base64_decode_data_blob(TALLOC_CTX *mem_ctx, const char *s)
 952 {
 953         DATA_BLOB ret = data_blob_talloc(mem_ctx, s, strlen(s)+1);
 954         ret.length = ldb_base64_decode(ret.data);
 955         return ret;
 956 }
 957
 958 /**
 959  * Decode a base64 string in-place - wrapper for the above
 960  **/
 961 void base64_decode_inplace(char *s)
 962 {
 963         ldb_base64_decode(s);
 964 }
 965
 966 /**
 967  * Encode a base64 string into a talloc()ed string caller to free.
 968  **/
 969 char *base64_encode_data_blob(TALLOC_CTX *mem_ctx, DATA_BLOB data)
 970 {
 971         return ldb_base64_encode(mem_ctx, data.data, data.length);
 972 }
 973
 974 #ifdef VALGRIND
 975 size_t valgrind_strlen(const char *s)
 976 {
 977         size_t count;
 978         for(count = 0; *s++; count++)
 979                 ;
 980         return count;
 981 }
 982 #endif
 983
 984
 985 /*
 986   format a string into length-prefixed dotted domain format, as used in NBT
 987   and in some ADS structures
 988 */
 989 const char *str_format_nbt_domain(TALLOC_CTX *mem_ctx, const char *s)
 990 {
 991         char *ret;
 992         int i;
 993         if (!s || !*s) {
 994                 return talloc_strdup(mem_ctx, "");
 995         }
 996         ret = talloc_size(mem_ctx, strlen(s)+2);
 997         if (!ret) {
 998                 return ret;
 999         }
1000
1001         memcpy(ret+1, s, strlen(s)+1);
1002         ret[0] = '.';
1003
1004         for (i=0;ret[i];i++) {
1005                 if (ret[i] == '.') {
1006                         char *p = strchr(ret+i+1, '.');
1007                         if (p) {
1008                                 ret[i] = p-(ret+i+1);
1009                         } else {
1010                                 ret[i] = strlen(ret+i+1);
1011                         }
1012                 }
1013         }
1014
1015         return ret;
1016 }
1017
1018 BOOL add_string_to_array(TALLOC_CTX *mem_ctx,
1019                          const char *str, const char ***strings, int *num)
1020 {
1021         char *dup_str = talloc_strdup(mem_ctx, str);
1022
1023         *strings = talloc_realloc(mem_ctx,
1024                                     *strings,
1025                                     const char *, ((*num)+1));
1026
1027         if ((*strings == NULL) || (dup_str == NULL))
1028                 return False;
1029
1030         (*strings)[*num] = dup_str;
1031         *num += 1;
1032
1033         return True;
1034 }
1035
1036
1037
1038 /*
1039   varient of strcmp() that handles NULL ptrs
1040 */
1041 int strcmp_safe(const char *s1, const char *s2)
1042 {
1043         if (s1 == s2) {
1044                 return 0;
1045         }
1046         if (s1 == NULL || s2 == NULL) {
1047                 return s1?-1:1;
1048         }
1049         return strcmp(s1, s2);
1050 }
1051
1052
1053 /*******************************************************************
1054 return the number of bytes occupied by a buffer in ASCII format
1055 the result includes the null termination
1056 limited by 'n' bytes
1057 ********************************************************************/
1058 size_t ascii_len_n(const char *src, size_t n)
1059 {
1060         size_t len;
1061
1062         len = strnlen(src, n);
1063         if (len+1 <= n) {
1064                 len += 1;
1065         }
1066
1067         return len;
1068 }
1069
1070
1071 /*******************************************************************
1072  Return a string representing a CIFS attribute for a file.
1073 ********************************************************************/
1074 char *attrib_string(TALLOC_CTX *mem_ctx, uint32_t attrib)
1075 {
1076         int i, len;
1077         const struct {
1078                 char c;
1079                 uint16_t attr;
1080         } attr_strs[] = {
1081                 {'V', FILE_ATTRIBUTE_VOLUME},
1082                 {'D', FILE_ATTRIBUTE_DIRECTORY},
1083                 {'A', FILE_ATTRIBUTE_ARCHIVE},
1084                 {'H', FILE_ATTRIBUTE_HIDDEN},
1085                 {'S', FILE_ATTRIBUTE_SYSTEM},
1086                 {'N', FILE_ATTRIBUTE_NORMAL},
1087                 {'R', FILE_ATTRIBUTE_READONLY},
1088                 {'d', FILE_ATTRIBUTE_DEVICE},
1089                 {'t', FILE_ATTRIBUTE_TEMPORARY},
1090                 {'s', FILE_ATTRIBUTE_SPARSE},
1091                 {'r', FILE_ATTRIBUTE_REPARSE_POINT},
1092                 {'c', FILE_ATTRIBUTE_COMPRESSED},
1093                 {'o', FILE_ATTRIBUTE_OFFLINE},
1094                 {'n', FILE_ATTRIBUTE_NONINDEXED},
1095                 {'e', FILE_ATTRIBUTE_ENCRYPTED}
1096         };
1097         char *ret;
1098
1099         ret = talloc_size(mem_ctx, ARRAY_SIZE(attr_strs)+1);
1100         if (!ret) {
1101                 return NULL;
1102         }
1103
1104         for (len=i=0; i<ARRAY_SIZE(attr_strs); i++) {
1105                 if (attrib & attr_strs[i].attr) {
1106                         ret[len++] = attr_strs[i].c;
1107                 }
1108         }
1109
1110         ret[len] = 0;
1111
1112         return ret;
1113 }