Fix the mess with ldb includes.

[metze/samba/wip.git] / source4 / lib / ldb / common / attrib_handlers.c
diff --git a/source4/lib/ldb/common/attrib_handlers.c b/source4/lib/ldb/common/attrib_handlers.c

index 4b6a7af1eedd6f4dc52c48b67c5623c13c31b386..80725ec04f9c5966a08964ac5e641b403c4ba2c9 100644 (file)
--- a/source4/lib/ldb/common/attrib_handlers.c
+++ b/source4/lib/ldb/common/attrib_handlers.c
@@ -10,7 +10,7 @@
     This library is free software; you can redistribute it and/or
     modify it under the terms of the GNU Lesser General Public
     License as published by the Free Software Foundation; either
-   version 2 of the License, or (at your option) any later version.
+   version 3 of the License, or (at your option) any later version.
  
     This library is distributed in the hope that it will be useful,
     but WITHOUT ANY WARRANTY; without even the implied warranty of
@@ -18,16 +18,16 @@
     Lesser General Public License for more details.
  
     You should have received a copy of the GNU Lesser General Public
-   License along with this library; if not, write to the Free Software
-   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+   License along with this library; if not, see <http://www.gnu.org/licenses/>.
  */
  /*
    attribute handlers for well known attribute types, selected by syntax OID
    see rfc2252
  */
  
-#include "includes.h"
-#include "ldb/include/includes.h"
+#include "ldb_private.h"
+#include "system/locale.h"
+#include "ldb_handlers.h"
  
  /*
    default handler that just copies a ldb_val.
@@ -50,16 +50,17 @@ int ldb_handler_copy(struct ldb_context *ldb, void *mem_ctx,
    We exploit the fact that utf8 never uses the space octet except for
    the space itself
  */
-static int ldb_handler_fold(struct ldb_context *ldb, void *mem_ctx,
+int ldb_handler_fold(struct ldb_context *ldb, void *mem_ctx,
                             const struct ldb_val *in, struct ldb_val *out)
  {
         char *s, *t;
         int l;
+
         if (!in || !out || !(in->data)) {
                 return -1;
         }
  
-       out->data = (uint8_t *)ldb_casefold(ldb, mem_ctx, (const char *)(in->data));
+       out->data = (uint8_t *)ldb_casefold(ldb, mem_ctx, (const char *)(in->data), in->length);
         if (out->data == NULL) {
                 ldb_debug(ldb, LDB_DEBUG_ERROR, "ldb_handler_fold: unable to casefold string [%s]", in->data);
                 return -1;
@@ -69,7 +70,7 @@ static int ldb_handler_fold(struct ldb_context *ldb, void *mem_ctx,
         
         /* remove trailing spaces if any */
         l = strlen(s);
-       while (s[l - 1] == ' ') l--;
+       while (l > 0 && s[l - 1] == ' ') l--;
         s[l] = '\0';
         
         /* remove leading spaces if any */
@@ -104,7 +105,7 @@ static int ldb_handler_fold(struct ldb_context *ldb, void *mem_ctx,
    canonicalise a ldap Integer
    rfc2252 specifies it should be in decimal form
  */
-static int ldb_canonicalise_Integer(struct ldb_context *ldb, void *mem_ctx,
+int ldb_canonicalise_Integer(struct ldb_context *ldb, void *mem_ctx,
                                     const struct ldb_val *in, struct ldb_val *out)
  {
         char *end;
@@ -123,7 +124,7 @@ static int ldb_canonicalise_Integer(struct ldb_context *ldb, void *mem_ctx,
  /*
    compare two Integers
  */
-static int ldb_comparison_Integer(struct ldb_context *ldb, void *mem_ctx,
+int ldb_comparison_Integer(struct ldb_context *ldb, void *mem_ctx,
                                   const struct ldb_val *v1, const struct ldb_val *v2)
  {
         return strtoll((char *)v1->data, NULL, 0) - strtoll((char *)v2->data, NULL, 0);
@@ -145,39 +146,92 @@ int ldb_comparison_binary(struct ldb_context *ldb, void *mem_ctx,
    compare two case insensitive strings, ignoring multiple whitespaces
    and leading and trailing whitespaces
    see rfc2252 section 8.1
+       
+  try to optimize for the ascii case,
+  but if we find out an utf8 codepoint revert to slower but correct function
  */
-static int ldb_comparison_fold(struct ldb_context *ldb, void *mem_ctx,
+int ldb_comparison_fold(struct ldb_context *ldb, void *mem_ctx,
                                const struct ldb_val *v1, const struct ldb_val *v2)
  {
         const char *s1=(const char *)v1->data, *s2=(const char *)v2->data;
-       while (*s1 == ' ') s1++;
-       while (*s2 == ' ') s2++;
+       size_t n1 = v1->length, n2 = v2->length;
+       const char *u1, *u2;
+       char *b1, *b2;
+       int ret;
+       while (*s1 == ' ' && n1) { s1++; n1--; };
+       while (*s2 == ' ' && n2) { s2++; n2--; };
         /* TODO: make utf8 safe, possibly with helper function from application */
-       while (*s1 && *s2) {
+       while (*s1 && *s2 && n1 && n2) {
+               /* the first 127 (0x7F) chars are ascii and utf8 guarantes they
+                * never appear in multibyte sequences */
+               if (((unsigned char)s1[0]) & 0x80) goto utf8str;
+               if (((unsigned char)s2[0]) & 0x80) goto utf8str;
                 if (toupper((unsigned char)*s1) != toupper((unsigned char)*s2))
                         break;
                 if (*s1 == ' ') {
-                       while (s1[0] == s1[1]) s1++;
-                       while (s2[0] == s2[1]) s2++;
+                       while (s1[0] == s1[1] && n1) { s1++; n1--; }
+                       while (s2[0] == s2[1] && n2) { s2++; n2--; }
                 }
                 s1++; s2++;
+               n1--; n2--;
         }
         if (! (*s1 && *s2)) {
-               /* remove trailing spaces only if one of the pointers
+               /* check for trailing spaces only if one of the pointers
                  * has reached the end of the strings otherwise we
                  * can mistakenly match.
                  * ex. "domain users" <-> "domainUpdates"
                  */
-               while (*s1 == ' ') s1++;
-               while (*s2 == ' ') s2++;
+               while (*s1 == ' ') { s1++; n1--; }
+               while (*s2 == ' ') { s2++; n2--; }
+       }
+       if (n1 != n2) {
+               return n1 - n2;
         }
         return (int)(toupper(*s1)) - (int)(toupper(*s2));
+
+utf8str:
+       /* no need to recheck from the start, just from the first utf8 char found */
+       b1 = ldb_casefold(ldb, mem_ctx, s1, n1);
+       b2 = ldb_casefold(ldb, mem_ctx, s2, n2);
+
+       if (b1 && b2) {
+               /* Both strings converted correctly */
+
+               u1 = b1;
+               u2 = b2;
+       } else {
+               /* One of the strings was not UTF8, so we have no options but to do a binary compare */
+
+               u1 = s1;
+               u2 = s2;
+       }
+
+       while (*u1 & *u2) {
+               if (*u1 != *u2)
+                       break;
+               if (*u1 == ' ') {
+                       while (u1[0] == u1[1]) u1++;
+                       while (u2[0] == u2[1]) u2++;
+               }
+               u1++; u2++;
+       }
+       if (! (*u1 && *u2)) {
+               while (*u1 == ' ') u1++;
+               while (*u2 == ' ') u2++;
+       }
+       ret = (int)(*u1 - *u2);
+
+       talloc_free(b1);
+       talloc_free(b2);
+       
+       return ret;
  }
  
+
  /*
    canonicalise a attribute in DN format
  */
-static int ldb_canonicalise_dn(struct ldb_context *ldb, void *mem_ctx,
+int ldb_canonicalise_dn(struct ldb_context *ldb, void *mem_ctx,
                                const struct ldb_val *in, struct ldb_val *out)
  {
         struct ldb_dn *dn;
@@ -186,12 +240,12 @@ static int ldb_canonicalise_dn(struct ldb_context *ldb, void *mem_ctx,
         out->length = 0;
         out->data = NULL;
  
-       dn = ldb_dn_explode_casefold(ldb, (char *)in->data);
-       if (dn == NULL) {
-               return -1;
+       dn = ldb_dn_from_ldb_val(ldb, mem_ctx, in);
+       if ( ! ldb_dn_validate(dn)) {
+               return LDB_ERR_INVALID_DN_SYNTAX;
         }
  
-       out->data = (uint8_t *)ldb_dn_linearize(mem_ctx, dn);
+       out->data = (uint8_t *)ldb_dn_alloc_casefold(mem_ctx, dn);
         if (out->data == NULL) {
                 goto done;
         }
@@ -208,59 +262,32 @@ done:
  /*
    compare two dns
  */
-static int ldb_comparison_dn(struct ldb_context *ldb, void *mem_ctx,
+int ldb_comparison_dn(struct ldb_context *ldb, void *mem_ctx,
                              const struct ldb_val *v1, const struct ldb_val *v2)
  {
         struct ldb_dn *dn1 = NULL, *dn2 = NULL;
         int ret;
  
-       dn1 = ldb_dn_explode_casefold(mem_ctx, (char *)v1->data);
-       if (dn1 == NULL) return -1;
+       dn1 = ldb_dn_from_ldb_val(ldb, mem_ctx, v1);
+       if ( ! ldb_dn_validate(dn1)) return -1;
  
-       dn2 = ldb_dn_explode_casefold(mem_ctx, (char *)v2->data);
-       if (dn2 == NULL) {
+       dn2 = ldb_dn_from_ldb_val(ldb, mem_ctx, v2);
+       if ( ! ldb_dn_validate(dn2)) {
                 talloc_free(dn1);
                 return -1;
         } 
  
-       ret = ldb_dn_compare(ldb, dn1, dn2);
+       ret = ldb_dn_compare(dn1, dn2);
  
         talloc_free(dn1);
         talloc_free(dn2);
         return ret;
  }
  
-/*
-  compare two objectclasses, looking at subclasses
-*/
-static int ldb_comparison_objectclass(struct ldb_context *ldb, void *mem_ctx,
-                                     const struct ldb_val *v1, const struct ldb_val *v2)
-{
-       int ret, i;
-       const char **subclasses;
-       ret = ldb_comparison_fold(ldb, mem_ctx, v1, v2);
-       if (ret == 0) {
-               return 0;
-       }
-       subclasses = ldb_subclass_list(ldb, (char *)v1->data);
-       if (subclasses == NULL) {
-               return ret;
-       }
-       for (i=0;subclasses[i];i++) {
-               struct ldb_val vs;
-               vs.data = discard_const(subclasses[i]);
-               vs.length = strlen(subclasses[i]);
-               if (ldb_comparison_objectclass(ldb, mem_ctx, &vs, v2) == 0) {
-                       return 0;
-               }
-       }
-       return ret;
-}
-
  /*
    compare two utc time values. 1 second resolution
  */
-static int ldb_comparison_utctime(struct ldb_context *ldb, void *mem_ctx,
+int ldb_comparison_utctime(struct ldb_context *ldb, void *mem_ctx,
                                   const struct ldb_val *v1, const struct ldb_val *v2)
  {
         time_t t1, t2;
@@ -272,7 +299,7 @@ static int ldb_comparison_utctime(struct ldb_context *ldb, void *mem_ctx,
  /*
    canonicalise a utc time
  */
-static int ldb_canonicalise_utctime(struct ldb_context *ldb, void *mem_ctx,
+int ldb_canonicalise_utctime(struct ldb_context *ldb, void *mem_ctx,
                                     const struct ldb_val *in, struct ldb_val *out)
  {
         time_t t = ldb_string_to_time((char *)in->data);
@@ -287,50 +314,44 @@ static int ldb_canonicalise_utctime(struct ldb_context *ldb, void *mem_ctx,
  /*
    table of standard attribute handlers
  */
-static const struct ldb_attrib_handler ldb_standard_attribs[] = {
+static const struct ldb_schema_syntax ldb_standard_syntaxes[] = {
         { 
-               .attr            = LDB_SYNTAX_INTEGER,
-               .flags           = 0,
+               .name            = LDB_SYNTAX_INTEGER,
                 .ldif_read_fn    = ldb_handler_copy,
                 .ldif_write_fn   = ldb_handler_copy,
                 .canonicalise_fn = ldb_canonicalise_Integer,
                 .comparison_fn   = ldb_comparison_Integer
         },
         { 
-               .attr            = LDB_SYNTAX_OCTET_STRING,
-               .flags           = 0,
+               .name            = LDB_SYNTAX_OCTET_STRING,
                 .ldif_read_fn    = ldb_handler_copy,
                 .ldif_write_fn   = ldb_handler_copy,
                 .canonicalise_fn = ldb_handler_copy,
                 .comparison_fn   = ldb_comparison_binary
         },
         { 
-               .attr            = LDB_SYNTAX_DIRECTORY_STRING,
-               .flags           = 0,
+               .name            = LDB_SYNTAX_DIRECTORY_STRING,
                 .ldif_read_fn    = ldb_handler_copy,
                 .ldif_write_fn   = ldb_handler_copy,
                 .canonicalise_fn = ldb_handler_fold,
                 .comparison_fn   = ldb_comparison_fold
         },
         { 
-               .attr            = LDB_SYNTAX_DN,
-               .flags           = 0,
+               .name            = LDB_SYNTAX_DN,
                 .ldif_read_fn    = ldb_handler_copy,
                 .ldif_write_fn   = ldb_handler_copy,
                 .canonicalise_fn = ldb_canonicalise_dn,
                 .comparison_fn   = ldb_comparison_dn
         },
         { 
-               .attr            = LDB_SYNTAX_OBJECTCLASS,
-               .flags           = 0,
+               .name            = LDB_SYNTAX_OBJECTCLASS,
                 .ldif_read_fn    = ldb_handler_copy,
                 .ldif_write_fn   = ldb_handler_copy,
                 .canonicalise_fn = ldb_handler_fold,
-               .comparison_fn   = ldb_comparison_objectclass
+               .comparison_fn   = ldb_comparison_fold
         },
         { 
-               .attr            = LDB_SYNTAX_UTC_TIME,
-               .flags           = 0,
+               .name            = LDB_SYNTAX_UTC_TIME,
                 .ldif_read_fn    = ldb_handler_copy,
                 .ldif_write_fn   = ldb_handler_copy,
                 .canonicalise_fn = ldb_canonicalise_utctime,
@@ -342,17 +363,16 @@ static const struct ldb_attrib_handler ldb_standard_attribs[] = {
  /*
    return the attribute handlers for a given syntax name
  */
-const struct ldb_attrib_handler *ldb_attrib_handler_syntax(struct ldb_context *ldb,
-                                                          const char *syntax)
+const struct ldb_schema_syntax *ldb_standard_syntax_by_name(struct ldb_context *ldb,
+                                                           const char *syntax)
  {
         int i;
-       unsigned num_handlers = sizeof(ldb_standard_attribs)/sizeof(ldb_standard_attribs[0]);
+       unsigned num_handlers = sizeof(ldb_standard_syntaxes)/sizeof(ldb_standard_syntaxes[0]);
         /* TODO: should be replaced with a binary search */
         for (i=0;i<num_handlers;i++) {
-               if (strcmp(ldb_standard_attribs[i].attr, syntax) == 0) {
-                       return &ldb_standard_attribs[i];
+               if (strcmp(ldb_standard_syntaxes[i].name, syntax) == 0) {
+                       return &ldb_standard_syntaxes[i];
                 }
         }
         return NULL;
  }
-