]> git.sur5r.net Git - openldap/blob - servers/slapd/tools/sizecount.c
Very crude LDIF changes:
[openldap] / servers / slapd / tools / sizecount.c
1 #include "portable.h"
2
3 #include <stdio.h>
4
5 #include <ac/stdlib.h>
6 #include <ac/string.h>
7 #include <ac/unistd.h>
8
9 #include <ldbm.h>
10 #include <lber.h>
11 #include <ldap.h>
12 #include "portable.h"
13
14 #define CACHE_SIZE      1000000
15 #define MODE            0600
16 #define DB_FLAGS        (LDBM_WRCREAT|LDBM_NEWDB)
17 #define SUBLEN          3
18
19 extern char     *first_word(char *);
20 extern char     *next_word(char *);
21 extern char     *word_dup(char *);
22 extern char     *phonetic(char *);
23
24 extern int ldap_debug;
25 extern int lber_debug;
26
27 int     ldap_syslog;
28 int     ldap_syslog_level;
29
30 static void     add(LDBM ldbm, char *s, int *count, int *size, int freeit);
31
32 int
33 main( int argc, char **argv )
34 {
35         LDAP                    *ld;
36         LDAPMessage             *res, *e;
37         int                             i, j, k, count, len, nentries;
38         int                             vcount, wcount, pcount, scount;
39         int                             vsize, wsize, psize, ssize;
40         struct berval   **bvals;
41         char                    **vals;
42         char                    *dn, *p, *val;
43         char                    buf[SUBLEN+1];
44         LDBM                    wldbm, pldbm, sldbm;
45         static char             *attrs[] = { "cn", "nentries", NULL };
46
47 /*
48         ldap_debug = 255;
49         lber_debug = 255;
50 */
51         if ( (ld = ldap_init( "vertigo:5555", 0 )) == NULL ) {
52                 perror( "ldap_init" );
53                 exit( 1 );
54         }
55
56         if ( ldap_search( ld, "cn=index", LDAP_SCOPE_ONELEVEL, "(objectclass=*)",
57           attrs, 0 ) == -1 ) {
58                 ldap_perror( ld, "ldap_search" );
59                 exit( 1 );
60         }
61
62         printf( "attr\tdn\tnentries\tvcount\tvsize\twcount\twsize\tpcount\tpsize\tscount\tssize\n" );
63         fflush( stdout );
64         count = 0;
65         while ( ldap_result( ld, LDAP_RES_ANY, 0, NULL, &res )
66           == LDAP_RES_SEARCH_ENTRY ) {
67                 count++;
68                 e = ldap_first_entry( ld, res );
69                 dn = ldap_get_dn( ld, e );
70                 if ( (vals = ldap_get_values( ld, e, "nentries" )) != NULL ) {
71                         nentries = atoi( vals[0] );
72                         ldap_value_free( vals );
73                 } else {
74                         fprintf( stderr, "no nentries attribute for (%s)\n", dn );
75                         nentries = -1;
76                 }
77
78                 for ( i = 0; attrs[i] != NULL; i++ ) {
79                         if ( strcasecmp( attrs[i], "nentries" ) == 0 ) {
80                                 continue;
81                         }
82                         if ( (wldbm = ldbm_open( "wcount.ldbm", DB_FLAGS, MODE,
83                           CACHE_SIZE )) == NULL || (pldbm = ldbm_open( "pcount.ldbm",
84                           DB_FLAGS, MODE, CACHE_SIZE )) == NULL || (sldbm = ldbm_open(
85                           "scount.ldbm", DB_FLAGS, MODE, CACHE_SIZE )) == NULL ) {
86                                 perror( "ldbm_open" );
87                                 exit( 1 );
88                         }
89                         vcount = 0; vsize = 0;
90                         wcount = 0; wsize = 0;
91                         pcount = 0; psize = 0;
92                         scount = 0; ssize = 0;
93                         if ( (bvals = ldap_get_values_len( ld, e, attrs[i] )) != NULL ) {
94                                 for ( j = 0; bvals[j] != NULL; j++ ) {
95                                         Datum   key, data;
96                                         char    *w;
97
98                                         ldbm_datum_init( key );
99                                         ldbm_datum_init( data );
100
101                                         /* update value count */
102                                         vcount++;
103                                         vsize += bvals[j]->bv_len;
104
105                                         /* update word and phoneme counts */
106                                         for ( w = first_word( bvals[j]->bv_val ); w != NULL;
107                                           w = next_word( w ) ) {
108                                                 add( wldbm, word_dup( w ), &wcount, &wsize, 1 );
109
110                                                 add( pldbm, phonetic( w ), &pcount, &psize, 1 );
111                                         }
112
113                                         /* update substring count */
114                                         len = bvals[j]->bv_len;
115                                         val = bvals[j]->bv_val;
116                                         if ( len > SUBLEN - 2 ) {
117                                                 buf[0] = '^';
118                                                 for ( k = 0; k < SUBLEN - 1; k++ ) {
119                                                         buf[k + 1] = val[k];
120                                                 }
121                                                 buf[SUBLEN] = '\0';
122                                                 add( sldbm, buf, &scount, &ssize, 0 );
123
124                                                 p = val + len - SUBLEN + 1;
125                                                 for ( k = 0; k < SUBLEN; k++ ) {
126                                                         buf[k] = p[k];
127                                                 }
128                                                 buf[SUBLEN - 1] = '$';
129                                                 buf[SUBLEN] = '\0';
130                                                 add( sldbm, buf, &scount, &ssize, 0 );
131                                         }
132                                         for ( p = val; p < (val + len - SUBLEN + 1); p++ ) {
133                                                 for ( k = 0; k < SUBLEN; k++ ) {
134                                                         buf[k] = p[k];
135                                                 }
136                                                 buf[SUBLEN] = '\0';
137                                                 add( sldbm, buf, &scount, &ssize, 0 );
138                                         }
139                                 }
140                                 ldap_value_free_len( bvals );
141                         }
142                         printf( "%s\t%s\t%d", attrs[i], dn, nentries );
143                         printf( "\t%d\t%d", vcount, vsize );
144                         printf( "\t%d\t%d", wcount, wsize );
145                         printf( "\t%d\t%d", pcount, psize );
146                         printf( "\t%d\t%d\n", scount, ssize );
147                         fflush( stdout );
148
149                         ldbm_close( wldbm );
150                         ldbm_close( pldbm );
151                         ldbm_close( sldbm );
152                 }
153
154                 free( dn );
155                 ldap_msgfree( res );
156         }
157         printf( "%d entries\n", count );
158         fflush( stdout );
159
160         if ( ldap_result2error( ld, res, 1 ) != LDAP_SUCCESS ) {
161                 ldap_perror( ld, "ldap_result" );
162         }
163         ldap_unbind( ld );
164
165         (void) unlink( "wcount.ldbm" );
166         (void) unlink( "pcount.ldbm" );
167         (void) unlink( "scount.ldbm" );
168
169         exit( 0 );
170 }
171
172 static void
173 add(
174     LDBM        ldbm,
175     char        *s,
176     int         *count,
177     int         *size,
178     int         freeit
179 )
180 {
181         Datum   key, data;
182
183         ldbm_datum_init( key );
184         ldbm_datum_init( data );
185
186         key.dptr = s;
187         key.dsize = strlen( key.dptr ) + 1;
188         data.dptr = "";
189         data.dsize = 0;
190         if ( ldbm_store( ldbm, key, data, LDBM_INSERT ) == 0 ) {
191                 (*count)++;
192                 (*size) += strlen( key.dptr );
193         }
194         if ( freeit && ( key.dptr != NULL ) )
195                 ldbm_datum_free( ldbm, key );
196 }