]> git.sur5r.net Git - openldap/blob - servers/slapd/tools/sizecount.c
Initial revision
[openldap] / servers / slapd / tools / sizecount.c
1 #include <stdio.h>
2 #include <ldbm.h>
3 #include <lber.h>
4 #include <ldap.h>
5 #include "portable.h"
6
7 #define CACHE_SIZE      1000000
8 #define MODE            0600
9 #define DB_FLAGS        (LDBM_WRCREAT|LDBM_NEWDB)
10 #define SUBLEN          3
11
12 extern char     *first_word();
13 extern char     *next_word();
14 extern char     *word_dup();
15 extern char     *phonetic();
16
17 extern int ldap_debug;
18 extern int lber_debug;
19
20 int     ldap_syslog;
21 int     ldap_syslog_level;
22
23 static void     add();
24
25 main( argc, argv )
26     int         argc;
27     char        **argv;
28 {
29         LDAP                    *ld;
30         LDAPMessage             *res, *e;
31         int                             i, j, k, count, len, nentries;
32         int                             vcount, wcount, pcount, scount;
33         int                             vsize, wsize, psize, ssize;
34         struct berval   **bvals;
35         char                    **vals;
36         char                    *dn, *p, *val;
37         char                    buf[SUBLEN+1];
38         LDBM                    wldbm, pldbm, sldbm;
39         static char             *attrs[] = { "cn", "nentries", NULL };
40
41 /*
42         ldap_debug = 255;
43         lber_debug = 255;
44 */
45         if ( (ld = ldap_open( "vertigo:5555", LDAP_PORT )) == NULL ) {
46                 perror( "ldap_open" );
47                 exit( 1 );
48         }
49
50         if ( ldap_search( ld, "cn=index", LDAP_SCOPE_ONELEVEL, "(objectclass=*)",
51           attrs, 0 ) == -1 ) {
52                 ldap_perror( ld, "ldap_search" );
53                 exit( 1 );
54         }
55
56         printf( "attr\tdn\tnentries\tvcount\tvsize\twcount\twsize\tpcount\tpsize\tscount\tssize\n" );
57         fflush( stdout );
58         count = 0;
59         while ( ldap_result( ld, LDAP_RES_ANY, 0, NULL, &res )
60           == LDAP_RES_SEARCH_ENTRY ) {
61                 count++;
62                 e = ldap_first_entry( ld, res );
63                 dn = ldap_get_dn( ld, e );
64                 if ( (vals = ldap_get_values( ld, e, "nentries" )) != NULL ) {
65                         nentries = atoi( vals[0] );
66                         ldap_value_free( vals );
67                 } else {
68                         fprintf( stderr, "no nentries attribute for (%s)\n", dn );
69                         nentries = -1;
70                 }
71
72                 for ( i = 0; attrs[i] != NULL; i++ ) {
73                         if ( strcasecmp( attrs[i], "nentries" ) == 0 ) {
74                                 continue;
75                         }
76                         if ( (wldbm = ldbm_open( "wcount.ldbm", DB_FLAGS, MODE,
77                           CACHE_SIZE )) == NULL || (pldbm = ldbm_open( "pcount.ldbm",
78                           DB_FLAGS, MODE, CACHE_SIZE )) == NULL || (sldbm = ldbm_open(
79                           "scount.ldbm", DB_FLAGS, MODE, CACHE_SIZE )) == NULL ) {
80                                 perror( "ldbm_open" );
81                                 exit( 1 );
82                         }
83                         vcount = 0; vsize = 0;
84                         wcount = 0; wsize = 0;
85                         pcount = 0; psize = 0;
86                         scount = 0; ssize = 0;
87                         if ( (bvals = ldap_get_values_len( ld, e, attrs[i] )) != NULL ) {
88                                 for ( j = 0; bvals[j] != NULL; j++ ) {
89                                         Datum   key, data;
90                                         char    *w;
91
92                                         /* update value count */
93                                         vcount++;
94                                         vsize += bvals[j]->bv_len;
95
96                                         /* update word and phoneme counts */
97                                         for ( w = first_word( bvals[j]->bv_val ); w != NULL;
98                                           w = next_word( w ) ) {
99                                                 add( wldbm, word_dup( w ), &wcount, &wsize, 1 );
100
101                                                 add( pldbm, phonetic( w ), &pcount, &psize, 1 );
102                                         }
103
104                                         /* update substring count */
105                                         len = bvals[j]->bv_len;
106                                         val = bvals[j]->bv_val;
107                                         if ( len > SUBLEN - 2 ) {
108                                                 buf[0] = '^';
109                                                 for ( k = 0; k < SUBLEN - 1; k++ ) {
110                                                         buf[k + 1] = val[k];
111                                                 }
112                                                 buf[SUBLEN] = '\0';
113                                                 add( sldbm, buf, &scount, &ssize, 0 );
114
115                                                 p = val + len - SUBLEN + 1;
116                                                 for ( k = 0; k < SUBLEN; k++ ) {
117                                                         buf[k] = p[k];
118                                                 }
119                                                 buf[SUBLEN - 1] = '$';
120                                                 buf[SUBLEN] = '\0';
121                                                 add( sldbm, buf, &scount, &ssize, 0 );
122                                         }
123                                         for ( p = val; p < (val + len - SUBLEN + 1); p++ ) {
124                                                 for ( k = 0; k < SUBLEN; k++ ) {
125                                                         buf[k] = p[k];
126                                                 }
127                                                 buf[SUBLEN] = '\0';
128                                                 add( sldbm, buf, &scount, &ssize, 0 );
129                                         }
130                                 }
131                                 ldap_value_free_len( bvals );
132                         }
133                         printf( "%s\t%s\t%d", attrs[i], dn, nentries );
134                         printf( "\t%d\t%d", vcount, vsize );
135                         printf( "\t%d\t%d", wcount, wsize );
136                         printf( "\t%d\t%d", pcount, psize );
137                         printf( "\t%d\t%d\n", scount, ssize );
138                         fflush( stdout );
139
140                         ldbm_close( wldbm );
141                         ldbm_close( pldbm );
142                         ldbm_close( sldbm );
143                 }
144
145                 free( dn );
146                 ldap_msgfree( res );
147         }
148         printf( "%d entries\n", count );
149         fflush( stdout );
150
151         if ( ldap_result2error( ld, res, 1 ) != LDAP_SUCCESS ) {
152                 ldap_perror( ld, "ldap_result" );
153         }
154         ldap_unbind( ld );
155
156         (void) unlink( "wcount.ldbm" );
157         (void) unlink( "pcount.ldbm" );
158         (void) unlink( "scount.ldbm" );
159
160         exit( 0 );
161 }
162
163 static void
164 add(
165     LDBM        ldbm,
166     char        *s,
167     int         *count,
168     int         *size,
169     int         freeit
170 )
171 {
172         Datum   key, data;
173
174         key.dptr = s;
175         key.dsize = strlen( key.dptr ) + 1;
176         data.dptr = "";
177         data.dsize = 0;
178         if ( ldbm_store( ldbm, key, data, LDBM_INSERT ) == 0 ) {
179                 (*count)++;
180                 (*size) += strlen( key.dptr );
181         }
182         if ( freeit )
183                 ldbm_datum_free( ldbm, key );
184 }