diff options
Diffstat (limited to 'utility')
-rw-r--r-- | utility/Makefile.in | 49 | ||||
-rw-r--r-- | utility/ap_pcre.c | 344 | ||||
-rw-r--r-- | utility/ap_pcre.h | 178 | ||||
-rw-r--r-- | utility/config.c | 534 | ||||
-rw-r--r-- | utility/config.h | 190 | ||||
-rw-r--r-- | utility/database.c | 212 | ||||
-rw-r--r-- | utility/database.h | 25 | ||||
-rw-r--r-- | utility/logparse.c | 768 | ||||
-rw-r--r-- | utility/logparse.h | 37 | ||||
-rw-r--r-- | utility/mod_log_sql.conf | 70 | ||||
-rw-r--r-- | utility/shell.c | 342 | ||||
-rw-r--r-- | utility/shell.h | 0 | ||||
-rw-r--r-- | utility/util.c | 189 | ||||
-rw-r--r-- | utility/util.h | 26 |
14 files changed, 2964 insertions, 0 deletions
diff --git a/utility/Makefile.in b/utility/Makefile.in new file mode 100644 index 0000000..fdc3846 --- /dev/null +++ b/utility/Makefile.in | |||
@@ -0,0 +1,49 @@ | |||
1 | # @configure_input@ | ||
2 | |||
3 | top_srcdir = @top_srcdir@ | ||
4 | srcdir = @abs_srcdir@ | ||
5 | top_builddir = @top_builddir@ | ||
6 | builddir = @abs_builddir@ | ||
7 | |||
8 | LIBTOOL=@LIBTOOL@ | ||
9 | CFLAGS = -g3 -Wall -fno-strict-aliasing \ | ||
10 | @APR_INCLUDES@ @APU_INCLUDES@ @PCRE_CFLAGS@ \ | ||
11 | -I$(top_srcdir)/include | ||
12 | CPPFLAGS = @APR_CPPFLAGS@ | ||
13 | LDFLAGS = @APR_LIBTOOL@ @APU_LIBTOOL@ @PCRE_LIBS@ | ||
14 | |||
15 | ifeq (@OOO_MAINTAIN@,1) | ||
16 | CFLAGS += -Werror | ||
17 | endif | ||
18 | |||
19 | STD_DIST = Makefile.in | ||
20 | |||
21 | DISTFILES = $(STD_DIST) $(EXTRA_DIST) $(SOURCES) $(HEADERS) | ||
22 | |||
23 | SOURCES = shell.c config.c logparse.c ap_pcre.c util.c database.c | ||
24 | HEADERS = shell.h config.h logparse.h ap_pcre.h util.h database.h | ||
25 | OBJECTS = $(SOURCES:.c=.o) | ||
26 | DEPS = $(SOURCES:.c=.d) | ||
27 | TARGETS = mod_log_sql | ||
28 | |||
29 | all: $(TARGETS) | ||
30 | |||
31 | mod_log_sql: $(OBJECTS) $(HEADERS) | ||
32 | $(LIBTOOL) --tag=CC --mode=link $(CC) -o $@ $(OBJECTS) $(LDFLAGS) | ||
33 | |||
34 | %.o: %.c %.d | ||
35 | gcc -c $(CFLAGS) $(CPPFLAGS) $< -o $@ | ||
36 | %.d: %.c | ||
37 | gcc -MM $(CFLAGS) $(CPPFLAGS) $< -o $@ | ||
38 | |||
39 | -include $(DEPS) | ||
40 | |||
41 | clean: | ||
42 | $(RM) $(OBJECTS) $(TARGETS) $(DEPS) | ||
43 | |||
44 | local-dist: $(DISTFILES) | ||
45 | mkdir -p $(DESTDIR) | ||
46 | cp -dp --parents $(DISTFILES) $(DESTDIR) | ||
47 | |||
48 | Makefile: Makefile.in ../config.status | ||
49 | cd .. && ./config.status | ||
diff --git a/utility/ap_pcre.c b/utility/ap_pcre.c new file mode 100644 index 0000000..b2b9767 --- /dev/null +++ b/utility/ap_pcre.c | |||
@@ -0,0 +1,344 @@ | |||
1 | /************************************************* | ||
2 | * Perl-Compatible Regular Expressions * | ||
3 | *************************************************/ | ||
4 | |||
5 | /* | ||
6 | This is a library of functions to support regular expressions whose syntax | ||
7 | and semantics are as close as possible to those of the Perl 5 language. See | ||
8 | the file Tech.Notes for some information on the internals. | ||
9 | |||
10 | This module is a wrapper that provides a POSIX API to the underlying PCRE | ||
11 | functions. | ||
12 | |||
13 | Written by: Philip Hazel <ph10@cam.ac.uk> | ||
14 | |||
15 | Copyright (c) 1997-2004 University of Cambridge | ||
16 | |||
17 | ----------------------------------------------------------------------------- | ||
18 | Redistribution and use in source and binary forms, with or without | ||
19 | modification, are permitted provided that the following conditions are met: | ||
20 | |||
21 | * Redistributions of source code must retain the above copyright notice, | ||
22 | this list of conditions and the following disclaimer. | ||
23 | |||
24 | * Redistributions in binary form must reproduce the above copyright | ||
25 | notice, this list of conditions and the following disclaimer in the | ||
26 | documentation and/or other materials provided with the distribution. | ||
27 | |||
28 | * Neither the name of the University of Cambridge nor the names of its | ||
29 | contributors may be used to endorse or promote products derived from | ||
30 | this software without specific prior written permission. | ||
31 | |||
32 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||
33 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||
34 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||
35 | ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | ||
36 | LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||
37 | CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||
38 | SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||
39 | INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||
40 | CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||
41 | ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||
42 | POSSIBILITY OF SUCH DAMAGE. | ||
43 | ----------------------------------------------------------------------------- | ||
44 | */ | ||
45 | |||
46 | #include "apr_lib.h" | ||
47 | #include "apr_strings.h" | ||
48 | #include "ap_pcre.h" | ||
49 | #include "pcre.h" | ||
50 | |||
51 | #define APR_WANT_STRFUNC | ||
52 | #include "apr_want.h" | ||
53 | |||
54 | #ifndef POSIX_MALLOC_THRESHOLD | ||
55 | #define POSIX_MALLOC_THRESHOLD (10) | ||
56 | #endif | ||
57 | |||
58 | /* Table of error strings corresponding to POSIX error codes; must be | ||
59 | * kept in synch with include/ap_regex.h's AP_REG_E* definitions. */ | ||
60 | |||
61 | static const char *const pstring[] = { | ||
62 | "", /* Dummy for value 0 */ | ||
63 | "internal error", /* AP_REG_ASSERT */ | ||
64 | "failed to get memory", /* AP_REG_ESPACE */ | ||
65 | "bad argument", /* AP_REG_INVARG */ | ||
66 | "match failed" /* AP_REG_NOMATCH */ | ||
67 | }; | ||
68 | |||
69 | apr_size_t ap_regerror(int errcode, const ap_regex_t *preg, char *errbuf, | ||
70 | apr_size_t errbuf_size) | ||
71 | { | ||
72 | const char *message, *addmessage; | ||
73 | apr_size_t length, addlength; | ||
74 | |||
75 | message | ||
76 | = (errcode >= (int)(sizeof(pstring)/sizeof(char *))) ? "unknown error code" | ||
77 | : pstring[errcode]; | ||
78 | length = strlen(message) + 1; | ||
79 | |||
80 | addmessage = " at offset "; | ||
81 | addlength | ||
82 | = (preg != NULL && (int)preg->re_erroffset != -1) ? strlen(addmessage) | ||
83 | + 6 | ||
84 | : 0; | ||
85 | |||
86 | if (errbuf_size > 0) { | ||
87 | if (addlength > 0 && errbuf_size >= length + addlength) | ||
88 | apr_snprintf(errbuf, sizeof errbuf, "%s%s%-6d", message, | ||
89 | addmessage, (int)preg->re_erroffset); | ||
90 | else { | ||
91 | strncpy(errbuf, message, errbuf_size - 1); | ||
92 | errbuf[errbuf_size-1] = 0; | ||
93 | } | ||
94 | } | ||
95 | |||
96 | return length + addlength; | ||
97 | } | ||
98 | |||
99 | /************************************************* | ||
100 | * Free store held by a regex * | ||
101 | *************************************************/ | ||
102 | |||
103 | void ap_regfree(ap_regex_t *preg) | ||
104 | { | ||
105 | (pcre_free)(preg->re_pcre); | ||
106 | } | ||
107 | |||
108 | /************************************************* | ||
109 | * Compile a regular expression * | ||
110 | *************************************************/ | ||
111 | |||
112 | /* | ||
113 | Arguments: | ||
114 | preg points to a structure for recording the compiled expression | ||
115 | pattern the pattern to compile | ||
116 | cflags compilation flags | ||
117 | |||
118 | Returns: 0 on success | ||
119 | various non-zero codes on failure | ||
120 | */ | ||
121 | |||
122 | int ap_regcomp(ap_regex_t *preg, const char *pattern, int cflags) | ||
123 | { | ||
124 | const char *errorptr; | ||
125 | int erroffset; | ||
126 | int options = 0; | ||
127 | |||
128 | if ((cflags & AP_REG_ICASE) != 0) | ||
129 | options |= PCRE_CASELESS; | ||
130 | if ((cflags & AP_REG_NEWLINE) != 0) | ||
131 | options |= PCRE_MULTILINE; | ||
132 | |||
133 | preg->re_pcre = pcre_compile(pattern, options, &errorptr, &erroffset, NULL); | ||
134 | preg->re_erroffset = erroffset; | ||
135 | |||
136 | if (preg->re_pcre == NULL) | ||
137 | return AP_REG_INVARG; | ||
138 | |||
139 | preg->re_nsub = pcre_info((const pcre *)preg->re_pcre, NULL, NULL); | ||
140 | return 0; | ||
141 | } | ||
142 | |||
143 | /************************************************* | ||
144 | * Match a regular expression * | ||
145 | *************************************************/ | ||
146 | |||
147 | /* Unfortunately, PCRE requires 3 ints of working space for each captured | ||
148 | substring, so we have to get and release working store instead of just using | ||
149 | the POSIX structures as was done in earlier releases when PCRE needed only 2 | ||
150 | ints. However, if the number of possible capturing brackets is small, use a | ||
151 | block of store on the stack, to reduce the use of malloc/free. The threshold is | ||
152 | in a macro that can be changed at configure time. */ | ||
153 | |||
154 | int ap_regexec(const ap_regex_t *preg, const char *string, apr_size_t nmatch, | ||
155 | ap_regmatch_t pmatch[], int eflags) | ||
156 | { | ||
157 | int rc; | ||
158 | int options = 0; | ||
159 | int *ovector= NULL; | ||
160 | int small_ovector[POSIX_MALLOC_THRESHOLD * 3]; | ||
161 | int allocated_ovector = 0; | ||
162 | |||
163 | if ((eflags & AP_REG_NOTBOL) != 0) | ||
164 | options |= PCRE_NOTBOL; | ||
165 | if ((eflags & AP_REG_NOTEOL) != 0) | ||
166 | options |= PCRE_NOTEOL; | ||
167 | |||
168 | ((ap_regex_t *)preg)->re_erroffset = (apr_size_t)(-1); /* Only has meaning after compile */ | ||
169 | |||
170 | if (nmatch > 0) { | ||
171 | if (nmatch <= POSIX_MALLOC_THRESHOLD) { | ||
172 | ovector = &(small_ovector[0]); | ||
173 | } else { | ||
174 | ovector = (int *)malloc(sizeof(int) * nmatch * 3); | ||
175 | if (ovector == NULL) | ||
176 | return AP_REG_ESPACE; | ||
177 | allocated_ovector = 1; | ||
178 | } | ||
179 | } | ||
180 | |||
181 | rc = pcre_exec((const pcre *)preg->re_pcre, NULL, string, | ||
182 | (int)strlen(string), 0, options, ovector, nmatch * 3); | ||
183 | |||
184 | if (rc == 0) | ||
185 | rc = nmatch; /* All captured slots were filled in */ | ||
186 | |||
187 | if (rc >= 0) { | ||
188 | apr_size_t i; | ||
189 | for (i = 0; i < (apr_size_t)rc; i++) { | ||
190 | pmatch[i].rm_so = ovector[i*2]; | ||
191 | pmatch[i].rm_eo = ovector[i*2+1]; | ||
192 | } | ||
193 | if (allocated_ovector) | ||
194 | free(ovector); | ||
195 | for (; i < nmatch; i++) | ||
196 | pmatch[i].rm_so = pmatch[i].rm_eo = -1; | ||
197 | return 0; | ||
198 | } | ||
199 | |||
200 | else { | ||
201 | if (allocated_ovector) | ||
202 | free(ovector); | ||
203 | switch (rc) { | ||
204 | case PCRE_ERROR_NOMATCH: | ||
205 | return AP_REG_NOMATCH; | ||
206 | case PCRE_ERROR_NULL: | ||
207 | return AP_REG_INVARG; | ||
208 | case PCRE_ERROR_BADOPTION: | ||
209 | return AP_REG_INVARG; | ||
210 | case PCRE_ERROR_BADMAGIC: | ||
211 | return AP_REG_INVARG; | ||
212 | case PCRE_ERROR_UNKNOWN_NODE: | ||
213 | return AP_REG_ASSERT; | ||
214 | case PCRE_ERROR_NOMEMORY: | ||
215 | return AP_REG_ESPACE; | ||
216 | #ifdef PCRE_ERROR_MATCHLIMIT | ||
217 | case PCRE_ERROR_MATCHLIMIT: return AP_REG_ESPACE; | ||
218 | #endif | ||
219 | #ifdef PCRE_ERROR_BADUTF8 | ||
220 | case PCRE_ERROR_BADUTF8: return AP_REG_INVARG; | ||
221 | #endif | ||
222 | #ifdef PCRE_ERROR_BADUTF8_OFFSET | ||
223 | case PCRE_ERROR_BADUTF8_OFFSET: return AP_REG_INVARG; | ||
224 | #endif | ||
225 | default: | ||
226 | return AP_REG_ASSERT; | ||
227 | } | ||
228 | } | ||
229 | } | ||
230 | |||
231 | /* | ||
232 | * Here's a pool-based interface to the POSIX-esque ap_regcomp(). | ||
233 | * Note that we return ap_regex_t instead of being passed one. | ||
234 | * The reason is that if you use an already-used ap_regex_t structure, | ||
235 | * the memory that you've already allocated gets forgotten, and | ||
236 | * regfree() doesn't clear it. So we don't allow it. | ||
237 | */ | ||
238 | |||
239 | static apr_status_t regex_cleanup(void *preg) | ||
240 | { | ||
241 | ap_regfree((ap_regex_t *) preg); | ||
242 | return APR_SUCCESS; | ||
243 | } | ||
244 | |||
245 | ap_regex_t *ap_pregcomp(apr_pool_t *p, const char *pattern, int cflags) | ||
246 | { | ||
247 | ap_regex_t *preg = apr_palloc(p, sizeof *preg); | ||
248 | |||
249 | if (ap_regcomp(preg, pattern, cflags)) { | ||
250 | return NULL; | ||
251 | } | ||
252 | |||
253 | apr_pool_cleanup_register(p, (void *) preg, regex_cleanup, | ||
254 | apr_pool_cleanup_null); | ||
255 | |||
256 | return preg; | ||
257 | } | ||
258 | |||
259 | void ap_pregfree(apr_pool_t *p, ap_regex_t *reg) | ||
260 | { | ||
261 | ap_regfree(reg); | ||
262 | apr_pool_cleanup_kill(p, (void *) reg, regex_cleanup); | ||
263 | } | ||
264 | |||
265 | /* This function substitutes for $0-$9, filling in regular expression | ||
266 | * submatches. Pass it the same nmatch and pmatch arguments that you | ||
267 | * passed ap_regexec(). pmatch should not be greater than the maximum number | ||
268 | * of subexpressions - i.e. one more than the re_nsub member of ap_regex_t. | ||
269 | * | ||
270 | * input should be the string with the $-expressions, source should be the | ||
271 | * string that was matched against. | ||
272 | * | ||
273 | * It returns the substituted string, or NULL on error. | ||
274 | * | ||
275 | * Parts of this code are based on Henry Spencer's regsub(), from his | ||
276 | * AT&T V8 regexp package. | ||
277 | */ | ||
278 | |||
279 | char * ap_pregsub(apr_pool_t *p, const char *input, const char *source, | ||
280 | size_t nmatch, ap_regmatch_t pmatch[]) | ||
281 | { | ||
282 | const char *src = input; | ||
283 | char *dest, *dst; | ||
284 | char c; | ||
285 | size_t no; | ||
286 | int len; | ||
287 | |||
288 | if (!source) | ||
289 | return NULL; | ||
290 | if (!nmatch) | ||
291 | return apr_pstrdup(p, src); | ||
292 | |||
293 | /* First pass, find the size */ | ||
294 | |||
295 | len = 0; | ||
296 | |||
297 | while ((c = *src++) != '\0') { | ||
298 | if (c == '&') | ||
299 | no = 0; | ||
300 | else if (c == '$' && apr_isdigit(*src)) | ||
301 | no = *src++ - '0'; | ||
302 | else | ||
303 | no = 10; | ||
304 | |||
305 | if (no> 9) { /* Ordinary character. */ | ||
306 | if (c == '\\' && (*src == '$' || *src == '&')) | ||
307 | c = *src++; | ||
308 | len++; | ||
309 | } else if (no < nmatch && pmatch[no].rm_so < pmatch[no].rm_eo) { | ||
310 | len += pmatch[no].rm_eo - pmatch[no].rm_so; | ||
311 | } | ||
312 | |||
313 | } | ||
314 | |||
315 | dest = dst = apr_pcalloc(p, len + 1); | ||
316 | |||
317 | /* Now actually fill in the string */ | ||
318 | |||
319 | src = input; | ||
320 | |||
321 | while ((c = *src++) != '\0') { | ||
322 | if (c == '&') | ||
323 | no = 0; | ||
324 | else if (c == '$' && apr_isdigit(*src)) | ||
325 | no = *src++ - '0'; | ||
326 | else | ||
327 | no = 10; | ||
328 | |||
329 | if (no> 9) { /* Ordinary character. */ | ||
330 | if (c == '\\' && (*src == '$' || *src == '&')) | ||
331 | c = *src++; | ||
332 | *dst++ = c; | ||
333 | } else if (no < nmatch && pmatch[no].rm_so < pmatch[no].rm_eo) { | ||
334 | len = pmatch[no].rm_eo - pmatch[no].rm_so; | ||
335 | memcpy(dst, source + pmatch[no].rm_so, len); | ||
336 | dst += len; | ||
337 | } | ||
338 | |||
339 | } | ||
340 | *dst = '\0'; | ||
341 | |||
342 | return dest; | ||
343 | } | ||
344 | /* End of pcreposix.c */ | ||
diff --git a/utility/ap_pcre.h b/utility/ap_pcre.h new file mode 100644 index 0000000..e817dc2 --- /dev/null +++ b/utility/ap_pcre.h | |||
@@ -0,0 +1,178 @@ | |||
1 | /* Licensed to the Apache Software Foundation (ASF) under one or more | ||
2 | * contributor license agreements. See the NOTICE file distributed with | ||
3 | * this work for additional information regarding copyright ownership. | ||
4 | * The ASF licenses this file to You under the Apache License, Version 2.0 | ||
5 | * (the "License"); you may not use this file except in compliance with | ||
6 | * the License. You may obtain a copy of the License at | ||
7 | * | ||
8 | * http://www.apache.org/licenses/LICENSE-2.0 | ||
9 | * | ||
10 | * Unless required by applicable law or agreed to in writing, software | ||
11 | * distributed under the License is distributed on an "AS IS" BASIS, | ||
12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
13 | * See the License for the specific language governing permissions and | ||
14 | * limitations under the License. | ||
15 | */ | ||
16 | |||
17 | /* Derived from PCRE's pcreposix.h. | ||
18 | |||
19 | Copyright (c) 1997-2004 University of Cambridge | ||
20 | |||
21 | ----------------------------------------------------------------------------- | ||
22 | Redistribution and use in source and binary forms, with or without | ||
23 | modification, are permitted provided that the following conditions are met: | ||
24 | |||
25 | * Redistributions of source code must retain the above copyright notice, | ||
26 | this list of conditions and the following disclaimer. | ||
27 | |||
28 | * Redistributions in binary form must reproduce the above copyright | ||
29 | notice, this list of conditions and the following disclaimer in the | ||
30 | documentation and/or other materials provided with the distribution. | ||
31 | |||
32 | * Neither the name of the University of Cambridge nor the names of its | ||
33 | contributors may be used to endorse or promote products derived from | ||
34 | this software without specific prior written permission. | ||
35 | |||
36 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||
37 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||
38 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||
39 | ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | ||
40 | LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||
41 | CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||
42 | SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||
43 | INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||
44 | CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||
45 | ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||
46 | POSSIBILITY OF SUCH DAMAGE. | ||
47 | ----------------------------------------------------------------------------- | ||
48 | */ | ||
49 | |||
50 | /** | ||
51 | * @file ap_regex.h | ||
52 | * @brief Apache Regex defines | ||
53 | */ | ||
54 | |||
55 | #ifndef AP_REGEX_H | ||
56 | #define AP_REGEX_H | ||
57 | |||
58 | #include "apr.h" | ||
59 | |||
60 | /* Allow for C++ users */ | ||
61 | |||
62 | #ifdef __cplusplus | ||
63 | extern "C" { | ||
64 | #endif | ||
65 | |||
66 | /* Options for ap_regexec: */ | ||
67 | |||
68 | #define AP_REG_ICASE 0x01 /** use a case-insensitive match */ | ||
69 | #define AP_REG_NEWLINE 0x02 /** don't match newlines against '.' etc */ | ||
70 | #define AP_REG_NOTBOL 0x04 /** ^ will not match against start-of-string */ | ||
71 | #define AP_REG_NOTEOL 0x08 /** $ will not match against end-of-string */ | ||
72 | |||
73 | #define AP_REG_EXTENDED (0) /** unused */ | ||
74 | #define AP_REG_NOSUB (0) /** unused */ | ||
75 | |||
76 | #define AP_MAX_REG_MATCH 10 | ||
77 | |||
78 | /* Error values: */ | ||
79 | enum { | ||
80 | AP_REG_ASSERT = 1, /** internal error ? */ | ||
81 | AP_REG_ESPACE, /** failed to get memory */ | ||
82 | AP_REG_INVARG, /** invalid argument */ | ||
83 | AP_REG_NOMATCH /** match failed */ | ||
84 | }; | ||
85 | |||
86 | /* The structure representing a compiled regular expression. */ | ||
87 | typedef struct { | ||
88 | void *re_pcre; | ||
89 | apr_size_t re_nsub; | ||
90 | apr_size_t re_erroffset; | ||
91 | } ap_regex_t; | ||
92 | |||
93 | /* The structure in which a captured offset is returned. */ | ||
94 | typedef struct { | ||
95 | int rm_so; | ||
96 | int rm_eo; | ||
97 | } ap_regmatch_t; | ||
98 | |||
99 | /* The functions */ | ||
100 | |||
101 | /** | ||
102 | * Compile a regular expression. | ||
103 | * @param preg Returned compiled regex | ||
104 | * @param regex The regular expression string | ||
105 | * @param cflags Must be zero (currently). | ||
106 | * @return Zero on success or non-zero on error | ||
107 | */ | ||
108 | int ap_regcomp(ap_regex_t *preg, const char *regex, int cflags); | ||
109 | |||
110 | /** | ||
111 | * Match a NUL-terminated string against a pre-compiled regex. | ||
112 | * @param preg The pre-compiled regex | ||
113 | * @param string The string to match | ||
114 | * @param nmatch Provide information regarding the location of any matches | ||
115 | * @param pmatch Provide information regarding the location of any matches | ||
116 | * @param eflags Bitwise OR of any of AP_REG_* flags | ||
117 | * @return 0 for successful match, #REG_NOMATCH otherwise | ||
118 | */ | ||
119 | int ap_regexec(const ap_regex_t *preg, const char *string, | ||
120 | apr_size_t nmatch, ap_regmatch_t *pmatch, int eflags); | ||
121 | |||
122 | /** | ||
123 | * Return the error code returned by regcomp or regexec into error messages | ||
124 | * @param errcode the error code returned by regexec or regcomp | ||
125 | * @param preg The precompiled regex | ||
126 | * @param errbuf A buffer to store the error in | ||
127 | * @param errbuf_size The size of the buffer | ||
128 | */ | ||
129 | apr_size_t ap_regerror(int errcode, const ap_regex_t *preg, | ||
130 | char *errbuf, apr_size_t errbuf_size); | ||
131 | |||
132 | /** Destroy a pre-compiled regex. | ||
133 | * @param preg The pre-compiled regex to free. | ||
134 | */ | ||
135 | void ap_regfree(ap_regex_t *preg); | ||
136 | |||
137 | /** | ||
138 | * Compile a regular expression to be used later | ||
139 | * @param p The pool to allocate from | ||
140 | * @param pattern the regular expression to compile | ||
141 | * @param cflags The bitwise or of one or more of the following: | ||
142 | * @li REG_EXTENDED - Use POSIX extended Regular Expressions | ||
143 | * @li REG_ICASE - Ignore case | ||
144 | * @li REG_NOSUB - Support for substring addressing of matches | ||
145 | * not required | ||
146 | * @li REG_NEWLINE - Match-any-character operators don't match new-line | ||
147 | * @return The compiled regular expression | ||
148 | */ | ||
149 | ap_regex_t * ap_pregcomp(apr_pool_t *p, const char *pattern, | ||
150 | int cflags); | ||
151 | |||
152 | /** | ||
153 | * Free the memory associated with a compiled regular expression | ||
154 | * @param p The pool the regex was allocated from | ||
155 | * @param reg The regular expression to free | ||
156 | */ | ||
157 | void ap_pregfree(apr_pool_t *p, ap_regex_t *reg); | ||
158 | |||
159 | /** | ||
160 | * After performing a successful regex match, you may use this function to | ||
161 | * perform a series of string substitutions based on subexpressions that were | ||
162 | * matched during the call to ap_regexec | ||
163 | * @param p The pool to allocate from | ||
164 | * @param input An arbitrary string containing $1 through $9. These are | ||
165 | * replaced with the corresponding matched sub-expressions | ||
166 | * @param source The string that was originally matched to the regex | ||
167 | * @param nmatch the nmatch returned from ap_pregex | ||
168 | * @param pmatch the pmatch array returned from ap_pregex | ||
169 | */ | ||
170 | char * ap_pregsub(apr_pool_t *p, const char *input, const char *source, | ||
171 | size_t nmatch, ap_regmatch_t pmatch[]); | ||
172 | |||
173 | #ifdef __cplusplus | ||
174 | } /* extern "C" */ | ||
175 | #endif | ||
176 | |||
177 | #endif /* AP_REGEX_T */ | ||
178 | |||
diff --git a/utility/config.c b/utility/config.c new file mode 100644 index 0000000..6867476 --- /dev/null +++ b/utility/config.c | |||
@@ -0,0 +1,534 @@ | |||
1 | #include "apr.h" | ||
2 | #include "apr_file_info.h" | ||
3 | #include "apr_file_io.h" | ||
4 | #include "apr_strings.h" | ||
5 | #include "apr_hash.h" | ||
6 | #include "apr_uri.h" | ||
7 | |||
8 | #include "shell.h" | ||
9 | #include "config.h" | ||
10 | #include "util.h" | ||
11 | #include "logparse.h" | ||
12 | #include "autoconfig.h" | ||
13 | |||
14 | apr_hash_t *g_config_opts; | ||
15 | |||
16 | static apr_status_t config_set_string(config_t *cfg, config_opt_t *opt, | ||
17 | int argc, const char **argv) | ||
18 | { | ||
19 | int offset = (int)(long)opt->data; | ||
20 | char **data = (char **)((void *)cfg + offset); | ||
21 | if (argc != 2) | ||
22 | return APR_EINVAL; | ||
23 | *data = apr_pstrdup(cfg->pool, argv[1]); | ||
24 | return APR_SUCCESS; | ||
25 | } | ||
26 | |||
27 | static apr_status_t config_set_file(config_t *cfg, config_opt_t *opt, | ||
28 | int argc, const char **argv) | ||
29 | { | ||
30 | int offset = (int)(long)opt->data; | ||
31 | char **data = (char **)((void *)cfg + offset); | ||
32 | if (argc != 2) | ||
33 | return APR_EINVAL; | ||
34 | apr_filepath_merge(data, NULL, argv[1], | ||
35 | APR_FILEPATH_TRUENAME, cfg->pool); | ||
36 | return APR_SUCCESS; | ||
37 | } | ||
38 | |||
39 | static apr_status_t config_set_int(config_t *cfg, config_opt_t *opt, int argc, | ||
40 | const char **argv) | ||
41 | { | ||
42 | int offset = (int)(long)opt->data; | ||
43 | int *data = (int *)((void *)cfg + offset); | ||
44 | if (argc != 2) | ||
45 | return APR_EINVAL; | ||
46 | *data = apr_atoi64(argv[1]); | ||
47 | return APR_SUCCESS; | ||
48 | } | ||
49 | |||
50 | static apr_status_t config_set_flag(config_t *cfg, config_opt_t *opt, int argc, | ||
51 | const char **argv) | ||
52 | { | ||
53 | int offset = (int)(long)opt->data; | ||
54 | int *data = (int *)((void *)cfg + offset); | ||
55 | if (argc != 2) | ||
56 | return APR_EINVAL; | ||
57 | *data = CHECK_YESNO(argv[1]); | ||
58 | return APR_SUCCESS; | ||
59 | } | ||
60 | |||
61 | static apr_status_t config_set_loglevel(config_t *cfg, config_opt_t *opt, | ||
62 | int argc, const char **argv) | ||
63 | { | ||
64 | if (argc != 2) | ||
65 | return APR_EINVAL; | ||
66 | if (!strcasecmp(argv[1], "error")) { | ||
67 | cfg->loglevel = LOGLEVEL_ERROR; | ||
68 | } else if (!strcasecmp(argv[1], "notice")) { | ||
69 | cfg->loglevel = LOGLEVEL_NOTICE; | ||
70 | } else if (!strcasecmp(argv[1], "debug")) { | ||
71 | cfg->loglevel = LOGLEVEL_DEBUG; | ||
72 | } else { | ||
73 | cfg->loglevel = LOGLEVEL_ERROR; | ||
74 | } | ||
75 | return APR_SUCCESS; | ||
76 | } | ||
77 | |||
78 | static apr_status_t config_set_inputfile(config_t *cfg, config_opt_t *opt, | ||
79 | int argc, const char **argv) | ||
80 | { | ||
81 | config_filestat_t *newp; | ||
82 | if (argc != 2) | ||
83 | return APR_EINVAL; | ||
84 | newp = (config_filestat_t *)apr_array_push(cfg->input_files); | ||
85 | char *temp; | ||
86 | apr_filepath_merge(&temp, NULL, argv[1], | ||
87 | APR_FILEPATH_TRUENAME, cfg->pool); | ||
88 | newp->fname = temp; | ||
89 | newp->result = "Not Parsed"; | ||
90 | return APR_SUCCESS; | ||
91 | } | ||
92 | |||
93 | static apr_status_t config_set_dummy(config_t *cfg, config_opt_t *opt, | ||
94 | int argc, const char **argv) | ||
95 | { | ||
96 | return APR_SUCCESS; | ||
97 | } | ||
98 | |||
99 | static apr_status_t config_set_logformat(config_t *cfg, config_opt_t *opt, | ||
100 | int argc, const char **argv) | ||
101 | { | ||
102 | config_logformat_t *format; | ||
103 | config_logformat_field_t *field; | ||
104 | |||
105 | if (argc != 4) | ||
106 | return APR_EINVAL; | ||
107 | |||
108 | format = apr_hash_get(cfg->log_formats, argv[1], APR_HASH_KEY_STRING); | ||
109 | if (!format) { | ||
110 | format = apr_palloc(cfg->pool, sizeof(config_logformat_t)); | ||
111 | format->name = apr_pstrdup(cfg->pool, argv[1]); | ||
112 | format->fields = apr_array_make(cfg->pool, 5, | ||
113 | sizeof(config_logformat_field_t)); | ||
114 | apr_hash_set(cfg->log_formats, apr_pstrdup(cfg->pool,argv[1]), APR_HASH_KEY_STRING, format); | ||
115 | } | ||
116 | field = (config_logformat_field_t *)apr_array_push(format->fields); | ||
117 | field->name = apr_pstrdup(cfg->pool, argv[2]); | ||
118 | field->datatype = apr_pstrdup(cfg->pool, argv[3]); | ||
119 | return APR_SUCCESS; | ||
120 | } | ||
121 | |||
122 | static apr_status_t config_set_output_field(config_t *cfg, config_opt_t *opt, | ||
123 | int argc, const char **argv) | ||
124 | { | ||
125 | config_output_field_t *field; | ||
126 | char *type, *size, *temp; | ||
127 | |||
128 | if (argc < 5) | ||
129 | return APR_EINVAL; | ||
130 | field = (config_output_field_t *)apr_array_push(cfg->output_fields); | ||
131 | field->field = apr_pstrdup(cfg->pool, argv[1]); | ||
132 | field->source = apr_pstrdup(cfg->pool, argv[4]); | ||
133 | field->def = apr_pstrdup(cfg->pool, argv[3]); | ||
134 | type = size = apr_pstrdup(cfg->pool, argv[2]); | ||
135 | while (*size!='\0' && *size!='(') | ||
136 | size++; | ||
137 | if (*size == '(') { | ||
138 | *size = '\0'; | ||
139 | size++; | ||
140 | temp = size; | ||
141 | while (*temp != '\0' && *temp != ')') | ||
142 | temp++; | ||
143 | *temp = '\0'; | ||
144 | field->size = apr_atoi64(size); | ||
145 | } | ||
146 | if (strcasecmp("VARCHAR", type)==0) { | ||
147 | field->datatype = LOGSQL_DATATYPE_VARCHAR; | ||
148 | } else if (strcasecmp("INT", type)==0) { | ||
149 | field->datatype = LOGSQL_DATATYPE_INT; | ||
150 | } else if (strcasecmp("CHAR", type)==0) { | ||
151 | field->datatype = LOGSQL_DATATYPE_CHAR; | ||
152 | } else if (strcasecmp("SMALLINT", type)==0) { | ||
153 | field->datatype = LOGSQL_DATATYPE_SMALLINT; | ||
154 | } else if (strcasecmp("BIGINT", type)==0) { | ||
155 | field->datatype = LOGSQL_DATATYPE_BIGINT; | ||
156 | } else { | ||
157 | return APR_EINVAL; | ||
158 | } | ||
159 | |||
160 | // Has a function | ||
161 | if (argc > 5) { | ||
162 | int i; | ||
163 | field->fname = apr_pstrdup(cfg->pool, argv[5]); | ||
164 | field->func = parser_get_func(field->fname); | ||
165 | field->args = apr_pcalloc(cfg->pool, sizeof(char *) * (argc-5+1)); | ||
166 | for (i=6; i<=argc; i++) { | ||
167 | field->args[i-6] = apr_pstrdup(cfg->pool, argv[i]); | ||
168 | } | ||
169 | } | ||
170 | |||
171 | return APR_SUCCESS; | ||
172 | } | ||
173 | |||
174 | static apr_status_t config_set_filter(config_t *cfg, config_opt_t *opt, | ||
175 | int argc, const char **argv) | ||
176 | { | ||
177 | int argn = 1; | ||
178 | config_filter_t *filter; | ||
179 | switch (opt->name[1]) { | ||
180 | case 'i': //line | ||
181 | filter = apr_array_push(cfg->linefilters); | ||
182 | break; | ||
183 | case 'r': //pre | ||
184 | filter = apr_array_push(cfg->prefilters); | ||
185 | break; | ||
186 | case 'o': //post | ||
187 | filter = apr_array_push(cfg->postfilters); | ||
188 | break; | ||
189 | } | ||
190 | |||
191 | if (opt->name[0]=='P') { // Pre or post 2-3 args | ||
192 | if (argc == 1) | ||
193 | return APR_EINVAL; | ||
194 | filter->field = apr_pstrdup(cfg->pool, argv[1]); | ||
195 | argn++; | ||
196 | } // Otherwise Line based only 1-2 args (no field) | ||
197 | if (argc <= argn) | ||
198 | return APR_EINVAL; | ||
199 | if (*argv[argn] == '+') | ||
200 | argn++; | ||
201 | if (*argv[argn] == '-') { | ||
202 | filter->negative = 1; | ||
203 | argn++; | ||
204 | } | ||
205 | if (filter->negative && argc == argn) { | ||
206 | // if no filter for negative.. that's ok.. Assume ALL | ||
207 | return APR_SUCCESS; | ||
208 | } | ||
209 | if (argc <= argn) | ||
210 | return APR_EINVAL; | ||
211 | filter->filter = apr_pstrdup(cfg->pool, argv[argn]); | ||
212 | filter->regex = ap_pregcomp(cfg->pool, filter->filter, AP_REG_EXTENDED|AP_REG_ICASE); | ||
213 | return APR_SUCCESS; | ||
214 | } | ||
215 | |||
216 | void config_dump(config_t *cfg) | ||
217 | { | ||
218 | apr_hash_index_t *hi; | ||
219 | int i; | ||
220 | config_output_field_t *fields; | ||
221 | config_filter_t *filters; | ||
222 | |||
223 | printf("ErrorLog: %s\n", cfg->errorlog); | ||
224 | printf("LogLevel: %d\n", cfg->loglevel); | ||
225 | |||
226 | printf("BadLineFile: %s\n", cfg->badlinefile); | ||
227 | printf("BadLineMax: %d\n", cfg->badlinemax); | ||
228 | |||
229 | printf("InputDir: %s\n", cfg->input_dir); | ||
230 | |||
231 | printf("Split input files: %d\n", cfg->split_enabled); | ||
232 | printf("Split output directory: %s\n", cfg->split_dir); | ||
233 | printf("Split file count: %d\n", cfg->split_count); | ||
234 | printf("Split min lines: %'d\n", cfg->split_minimum); | ||
235 | printf("Split max lines: %'d\n", cfg->split_maximum); | ||
236 | |||
237 | printf("DB Driver: %s\n", cfg->dbdriver); | ||
238 | printf("DB Params: %s\n", cfg->dbparams); | ||
239 | |||
240 | printf("Table: %s\n", cfg->table); | ||
241 | printf("Transactions: %d\n", cfg->transactions); | ||
242 | printf("MachineID: %s\n", cfg->machineid); | ||
243 | |||
244 | printf("Log formats:\n"); | ||
245 | for (hi = apr_hash_first(cfg->pool, cfg->log_formats); hi; hi | ||
246 | = apr_hash_next(hi)) { | ||
247 | config_logformat_t *format; | ||
248 | config_logformat_field_t *fields; | ||
249 | int i; | ||
250 | |||
251 | apr_hash_this(hi, NULL, NULL, (void **)&format); | ||
252 | printf(">> '%s'\n", format->name); | ||
253 | fields = (config_logformat_field_t *)format->fields->elts; | ||
254 | for (i=0; i<format->fields->nelts; i++) { | ||
255 | printf(">>>> %s:%s\n", fields[i].name, fields[i].datatype); | ||
256 | } | ||
257 | } | ||
258 | printf("Log Format: '%s'\n", cfg->logformat); | ||
259 | |||
260 | printf("Output Fields:\n"); | ||
261 | fields = (config_output_field_t *)cfg->output_fields->elts; | ||
262 | for (i=0; i<cfg->output_fields->nelts; i++) { | ||
263 | printf(">> %s %s(%d) DEFAULT '%s': %s", fields[i].field, | ||
264 | logsql_field_datatyeName(fields[i].datatype), | ||
265 | fields[i].size, fields[i].def, fields[i].source); | ||
266 | if (fields[i].func) { | ||
267 | printf(" :: %s(", fields[i].fname); | ||
268 | if (fields[i].args) { | ||
269 | int a = 0; | ||
270 | while (fields[i].args[a]) { | ||
271 | printf("%s,", fields[i].args[a]); | ||
272 | a++; | ||
273 | } | ||
274 | } | ||
275 | printf(")"); | ||
276 | } | ||
277 | printf("\n"); | ||
278 | } | ||
279 | printf("Filters:\n>> Line:\n"); | ||
280 | filters = (config_filter_t *)cfg->linefilters->elts; | ||
281 | for (i=0; i<cfg->linefilters->nelts; i++) { | ||
282 | printf(">>>> %c \"%s\" (%pp)\n",filters[i].negative ? '-':'+', | ||
283 | filters[i].filter, filters[i].regex); | ||
284 | } | ||
285 | printf(">> Pre:\n"); | ||
286 | filters = (config_filter_t *)cfg->prefilters->elts; | ||
287 | for (i=0; i<cfg->prefilters->nelts; i++) { | ||
288 | printf(">>>> %s %c \"%s\" (%pp)\n", | ||
289 | filters[i].field, filters[i].negative ? '-':'+', | ||
290 | filters[i].filter, filters[i].regex); | ||
291 | } | ||
292 | printf(">> Post:\n"); | ||
293 | filters = (config_filter_t *)cfg->postfilters->elts; | ||
294 | for (i=0; i<cfg->postfilters->nelts; i++) { | ||
295 | printf(">>>> %s %c \"%s\" (%pp)\n", | ||
296 | filters[i].field, filters[i].negative ? '-':'+', | ||
297 | filters[i].filter, filters[i].regex); | ||
298 | } | ||
299 | |||
300 | printf("DryRun: %d\n", cfg->dryrun); | ||
301 | printf("Summary: %d\n", cfg->summary); | ||
302 | } | ||
303 | |||
304 | #define config_get_option(name) apr_hash_get(g_config_opts, name, APR_HASH_KEY_STRING) | ||
305 | |||
306 | static void config_add_option(apr_pool_t *p, const char *const name, | ||
307 | const char *const help, config_func_t func, void *data) | ||
308 | { | ||
309 | config_opt_t *opt; | ||
310 | if (!g_config_opts) { | ||
311 | g_config_opts = apr_hash_make(p); | ||
312 | } | ||
313 | opt = apr_palloc(p, sizeof(config_opt_t)); | ||
314 | opt->name = name; | ||
315 | opt->help = help; | ||
316 | opt->func = func; | ||
317 | opt->data = data; | ||
318 | apr_hash_set(g_config_opts, lowerstr(p, name), APR_HASH_KEY_STRING, opt); | ||
319 | } | ||
320 | |||
321 | void config_init(apr_pool_t *p) | ||
322 | { | ||
323 | config_add_option(p, "ErrorLog", "File to log errors", config_set_file, | ||
324 | (void *)APR_OFFSETOF(config_t, errorlog)); | ||
325 | config_add_option(p, "LogLevel", "Set Log Level (error, warn, debug, quiet)", | ||
326 | config_set_loglevel, NULL); | ||
327 | |||
328 | config_add_option(p, "BadLineFile", "File to log bad log lines", config_set_file, | ||
329 | (void *)APR_OFFSETOF(config_t, badlinefile)); | ||
330 | config_add_option(p, "BadLineMax", "Max number of bad lines before aborting", | ||
331 | config_set_int, (void *)APR_OFFSETOF(config_t, badlinemax)); | ||
332 | |||
333 | |||
334 | config_add_option(p, "InputDirectory", "Directory to scan for log files", | ||
335 | config_set_file, (void *)APR_OFFSETOF(config_t, input_dir)); | ||
336 | config_add_option(p, "InputFile", "Parse only this file", | ||
337 | config_set_inputfile, NULL); | ||
338 | |||
339 | config_add_option(p, "SplitInput", | ||
340 | "Split the file into pieces, then process", | ||
341 | config_set_flag, (void *)APR_OFFSETOF(config_t, split_enabled)); | ||
342 | config_add_option(p, "SplitCount", | ||
343 | "Split the file into N number of pieces", | ||
344 | config_set_int, (void *)APR_OFFSETOF(config_t, split_count)); | ||
345 | config_add_option(p, "SplitMinLines", | ||
346 | "Each split piece will have a minumum of N lines", | ||
347 | config_set_int, (void *)APR_OFFSETOF(config_t, split_minimum)); | ||
348 | config_add_option(p, "SplitMaxLines", | ||
349 | "Each split piece will have a maximum of N lines", | ||
350 | config_set_int, (void *)APR_OFFSETOF(config_t, split_maximum)); | ||
351 | config_add_option(p, "SplitDirectory", | ||
352 | "Output directory to put intermediate split files", | ||
353 | config_set_file, (void *)APR_OFFSETOF(config_t, split_dir)); | ||
354 | |||
355 | config_add_option(p, "ThreadCount", | ||
356 | "Numer of threads to use for processing the input files", | ||
357 | config_set_int, (void *)APR_OFFSETOF(config_t, thread_count)); | ||
358 | |||
359 | config_add_option(p, "DBDDriver", "DBD Driver to use", | ||
360 | config_set_string, (void *)APR_OFFSETOF(config_t, dbdriver)); | ||
361 | config_add_option(p, "DBDParams", "DBD Connection Parameters", | ||
362 | config_set_string, (void *)APR_OFFSETOF(config_t, dbparams)); | ||
363 | config_add_option(p, "Table", "Table to import the log to", | ||
364 | config_set_string, (void *)APR_OFFSETOF(config_t, table)); | ||
365 | config_add_option(p, "UseTransactions", "Enable Transactions?", | ||
366 | config_set_flag, (void *)APR_OFFSETOF(config_t, transactions)); | ||
367 | config_add_option(p, "MachineID", "Machine ID to set", | ||
368 | config_set_string, (void *)APR_OFFSETOF(config_t, machineid)); | ||
369 | |||
370 | config_add_option(p, "LogFormatConfig", "Define input log formats", | ||
371 | config_set_logformat, NULL); | ||
372 | config_add_option(p, "LogFormat", "Use this logformat when parsing files", | ||
373 | config_set_string, (void *)APR_OFFSETOF(config_t, logformat)); | ||
374 | |||
375 | config_add_option(p, "LineFilter", | ||
376 | "A regular expression to apply to the input line", | ||
377 | config_set_filter, (void *)APR_OFFSETOF(config_t, linefilters)); | ||
378 | config_add_option(p, "PreFilter", | ||
379 | "A regular expression to apply to a specific input field", | ||
380 | config_set_filter, (void *)APR_OFFSETOF(config_t, prefilters)); | ||
381 | config_add_option(p, "PostFilter", | ||
382 | "A regular expression to apply to a specific SQL output field", | ||
383 | config_set_filter, (void *)APR_OFFSETOF(config_t, postfilters)); | ||
384 | |||
385 | config_add_option(p, "OutputField", | ||
386 | "Define output fields: field datatype source optfunc optarg...", | ||
387 | config_set_output_field, NULL); | ||
388 | |||
389 | config_add_option(p, "DryRun", "Don't perform any actual database changes", | ||
390 | config_set_flag, (void *)APR_OFFSETOF(config_t, dryrun)); | ||
391 | config_add_option(p, "Dump", "Dump Configuration and quit", | ||
392 | config_set_flag, (void *)APR_OFFSETOF(config_t, dump)); | ||
393 | config_add_option(p, "Config", "Dummy to handle config directive", | ||
394 | config_set_dummy, NULL); | ||
395 | config_add_option(p, "Summary", "Show the summary before exit?", | ||
396 | config_set_flag, (void *)APR_OFFSETOF(config_t, summary)); | ||
397 | } | ||
398 | |||
399 | config_t *config_create(apr_pool_t *p) | ||
400 | { | ||
401 | config_t *cfg; | ||
402 | apr_pool_t *sp; | ||
403 | apr_pool_create(&sp, p); | ||
404 | cfg = apr_pcalloc(sp, sizeof(config_t)); | ||
405 | cfg->pool = sp; | ||
406 | cfg->loglevel = LOGLEVEL_ERROR; | ||
407 | cfg->summary = 1; | ||
408 | cfg->transactions = 1; | ||
409 | cfg->thread_count = 0; // default zero thread (aka non-threaded) | ||
410 | cfg->split_count = 4; | ||
411 | cfg->split_minimum = 10000; | ||
412 | cfg->split_maximum = 50000; | ||
413 | cfg->input_files = apr_array_make(cfg->pool, 2, sizeof(config_filestat_t)); | ||
414 | cfg->log_formats = apr_hash_make(cfg->pool); | ||
415 | cfg->output_fields = apr_array_make(cfg->pool, 10, | ||
416 | sizeof(config_output_field_t)); | ||
417 | cfg->linefilters = apr_array_make(cfg->pool, 2, sizeof(config_filter_t)); | ||
418 | cfg->prefilters = apr_array_make(cfg->pool, 2, sizeof(config_filter_t)); | ||
419 | cfg->postfilters = apr_array_make(cfg->pool, 2, sizeof(config_filter_t)); | ||
420 | return cfg; | ||
421 | } | ||
422 | |||
423 | apr_status_t config_check(config_t *cfg) | ||
424 | { | ||
425 | apr_status_t ret = APR_SUCCESS; | ||
426 | if (!cfg->dbdriver || !cfg->dbparams) { | ||
427 | logging_log(cfg, LOGLEVEL_NOISE, "CONFIG: Database configuration is missing"); | ||
428 | ret = APR_EINVAL; | ||
429 | } | ||
430 | if (!cfg->table) { | ||
431 | logging_log(cfg, LOGLEVEL_NOISE, "CONFIG: No Log Table defined"); | ||
432 | ret = APR_EINVAL; | ||
433 | } | ||
434 | if (apr_is_empty_array(cfg->output_fields)) { | ||
435 | logging_log(cfg, LOGLEVEL_NOISE, "CONFIG: No Output Fields Defined"); | ||
436 | ret = APR_EINVAL; | ||
437 | } | ||
438 | if (apr_hash_count(cfg->log_formats)==0) { | ||
439 | logging_log(cfg, LOGLEVEL_NOISE, "CONFIG: No Input Log Formats Defined"); | ||
440 | ret = APR_EINVAL; | ||
441 | } | ||
442 | #if !defined(HAVE_APR_DBD_TRANSACTION_MODE_GET) | ||
443 | if (cfg->transactions) { | ||
444 | logging_log(cfg, LOGLEVEL_NOISE, "CONFIG: Disabling Transaction Support. Requires apr-util 1.3.0 or higher"); | ||
445 | cfg->transactions = 0; | ||
446 | } | ||
447 | #endif | ||
448 | return ret; | ||
449 | } | ||
450 | |||
451 | static int config_merge(void *rec, const char *key, const char *value) | ||
452 | { | ||
453 | config_t *cfg = (config_t *)rec; | ||
454 | |||
455 | config_opt_t *opt= config_get_option(key); | ||
456 | if (opt) { | ||
457 | const char *args[] = { | ||
458 | key, | ||
459 | value }; | ||
460 | opt->func(cfg, opt, 2, args); | ||
461 | } else { | ||
462 | logging_log(cfg, LOGLEVEL_NOISE, "Unhandled: %s\n", key); | ||
463 | } | ||
464 | return 1; | ||
465 | } | ||
466 | |||
467 | apr_status_t config_read(config_t *cfg, const char *filename, | ||
468 | apr_table_t *merge) | ||
469 | { | ||
470 | apr_finfo_t finfo; | ||
471 | apr_file_t *file; | ||
472 | apr_status_t rv, ret= APR_SUCCESS; | ||
473 | apr_pool_t *tp, *targp; | ||
474 | config_opt_t *opt; | ||
475 | char buff[1024]; | ||
476 | char *ptr; | ||
477 | char **targv; | ||
478 | int targc; | ||
479 | int line; | ||
480 | |||
481 | apr_pool_create(&tp, cfg->pool); | ||
482 | apr_pool_create(&targp, tp); | ||
483 | |||
484 | if (apr_stat(&finfo, filename, APR_FINFO_MIN, tp) != APR_SUCCESS) { | ||
485 | return APR_ENOENT; | ||
486 | } | ||
487 | rv = apr_file_open(&file, filename, APR_FOPEN_READ | APR_BUFFERED, | ||
488 | APR_OS_DEFAULT, tp); | ||
489 | if (rv != APR_SUCCESS) | ||
490 | return rv; | ||
491 | |||
492 | line = 0; | ||
493 | do { | ||
494 | rv = apr_file_gets(buff, 1024, file); | ||
495 | if (rv == APR_SUCCESS) { // we read data | ||
496 | line++; | ||
497 | |||
498 | // skip leading white space | ||
499 | for (ptr = buff; *ptr == ' ' || *ptr == '\t'; ptr++) | ||
500 | ; | ||
501 | line_chomp(ptr); | ||
502 | |||
503 | // skip comments | ||
504 | if (*ptr == '#') | ||
505 | continue; | ||
506 | if (*ptr == '\0') | ||
507 | continue; | ||
508 | apr_pool_clear(targp); | ||
509 | parser_tokenize_line(ptr, &targv, targp); | ||
510 | targc = 0; | ||
511 | while (targv[targc]) | ||
512 | targc++; | ||
513 | opt = config_get_option(lowerstr(targp,targv[0])); | ||
514 | if (opt) { | ||
515 | rv = opt->func(cfg, opt, targc, (const char **)targv); | ||
516 | if (APR_STATUS_IS_EINVAL(rv)) { | ||
517 | logging_log(cfg, LOGLEVEL_NOISE, | ||
518 | "Config Error: Invalid Arguments for %s\n\t%s\n", | ||
519 | opt->name, opt->help); | ||
520 | ret = rv; | ||
521 | } | ||
522 | } else { | ||
523 | logging_log(cfg, LOGLEVEL_NOISE, "Unhandled: %s\n", targv[0]); | ||
524 | } | ||
525 | } | ||
526 | } while (rv == APR_SUCCESS); | ||
527 | |||
528 | // Apply merges | ||
529 | apr_table_do(config_merge, (void *)cfg, merge, NULL); | ||
530 | |||
531 | apr_file_close(file); | ||
532 | apr_pool_destroy(tp); | ||
533 | return ret; | ||
534 | } | ||
diff --git a/utility/config.h b/utility/config.h new file mode 100644 index 0000000..a9bd1b5 --- /dev/null +++ b/utility/config.h | |||
@@ -0,0 +1,190 @@ | |||
1 | #ifndef CONFIG_H_ | ||
2 | #define CONFIG_H_ | ||
3 | |||
4 | #include "apr_tables.h" | ||
5 | #include "apr_hash.h" | ||
6 | #include "apr_file_io.h" | ||
7 | #include "ap_pcre.h" | ||
8 | |||
9 | typedef enum { | ||
10 | LOGLEVEL_NOISE = 0, | ||
11 | LOGLEVEL_NONE, | ||
12 | LOGLEVEL_ERROR, | ||
13 | LOGLEVEL_NOTICE, | ||
14 | LOGLEVEL_DEBUG, | ||
15 | } loglevel_e; | ||
16 | |||
17 | typedef struct config_dbd_t config_dbd_t; | ||
18 | typedef struct config_t config_t; | ||
19 | struct config_t { | ||
20 | /** the structures pool (to ease function arguments) */ | ||
21 | apr_pool_t *pool; | ||
22 | |||
23 | /** error log file */ | ||
24 | const char *errorlog; | ||
25 | /** log level */ | ||
26 | loglevel_e loglevel; | ||
27 | /** error_log */ | ||
28 | apr_file_t *errorlog_fp; | ||
29 | apr_file_t *errorlog_fperr; | ||
30 | apr_pool_t *errorlog_p; | ||
31 | |||
32 | const char *badlinefile; | ||
33 | const char *badlastfile; | ||
34 | apr_file_t *badline_fp; | ||
35 | int badline_count; | ||
36 | int badlinemax; | ||
37 | |||
38 | |||
39 | /** input directory of log files */ | ||
40 | const char *input_dir; | ||
41 | /** list of files to scan */ | ||
42 | apr_array_header_t *input_files; | ||
43 | |||
44 | /** split the input file before processing */ | ||
45 | int split_enabled; | ||
46 | /** the number of files to split each input file into */ | ||
47 | int split_count; | ||
48 | /** the minimum number of lines for each piece */ | ||
49 | int split_minimum; | ||
50 | /** the maximum number of lines for each piece */ | ||
51 | int split_maximum; | ||
52 | /** directory to put ouput split files */ | ||
53 | const char *split_dir; | ||
54 | |||
55 | /** the number of threads to run the import in */ | ||
56 | int thread_count; | ||
57 | |||
58 | /** db connection configuration */ | ||
59 | const char *dbdriver; | ||
60 | const char *dbparams; | ||
61 | |||
62 | /** Logging table */ | ||
63 | const char *table; | ||
64 | /** Use transactons */ | ||
65 | int transactions; | ||
66 | /** Machine ID */ | ||
67 | const char *machineid; | ||
68 | |||
69 | /** Log file formats */ | ||
70 | apr_hash_t *log_formats; | ||
71 | /** format to use to parse files */ | ||
72 | const char *logformat; | ||
73 | |||
74 | /** output fields */ | ||
75 | apr_array_header_t *output_fields; | ||
76 | |||
77 | /** filter configuration */ | ||
78 | apr_array_header_t *linefilters; | ||
79 | apr_array_header_t *prefilters; | ||
80 | apr_array_header_t *postfilters; | ||
81 | |||
82 | /** Dry Run */ | ||
83 | int dryrun; | ||
84 | /** dump configuration only */ | ||
85 | int dump; | ||
86 | |||
87 | /* Show the summary */ | ||
88 | int summary; | ||
89 | }; | ||
90 | |||
91 | typedef struct config_filestat_t config_filestat_t; | ||
92 | struct config_filestat_t { | ||
93 | const char *fname; | ||
94 | apr_size_t linesparsed; | ||
95 | apr_size_t lineskipped; | ||
96 | apr_size_t linesbad; | ||
97 | const char *result; | ||
98 | apr_time_t start; | ||
99 | apr_time_t stop; | ||
100 | }; | ||
101 | |||
102 | typedef struct config_logformat_t config_logformat_t; | ||
103 | struct config_logformat_t { | ||
104 | const char *name; | ||
105 | apr_array_header_t *fields; | ||
106 | }; | ||
107 | |||
108 | typedef struct config_logformat_field_t config_logformat_field_t; | ||
109 | struct config_logformat_field_t { | ||
110 | const char *name; | ||
111 | const char *datatype; | ||
112 | }; | ||
113 | |||
114 | typedef struct config_opt_t config_opt_t; | ||
115 | typedef apr_status_t (*config_func_t)(config_t *cfg, config_opt_t *opt, | ||
116 | int argc, const char **argv); | ||
117 | struct config_opt_t { | ||
118 | const char *name; | ||
119 | const char *help; | ||
120 | config_func_t func; | ||
121 | void *data; | ||
122 | }; | ||
123 | |||
124 | typedef struct config_filter_t config_filter_t; | ||
125 | struct config_filter_t { | ||
126 | const char *field; | ||
127 | const char *filter; | ||
128 | int negative; | ||
129 | ap_regex_t *regex; | ||
130 | }; | ||
131 | |||
132 | typedef enum { | ||
133 | LOGSQL_DATATYPE_INT = 0, | ||
134 | LOGSQL_DATATYPE_SMALLINT, | ||
135 | LOGSQL_DATATYPE_VARCHAR, | ||
136 | LOGSQL_DATATYPE_CHAR, | ||
137 | LOGSQL_DATATYPE_BIGINT | ||
138 | } logsql_field_datatype; | ||
139 | #define logsql_field_datatyeName(x) \ | ||
140 | (x == LOGSQL_DATATYPE_INT ? "INT" \ | ||
141 | : (x == LOGSQL_DATATYPE_SMALLINT ? "SMALLINT" \ | ||
142 | : (x == LOGSQL_DATATYPE_VARCHAR ? "VARCHAR" \ | ||
143 | : (x == LOGSQL_DATATYPE_CHAR ? "CHAR" \ | ||
144 | : (x == LOGSQL_DATATYPE_BIGINT ? "BIGINT" : "ERR"))))) | ||
145 | |||
146 | typedef struct config_output_field_t config_output_field_t; | ||
147 | |||
148 | typedef struct parser_func_t parser_func_t; | ||
149 | |||
150 | struct config_output_field_t { | ||
151 | const char *field; | ||
152 | logsql_field_datatype datatype; | ||
153 | apr_size_t size; | ||
154 | const char *def; | ||
155 | const char *source; | ||
156 | const char *fname; | ||
157 | parser_func_t *func; | ||
158 | const char **args; | ||
159 | void *data; | ||
160 | }; | ||
161 | |||
162 | #define CHECK_YESNO(c) ((!strcasecmp(c,"on") || !strcasecmp(c,"yes")) ? 1 : 0) | ||
163 | |||
164 | /** | ||
165 | * Initialize the config parser | ||
166 | */ | ||
167 | void config_init(apr_pool_t *p); | ||
168 | |||
169 | /** | ||
170 | * Dump the configuration to stdout | ||
171 | */ | ||
172 | void config_dump(config_t *cfg); | ||
173 | |||
174 | /** | ||
175 | * Checks the configuration to ensure all the required settings are set | ||
176 | */ | ||
177 | apr_status_t config_check(config_t *cfg); | ||
178 | |||
179 | /** | ||
180 | * Creates the default configuration | ||
181 | */ | ||
182 | config_t *config_create(apr_pool_t *p); | ||
183 | |||
184 | /** | ||
185 | * Read in a configuration file | ||
186 | */ | ||
187 | apr_status_t config_read(config_t *cfg, const char *filename, | ||
188 | apr_table_t *merge); | ||
189 | |||
190 | #endif /*CONFIG_H_*/ | ||
diff --git a/utility/database.c b/utility/database.c new file mode 100644 index 0000000..ff81caa --- /dev/null +++ b/utility/database.c | |||
@@ -0,0 +1,212 @@ | |||
1 | #include "database.h" | ||
2 | #include "apu.h" | ||
3 | #include "apr_dbd.h" | ||
4 | #include "apr_strings.h" | ||
5 | |||
6 | #include "util.h" | ||
7 | #include "autoconfig.h" | ||
8 | |||
9 | struct config_dbd_t { | ||
10 | const apr_dbd_driver_t *driver; | ||
11 | apr_dbd_t *dbd; | ||
12 | apr_dbd_prepared_t *stmt; | ||
13 | apr_dbd_transaction_t *txn; | ||
14 | const char **args; | ||
15 | }; | ||
16 | |||
17 | void database_init(apr_pool_t *p) | ||
18 | { | ||
19 | apr_dbd_init(p); | ||
20 | } | ||
21 | |||
22 | /** @todo split this into load and connect */ | ||
23 | apr_status_t database_connect(config_t *cfg, config_dbd_t **dbconn) | ||
24 | { | ||
25 | apr_status_t rv; | ||
26 | if (!cfg->dbdriver || !cfg->dbparams) | ||
27 | return APR_EINVAL; | ||
28 | if (!*dbconn) { | ||
29 | *dbconn = apr_pcalloc(cfg->pool, sizeof(config_dbd_t)); | ||
30 | } | ||
31 | rv = apr_dbd_get_driver(cfg->pool, cfg->dbdriver, &((*dbconn)->driver)); | ||
32 | if (rv) { | ||
33 | |||
34 | logging_log(cfg, LOGLEVEL_ERROR, | ||
35 | "DB: Could not load database driver %s. Error %s", | ||
36 | cfg->dbdriver, logging_strerror(rv)); | ||
37 | return rv; | ||
38 | } | ||
39 | |||
40 | rv = apr_dbd_open((*dbconn)->driver, cfg->pool, cfg->dbparams, | ||
41 | &((*dbconn)->dbd)); | ||
42 | if (rv) { | ||
43 | logging_log(cfg, LOGLEVEL_ERROR, | ||
44 | "DB: Could not connect to database. Error (%d)%s", rv, | ||
45 | logging_strerror(rv)); | ||
46 | return rv; | ||
47 | } | ||
48 | |||
49 | return APR_SUCCESS; | ||
50 | } | ||
51 | |||
52 | apr_status_t database_disconnect(config_dbd_t *dbconn) | ||
53 | { | ||
54 | return apr_dbd_close(dbconn->driver, dbconn->dbd); | ||
55 | } | ||
56 | |||
57 | static apr_dbd_prepared_t *database_prepare_insert(config_t *cfg, | ||
58 | config_dbd_t *dbconn, apr_pool_t *p) | ||
59 | { | ||
60 | apr_status_t rv; | ||
61 | char *sql; | ||
62 | int i, f; | ||
63 | struct iovec *vec; | ||
64 | apr_dbd_prepared_t *stmt= NULL; | ||
65 | int nfs = cfg->output_fields->nelts; | ||
66 | config_output_field_t *ofields; | ||
67 | |||
68 | ofields = (config_output_field_t *)cfg->output_fields->elts; | ||
69 | |||
70 | vec = apr_palloc(p, (nfs*2 + 5) * sizeof(struct iovec)); | ||
71 | sql = apr_palloc(p, (nfs*3)); | ||
72 | |||
73 | vec[0].iov_base = "INSERT INTO "; | ||
74 | vec[0].iov_len = 12; | ||
75 | vec[1].iov_base = (void *)cfg->table; | ||
76 | vec[1].iov_len = strlen(cfg->table); | ||
77 | vec[2].iov_base = " ("; | ||
78 | vec[2].iov_len = 2; | ||
79 | for (i=3, f=0; f<nfs; f++, i+=2) { | ||
80 | vec[i].iov_base = (void *)ofields[f].field; | ||
81 | vec[i].iov_len = strlen(vec[i].iov_base); | ||
82 | vec[i+1].iov_base = ","; | ||
83 | vec[i+1].iov_len = 1; | ||
84 | memcpy(&sql[f*3], "%s,", 3); | ||
85 | } | ||
86 | sql[nfs*3-1] = '\0'; | ||
87 | vec[i-1].iov_base = ") VALUES ("; | ||
88 | vec[i-1].iov_len = 10; | ||
89 | vec[i].iov_base = sql; | ||
90 | vec[i].iov_len = nfs*3-1; | ||
91 | vec[i+1].iov_base = ")"; | ||
92 | vec[i+1].iov_len = 1; | ||
93 | |||
94 | sql = apr_pstrcatv(p, vec, i+2, NULL); | ||
95 | |||
96 | logging_log(cfg, LOGLEVEL_DEBUG, "DB: Generated SQL: %s", sql); | ||
97 | |||
98 | rv = apr_dbd_prepare(dbconn->driver, cfg->pool, dbconn->dbd, sql, | ||
99 | "INSERT", &stmt); | ||
100 | |||
101 | if (rv) { | ||
102 | logging_log(cfg, LOGLEVEL_NOISE, | ||
103 | "DB: Unable to Prepare SQL insert: %s", apr_dbd_error( | ||
104 | dbconn->driver, dbconn->dbd, rv)); | ||
105 | return NULL; | ||
106 | } | ||
107 | return stmt; | ||
108 | } | ||
109 | |||
110 | apr_status_t database_insert(config_t *cfg, config_dbd_t *dbconn, | ||
111 | apr_pool_t *p, apr_table_t *data) | ||
112 | { | ||
113 | apr_status_t rv; | ||
114 | int f, nfs; | ||
115 | config_output_field_t *ofields; | ||
116 | ofields = (config_output_field_t *)cfg->output_fields->elts; | ||
117 | nfs = cfg->output_fields->nelts; | ||
118 | // Prepare statement | ||
119 | if (!dbconn->stmt) { | ||
120 | dbconn->stmt = database_prepare_insert(cfg, dbconn, p); | ||
121 | if (!dbconn->stmt) { | ||
122 | return APR_EINVAL; | ||
123 | } | ||
124 | dbconn->args = apr_palloc(cfg->pool, nfs * sizeof(char *)); | ||
125 | } | ||
126 | for (f=0; f<nfs; f++) { | ||
127 | dbconn->args[f] = apr_table_get(data, ofields[f].field); | ||
128 | } | ||
129 | rv = apr_dbd_pquery(dbconn->driver, p, dbconn->dbd, &f, | ||
130 | dbconn->stmt, nfs, dbconn->args); | ||
131 | if (rv) { | ||
132 | logging_log(cfg, LOGLEVEL_ERROR, "DB: Unable to Insert SQL: %s", | ||
133 | apr_dbd_error(dbconn->driver, dbconn->dbd, rv)); | ||
134 | return rv; | ||
135 | } | ||
136 | return APR_SUCCESS; | ||
137 | } | ||
138 | |||
139 | apr_status_t database_trans_start(config_t *cfg, config_dbd_t *dbconn, | ||
140 | apr_pool_t *p) | ||
141 | { | ||
142 | #if HAVE_APR_DBD_TRANSACTION_MODE_GET | ||
143 | apr_status_t rv; | ||
144 | if (!cfg->transactions) | ||
145 | return APR_SUCCESS; | ||
146 | if (dbconn->txn) { | ||
147 | logging_log(cfg, LOGLEVEL_NOISE, | ||
148 | "Transaction Already Started. Something is BROKE"); | ||
149 | return APR_EINVAL; | ||
150 | } | ||
151 | logging_log(cfg, LOGLEVEL_DEBUG, "DB: Starting Transaction"); | ||
152 | rv = apr_dbd_transaction_start(dbconn->driver, p, dbconn->dbd, | ||
153 | &dbconn->txn); | ||
154 | if (rv) | ||
155 | logging_log(cfg, LOGLEVEL_NOISE, | ||
156 | "DB: Error Starting Transaction: (%d)%s", rv, apr_dbd_error( | ||
157 | dbconn->driver, dbconn->dbd, rv)); | ||
158 | return rv; | ||
159 | #else | ||
160 | return APR_SUCCESS; | ||
161 | #endif | ||
162 | } | ||
163 | |||
164 | apr_status_t database_trans_stop(config_t *cfg, config_dbd_t *dbconn, | ||
165 | apr_pool_t *p) | ||
166 | { | ||
167 | #if HAVE_APR_DBD_TRANSACTION_MODE_GET | ||
168 | apr_status_t rv; | ||
169 | if (!cfg->transactions) | ||
170 | return APR_SUCCESS; | ||
171 | if (!dbconn->txn) { | ||
172 | logging_log(cfg, LOGLEVEL_NOISE, | ||
173 | "No Transaction Started. Something is BROKE"); | ||
174 | return APR_EINVAL; | ||
175 | } | ||
176 | logging_log(cfg, LOGLEVEL_DEBUG, "DB: Stopping Transaction"); | ||
177 | rv = apr_dbd_transaction_end(dbconn->driver, p, dbconn->txn); | ||
178 | if (rv) | ||
179 | logging_log(cfg, LOGLEVEL_NOISE, | ||
180 | "DB: Error Stopping Transaction: (%d)%s", rv, apr_dbd_error( | ||
181 | dbconn->driver, dbconn->dbd, rv)); | ||
182 | |||
183 | dbconn->txn = NULL; | ||
184 | return rv; | ||
185 | #else | ||
186 | return APR_SUCCESS; | ||
187 | #endif | ||
188 | } | ||
189 | |||
190 | apr_status_t database_trans_abort(config_t *cfg, config_dbd_t *dbconn) | ||
191 | { | ||
192 | #if HAVE_APR_DBD_TRANSACTION_MODE_GET | ||
193 | apr_status_t rv; | ||
194 | if (!cfg->transactions) | ||
195 | return APR_SUCCESS; | ||
196 | if (!dbconn->txn) { | ||
197 | logging_log(cfg, LOGLEVEL_NOISE, | ||
198 | "No Transaction Started. Something is BROKE"); | ||
199 | return APR_EINVAL; | ||
200 | } | ||
201 | logging_log(cfg, LOGLEVEL_NOTICE, "DB: Aborting Transaction"); | ||
202 | rv = apr_dbd_transaction_mode_set(dbconn->driver, dbconn->txn, | ||
203 | APR_DBD_TRANSACTION_ROLLBACK); | ||
204 | if (rv) | ||
205 | logging_log(cfg, LOGLEVEL_NOISE, | ||
206 | "DB: Error Aborting Transaction: (%d)%s", rv, apr_dbd_error( | ||
207 | dbconn->driver, dbconn->dbd, rv)); | ||
208 | return rv; | ||
209 | #else | ||
210 | return APR_SUCCESS; | ||
211 | #endif | ||
212 | } | ||
diff --git a/utility/database.h b/utility/database.h new file mode 100644 index 0000000..9797d51 --- /dev/null +++ b/utility/database.h | |||
@@ -0,0 +1,25 @@ | |||
1 | #ifndef DATABASE_H_ | ||
2 | #define DATABASE_H_ | ||
3 | |||
4 | #include "apr_pools.h" | ||
5 | |||
6 | #include "config.h" | ||
7 | |||
8 | void database_init(apr_pool_t *p); | ||
9 | |||
10 | apr_status_t database_connect(config_t *cfg, config_dbd_t **dbconn); | ||
11 | |||
12 | apr_status_t database_disconnect(config_dbd_t *dbconn); | ||
13 | |||
14 | apr_status_t database_insert(config_t *cfg, config_dbd_t *dbconn, | ||
15 | apr_pool_t *p, apr_table_t *data); | ||
16 | |||
17 | apr_status_t database_trans_start(config_t *cfg, config_dbd_t *dbconn, | ||
18 | apr_pool_t *p); | ||
19 | |||
20 | apr_status_t database_trans_stop(config_t *cfg, config_dbd_t *dbconn, | ||
21 | apr_pool_t *p); | ||
22 | |||
23 | apr_status_t database_trans_abort(config_t *cfg, config_dbd_t *dbconn); | ||
24 | |||
25 | #endif /*DATABASE_H_*/ | ||
diff --git a/utility/logparse.c b/utility/logparse.c new file mode 100644 index 0000000..1b3cc97 --- /dev/null +++ b/utility/logparse.c | |||
@@ -0,0 +1,768 @@ | |||
1 | #include "logparse.h" | ||
2 | #include "apr_file_info.h" | ||
3 | #include "apr_file_io.h" | ||
4 | #include "apr_strings.h" | ||
5 | #include "apr_time.h" | ||
6 | |||
7 | #include "time.h" | ||
8 | #include "stdlib.h" | ||
9 | |||
10 | #include "util.h" | ||
11 | #include "ap_pcre.h" | ||
12 | #include "database.h" | ||
13 | |||
14 | apr_hash_t *g_parser_funcs; | ||
15 | void **g_parser_linedata; | ||
16 | |||
17 | static apr_status_t parser_func_wrap(apr_pool_t *p, config_t *cfg, | ||
18 | config_output_field_t *field, const char *value, const char **ret) | ||
19 | { | ||
20 | if (field->args[0] && field->args[1]) { | ||
21 | struct iovec vec[3]; | ||
22 | apr_size_t len; | ||
23 | |||
24 | vec[0].iov_base = (void *)field->args[0]; | ||
25 | vec[0].iov_len = strlen(field->args[0]); | ||
26 | vec[1].iov_base = (void *)value; | ||
27 | vec[1].iov_len = strlen(value); | ||
28 | vec[2].iov_base = (void *)field->args[1]; | ||
29 | vec[2].iov_len = strlen(field->args[1]); | ||
30 | |||
31 | *ret = apr_pstrcatv(p, vec, 3, &len); | ||
32 | } else { | ||
33 | logging_log(cfg, LOGLEVEL_NOISE, "wrap requires before and after strings"); | ||
34 | return APR_EINVAL; | ||
35 | } | ||
36 | return APR_SUCCESS; | ||
37 | } | ||
38 | |||
39 | static apr_status_t parser_func_regexmatch(apr_pool_t *p, config_t *cfg, | ||
40 | config_output_field_t *field, const char *value, const char **ret) | ||
41 | { | ||
42 | struct { | ||
43 | ap_regex_t *rx; | ||
44 | const char *substr; | ||
45 | }*_data; | ||
46 | ap_regmatch_t regm[AP_MAX_REG_MATCH]; | ||
47 | // Check if a regular expression configured | ||
48 | if (!field->args[0]) | ||
49 | return APR_EINVAL; | ||
50 | if (!field->data) { | ||
51 | // pre compile the regex | ||
52 | _data = apr_palloc(cfg->pool, sizeof(ap_regex_t)+sizeof(const char *)); | ||
53 | _data->rx = ap_pregcomp(cfg->pool, field->args[0], | ||
54 | AP_REG_EXTENDED|AP_REG_ICASE); | ||
55 | if (field->args[1]) { | ||
56 | _data->substr = field->args[1]; | ||
57 | } else { | ||
58 | _data->substr = "$1"; | ||
59 | } | ||
60 | if (!_data->rx) { | ||
61 | logging_log(cfg, LOGLEVEL_NOISE, "Failed to compile regular expression"); | ||
62 | return APR_EINVAL; | ||
63 | } | ||
64 | field->data = _data; | ||
65 | } else | ||
66 | _data = field->data; | ||
67 | |||
68 | if (!ap_regexec(_data->rx, value, AP_MAX_REG_MATCH, regm, 0)) { | ||
69 | *ret = ap_pregsub(p, _data->substr, value, AP_MAX_REG_MATCH, regm); | ||
70 | } | ||
71 | logging_log(cfg, LOGLEVEL_DEBUG, "REGEX: matched %s against %s to %s", value, | ||
72 | field->args[0], *ret); | ||
73 | return APR_SUCCESS; | ||
74 | } | ||
75 | |||
76 | static apr_status_t parser_func_totimestamp(apr_pool_t *p, config_t *cfg, | ||
77 | config_output_field_t *field, const char *value, const char **ret) | ||
78 | { | ||
79 | time_t time; | ||
80 | struct tm ts; | ||
81 | |||
82 | //memset(&ts,0,sizeof(struct tm)); | ||
83 | |||
84 | strptime(value, "%d/%b/%Y:%H:%M:%S %z", &ts); | ||
85 | time = mktime(&ts); | ||
86 | |||
87 | *ret = apr_itoa(p, time); | ||
88 | return APR_SUCCESS; | ||
89 | } | ||
90 | |||
91 | static apr_status_t parser_func_machineid(apr_pool_t *p, config_t *cfg, | ||
92 | config_output_field_t *field, const char *value, const char **ret) | ||
93 | { | ||
94 | if (cfg->machineid) { | ||
95 | *ret = apr_pstrdup(p, cfg->machineid); | ||
96 | } | ||
97 | return APR_SUCCESS; | ||
98 | } | ||
99 | |||
100 | static apr_status_t parser_func_queryarg(apr_pool_t *p, config_t *cfg, | ||
101 | config_output_field_t *field, const char *value, const char **ret) | ||
102 | { | ||
103 | apr_table_t *query = parser_get_linedata(field->func); | ||
104 | |||
105 | if (!field->args[0]) { | ||
106 | logging_log(cfg, LOGLEVEL_NOISE, "queryarg requires name of query arg"); | ||
107 | return APR_EINVAL; | ||
108 | } | ||
109 | |||
110 | if (!query) { | ||
111 | char *query_beg; | ||
112 | |||
113 | query = apr_table_make(p,3); | ||
114 | |||
115 | query_beg = strchr(value, '?'); | ||
116 | // if we have a query string, rip it apart | ||
117 | if (query_beg) { | ||
118 | char *key; | ||
119 | char *value; | ||
120 | const char *delim = "&"; | ||
121 | char *query_string; | ||
122 | char *strtok_state; | ||
123 | char *query_end = strrchr(++query_beg,' '); | ||
124 | |||
125 | query_string = apr_pstrndup(p, query_beg, query_end-query_beg); | ||
126 | logging_log(cfg, LOGLEVEL_DEBUG, "QUERY: Found String %pp, %pp, %s", | ||
127 | query_beg, query_end, query_string); | ||
128 | if (field->args[1]) { | ||
129 | delim = field->args[1]; | ||
130 | } | ||
131 | key = apr_strtok(query_string, delim, &strtok_state); | ||
132 | while (key) { | ||
133 | value = strchr(key, '='); | ||
134 | if (value) { | ||
135 | *value = '\0'; /* Split the string in two */ | ||
136 | value++; /* Skip past the = */ | ||
137 | } | ||
138 | else { | ||
139 | value = "1"; | ||
140 | } | ||
141 | ap_unescape_url(key); | ||
142 | ap_unescape_url(value); | ||
143 | apr_table_set(query, key, value); | ||
144 | |||
145 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
146 | "QUERY: Found arg: %s = %s", key, value); | ||
147 | |||
148 | key = apr_strtok(NULL, delim, &strtok_state); | ||
149 | } | ||
150 | } | ||
151 | parser_set_linedata(field->func,query); | ||
152 | } | ||
153 | *ret = apr_table_get(query, field->args[0]); | ||
154 | return APR_SUCCESS; | ||
155 | } | ||
156 | |||
157 | parser_func_t *parser_get_func(const char *name) | ||
158 | { | ||
159 | return apr_hash_get(g_parser_funcs, name, APR_HASH_KEY_STRING); | ||
160 | } | ||
161 | |||
162 | static void parser_add_func(apr_pool_t *p, const char *const name, | ||
163 | parser_func_f func, int id) | ||
164 | { | ||
165 | parser_func_t *s; | ||
166 | if (!g_parser_funcs) { | ||
167 | g_parser_funcs = apr_hash_make(p); | ||
168 | } | ||
169 | s = apr_palloc(p, sizeof(parser_func_t)); | ||
170 | s->func = func; | ||
171 | s->pos = id; | ||
172 | s->data = NULL; | ||
173 | s->linedata = &g_parser_linedata; | ||
174 | apr_hash_set(g_parser_funcs, lowerstr(p, name), APR_HASH_KEY_STRING, s); | ||
175 | } | ||
176 | |||
177 | void parser_init(apr_pool_t *p) | ||
178 | { | ||
179 | int i = 0; | ||
180 | parser_add_func(p, "regexmatch", parser_func_regexmatch, ++i); | ||
181 | parser_add_func(p, "totimestamp", parser_func_totimestamp, ++i); | ||
182 | parser_add_func(p, "machineid", parser_func_machineid, ++i); | ||
183 | parser_add_func(p, "queryarg", parser_func_queryarg, ++i); | ||
184 | parser_add_func(p, "wrap", parser_func_wrap, ++i); | ||
185 | g_parser_linedata = apr_pcalloc(p, sizeof(void *) * (i+1)); | ||
186 | g_parser_linedata[0] = (void *)i; | ||
187 | } | ||
188 | |||
189 | void parser_find_logs(config_t *cfg) | ||
190 | { | ||
191 | apr_pool_t *tp; | ||
192 | apr_dir_t *dir; | ||
193 | apr_finfo_t finfo; | ||
194 | config_filestat_t *newp; | ||
195 | |||
196 | logging_log(cfg, LOGLEVEL_NOTICE, "Find Log files"); | ||
197 | if (!cfg->input_dir) | ||
198 | return; | ||
199 | apr_pool_create(&tp, cfg->pool); | ||
200 | if (apr_dir_open(&dir, cfg->input_dir, tp)==APR_SUCCESS) { | ||
201 | while (apr_dir_read(&finfo, APR_FINFO_NAME | APR_FINFO_TYPE, dir) | ||
202 | == APR_SUCCESS) { | ||
203 | char *temp; | ||
204 | if (finfo.filetype == APR_DIR) | ||
205 | continue; | ||
206 | newp = (config_filestat_t *)apr_array_push(cfg->input_files); | ||
207 | newp->result = "Not Parsed"; | ||
208 | apr_filepath_merge(&temp, cfg->input_dir, finfo.name, | ||
209 | APR_FILEPATH_TRUENAME, cfg->pool); | ||
210 | newp->fname = temp; | ||
211 | } | ||
212 | apr_dir_close(dir); | ||
213 | } | ||
214 | apr_pool_destroy(tp); | ||
215 | } | ||
216 | |||
217 | #define BUFFER_SIZE (16 * 1024) | ||
218 | |||
219 | void parser_split_logs(config_t *cfg) | ||
220 | { | ||
221 | apr_pool_t *tp, *tfp; | ||
222 | apr_array_header_t *foundfiles; | ||
223 | config_filestat_t *filelist; | ||
224 | config_filestat_t *newfile; | ||
225 | apr_file_t *infile; | ||
226 | int f, l; | ||
227 | apr_status_t rv; | ||
228 | apr_finfo_t finfo; | ||
229 | char buff[BUFFER_SIZE]; | ||
230 | int linecount; | ||
231 | int piecesize; | ||
232 | |||
233 | if (!cfg->split_enabled) return; | ||
234 | if (!cfg->split_dir) { | ||
235 | logging_log(cfg, LOGLEVEL_NOISE, "SPLITTER: Missing Split Output directory"); | ||
236 | return; | ||
237 | } | ||
238 | apr_pool_create(&tp, cfg->pool); | ||
239 | apr_pool_create(&tfp, tp); | ||
240 | |||
241 | if (APR_SUCCESS != apr_stat(&finfo, cfg->split_dir, APR_FINFO_MIN, tp)) { | ||
242 | logging_log(cfg, LOGLEVEL_NOISE, "SPLITTER: Directory %s does not exist", cfg->split_dir); | ||
243 | return; | ||
244 | } | ||
245 | foundfiles = apr_array_copy(tp, cfg->input_files); | ||
246 | apr_array_clear(cfg->input_files); | ||
247 | |||
248 | filelist = (config_filestat_t *)foundfiles->elts; | ||
249 | for (f=0, l=foundfiles->nelts; f < l; f++) { | ||
250 | apr_pool_clear(tfp); | ||
251 | logging_log(cfg, LOGLEVEL_NOTICE, "SPLITTER: Begin Splitting Log File '%s'", filelist[f].fname); | ||
252 | rv = apr_file_open(&infile, filelist[f].fname, APR_FOPEN_READ, APR_OS_DEFAULT, tfp); | ||
253 | |||
254 | if (rv != APR_SUCCESS) { | ||
255 | logging_log(cfg, LOGLEVEL_NOISE, "SPLITTER: Could not open %s", filelist[f].fname); | ||
256 | return; | ||
257 | } | ||
258 | linecount = 0; | ||
259 | while (apr_file_eof(infile) == APR_SUCCESS) { | ||
260 | apr_size_t read = BUFFER_SIZE; | ||
261 | char *p; | ||
262 | apr_file_read(infile, buff, &read); | ||
263 | p = buff; | ||
264 | while ((p = memchr(p, '\n', (buff + read) - p))) { | ||
265 | ++p; | ||
266 | ++linecount; | ||
267 | } | ||
268 | } | ||
269 | // now we know how long it is. Lets split up the file | ||
270 | piecesize = linecount / cfg->split_count; | ||
271 | if (piecesize < cfg->split_minimum) | ||
272 | piecesize = cfg->split_minimum; | ||
273 | if (piecesize > cfg->split_maximum && cfg->split_maximum > 0) | ||
274 | piecesize = cfg->split_maximum; | ||
275 | if (piecesize > linecount) { | ||
276 | // File is smaller than piece size just add it back in as is | ||
277 | newfile = (config_filestat_t *)apr_array_push(cfg->input_files); | ||
278 | newfile->result = "Not Parsed"; | ||
279 | newfile->fname = filelist[f].fname; | ||
280 | } else { | ||
281 | //split apart the files | ||
282 | int cur_line = 0; | ||
283 | int file_count = 1; | ||
284 | int out_lines = 0; | ||
285 | const char *basefile, *file; | ||
286 | apr_file_t *outfile; | ||
287 | char trail[2048]; | ||
288 | apr_size_t trail_size = 0; | ||
289 | apr_size_t write; | ||
290 | apr_off_t off = 0; | ||
291 | |||
292 | apr_file_seek(infile, APR_SET, &off); | ||
293 | |||
294 | basefile = apr_pstrdup(tfp, basename(apr_pstrdup(tfp, filelist[f].fname))); | ||
295 | |||
296 | file = apr_psprintf(tfp, "%s/%s-%d", cfg->split_dir, basefile, file_count++); | ||
297 | logging_log(cfg, LOGLEVEL_NOTICE, "SPLITTER: Creating output file %s", file); | ||
298 | rv = apr_file_open(&outfile, file, APR_FOPEN_WRITE | APR_FOPEN_CREATE | APR_FOPEN_TRUNCATE, APR_OS_DEFAULT, tfp); | ||
299 | if (rv != APR_SUCCESS) { | ||
300 | logging_log(cfg, LOGLEVEL_NOISE, "SPLITTER: Could not open %s (%d)", file, rv); | ||
301 | return; | ||
302 | } | ||
303 | newfile = (config_filestat_t *)apr_array_push(cfg->input_files); | ||
304 | newfile->result = "Not Parsed"; | ||
305 | newfile->fname = apr_pstrdup(cfg->pool, file); | ||
306 | |||
307 | while (apr_file_eof(infile) == APR_SUCCESS) { | ||
308 | apr_size_t read = BUFFER_SIZE; | ||
309 | char *p, *pp, *buff_start; | ||
310 | apr_file_read(infile, buff, &read); | ||
311 | buff_start = p = pp = buff; | ||
312 | if (trail_size) { | ||
313 | p = memchr(p, '\n', (buff + read) - p); | ||
314 | if (p) { | ||
315 | //printf("Trail Line: %p, %p, %d\n", pp, p, (p - pp) + trail_size); | ||
316 | ++p; | ||
317 | pp = p; | ||
318 | ++cur_line; | ||
319 | ++out_lines; | ||
320 | // write out to file | ||
321 | apr_file_write(outfile, trail, &trail_size); | ||
322 | trail_size = 0; | ||
323 | } else { | ||
324 | if ((read + trail_size) > 2048) { | ||
325 | logging_log(cfg, LOGLEVEL_NOISE, "SPLITTER: Excessively long line %d in file %s", cur_line, filelist[f].fname); | ||
326 | exit(1); | ||
327 | } else { | ||
328 | memcpy(trail+trail_size, buff, read); | ||
329 | trail_size += read; | ||
330 | } | ||
331 | } | ||
332 | } | ||
333 | while ((p = memchr(p, '\n', (buff + read) - p))) { | ||
334 | //printf("Line: %p, %p, %d\n", pp, p, (p - pp)); | ||
335 | if (out_lines == piecesize) { | ||
336 | // Write out to file | ||
337 | write = pp - buff_start; | ||
338 | apr_file_write(outfile, buff_start, &write); | ||
339 | buff_start = pp; | ||
340 | out_lines = 0; | ||
341 | // Open new file | ||
342 | file = apr_psprintf(tfp, "%s/%s-%d", cfg->split_dir, basefile, file_count++); | ||
343 | logging_log(cfg, LOGLEVEL_NOTICE, "SPLITTER: Creating output file %s", file); | ||
344 | rv = apr_file_open(&outfile, file, APR_FOPEN_WRITE | APR_FOPEN_CREATE | APR_FOPEN_TRUNCATE, APR_OS_DEFAULT, tfp); | ||
345 | if (rv != APR_SUCCESS) { | ||
346 | logging_log(cfg, LOGLEVEL_NOISE, "SPLITTER: Could not open %s (%d)", file, rv); | ||
347 | return; | ||
348 | } | ||
349 | newfile = (config_filestat_t *)apr_array_push(cfg->input_files); | ||
350 | newfile->result = "Not Parsed"; | ||
351 | newfile->fname = apr_pstrdup(cfg->pool, file); | ||
352 | } | ||
353 | ++p; | ||
354 | pp = p; | ||
355 | ++cur_line; | ||
356 | ++out_lines; | ||
357 | } | ||
358 | // Write out to file | ||
359 | write = pp - buff_start; | ||
360 | apr_file_write(outfile, buff_start, &write); | ||
361 | |||
362 | trail_size = (buff+read) - pp; | ||
363 | if (trail_size) { | ||
364 | memcpy(trail, pp, trail_size); | ||
365 | } | ||
366 | } | ||
367 | } | ||
368 | } | ||
369 | apr_pool_destroy(tfp); | ||
370 | apr_pool_destroy(tp); | ||
371 | } | ||
372 | |||
373 | apr_status_t parser_logbadline(config_t *cfg, const char *filename, | ||
374 | const char *badline) | ||
375 | { | ||
376 | apr_status_t rv = APR_SUCCESS; | ||
377 | apr_size_t len; | ||
378 | struct iovec vec[5]; | ||
379 | |||
380 | if (cfg->badlinefile) { | ||
381 | if (!cfg->badline_fp) { | ||
382 | rv = apr_file_open(&cfg->badline_fp, cfg->badlinefile, | ||
383 | APR_FOPEN_CREATE | APR_FOPEN_WRITE | APR_FOPEN_APPEND, | ||
384 | APR_OS_DEFAULT, cfg->pool); | ||
385 | if (rv) { | ||
386 | logging_log(cfg, LOGLEVEL_NOISE, | ||
387 | "Error opening badline file %s\n", cfg->badlinefile); | ||
388 | cfg->badlinefile = NULL; | ||
389 | } | ||
390 | } | ||
391 | if (!rv) { | ||
392 | if (filename != cfg->badlastfile){ | ||
393 | char date[APR_RFC822_DATE_LEN]; | ||
394 | vec[0].iov_base = "Starting BadLines for \""; | ||
395 | vec[0].iov_len = sizeof("Starting BadLines for \"")-1; | ||
396 | vec[1].iov_base = (void *)filename; | ||
397 | vec[1].iov_len = strlen(filename); | ||
398 | vec[2].iov_base = "\" on "; | ||
399 | vec[2].iov_len = sizeof("\" on ")-1; | ||
400 | apr_rfc822_date(date, apr_time_now()); | ||
401 | vec[3].iov_base = date; | ||
402 | vec[3].iov_len = APR_RFC822_DATE_LEN-1; | ||
403 | vec[4].iov_base = "\n"; | ||
404 | vec[4].iov_len = 1; | ||
405 | apr_file_writev(cfg->badline_fp, vec,5, &len); | ||
406 | cfg->badlastfile = filename; | ||
407 | } | ||
408 | |||
409 | if ((++cfg->badline_count) > cfg->badlinemax) { | ||
410 | logging_log(cfg, LOGLEVEL_NOISE, | ||
411 | "Found more than %d bad lines (found %d)", | ||
412 | cfg->badlinemax, cfg->badline_count); | ||
413 | rv = APR_EINVAL; | ||
414 | } else { | ||
415 | vec[0].iov_base = (void *)badline; | ||
416 | vec[0].iov_len = strlen(badline); | ||
417 | vec[1].iov_base = "\n"; | ||
418 | vec[1].iov_len = 1; | ||
419 | apr_file_writev(cfg->badline_fp, vec,2, &len); | ||
420 | } | ||
421 | } | ||
422 | } | ||
423 | return rv; | ||
424 | } | ||
425 | |||
426 | /* | ||
427 | * Modified version of apr_tokenize_to_argv to add [] as quoting characters | ||
428 | * | ||
429 | * token_context: Context from which pool allocations will occur. | ||
430 | * arg_str: Input string for conversion to argv[]. | ||
431 | * argv_out: Output location. This is a pointer to an array | ||
432 | * of pointers to strings (ie. &(char *argv[]). | ||
433 | * This value will be allocated from the contexts | ||
434 | * pool and filled in with copies of the tokens | ||
435 | * found during parsing of the arg_str. | ||
436 | */ | ||
437 | apr_status_t parser_tokenize_line(const char *arg_str, char ***argv_out, | ||
438 | apr_pool_t *token_context) | ||
439 | { | ||
440 | const char *cp; | ||
441 | const char *ct; | ||
442 | char *cleaned, *dirty; | ||
443 | int escaped; | ||
444 | int isquoted, numargs = 0, argnum; | ||
445 | |||
446 | #define SKIP_WHITESPACE(cp) \ | ||
447 | for ( ; *cp == ' ' || *cp == '\t'; ) { \ | ||
448 | cp++; \ | ||
449 | }; | ||
450 | |||
451 | #define CHECK_QUOTATION(cp,isquoted) \ | ||
452 | isquoted = 0; \ | ||
453 | if (*cp == '"') { \ | ||
454 | isquoted = 1; \ | ||
455 | cp++; \ | ||
456 | } \ | ||
457 | else if (*cp == '\'') { \ | ||
458 | isquoted = 2; \ | ||
459 | cp++; \ | ||
460 | } \ | ||
461 | else if (*cp == '[') { \ | ||
462 | isquoted = 3; \ | ||
463 | cp++; \ | ||
464 | } | ||
465 | |||
466 | /* DETERMINE_NEXTSTRING: | ||
467 | * At exit, cp will point to one of the following: NULL, SPACE, TAB or QUOTE. | ||
468 | * NULL implies the argument string has been fully traversed. | ||
469 | */ | ||
470 | #define DETERMINE_NEXTSTRING(cp,isquoted) \ | ||
471 | for ( ; *cp != '\0'; cp++) { \ | ||
472 | if ( (*cp == '\\' && (*(cp+1) == ' ' || *(cp+1) == '\t' || \ | ||
473 | *(cp+1) == '"' || *(cp+1) == '\'' || \ | ||
474 | *(cp+1) == '[' || *(cp+1) == ']'))) { \ | ||
475 | cp++; \ | ||
476 | continue; \ | ||
477 | } \ | ||
478 | if ( (!isquoted && (*cp == ' ' || *cp == '\t')) \ | ||
479 | || (isquoted == 1 && *cp == '"') \ | ||
480 | || (isquoted == 2 && *cp == '\'') \ | ||
481 | || (isquoted == 3 && *cp == ']') \ | ||
482 | ) { \ | ||
483 | break; \ | ||
484 | } \ | ||
485 | } | ||
486 | |||
487 | /* REMOVE_ESCAPE_CHARS: | ||
488 | * Compresses the arg string to remove all of the '\' escape chars. | ||
489 | * The final argv strings should not have any extra escape chars in it. | ||
490 | */ | ||
491 | #define REMOVE_ESCAPE_CHARS(cleaned, dirty, escaped) \ | ||
492 | escaped = 0; \ | ||
493 | while(*dirty) { \ | ||
494 | if (!escaped && *dirty == '\\') { \ | ||
495 | escaped = 1; \ | ||
496 | } \ | ||
497 | else { \ | ||
498 | escaped = 0; \ | ||
499 | *cleaned++ = *dirty; \ | ||
500 | } \ | ||
501 | ++dirty; \ | ||
502 | } \ | ||
503 | *cleaned = 0; /* last line of macro... */ | ||
504 | |||
505 | cp = arg_str; | ||
506 | SKIP_WHITESPACE(cp); | ||
507 | ct = cp; | ||
508 | |||
509 | /* This is ugly and expensive, but if anyone wants to figure a | ||
510 | * way to support any number of args without counting and | ||
511 | * allocating, please go ahead and change the code. | ||
512 | * | ||
513 | * Must account for the trailing NULL arg. | ||
514 | */ | ||
515 | numargs = 1; | ||
516 | while (*ct != '\0') { | ||
517 | CHECK_QUOTATION(ct, isquoted) | ||
518 | ; | ||
519 | DETERMINE_NEXTSTRING(ct, isquoted); | ||
520 | if (*ct != '\0') { | ||
521 | ct++; | ||
522 | } | ||
523 | numargs++; | ||
524 | SKIP_WHITESPACE(ct); | ||
525 | } | ||
526 | *argv_out = apr_palloc(token_context, numargs * sizeof(char*)); | ||
527 | |||
528 | /* determine first argument */ | ||
529 | for (argnum = 0; argnum < (numargs-1); argnum++) { | ||
530 | SKIP_WHITESPACE(cp); | ||
531 | CHECK_QUOTATION(cp, isquoted) | ||
532 | ; | ||
533 | ct = cp; | ||
534 | DETERMINE_NEXTSTRING(cp, isquoted); | ||
535 | cp++; | ||
536 | (*argv_out)[argnum] = apr_palloc(token_context, cp - ct); | ||
537 | apr_cpystrn((*argv_out)[argnum], ct, cp - ct); | ||
538 | cleaned = dirty = (*argv_out)[argnum]; | ||
539 | REMOVE_ESCAPE_CHARS(cleaned, dirty, escaped) | ||
540 | ; | ||
541 | } | ||
542 | (*argv_out)[argnum] = NULL; | ||
543 | |||
544 | return APR_SUCCESS; | ||
545 | } | ||
546 | |||
547 | apr_status_t parser_parsefile(config_t *cfg, config_dbd_t *dbconn, | ||
548 | config_filestat_t *fstat) | ||
549 | { | ||
550 | apr_pool_t *tp, *targp; | ||
551 | apr_file_t *file; | ||
552 | apr_status_t rv; | ||
553 | char buff[2048]; | ||
554 | char readbuff[BUFFER_SIZE]; | ||
555 | char **targv; | ||
556 | int targc; | ||
557 | |||
558 | apr_pool_create(&tp, cfg->pool); | ||
559 | apr_pool_create(&targp, tp); | ||
560 | |||
561 | logging_log(cfg, LOGLEVEL_NOTICE, "PARSER: Begin Parsing Log File '%s'", fstat->fname); | ||
562 | |||
563 | rv = apr_file_open(&file, fstat->fname, APR_FOPEN_READ, APR_OS_DEFAULT, tp); | ||
564 | apr_file_buffer_set(file, readbuff, BUFFER_SIZE); | ||
565 | if (rv != APR_SUCCESS) { | ||
566 | logging_log(cfg, LOGLEVEL_NOISE, "PARSER: Could not open %s", fstat->fname); | ||
567 | return rv; | ||
568 | } | ||
569 | |||
570 | fstat->linesparsed = 0; | ||
571 | // Start Transaction | ||
572 | fstat->start = apr_time_now(); | ||
573 | if (!cfg->dryrun && database_trans_start(cfg, dbconn, tp)) { | ||
574 | fstat->result = "Database Transaction Error"; | ||
575 | fstat->stop = apr_time_now(); | ||
576 | return rv; | ||
577 | } | ||
578 | |||
579 | do { | ||
580 | rv = apr_file_gets(buff, 2048, file); | ||
581 | if (rv == APR_SUCCESS) { | ||
582 | int i,m, cont = 0; | ||
583 | config_filter_t *filters; | ||
584 | |||
585 | fstat->linesparsed++; | ||
586 | // chomp off newline | ||
587 | line_chomp(buff); | ||
588 | // Run line filters | ||
589 | for (i=0, m=cfg->linefilters->nelts, | ||
590 | filters = (config_filter_t *)cfg->linefilters->elts; | ||
591 | i<m; i++) { | ||
592 | if (!filters[i].regex || ap_regexec(filters[i].regex, buff, 0, NULL,0)==0) { | ||
593 | if (filters[i].negative) { | ||
594 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
595 | "PARSER: LINEFILTER: Skipping Line %d due to Filter (%d)%s", | ||
596 | fstat->linesparsed, i, filters[i].filter); | ||
597 | fstat->lineskipped++; | ||
598 | cont = 1; | ||
599 | } else { | ||
600 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
601 | "PARSER: LINEFILTER: Force Parsing Line %d due to Filter (%d)%s", | ||
602 | fstat->linesparsed, i, filters[i].filter); | ||
603 | } | ||
604 | break; | ||
605 | } | ||
606 | } | ||
607 | if (cont) continue; | ||
608 | |||
609 | apr_pool_clear(targp); | ||
610 | parser_tokenize_line(buff, &targv, targp); | ||
611 | targc = 0; | ||
612 | while (targv[targc]) | ||
613 | targc++; | ||
614 | rv = parser_processline(targp, cfg, dbconn, fstat, targv, targc); | ||
615 | if (rv != APR_SUCCESS) { | ||
616 | int i; | ||
617 | |||
618 | fstat->linesbad++; | ||
619 | rv = parser_logbadline(cfg, fstat->fname, buff); | ||
620 | if (rv) { | ||
621 | if (!cfg->dryrun) database_trans_abort(cfg, dbconn); | ||
622 | logging_log(cfg, LOGLEVEL_ERROR, "Line %d(%d): %s", fstat->linesparsed, | ||
623 | targc, buff); | ||
624 | for (i = 0; targv[i]; i++) { | ||
625 | logging_log(cfg, LOGLEVEL_ERROR, "Arg (%d): '%s'", i, | ||
626 | targv[i]); | ||
627 | } | ||
628 | } | ||
629 | } | ||
630 | } else { | ||
631 | rv = APR_SUCCESS; | ||
632 | break; | ||
633 | } | ||
634 | } while (rv == APR_SUCCESS); | ||
635 | apr_file_close(file); | ||
636 | // Finish Transaction | ||
637 | if (!cfg->dryrun && database_trans_stop(cfg, dbconn, tp)) { | ||
638 | fstat->result = apr_psprintf(cfg->pool, | ||
639 | "Input line %d, Database Transaction Error", | ||
640 | fstat->linesparsed); | ||
641 | } | ||
642 | |||
643 | apr_pool_destroy(tp); | ||
644 | logging_log(cfg, LOGLEVEL_NOTICE, | ||
645 | "PARSER: Finish Parsing Log File '%s'. Lines: (%d/%d)", | ||
646 | fstat->fname, fstat->linesparsed - fstat->lineskipped, fstat->linesparsed); | ||
647 | if (!rv) { | ||
648 | fstat->result = "File Parsed Succesfully"; | ||
649 | } | ||
650 | fstat->stop = apr_time_now(); | ||
651 | return rv; | ||
652 | } | ||
653 | |||
654 | apr_status_t parser_processline(apr_pool_t *ptemp, config_t *cfg, | ||
655 | config_dbd_t *dbconn, config_filestat_t *fstat, char **argv, int argc) | ||
656 | { | ||
657 | config_logformat_t *fmt; | ||
658 | config_logformat_field_t *ifields; | ||
659 | config_output_field_t *ofields; | ||
660 | config_filter_t *filters; | ||
661 | apr_table_t *datain; | ||
662 | apr_table_t *dataout; | ||
663 | apr_status_t rv= APR_SUCCESS; | ||
664 | int i,m; | ||
665 | |||
666 | fmt = apr_hash_get(cfg->log_formats, cfg->logformat, APR_HASH_KEY_STRING); | ||
667 | if (!fmt) { | ||
668 | logging_log(cfg, LOGLEVEL_NOISE, "PARSER: No Input Log format"); | ||
669 | return APR_EINVAL; | ||
670 | } | ||
671 | if (fmt->fields->nelts != argc) { | ||
672 | logging_log(cfg, LOGLEVEL_NOISE, | ||
673 | "PARSER: Input line field number differs from expected. Expected %d got %d.", | ||
674 | fmt->fields->nelts, argc); | ||
675 | fstat->result = apr_psprintf(cfg->pool, | ||
676 | "Input line %d is badly formatted (wrong number of fields)", | ||
677 | fstat->linesparsed); | ||
678 | return APR_EINVAL; | ||
679 | } | ||
680 | |||
681 | datain = apr_table_make(ptemp, fmt->fields->nelts); | ||
682 | dataout = apr_table_make(ptemp, cfg->output_fields->nelts); | ||
683 | |||
684 | ifields = (config_logformat_field_t *)fmt->fields->elts; | ||
685 | for (i=0; i<fmt->fields->nelts; i++) { | ||
686 | apr_table_setn(datain, ifields[i].name, argv[i]); | ||
687 | } | ||
688 | // Run Pre Filters | ||
689 | for (i=0, m=cfg->prefilters->nelts, | ||
690 | filters = (config_filter_t *)cfg->prefilters->elts; | ||
691 | i<m; i++) { | ||
692 | const char *temp = apr_table_get(datain, filters[i].field); | ||
693 | if (temp && (!filters[i].regex || ap_regexec(filters[i].regex, temp, 0, NULL,0)==0)) { | ||
694 | if (filters[i].negative) { | ||
695 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
696 | "PARSER: PREFILTER: Skipping Line %d due to Filter (%d)%s", | ||
697 | fstat->linesparsed, i, filters[i].filter); | ||
698 | fstat->lineskipped++; | ||
699 | return APR_SUCCESS; | ||
700 | } else { | ||
701 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
702 | "PARSER: PREFILTER: Force Parsing Line %d due to Filter (%d)%s", | ||
703 | fstat->linesparsed, i, filters[i].filter); | ||
704 | } | ||
705 | break; | ||
706 | } | ||
707 | } | ||
708 | |||
709 | ofields = (config_output_field_t *)cfg->output_fields->elts; | ||
710 | // clear out ofield function per-line data | ||
711 | memset(&g_parser_linedata[1],0,sizeof(void *)*(int)g_parser_linedata[0]); | ||
712 | // Convert input fields to output fields | ||
713 | for (i=0,m=cfg->output_fields->nelts; i<m; i++) { | ||
714 | const char *val; | ||
715 | val = apr_table_get(datain, ofields[i].source); | ||
716 | // If we can't find the source field just continue | ||
717 | if (!val && !(ofields[i].source[0]=='\0' && ofields[i].func)) { | ||
718 | apr_table_setn(dataout, ofields[i].field, ofields[i].def); | ||
719 | continue; | ||
720 | } | ||
721 | if (!ofields[i].func) { | ||
722 | apr_table_setn(dataout, ofields[i].field, val); | ||
723 | } else { | ||
724 | const char *ret= NULL; | ||
725 | rv = ((parser_func_t *)ofields[i].func)->func(ptemp, cfg, | ||
726 | &ofields[i], val, &ret); | ||
727 | if (rv) { | ||
728 | fstat->result = apr_psprintf(cfg->pool, | ||
729 | "Input line %d, Parser function %s returned error (%d)%s", | ||
730 | fstat->linesparsed, ofields[i].fname, rv, logging_strerror(rv)); | ||
731 | return rv; | ||
732 | } | ||
733 | apr_table_setn(dataout, ofields[i].field, ret ? ret : ofields[i].def); | ||
734 | } | ||
735 | } | ||
736 | |||
737 | // Run Post filters | ||
738 | for (i=0, m=cfg->postfilters->nelts, | ||
739 | filters = (config_filter_t *)cfg->postfilters->elts; | ||
740 | i<m; i++) { | ||
741 | const char *temp = apr_table_get(dataout, filters[i].field); | ||
742 | if (temp && (!filters[i].regex || ap_regexec(filters[i].regex, temp, 0, NULL,0)==0)) { | ||
743 | if (filters[i].negative) { | ||
744 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
745 | "PARSER: POSTFILTER: Skipping Line %d due to Filter (%d)%s", | ||
746 | fstat->linesparsed, i, filters[i].filter); | ||
747 | fstat->lineskipped++; | ||
748 | return APR_SUCCESS; | ||
749 | } else { | ||
750 | logging_log(cfg, LOGLEVEL_DEBUG, | ||
751 | "PARSER: POSTFILTER: Force Parsing Line %d due to Filter (%d)%s", | ||
752 | fstat->linesparsed, i, filters[i].filter); | ||
753 | } | ||
754 | break; | ||
755 | } | ||
756 | } | ||
757 | |||
758 | // Process DB Query | ||
759 | if (!cfg->dryrun) { | ||
760 | rv = database_insert(cfg, dbconn, ptemp, dataout); | ||
761 | if (rv) { | ||
762 | fstat->result = apr_psprintf(cfg->pool, | ||
763 | "Input line %d, Database Error", | ||
764 | fstat->linesparsed); | ||
765 | } | ||
766 | } | ||
767 | return rv; | ||
768 | } | ||
diff --git a/utility/logparse.h b/utility/logparse.h new file mode 100644 index 0000000..7ca0958 --- /dev/null +++ b/utility/logparse.h | |||
@@ -0,0 +1,37 @@ | |||
1 | #ifndef LOGPARSE_H_ | ||
2 | #define LOGPARSE_H_ | ||
3 | |||
4 | #include "config.h" | ||
5 | |||
6 | typedef apr_status_t (*parser_func_f)(apr_pool_t *p, config_t *cfg, | ||
7 | config_output_field_t *field, const char *value, const char **ret); | ||
8 | |||
9 | struct parser_func_t { | ||
10 | parser_func_f func; | ||
11 | int pos; | ||
12 | void *data; | ||
13 | void ***linedata; | ||
14 | }; | ||
15 | |||
16 | #define parser_get_linedata(f) (*f->linedata)[f->pos] | ||
17 | |||
18 | #define parser_set_linedata(f, v) (*f->linedata)[f->pos] = v | ||
19 | |||
20 | parser_func_t *parser_get_func(const char *name); | ||
21 | |||
22 | void parser_init(apr_pool_t *p); | ||
23 | |||
24 | void parser_find_logs(config_t *cfg); | ||
25 | |||
26 | void parser_split_logs(config_t *cfg); | ||
27 | |||
28 | apr_status_t parser_tokenize_line(const char *arg_str, char ***argv_out, | ||
29 | apr_pool_t *token_context); | ||
30 | |||
31 | apr_status_t parser_parsefile(config_t *cfg, config_dbd_t *dbconn, | ||
32 | config_filestat_t *fstat); | ||
33 | |||
34 | apr_status_t parser_processline(apr_pool_t *ptemp, config_t *cfg, | ||
35 | config_dbd_t *dbconn, config_filestat_t *line, char **argv, int argc); | ||
36 | |||
37 | #endif /*LOGPARSE_H_*/ | ||
diff --git a/utility/mod_log_sql.conf b/utility/mod_log_sql.conf new file mode 100644 index 0000000..911fc18 --- /dev/null +++ b/utility/mod_log_sql.conf | |||
@@ -0,0 +1,70 @@ | |||
1 | InputDirectory ./logs | ||
2 | ErrorLog ./error_log | ||
3 | |||
4 | DBDDriver mysql | ||
5 | DBDParams "host=localhost;user=root;dbname=apache_log" | ||
6 | Table access_log | ||
7 | MachineID 7of9 | ||
8 | UseTransactions on | ||
9 | LogLevel notice | ||
10 | DryRun off | ||
11 | Summary on | ||
12 | |||
13 | SplitInput on | ||
14 | #SplitCount 4 | ||
15 | SplitMinLines 0 | ||
16 | SplitMaxLines 50000 | ||
17 | SplitDirectory ./split_temp | ||
18 | |||
19 | #ThreadCount 0 | ||
20 | |||
21 | BadLineFile ./badlines.log | ||
22 | BadLineMax 10 | ||
23 | |||
24 | LogFormatConfig CLF remhost String | ||
25 | LogFormatConfig CLF ident String | ||
26 | LogFormatConfig CLF user String | ||
27 | LogFormatConfig CLF date Date | ||
28 | LogFormatConfig CLF request String | ||
29 | LogFormatConfig CLF status Number | ||
30 | LogFormatConfig CLF bytes_sent Number | ||
31 | |||
32 | LogFormatConfig Combined remhost String | ||
33 | LogFormatConfig Combined ident String | ||
34 | LogFormatConfig Combined user String | ||
35 | LogFormatConfig Combined date Date | ||
36 | LogFormatConfig Combined request String | ||
37 | LogFormatConfig Combined status Number | ||
38 | LogFormatConfig Combined bytes_sent Number | ||
39 | LogFormatConfig Combined referer String | ||
40 | LogFormatConfig Combined agent String | ||
41 | |||
42 | LogFormat Combined | ||
43 | |||
44 | #Linefilter - "BAD" | ||
45 | #LineFilter "GOOD" | ||
46 | #LineFilter + "BETTER" | ||
47 | # the next filter ignores ALL lines | ||
48 | #LineFilter - | ||
49 | #PreFilter request - "Rebuild" | ||
50 | #PostFilter request_method "GET" | ||
51 | |||
52 | # Usage field datatype(size) default source [function [param]...] | ||
53 | OutputField bytes_sent int 0 bytes_sent | ||
54 | OutputField request_protocol varchar(10) "" request regexmatch "(HTTP/[\\d\\.]+)$" | ||
55 | OutputField remote_host varchar(50) "" remhost | ||
56 | OutputField request_method varchar(25) "" request regexmatch "^(\\w+)" | ||
57 | OutputField time_stamp int 0 date totimestamp | ||
58 | OutputField status smallint 0 status | ||
59 | OutputField request_line varchar(255) "" request | ||
60 | #OutputField request_uri varchar(255) "" request regexmatch "^\\w+ (.+) \\w+/[\\d\\.]+$" | ||
61 | OutputField remote_user varchar(50) "" user | ||
62 | OutputField remote_logname varchar(50) "" ident | ||
63 | OutputField request_time char(28) "" date wrap "[" "]" | ||
64 | #Only used for Combined log input, if standard CLF input, they are ignored | ||
65 | OutputField agent varchar(255) "" agent | ||
66 | OutputField referer varchar(255) "" referer | ||
67 | OutputField machine_id varchar(25) "" "" machineid | ||
68 | #VIZU Fields | ||
69 | OutputField poll_id int 0 request queryarg n "&;" | ||
70 | |||
diff --git a/utility/shell.c b/utility/shell.c new file mode 100644 index 0000000..1b9e890 --- /dev/null +++ b/utility/shell.c | |||
@@ -0,0 +1,342 @@ | |||
1 | #include "apr.h" | ||
2 | #include "apr_getopt.h" | ||
3 | #include "apr_tables.h" | ||
4 | |||
5 | #define APR_WANT_STDIO | ||
6 | #include "apr_want.h" | ||
7 | #include "stdlib.h" | ||
8 | |||
9 | #include "shell.h" | ||
10 | #include "config.h" | ||
11 | #include "logparse.h" | ||
12 | #include "database.h" | ||
13 | #include "util.h" | ||
14 | |||
15 | #if APR_HAS_THREADS | ||
16 | #include "apr_queue.h" | ||
17 | #include "apr_thread_pool.h" | ||
18 | |||
19 | static apr_queue_t *queue; | ||
20 | |||
21 | void run_multithreaded(config_t *cfg); | ||
22 | #endif | ||
23 | |||
24 | void run_singlethreaded(config_t *cfg); | ||
25 | |||
26 | const apr_getopt_option_t _opt_config[] = { | ||
27 | {"machineid", 'm', 1, "Machine ID for the log file"}, | ||
28 | {"transaction", 't', 1, "Use a Transaction (yes,no)"}, | ||
29 | {"logformat", 'r', 1, "Use this logformat to parse files"}, | ||
30 | {"file", 'f', 1, "Parse this single log file (input dir is NOT scanned)"}, | ||
31 | {"inputdir", 'i', 1, "Input Directory to look for log files"}, | ||
32 | {"config", 'c', 1, "Configuration file to use (default mod_log_sql.conf)"}, | ||
33 | {"dryrun", 'n', 0, "Perform a dry run (do not actually alter the databse)"}, | ||
34 | {"dump", 'd', 0, "Dump the configuration after parsing and quit"}, | ||
35 | {"loglevel", 'l', 1, "Log Level (deubg, notice, error)"}, | ||
36 | {"summary", 's', 1, "Summary (yes,no)"}, | ||
37 | {"threadcount", 'p', 1, "Set thread count (a number greater than 0)"}, | ||
38 | {"help", 'h', 0, "Show Help"}, | ||
39 | {NULL} | ||
40 | }; | ||
41 | |||
42 | void show_help(const char *prog, const apr_getopt_option_t *opts, FILE *output) | ||
43 | { | ||
44 | int ptr = 0; | ||
45 | fprintf(output, "Usage: %s [OPTIONS] [files...]\n\n", prog); | ||
46 | while (opts[ptr].optch != 0) { | ||
47 | if (opts[ptr].optch > 255) { | ||
48 | if (opts[ptr].name) { | ||
49 | fprintf(output, " --%-10s", opts[ptr].name); | ||
50 | } else { | ||
51 | fprintf(output, " "); | ||
52 | } | ||
53 | } else { | ||
54 | if (opts[ptr].name) { | ||
55 | fprintf(output, " -%c --%-10s", opts[ptr].optch, opts[ptr].name); | ||
56 | } else { | ||
57 | fprintf(output, " -%c ", opts[ptr].optch); | ||
58 | } | ||
59 | } | ||
60 | if (opts[ptr].has_arg) { | ||
61 | fprintf(output, " (arg)"); | ||
62 | } else { | ||
63 | fprintf(output, " "); | ||
64 | } | ||
65 | fprintf(output, " %s\n", opts[ptr].description); | ||
66 | ptr++; | ||
67 | } | ||
68 | } | ||
69 | |||
70 | void print_summary(config_t *cfg) { | ||
71 | config_filestat_t *fstat; | ||
72 | int i,m; | ||
73 | apr_time_t totaltime = 0; | ||
74 | apr_size_t totalparsed = 0, totalskipped = 0, totalbad = 0; | ||
75 | |||
76 | fstat = (config_filestat_t *)cfg->input_files->elts; | ||
77 | |||
78 | printf("Execution Summary\nParsed %d files\n", cfg->input_files->nelts); | ||
79 | for (i=0, m=cfg->input_files->nelts; i<m; i++) { | ||
80 | totaltime += fstat[i].stop - fstat[i].start; | ||
81 | totalparsed += fstat[i].linesparsed; | ||
82 | totalskipped += fstat[i].lineskipped; | ||
83 | totalbad += fstat[i].linesbad; | ||
84 | printf(" File: %s\n" | ||
85 | " Lines Added %'d out of %'d (Skipped %'d, Bad %'d)\n" | ||
86 | " Status: %s\n" | ||
87 | " Duration: %02"APR_TIME_T_FMT":%02"APR_TIME_T_FMT".%"APR_TIME_T_FMT" (minutes, seconds, and miliseconds)\n" | ||
88 | "\n", | ||
89 | fstat[i].fname, | ||
90 | fstat[i].linesparsed - fstat[i].lineskipped - fstat[i].linesbad, | ||
91 | fstat[i].linesparsed, | ||
92 | fstat[i].lineskipped, | ||
93 | fstat[i].linesbad, | ||
94 | fstat[i].result, | ||
95 | apr_time_sec(fstat[i].stop - fstat[i].start)/60, | ||
96 | apr_time_sec(fstat[i].stop - fstat[i].start) % 60, | ||
97 | apr_time_msec(fstat[i].stop - fstat[i].start) | ||
98 | ); | ||
99 | } | ||
100 | printf("Totals\n" | ||
101 | " Lines Added %'d out of %'d (Skipped %'d, Bad %'d)\n" | ||
102 | " Duration: %02"APR_TIME_T_FMT":%02"APR_TIME_T_FMT".%"APR_TIME_T_FMT" (minutes, seconds, and miliseconds)\n" | ||
103 | "\n", | ||
104 | totalparsed - totalskipped - totalbad, | ||
105 | totalparsed, | ||
106 | totalskipped, | ||
107 | totalbad, | ||
108 | apr_time_sec(totaltime)/60, | ||
109 | apr_time_sec(totaltime) % 60, | ||
110 | apr_time_msec(totaltime) | ||
111 | ); | ||
112 | } | ||
113 | |||
114 | int main(int argc, const char *const argv[]) | ||
115 | { | ||
116 | apr_pool_t *pool, *ptemp; | ||
117 | apr_getopt_t *opts; | ||
118 | int opt; | ||
119 | const char *opt_arg; | ||
120 | apr_status_t rv; | ||
121 | apr_table_t *args; | ||
122 | config_t *cfg; | ||
123 | |||
124 | apr_app_initialize(&argc, &argv, NULL); | ||
125 | atexit(apr_terminate); | ||
126 | |||
127 | if (apr_pool_create(&pool, NULL) != APR_SUCCESS) { | ||
128 | fprintf(stderr, "Failed to create memory pool!\n"); | ||
129 | exit(1); | ||
130 | } | ||
131 | apr_pool_create(&ptemp, NULL); | ||
132 | |||
133 | /** Iterate over command line arguments | ||
134 | * shoving args in a apr_table for processing later*/ | ||
135 | args = apr_table_make(ptemp, 5); | ||
136 | apr_table_setn(args, "config", "mod_log_sql.conf"); | ||
137 | apr_getopt_init(&opts, ptemp, argc, argv); | ||
138 | while ((rv = apr_getopt_long(opts, _opt_config, &opt, &opt_arg)) == APR_SUCCESS) { | ||
139 | switch (opt) { | ||
140 | case 'c': | ||
141 | apr_table_setn(args,"config",opt_arg); | ||
142 | break; | ||
143 | case 'd': | ||
144 | apr_table_setn(args,"dump","yes"); | ||
145 | break; | ||
146 | case 'f': | ||
147 | apr_table_setn(args,"inputfile",opt_arg); | ||
148 | break; | ||
149 | case 'h': | ||
150 | show_help(argv[0], _opt_config, stdout); | ||
151 | exit(1); | ||
152 | break; | ||
153 | case 'i': | ||
154 | apr_table_setn(args,"inputdirectory",opt_arg); | ||
155 | break; | ||
156 | case 'l': | ||
157 | apr_table_setn(args,"loglevel",opt_arg); | ||
158 | break; | ||
159 | case 'm': | ||
160 | apr_table_setn(args,"machineid",opt_arg); | ||
161 | break; | ||
162 | case 'n': | ||
163 | apr_table_setn(args,"dryrun","yes"); | ||
164 | break; | ||
165 | case 'p': | ||
166 | apr_table_setn(args,"threadcount",opt_arg); | ||
167 | break; | ||
168 | case 'r': | ||
169 | apr_table_setn(args,"logformat",opt_arg); | ||
170 | break; | ||
171 | case 's': | ||
172 | apr_table_setn(args,"summary",opt_arg); | ||
173 | break; | ||
174 | case 't': | ||
175 | apr_table_setn(args,"usetransactions",opt_arg); | ||
176 | break; | ||
177 | } | ||
178 | } | ||
179 | if (rv != APR_EOF) { | ||
180 | show_help(argv[0], _opt_config, stderr); | ||
181 | exit(1); | ||
182 | } | ||
183 | // Check if no extra args were passed | ||
184 | if (opts->ind != opts->argc) { | ||
185 | show_help(argv[0], _opt_config, stderr); | ||
186 | fprintf(stderr, "\n%s: Extra unknown arguments passed\n\n",argv[0]); | ||
187 | exit(1); | ||
188 | } | ||
189 | |||
190 | // Initialize sub systems | ||
191 | parser_init(pool); | ||
192 | config_init(pool); | ||
193 | database_init(pool); | ||
194 | // Process configuration file | ||
195 | cfg = config_create(pool); | ||
196 | // initialize STD out error log | ||
197 | logging_preinit(cfg); | ||
198 | rv = config_read(cfg, apr_table_get(args,"Config"), args); | ||
199 | apr_pool_destroy(ptemp); | ||
200 | |||
201 | // Initialize Log system AFTER we parse the configuration | ||
202 | logging_init(cfg); | ||
203 | |||
204 | if (APR_STATUS_IS_ENOENT(rv)) { | ||
205 | logging_log(cfg,LOGLEVEL_NOISE,"Could not load configuration file: %s",apr_table_get(args,"config")); | ||
206 | } else if (rv) { | ||
207 | exit(1); | ||
208 | } | ||
209 | if (cfg->dump) { | ||
210 | config_dump(cfg); | ||
211 | exit(0); | ||
212 | } | ||
213 | |||
214 | if (config_check(cfg)) { | ||
215 | logging_log(cfg,LOGLEVEL_NOISE, "Please correct the configuration"); | ||
216 | exit(1); | ||
217 | } | ||
218 | |||
219 | // Only Find files IF no filename was passed via the command line | ||
220 | if (apr_is_empty_array(cfg->input_files)) { | ||
221 | parser_find_logs(cfg); | ||
222 | } | ||
223 | if (!apr_is_empty_array(cfg->input_files)) { | ||
224 | parser_split_logs(cfg); | ||
225 | #if APR_HAS_THREADS | ||
226 | if (cfg->thread_count > 0) { | ||
227 | run_multithreaded(cfg); | ||
228 | } else { | ||
229 | #endif | ||
230 | run_singlethreaded(cfg); | ||
231 | #if APR_HAS_THREADS | ||
232 | } | ||
233 | #endif | ||
234 | } else { | ||
235 | logging_log(cfg,LOGLEVEL_NOISE,"No log files found to parse"); | ||
236 | } | ||
237 | |||
238 | if (cfg->summary) { | ||
239 | print_summary(cfg); | ||
240 | } | ||
241 | return 0; | ||
242 | } | ||
243 | |||
244 | void run_singlethreaded(config_t *cfg) | ||
245 | { | ||
246 | config_filestat_t *filelist; | ||
247 | config_dbd_t *dbconn = NULL; | ||
248 | int f, l; | ||
249 | apr_status_t rv; | ||
250 | |||
251 | if (!cfg->dryrun) { | ||
252 | if ((rv = database_connect(cfg, &dbconn))) { | ||
253 | logging_log(cfg,LOGLEVEL_NOISE, "Error Connecting to Database"); | ||
254 | exit(1); | ||
255 | } | ||
256 | } | ||
257 | |||
258 | filelist = (config_filestat_t *)cfg->input_files->elts; | ||
259 | for (f=0, l=cfg->input_files->nelts; f < l; f++) { | ||
260 | rv = parser_parsefile(cfg, dbconn, &filelist[f]); | ||
261 | if (rv) { | ||
262 | logging_log(cfg, LOGLEVEL_NOISE, | ||
263 | "Error occured parsing log files. Aborting"); | ||
264 | break; | ||
265 | } | ||
266 | } | ||
267 | |||
268 | if (!cfg->dryrun) { | ||
269 | database_disconnect(dbconn); | ||
270 | } | ||
271 | } | ||
272 | |||
273 | #if APR_HAS_THREADS | ||
274 | void * APR_THREAD_FUNC run_filethread(apr_thread_t *thd, void *data) | ||
275 | { | ||
276 | config_t *cfg = data; | ||
277 | config_dbd_t *dbconn = NULL; | ||
278 | config_filestat_t *fileentry; | ||
279 | apr_status_t rv; | ||
280 | |||
281 | if (!cfg->dryrun) { | ||
282 | if ((rv = database_connect(cfg, &dbconn))) { | ||
283 | logging_log(cfg,LOGLEVEL_NOISE, "Error Connecting to Database"); | ||
284 | return NULL; | ||
285 | } | ||
286 | } | ||
287 | |||
288 | while (1) { | ||
289 | rv = apr_queue_pop(queue, (void **)&fileentry); | ||
290 | if (rv == APR_EINTR) | ||
291 | continue; | ||
292 | if (rv == APR_EOF) | ||
293 | break; | ||
294 | rv = parser_parsefile(cfg, dbconn, fileentry); | ||
295 | if (rv) { | ||
296 | logging_log(cfg, LOGLEVEL_NOISE, | ||
297 | "Error occured parsing log file %s", fileentry->fname); | ||
298 | } | ||
299 | } | ||
300 | |||
301 | if (!cfg->dryrun) { | ||
302 | database_disconnect(dbconn); | ||
303 | } | ||
304 | return NULL; | ||
305 | } | ||
306 | |||
307 | void run_multithreaded(config_t *cfg) | ||
308 | { | ||
309 | logging_log(cfg, LOGLEVEL_NOISE, "Running Multithreaded"); | ||
310 | |||
311 | config_filestat_t *filelist; | ||
312 | int f, l; | ||
313 | apr_status_t rv; | ||
314 | apr_pool_t *tp; | ||
315 | apr_thread_pool_t *thrp; | ||
316 | unsigned int count; | ||
317 | |||
318 | apr_pool_create(&tp, cfg->pool); | ||
319 | rv = apr_queue_create(&queue, cfg->input_files->nelts, tp); | ||
320 | |||
321 | rv = apr_thread_pool_create(&thrp, 0, cfg->thread_count, tp); | ||
322 | |||
323 | //populate queue | ||
324 | filelist = (config_filestat_t *)cfg->input_files->elts; | ||
325 | for (f=0, l=cfg->input_files->nelts; f < l; f++) { | ||
326 | rv = apr_queue_push(queue, &filelist[f]); | ||
327 | } | ||
328 | // populate the worker threads | ||
329 | for (f=0; f<cfg->thread_count; f++) { | ||
330 | rv = apr_thread_pool_push(thrp, run_filethread, cfg, 0, NULL); | ||
331 | } | ||
332 | |||
333 | do { | ||
334 | apr_sleep(apr_time_from_sec(1)); | ||
335 | count = apr_queue_size(queue); | ||
336 | } while (count > 0); | ||
337 | |||
338 | rv = apr_queue_term(queue); | ||
339 | |||
340 | rv = apr_thread_pool_destroy(thrp); | ||
341 | } | ||
342 | #endif | ||
diff --git a/utility/shell.h b/utility/shell.h new file mode 100644 index 0000000..e69de29 --- /dev/null +++ b/utility/shell.h | |||
diff --git a/utility/util.c b/utility/util.c new file mode 100644 index 0000000..dcfb028 --- /dev/null +++ b/utility/util.c | |||
@@ -0,0 +1,189 @@ | |||
1 | #include "util.h" | ||
2 | #include "apr_strings.h" | ||
3 | #include "apr_lib.h" | ||
4 | #include "apr_file_io.h" | ||
5 | #include "apr_time.h" | ||
6 | |||
7 | #include "config.h" | ||
8 | |||
9 | #include <stdarg.h> | ||
10 | |||
11 | char *lowerstr(apr_pool_t *pool, const char *input) | ||
12 | { | ||
13 | char *temp; | ||
14 | char *itr; | ||
15 | temp = apr_pstrdup(pool, input); | ||
16 | for (itr=temp; *itr!='\0'; itr++) { | ||
17 | *itr = apr_tolower(*itr); | ||
18 | } | ||
19 | return temp; | ||
20 | } | ||
21 | |||
22 | void line_chomp(char *str) | ||
23 | { | ||
24 | int len; | ||
25 | // chomp off newline | ||
26 | len = strlen(str); | ||
27 | if (len) { | ||
28 | while (str[len-1] == '\r' || str[len-1] == '\n') { | ||
29 | str[len-1] = '\0'; | ||
30 | len--; | ||
31 | } | ||
32 | } | ||
33 | } | ||
34 | |||
35 | /* | ||
36 | * *** Ripped from HTTPD util.c (why are so many PORTABLE things not in APR UTIL?) | ||
37 | */ | ||
38 | static char x2c(const char *what) | ||
39 | { | ||
40 | register char digit; | ||
41 | |||
42 | digit = ((what[0] >= 'A') ? ((what[0] & 0xdf) - 'A') + 10 | ||
43 | : (what[0] - '0')); | ||
44 | digit *= 16; | ||
45 | digit += (what[1] >= 'A' ? ((what[1] & 0xdf) - 'A') + 10 | ||
46 | : (what[1] - '0')); | ||
47 | return (digit); | ||
48 | } | ||
49 | |||
50 | /* | ||
51 | * *** Ripped from HTTPD util.c (why are so many PORTABLE things not in APR UTIL?) | ||
52 | * | ||
53 | * Unescapes a URL, leaving reserved characters intact. | ||
54 | * Returns 0 on success, non-zero on error | ||
55 | * Failure is due to | ||
56 | * bad % escape returns HTTP_BAD_REQUEST | ||
57 | * | ||
58 | * decoding %00 or a forbidden character returns HTTP_NOT_FOUND | ||
59 | */ | ||
60 | static int unescape_url(char *url, const char *forbid, const char *reserved) | ||
61 | { | ||
62 | register int badesc, badpath; | ||
63 | char *x, *y; | ||
64 | |||
65 | badesc = 0; | ||
66 | badpath = 0; | ||
67 | /* Initial scan for first '%'. Don't bother writing values before | ||
68 | * seeing a '%' */ | ||
69 | y = strchr(url, '%'); | ||
70 | if (y == NULL) { | ||
71 | return APR_SUCCESS; | ||
72 | } | ||
73 | for (x = y; *y; ++x, ++y) { | ||
74 | if (*y != '%') { | ||
75 | *x = *y; | ||
76 | } | ||
77 | else { | ||
78 | if (!apr_isxdigit(*(y + 1)) || !apr_isxdigit(*(y + 2))) { | ||
79 | badesc = 1; | ||
80 | *x = '%'; | ||
81 | } | ||
82 | else { | ||
83 | char decoded; | ||
84 | decoded = x2c(y + 1); | ||
85 | if ((decoded == '\0') | ||
86 | || (forbid && strchr(forbid, decoded))) { | ||
87 | badpath = 1; | ||
88 | *x = decoded; | ||
89 | y += 2; | ||
90 | } | ||
91 | else if (reserved && strchr(reserved, decoded)) { | ||
92 | *x++ = *y++; | ||
93 | *x++ = *y++; | ||
94 | *x = *y; | ||
95 | } | ||
96 | else { | ||
97 | *x = decoded; | ||
98 | y += 2; | ||
99 | } | ||
100 | } | ||
101 | } | ||
102 | } | ||
103 | *x = '\0'; | ||
104 | if (badesc) { | ||
105 | return APR_EINVAL; | ||
106 | } | ||
107 | else if (badpath) { | ||
108 | return APR_EINVAL; | ||
109 | } | ||
110 | else { | ||
111 | return APR_SUCCESS; | ||
112 | } | ||
113 | } | ||
114 | |||
115 | /* | ||
116 | * *** Ripped from HTTPD util.c (why are so many PORTABLE things not in APR UTIL?) | ||
117 | */ | ||
118 | int ap_unescape_url(char *url) | ||
119 | { | ||
120 | /* Traditional */ | ||
121 | #ifdef CASE_BLIND_FILESYSTEM | ||
122 | return unescape_url(url, "/\\", NULL); | ||
123 | #else | ||
124 | return unescape_url(url, "/", NULL); | ||
125 | #endif | ||
126 | } | ||
127 | |||
128 | void logging_preinit(config_t *cfg) | ||
129 | { | ||
130 | apr_pool_create(&cfg->errorlog_p, cfg->pool); | ||
131 | apr_file_open_stderr(&cfg->errorlog_fperr, cfg->pool); | ||
132 | } | ||
133 | |||
134 | void logging_init(config_t *cfg) | ||
135 | { | ||
136 | apr_status_t rv; | ||
137 | if (cfg->errorlog) { | ||
138 | rv = apr_file_open(&cfg->errorlog_fp, cfg->errorlog, | ||
139 | APR_FOPEN_CREATE | APR_FOPEN_WRITE | APR_FOPEN_APPEND, | ||
140 | APR_OS_DEFAULT, | ||
141 | cfg->pool); | ||
142 | if (rv) { | ||
143 | printf("Error opening %s\n",cfg->errorlog); | ||
144 | cfg->loglevel = LOGLEVEL_NONE; | ||
145 | } | ||
146 | logging_log(cfg, LOGLEVEL_ERROR, "Log file Opened"); | ||
147 | } else { | ||
148 | cfg->loglevel = LOGLEVEL_NONE; | ||
149 | logging_log(cfg, LOGLEVEL_NOISE, "No Log file specified, disabled logging"); | ||
150 | } | ||
151 | } | ||
152 | |||
153 | const char *logging_strerror(apr_status_t rv) | ||
154 | { | ||
155 | char buff[256]; | ||
156 | return apr_strerror(rv, buff, 256); | ||
157 | } | ||
158 | |||
159 | void logging_log(config_t *cfg, loglevel_e level, const char *fmt, ...) | ||
160 | { | ||
161 | va_list ap; | ||
162 | char date[APR_RFC822_DATE_LEN]; | ||
163 | struct iovec vec[4]; | ||
164 | apr_size_t blen; | ||
165 | |||
166 | if (cfg->loglevel < level) return; | ||
167 | |||
168 | va_start(ap, fmt); | ||
169 | apr_pool_clear(cfg->errorlog_p); | ||
170 | |||
171 | apr_rfc822_date(date, apr_time_now()); | ||
172 | vec[0].iov_base = date; | ||
173 | vec[0].iov_len = APR_RFC822_DATE_LEN-1; | ||
174 | vec[1].iov_base = " "; | ||
175 | vec[1].iov_len = 2; | ||
176 | vec[2].iov_base = apr_pvsprintf(cfg->errorlog_p, fmt, ap); | ||
177 | vec[2].iov_len = strlen(vec[2].iov_base); | ||
178 | vec[3].iov_base = "\n"; | ||
179 | vec[3].iov_len = 1; | ||
180 | |||
181 | if (level == LOGLEVEL_NOISE) { | ||
182 | apr_file_writev(cfg->errorlog_fperr,&vec[2],2,&blen); | ||
183 | } | ||
184 | if (cfg->loglevel > LOGLEVEL_NONE && cfg->errorlog_fp) { | ||
185 | apr_file_writev(cfg->errorlog_fp,vec,4,&blen); | ||
186 | } | ||
187 | |||
188 | va_end(ap); | ||
189 | } | ||
diff --git a/utility/util.h b/utility/util.h new file mode 100644 index 0000000..a5a7f7e --- /dev/null +++ b/utility/util.h | |||
@@ -0,0 +1,26 @@ | |||
1 | #ifndef UTIL_H_ | ||
2 | #define UTIL_H_ | ||
3 | |||
4 | #include "apr_pools.h" | ||
5 | |||
6 | #include "config.h" | ||
7 | |||
8 | char *lowerstr(apr_pool_t *pool, const char *input); | ||
9 | |||
10 | /** | ||
11 | * Chomp new line characters off the end of the line | ||
12 | */ | ||
13 | void line_chomp(char *str); | ||
14 | |||
15 | int ap_unescape_url(char *url); | ||
16 | |||
17 | void logging_preinit(config_t *cfg); | ||
18 | |||
19 | void logging_init(config_t *cfg); | ||
20 | |||
21 | void logging_log(config_t *cfg, loglevel_e level, const char *fmt, ...) | ||
22 | __attribute__((format(printf, 3, 4))); | ||
23 | |||
24 | const char *logging_strerror(apr_status_t rv); | ||
25 | |||
26 | #endif /*UTIL_H_*/ | ||