📄 parse.c
字号:
/*** Modular Logfile Analyzer** Copyright 2000 Jan Kneschke <jan@kneschke.de>**** Homepage: http://www.kneschke.de/projekte/modlogan** This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version, and provided that the above copyright and permission notice is included with all distributed copies of this or derived software. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA**** $Id: parse.c,v 1.26 2001/01/11 22:34:14 jk Exp $*/#include <stdlib.h>#include <stdio.h>#include <string.h>#include <time.h>#include <ctype.h>#include <errno.h>#include "config.h"#ifdef HAVE_LIBADNS#include <adns.h>#endif#include "mlocale.h"#include "mplugins.h"#include "mrecord.h"#include "mdatatypes.h"#include "misc.h"#include "plugin_config.h"const char *short_month[] = { "Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec", NULL};int find_os (mconfig *ext_conf, char *str) { config_input *conf = ext_conf->input; mlist *l = conf->match_os; if (!str || !l) return 0; while (*str == ' ') str++; while (l) { data_Match *data = (data_Match *)l->data; if (data && strmatch(data->match, str)) {#if 0 printf("OS found: %s\n", str);#endif return 1; } l = l->next; } return 0;}int find_ua (mconfig *ext_conf, char *str) { config_input *conf = ext_conf->input; mlist *l = conf->match_ua; if (!str || !l) return 0; while (*str == ' ') str++; while (l) { data_Match *data = (data_Match *)l->data; if (data && strmatch(data->match, str)) {#if 0 printf("UA found: %s\n", str);#endif return 1; } l = l->next; } return 0;}int parse_timestamp(mconfig *ext_conf, const char *str, mlogrec *record) {#define N 20 + 1 int ovector[3 * N], n, i; char buf[10]; struct tm tm; config_input *conf = ext_conf->input; if ((n = pcre_exec(conf->match_timestamp, conf->match_timestamp_extra, str, strlen(str), 0, 0, ovector, 3 * N)) < 0) { if (n == PCRE_ERROR_NOMATCH) { fprintf(stderr, "%s.%d: string doesn't match: %s\n", __FILE__, __LINE__, str); } else { fprintf(stderr, "%s.%d: execution error while matching: %d\n", __FILE__, __LINE__, n); } return -1; } /* everything has matched, take the different pieces and be happy :) */ pcre_copy_substring(str, ovector, n, 1, buf, sizeof(buf)); tm.tm_mday = strtol(buf, NULL, 10); pcre_copy_substring(str, ovector, n, 2, buf, sizeof(buf)); for (i = 0; short_month[i];i++) { if (!strcmp(buf, short_month[i])) { tm.tm_mon = i; } } pcre_copy_substring(str, ovector, n, 3, buf, sizeof(buf)); tm.tm_year = strtol(buf, NULL, 10)-1900; pcre_copy_substring(str, ovector, n, 4, buf, sizeof(buf)); tm.tm_hour = strtol(buf, NULL, 10); pcre_copy_substring(str, ovector, n, 5, buf, sizeof(buf)); tm.tm_min = strtol(buf, NULL, 10); pcre_copy_substring(str, ovector, n, 6, buf, sizeof(buf)); tm.tm_sec = strtol(buf, NULL, 10); record->timestamp = mktime (&tm); return 0;#undef N}int parse_useragent(mconfig *ext_conf,const char *str, mlogrec_web_extclf *record) {/* get user agent */ char *pc1 = (char *)str, *pc3, *pc2 = (char *)str, *buf_copy; buf_copy = malloc(strlen(str)+1); strcpy(buf_copy, str); if ((pc3 = strchr(pc1, '(') )) { if (strstr(pc3, "compatible")) { int finished = 0; pc1 = pc2 = (pc3+1); while (!finished) { while (*pc2 && !(*pc2 == ';' || *pc2 == ')')) pc2++; if (!*pc2) { if (ext_conf->debug_level > 0) fprintf(stderr, "%s: '%s'\n", _("the 'Useragent' field of the logfile is incorrect"),buf_copy); free(buf_copy); return -1; } else if (*pc2 == ')') { finished = 1; } while (*pc1 == ' ') pc1++; *pc2 = '\0'; if (!record->req_useragent && find_ua(ext_conf, pc1)) { record->req_useragent = malloc(pc2-pc1+1); strcpy(record->req_useragent, pc1); } else if (!record->req_useros && find_os(ext_conf, pc1)) { record->req_useros = malloc(pc2-pc1+1); strcpy(record->req_useros, pc1); } pc1 = ++pc2; } } else { int finished = 0; pc2 = pc3; *pc2 = '\0'; if (!find_ua(ext_conf, pc1)) {// printf("UA- unknown: %s\n", pc4); } record->req_useragent = malloc(pc2-pc1+1); strcpy(record->req_useragent, pc1); pc1 = pc2 = (pc3+1); while (!finished) { while (*pc2 && !(*pc2 == ';' || *pc2 == ')')) pc2++; if (!*pc2) { if (ext_conf->debug_level > 0) fprintf(stderr, "%s: '%s'\n", _("the 'Useragent' field of the logfile is incorrect"),buf_copy); free(buf_copy); return -1; } else if (*pc2 == ')') { finished = 1; } while (*pc1 == ' ') pc1++; *pc2 = '\0'; if (!record->req_useros && find_os(ext_conf, pc1)) { record->req_useros = malloc(strlen(pc1)+1); strcpy(record->req_useros, pc1); } pc1 = ++pc2; } }#if 0 if (!record->req_useragent) { printf("UA unknown: %s\n", pc4); } if (!record->req_useros) { printf("OS unknown: %s\n", pc4); }#endif } else { record->req_useragent = malloc(strlen(str)+1); strcpy(record->req_useragent, str); } free(buf_copy); return 0;}int parse_url(mconfig *ext_conf,const char *str, mlogrec_web *record) {#define N 20 + 1 int ovector[3 * N], n;#ifdef DEBUG_INPUT int i;#endif config_input *conf = ext_conf->input; const char **list; if ((n = pcre_exec(conf->match_url, conf->match_url_extra, str, strlen(str), 0, 0, ovector, 3 * N)) < 0) { if (n == PCRE_ERROR_NOMATCH) { fprintf(stderr, "%s.%d: string doesn't match: %s\n", __FILE__, __LINE__, str); } else { fprintf(stderr, "%s.%d: execution error while matching: %d\n", __FILE__, __LINE__, n); } return -1; } if (n >= 3) { /* everything has matched, take the different pieces and be happy :) */ pcre_get_substring_list(str, ovector, n, &list); record->req_method = malloc(strlen((char *)list[1])+1); strcpy(record->req_method, (char *)list[1]); record->req_url = malloc(strlen((char *)list[2])+1); strcpy(record->req_url, (char *)list[2]); if (n >= 4) { if (strlen((char *)list[4])) { record->req_getvars = malloc(strlen((char *)list[4])+1); strcpy(record->req_getvars, (char *)list[4]); } } if (n >= 6) { record->req_protocol = malloc(strlen((char *)list[6])+1); strcpy(record->req_protocol, (char *)list[6]); }#ifdef DEBUG_INPUT for (i = 0; i < n ; i++) { printf("--> %d: %s\n", i, list[i]); } fprintf(stderr, "%s.%d: %s, %s, %s, %s\n", __FILE__, __LINE__, record->req_method, record->req_url, record->req_getvars, record->req_protocol);#endif free(list); } else { fprintf(stderr, "%s.%d: Matched fields below minimum: %d\n", __FILE__, __LINE__, n); return -1; } return 0;#undef N}int parse_referrer(mconfig *ext_conf,const char *str, mlogrec_web_extclf *record) {#define N 20 + 1 int ovector[3 * N], n; config_input *conf = ext_conf->input; const char **list; if ((n = pcre_exec(conf->match_referrer, conf->match_referrer_extra, str, strlen(str), 0, 0, ovector, 3 * N)) < 0) { if (n == PCRE_ERROR_NOMATCH) { fprintf(stderr, "%s.%d: string doesn't match: %s\n", __FILE__, __LINE__, str); } else { fprintf(stderr, "%s.%d: execution error while matching: %d\n", __FILE__, __LINE__, n); } return -1; } if (n >= 2) { /* everything has matched, take the different pieces and be happy :) */ pcre_get_substring_list(str, ovector, n, &list); record->ref_url = malloc(strlen((char *)list[1])+1); strcpy(record->ref_url, (char *)list[1]); if (n > 3) { record->ref_getvars = malloc(strlen((char *)list[3])+1); strcpy(record->ref_getvars, (char *)list[3]); }#ifdef DEBUG_INPUT fprintf(stderr, "%s.%d: %s, %s\n", __FILE__, __LINE__, record->ref_url, record->ref_getvars);#endif free(list); } else { fprintf(stderr, "%s.%d: Matched fields below minimum: %d\n", __FILE__, __LINE__, n); return -1; } return 0;#undef N}int parse_record_pcre(mconfig *ext_conf, mlogrec *record, char *_buffer) {#define N 20 + 1 const char **list; int ovector[3 * N], n; config_input *conf = ext_conf->input; int endpos; mlogrec_web *recweb = NULL; record->ext_type = M_RECORD_TYPE_WEB; record->ext = mrecord_init_web(); recweb = record->ext; if (recweb == NULL) return -1; if (strncmp("format=", _buffer, 7) == 0) { fprintf(stderr, "%s.%d: detected a NetScape Server Log - perhaps it goes wrong\n", __FILE__, __LINE__); fprintf(stderr, "%s.%d: bitch the developer for real Netscape support\n", __FILE__, __LINE__); }/* parse a CLF record */ if ((n = pcre_exec(conf->match_clf, conf->match_clf_extra, _buffer, strlen(_buffer), 0, 0, ovector, 3 * N)) < 0) { if (n == PCRE_ERROR_NOMATCH) { fprintf(stderr, "%s.%d: string doesn't match: %s\n", __FILE__, __LINE__, _buffer); } else { fprintf(stderr, "%s.%d: execution error while matching: %d\n", __FILE__, __LINE__, n); } return -1; } if (n >= 7) { pcre_get_substring_list(_buffer, ovector, n, &list); recweb->req_host = malloc(strlen((char *)list[1])+1); strcpy(recweb->req_host, (char *)list[1]); recweb->req_user = malloc(strlen((char *)list[3])+1); strcpy(recweb->req_user, (char *)list[3]); if (parse_timestamp(ext_conf, list[4], record) == -1) { free(list); return -1; } if (parse_url(ext_conf, list[5], recweb) == -1) { free(list); return -1; } recweb->req_status = strtol(list[6], NULL,10); recweb->xfersize = strtol(list[7], NULL,10); free(list); } else { fprintf(stderr, "%s.%d: Matched fields below minimum: %d\n", __FILE__, __LINE__, n); return -1; } endpos = ovector[ (n-1)*2 + 1 ];/* try to get the extended log fields */ n = pcre_exec(conf->match_clf_extended, conf->match_clf_extended_extra, _buffer, strlen(_buffer), endpos, 0, ovector, 3 * N); if (n < 0 && n != PCRE_ERROR_NOMATCH) { fprintf(stderr, "%s.%d: execution error while matching: %d\n", __FILE__, __LINE__, n); return -1; } else if (n == 3) { mlogrec_web_extclf *recext; recext = mrecord_init_web_extclf(); if (recext != NULL) { pcre_get_substring_list(_buffer, ovector, n, &list);#ifdef DEBUG_INPUT fprintf(stderr, "-elf-1-> %s, %s\n", list[1],list[2]);#endif if (parse_referrer(ext_conf, list[1], recext) == -1) { mrecord_free_web_extclf(recext); free(list); return 0; } if (parse_useragent(ext_conf, list[2], recext) == -1) { mrecord_free_web_extclf(recext); free(list);
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -