added an import utility

This commit is contained in:
SJ 2011-12-30 15:52:59 +01:00
parent 89a83df4fb
commit 1b57459f89
11 changed files with 216 additions and 13 deletions

View File

@ -33,7 +33,7 @@ MAKE = `which make`
INSTALL = @INSTALL@ INSTALL = @INSTALL@
all: libpiler.a piler pilerconf pilerget test all: libpiler.a piler pilerconf pilerget pilerimport test
install: install-piler install: install-piler
@ -51,6 +51,9 @@ libpiler.a: $(OBJS) $(MYSQL_OBJS)
pilerget: pilerget.c cfg.o misc.o tai.o store.o attachment.o digest.o pilerget: pilerget.c cfg.o misc.o tai.o store.o attachment.o digest.o
$(CC) $(CFLAGS) $(INCDIR) $(DEFS) -o $@ $^ $(LIBS) $(LIBDIR) $(CC) $(CFLAGS) $(INCDIR) $(DEFS) -o $@ $^ $(LIBS) $(LIBDIR)
pilerimport: pilerimport.c libpiler.a
$(CC) $(CFLAGS) $(INCDIR) $(DEFS) -o $@ $^ -lpiler $(LIBS) $(LIBDIR)
pilerconf: pilerconf.c cfg.o misc.o tai.o pilerconf: pilerconf.c cfg.o misc.o tai.o
$(CC) $(CFLAGS) $(INCDIR) $(DEFS) -o $@ $^ $(LIBDIR) $(CC) $(CFLAGS) $(INCDIR) $(DEFS) -o $@ $^ $(LIBDIR)
@ -79,7 +82,7 @@ install-piler:
$(INSTALL) -m 0755 pilerget $(DESTDIR)$(bindir) $(INSTALL) -m 0755 pilerget $(DESTDIR)$(bindir)
clean: clean:
rm -f *.o *.a libpiler.so* piler pilerconf pilerget pilertest rm -f *.o *.a libpiler.so* piler pilerconf pilerget pilerimport pilertest
distclean: clean distclean: clean
rm -f Makefile rm -f Makefile

View File

@ -98,7 +98,7 @@ int store_attachments(struct session_data *sdata, struct _state *state, struct _
bind[4].buffer_type = MYSQL_TYPE_STRING; bind[4].buffer_type = MYSQL_TYPE_STRING;
bind[4].buffer = state->attachments[i].type; bind[4].buffer = state->attachments[i].type;
bind[4].is_null = 0; bind[4].is_null = 0;
len[4] = strlen(state->attachments[i].digest); bind[4].length = &len[4]; len[4] = strlen(state->attachments[i].type); bind[4].length = &len[4];
bind[5].buffer_type = MYSQL_TYPE_LONG; bind[5].buffer_type = MYSQL_TYPE_LONG;
bind[5].buffer = (char *)&(state->attachments[i].size); bind[5].buffer = (char *)&(state->attachments[i].size);

View File

@ -151,7 +151,7 @@ struct session_data {
char ttmpfile[SMALLBUFSIZE], tmpframe[SMALLBUFSIZE], tre, restored_copy; char ttmpfile[SMALLBUFSIZE], tmpframe[SMALLBUFSIZE], tre, restored_copy;
char mailfrom[SMALLBUFSIZE], rcptto[MAX_RCPT_TO][SMALLBUFSIZE], client_addr[SMALLBUFSIZE]; char mailfrom[SMALLBUFSIZE], rcptto[MAX_RCPT_TO][SMALLBUFSIZE], client_addr[SMALLBUFSIZE];
char acceptbuf[SMALLBUFSIZE]; char acceptbuf[SMALLBUFSIZE];
char whitelist[MAXBUFSIZE], blacklist[MAXBUFSIZE]; char attachments[SMALLBUFSIZE];
int fd, hdr_len, tot_len, num_of_rcpt_to, rav; int fd, hdr_len, tot_len, num_of_rcpt_to, rav;
int need_scan; int need_scan;
float __acquire, __parsed, __av, __store, __compress, __encrypt; float __acquire, __parsed, __av, __store, __compress, __encrypt;

View File

@ -117,8 +117,8 @@ int store_index_data(struct session_data *sdata, struct _state *state, uint64 id
char *subj, s[SMALLBUFSIZE]; char *subj, s[SMALLBUFSIZE];
MYSQL_STMT *stmt; MYSQL_STMT *stmt;
MYSQL_BIND bind[4]; MYSQL_BIND bind[5];
unsigned long len[4]; unsigned long len[5];
subj = state->b_subject; subj = state->b_subject;
if(*subj == ' ') subj++; if(*subj == ' ') subj++;
@ -131,7 +131,7 @@ int store_index_data(struct session_data *sdata, struct _state *state, uint64 id
} }
snprintf(s, sizeof(s)-1, "INSERT INTO %s (`id`, `from`, `to`, `subject`, `body`, `arrived`, `sent`, `size`, `attachments`) values(%llu,?,?,?,?,%ld,%ld,%d,%d)", SQL_SPHINX_TABLE, id, sdata->now, sdata->sent, sdata->tot_len, state->n_attachments); snprintf(s, sizeof(s)-1, "INSERT INTO %s (`id`, `from`, `to`, `subject`, `body`, `arrived`, `sent`, `size`, `attachments`, `attachment_types`) values(%llu,?,?,?,?,%ld,%ld,%d,%d,?)", SQL_SPHINX_TABLE, id, sdata->now, sdata->sent, sdata->tot_len, state->n_attachments);
if(mysql_stmt_prepare(stmt, s, strlen(s))){ if(mysql_stmt_prepare(stmt, s, strlen(s))){
@ -166,6 +166,11 @@ int store_index_data(struct session_data *sdata, struct _state *state, uint64 id
bind[3].is_null = 0; bind[3].is_null = 0;
len[3] = strlen(state->b_body); bind[3].length = &len[3]; len[3] = strlen(state->b_body); bind[3].length = &len[3];
bind[4].buffer_type = MYSQL_TYPE_STRING;
bind[4].buffer = sdata->attachments;
bind[4].is_null = 0;
len[4] = strlen(sdata->attachments); bind[4].length = &len[3];
if(mysql_stmt_bind_param(stmt, bind)){ if(mysql_stmt_bind_param(stmt, bind)){
syslog(LOG_PRIORITY, "%s: %s.mysql_stmt_bind_param() error: %s", sdata->ttmpfile, SQL_SPHINX_TABLE, mysql_stmt_error(stmt)); syslog(LOG_PRIORITY, "%s: %s.mysql_stmt_bind_param() error: %s", sdata->ttmpfile, SQL_SPHINX_TABLE, mysql_stmt_error(stmt));

View File

@ -18,7 +18,7 @@
struct _state parse_message(struct session_data *sdata, struct __config *cfg){ struct _state parse_message(struct session_data *sdata, struct __config *cfg){
FILE *f; FILE *f;
char buf[MAXBUFSIZE]; char *p, buf[MAXBUFSIZE];
struct _state state; struct _state state;
int i, len; int i, len;
@ -58,6 +58,11 @@ struct _state parse_message(struct session_data *sdata, struct __config *cfg){
fixupEncodedHeaderLine(state.attachments[i].filename); fixupEncodedHeaderLine(state.attachments[i].filename);
if(cfg->verbosity >= _LOG_DEBUG) syslog(LOG_PRIORITY, "%s: attachment list: i:%d, name=*%s*, type: *%s*, size: %d, int.name: %s, digest: %s", sdata->ttmpfile, i, state.attachments[i].filename, state.attachments[i].type, state.attachments[i].size, state.attachments[i].internalname, state.attachments[i].digest); if(cfg->verbosity >= _LOG_DEBUG) syslog(LOG_PRIORITY, "%s: attachment list: i:%d, name=*%s*, type: *%s*, size: %d, int.name: %s, digest: %s", sdata->ttmpfile, i, state.attachments[i].filename, state.attachments[i].type, state.attachments[i].size, state.attachments[i].internalname, state.attachments[i].digest);
p = determine_attachment_type(state.attachments[i].filename, state.attachments[i].type);
len = strlen(p);
if(strlen(sdata->attachments) < SMALLBUFSIZE-len-1) memcpy(&(sdata->attachments[strlen(sdata->attachments)]), p, len);
} }

View File

@ -27,5 +27,6 @@ void reassembleToken(char *p);
void degenerateToken(unsigned char *p); void degenerateToken(unsigned char *p);
void fixURL(char *url); void fixURL(char *url);
int extractNameFromHeaderLine(char *s, char *name, char *resultbuf); int extractNameFromHeaderLine(char *s, char *name, char *resultbuf);
char *determine_attachment_type(char *filename, char *type);
#endif /* _PARSER_H */ #endif /* _PARSER_H */

View File

@ -591,4 +591,49 @@ int extractNameFromHeaderLine(char *s, char *name, char *resultbuf){
} }
char *determine_attachment_type(char *filename, char *type){
char *p;
if(strncasecmp(type, "text/", strlen("text/")) == 0) return "text,";
if(strncasecmp(type, "image/", strlen("image/")) == 0) return "image,";
if(strncasecmp(type, "audio/", strlen("audio/")) == 0) return "audio,";
if(strncasecmp(type, "video/", strlen("video/")) == 0) return "video,";
if(strncasecmp(type, "text/x-card", strlen("text/x-card")) == 0) return "vcard,";
if(strncasecmp(type, "application/pdf", strlen("application/pdf")) == 0) return "pdf,";
if(strncasecmp(type, "application/msword", strlen("application/msword")) == 0) return "word,";
if(strncasecmp(type, "application/vnd.ms-excel", strlen("application/vnd.ms-excel")) == 0) return "excel,";
if(strncasecmp(type, "application/vnd.ms-powerpoint", strlen("application/vnd.ms-powerpoint")) == 0) return "powerpoint,";
if(strncasecmp(type, "application/x-shockwave-flash", strlen("application/x-shockwave-flash")) == 0) return "flash,";
if(strcasestr(type, "opendocument")) return "odf,";
if(strcasecmp(type, "application/octet-stream") == 0){
p = strrchr(type, '.');
if(p){
p++;
if(strncasecmp(p, "zip", 3) == 0) return "compressed,";
if(strncasecmp(p, "rar", 3) == 0) return "compressed,";
if(strncasecmp(p, "doc", 3) == 0) return "word,";
if(strncasecmp(p, "docx", 4) == 0) return "word,";
if(strncasecmp(p, "xls", 3) == 0) return "excel,";
if(strncasecmp(p, "xlsx", 4) == 0) return "excel,";
if(strncasecmp(p, "ppt", 3) == 0) return "powerpoint,";
if(strncasecmp(p, "pptx", 4) == 0) return "powerpoint,";
if(strncasecmp(p, "png", 3) == 0) return "image,";
if(strncasecmp(p, "gif", 3) == 0) return "image,";
if(strncasecmp(p, "jpg", 3) == 0) return "image,";
if(strncasecmp(p, "jpeg", 4) == 0) return "image,";
if(strncasecmp(p, "tiff", 4) == 0) return "image,";
}
}
return "other,";
}

142
src/pilerimport.c Normal file
View File

@ -0,0 +1,142 @@
/*
* pilerimport.c, SJ
*/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sys/time.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/stat.h>
#include <unistd.h>
#include <time.h>
#include <locale.h>
#include <syslog.h>
#include <piler.h>
int import_message(char *filename, struct session_data *sdata, struct __data *data, struct __config *cfg){
int i, rc=ERR;
char *rule;
struct stat st;
struct _state state;
if(stat(filename, &st) != 0){
printf("cannot read: %s\n", filename);
return rc;
}
create_id(&(sdata->ttmpfile[0]));
printf("a: %s\n", sdata->ttmpfile);
link(filename, sdata->ttmpfile);
sdata->num_of_rcpt_to = -1;
memset(sdata->rcptto[0], 0, SMALLBUFSIZE);
time(&(sdata->now));
sdata->sent = 0;
sdata->hdr_len = 0;
sdata->tot_len = st.st_size;
memset(sdata->attachments, 0, SMALLBUFSIZE);
snprintf(sdata->tmpframe, SMALLBUFSIZE-1, "%s.m", sdata->ttmpfile);
state = parse_message(sdata, cfg);
rule = check_againt_ruleset(data->rules, &state, st.st_size);
if(rule){
printf("discarding %s by archiving policy: %s\n", filename, rule);
rc = OK;
goto ENDE;
}
printf("message-id: %s\n", state.message_id);
printf("from: *%s*\n", state.b_from);
printf("to: *%s*\n", state.b_to);
printf("subject: *%s*\n", state.b_subject);
make_digests(sdata, cfg);
printf("hdr len: %d\n", sdata->hdr_len);
printf("body digest: %s\n", sdata->bodydigest);
for(i=1; i<=state.n_attachments; i++){
printf("i:%d, name=*%s*, type: *%s*, size: %d, int.name: %s, digest: %s\n", i, state.attachments[i].filename, state.attachments[i].type, state.attachments[i].size, state.attachments[i].internalname, state.attachments[i].digest);
}
printf("attachments:%s\n", sdata->attachments);
printf("\n\n");
rc = processMessage(sdata, &state, cfg);
ENDE:
unlink(sdata->ttmpfile);
unlink(sdata->tmpframe);
if(rc == ERR) return rc;
if(rc == ERR_EXISTS) printf("discarding duplicate message: %s\n", sdata->ttmpfile);
return OK;
}
int main(int argc, char **argv){
int rc;
struct session_data sdata;
struct __config cfg;
struct __data data;
if(argc < 2){
printf("usage: %s <message>\n", argv[0]);
exit(1);
}
cfg = read_config(CONFIG_FILE);
if(read_key(&cfg)){
printf("%s\n", ERR_READING_KEY);
return 1;
}
mysql_init(&(sdata.mysql));
mysql_options(&(sdata.mysql), MYSQL_OPT_CONNECT_TIMEOUT, (const char*)&cfg.mysql_connect_timeout);
if(mysql_real_connect(&(sdata.mysql), cfg.mysqlhost, cfg.mysqluser, cfg.mysqlpwd, cfg.mysqldb, cfg.mysqlport, cfg.mysqlsocket, 0) == 0){
printf("cant connect to mysql server\n");
return 0;
}
mysql_real_query(&(sdata.mysql), "SET NAMES utf8", strlen("SET NAMES utf8"));
mysql_real_query(&(sdata.mysql), "SET CHARACTER SET utf8", strlen("SET CHARACTER SET utf8"));
printf("locale: %s\n", setlocale(LC_MESSAGES, cfg.locale));
setlocale(LC_CTYPE, cfg.locale);
data.rules = NULL;
load_archiving_rules(&sdata, &(data.rules));
rc = import_message(argv[1], &sdata, &data, &cfg);
free_rule(data.rules);
mysql_close(&(sdata.mysql));
return 0;
}

View File

@ -502,8 +502,7 @@ void initSessionData(struct session_data *sdata){
memset(sdata->mailfrom, 0, SMALLBUFSIZE); memset(sdata->mailfrom, 0, SMALLBUFSIZE);
snprintf(sdata->client_addr, SMALLBUFSIZE-1, "null"); snprintf(sdata->client_addr, SMALLBUFSIZE-1, "null");
memset(sdata->whitelist, 0, MAXBUFSIZE); memset(sdata->attachments, 0, SMALLBUFSIZE);
memset(sdata->blacklist, 0, MAXBUFSIZE);
sdata->restored_copy = 0; sdata->restored_copy = 0;

View File

@ -62,6 +62,7 @@ int main(int argc, char **argv){
sdata.sent = 0; sdata.sent = 0;
sdata.tot_len = st.st_size; sdata.tot_len = st.st_size;
memset(sdata.rcptto[0], 0, SMALLBUFSIZE); memset(sdata.rcptto[0], 0, SMALLBUFSIZE);
memset(sdata.attachments, 0, SMALLBUFSIZE);
snprintf(sdata.ttmpfile, SMALLBUFSIZE-1, "%s", argv[1]); snprintf(sdata.ttmpfile, SMALLBUFSIZE-1, "%s", argv[1]);
snprintf(sdata.tmpframe, SMALLBUFSIZE-1, "%s.m", argv[1]); snprintf(sdata.tmpframe, SMALLBUFSIZE-1, "%s.m", argv[1]);
@ -90,6 +91,7 @@ int main(int argc, char **argv){
printf("i:%d, name=*%s*, type: *%s*, size: %d, int.name: %s, digest: %s\n", i, state.attachments[i].filename, state.attachments[i].type, state.attachments[i].size, state.attachments[i].internalname, state.attachments[i].digest); printf("i:%d, name=*%s*, type: *%s*, size: %d, int.name: %s, digest: %s\n", i, state.attachments[i].filename, state.attachments[i].type, state.attachments[i].size, state.attachments[i].internalname, state.attachments[i].digest);
} }
printf("attachments:%s\n", sdata.attachments);
printf("\n\n"); printf("\n\n");

View File

@ -1,4 +1,4 @@
create database `piler` character set 'utf8'; create database if not exists `piler` character set 'utf8';
use `piler`; use `piler`;
@ -21,6 +21,7 @@ create table if not exists `sph_index` (
`body` text, `body` text,
`size` int default '0', `size` int default '0',
`attachments` int default 0, `attachments` int default 0,
`attachment_types` text(512) default null,
primary key (`id`) primary key (`id`)
) Engine=InnoDB; ) Engine=InnoDB;
@ -121,11 +122,11 @@ drop table if exists `counter`;
create table if not exists `counter` ( create table if not exists `counter` (
`rcvd` bigint unsigned default 0, `rcvd` bigint unsigned default 0,
`virus` bigint unsigned default 0, `virus` bigint unsigned default 0,
`duplicate` bigint unsigned default 0 `duplicate` bigint unsigned default 0,
`ignore` bigint unsigned default 0 `ignore` bigint unsigned default 0
) Engine=InnoDB; ) Engine=InnoDB;
insert into `counter` values(0, 0, 0); insert into `counter` values(0, 0, 0, 0);
drop table if exists `search`; drop table if exists `search`;