piler/unit_tests/check_parser_utils.c

296 lines
14 KiB
C
Raw Normal View History

2015-11-27 12:17:19 +01:00
/*
* check_parser_utils.c, SJ
*/
#include "test.h"
2015-11-27 12:17:19 +01:00
struct date_test {
char date_str[SMALLBUFSIZE];
time_t timestamp;
};
struct name_from_header_test {
char line[SMALLBUFSIZE];
char *token;
char *expected_result;
};
struct str_pair {
char line[SMALLBUFSIZE];
char *expected_result;
};
static void test_parse_date_header(){
2016-04-05 21:10:09 +02:00
unsigned int i;
struct config cfg;
2015-11-27 12:17:19 +01:00
struct date_test date_test[] = {
{"Date: Mon, 02 Nov 2015 09:39:31 -0000", 1446457171},
{"Date: Mon, 2 Nov 2015 10:39:45 +0100", 1446457185},
{"Date: Sun, 1 Nov 2015 17:23:07 +0100 (CET)", 1446394987},
{"Date: 3 Nov 2015 15:19:30 +0100", 1446560370},
{"Date: Mon, 3 Feb 2014 13:21:07 +0100", 1391430067},
{"Date: Sat, 4 Aug 2007 13:36:52 GMT-0700", 1186256212},
{"Date: Sat, 4 Aug 07 13:36:52 GMT-0700", 1186256212},
{"Date: 16 Dec 07 20:45:52", 1197837952},
{"Date: 03 Jun 06 05:59:00 +0100", 1149307140},
{"Date: 30.06.2005 17:47:42", 1120150062},
{"Date: 03-Feb-2014 08:09:10", 1391414950},
{"Date: 13 Mar 2013 14:56:02 UTC", 1363186562}
};
cfg = read_config("test.conf");
setlocale(LC_MESSAGES, cfg.locale);
setlocale(LC_CTYPE, cfg.locale);
TEST_HEADER();
for(i=0; i<sizeof(date_test)/sizeof(struct date_test); i++){
time_t delta = parse_date_header(date_test[i].date_str) - date_test[i].timestamp;
ASSERT(delta <= 3600 && delta >= -3600, date_test[i].date_str);
2015-11-27 12:17:19 +01:00
}
TEST_FOOTER();
2015-11-27 12:17:19 +01:00
}
static void test_extractNameFromHeaderLine(){
2016-04-05 21:10:09 +02:00
unsigned int i;
2015-11-27 12:17:19 +01:00
char resultbuf[SMALLBUFSIZE];
struct name_from_header_test name_from_header_test[] = {
{"Content-Type: text/plain; charset=UTF-8", "charset", "UTF-8"},
{"Content-Type: text/plain; charset=\"utf-8\"", "charset", "utf-8"},
{"Content-Type: text/plain; charset=us-ascii", "charset", "us-ascii"},
{"Content-Type: text/plain; charset=\"iso-8859-2\"", "charset", "iso-8859-2"},
{"Content-Type: text/calendar; method=REQUEST; charset=\"utf-8\"", "charset", "utf-8"},
{"Content-Type: text/plain; charset=\"utf-8\"; format=flowed", "charset", "utf-8"},
{"Content-Type: text/calendar; charset=\"utf-8\"; method=CANCEL", "charset", "utf-8"},
{"Content-Type: text/plain; format=flowed; charset=\"US-ASCII\"", "charset", "US-ASCII"},
{"Content-Type: text/plain; charset=\"UTF-8\"; format=flowed", "charset", "UTF-8"},
{"Content-Type: multipart/alternative; charset=\"UTF-8\"; boundary=\"b1_8c387891290303ff3c6ca75c8e238b54\"", "charset", "UTF-8"},
{"Content-Type: TEXT/PLAIN; format=flowed; charset=US-ASCII", "charset", "US-ASCII"},
{"Content-Type: message/delivery-status; name=\"Delivery report\"", "name", "Delivery report"},
{"Content-Disposition: attachment; filename=\"Delivery report\"; size=1193;", "name", "Delivery report"},
{"Content-Disposition: attachment; filename=\"AAAAA_ABC_150924.xls\"", "name", "AAAAA_ABC_150924.xls"},
{"Content-Type: image/jpeg; name=\"image001.jpg\"", "name", "image001.jpg"},
{"Content-Disposition: inline; filename=\"image001.jpg\"; size=5403;", "name", "image001.jpg"},
{"Content-Type: application/octet-stream; name=xxxxxDrRestoreGUI.log", "name", "xxxxxDrRestoreGUI.log"},
{"Content-Disposition: inline; filename=\"Legjobb_Munkahely_Felmeres_2012.jpg\"", "name", "Legjobb_Munkahely_Felmeres_2012.jpg"},
{"Content-Type: image/png; name=\"=?iso-8859-2?Q?N=E9vtelen.png?=\"", "name", "Névtelen.png"},
{"Content-Type: application/msword; name=", "name", ""},
{"Content-Disposition: attachment; filename=", "name", ""},
{"Content-Disposition: attachment; filename=\"NDA - Suto - 20151109.pdf\";", "name", "NDA - Suto - 20151109.pdf"},
{"Content-Type: image/png; name=\"Screenshot from 2015-11-10 10:07:13.png\"", "name", "Screenshot from 2015-11-10 10:07:13.png"},
{"Content-Disposition: attachment; filename=\"zzzzz Email Examples.zip\";", "name", "zzzzz Email Examples.zip"},
{"Content-Type: application/msword; name*=\"iso-8859-1''Einverst%E4ndniserkl%E4rung_Kids-PKW_Familienname.doc\"", "name", "Einverständniserklärung_Kids-PKW_Familienname.doc"},
{"Content-Type: application/msword; name*= \"iso-8859-1''Einverst%E4ndniserkl%E4rung_Kids-PKW_Familienname.doc\"", "name", "Einverständniserklärung_Kids-PKW_Familienname.doc"},
// This one sucks, and I don't think it's a proper definition
{"Content-Type: application/msword; filename*=utf-8''P;LAN%20Holden%204.docx;filename=\"P;LAN Holden 4.docx\"", "name", "P"},
// Adding quotes makes it acceptable to the parser
{"Content-Type: application/msword; filename*=\"utf-8''P;LAN%20Holden%204.docx\";filename=\"P;LAN Holden 4.docx\"", "name", "P;LAN Holden 4.docx"},
{"Content-Type: null; name=\"toDev-Netengineering.png\"", "name", "toDev-Netengineering.png"},
{"Content-Type: null; name=\"toDev-name-Netengineering.png\"", "name", "toDev-name-Netengineering.png"},
{"Content-Type: null; name*=\"iso-8859-1''toDev-Netengineering.png\"", "name", "toDev-Netengineering.png"},
{"Content-Type: null; name*=\"iso-8859-1''toDev-name-Netengineering.png\"", "name", "toDev-name-Netengineering.png"},
{"Content-Type: null; name*=\"iso-8859-1''toDevnameNetengineering.png\"", "name", "toDevnameNetengineering.png"},
{"Content-Type: null; name*=\"iso-8859-1''toDev-namE-Netengineering.png\"", "name", "toDev-namE-Netengineering.png"},
2015-11-27 12:17:19 +01:00
{"foo: bar; title=Economy", "title", "Economy"},
{"foo: bar; title=\"US-$ rates\"", "title", "US-$ rates"},
{"foo: bar; title*=iso-8859-1'en'%A3%20rates", "title", "£ rates"},
{"foo: bar; title*=UTF-8''%c2%a3%20and%20%e2%82%ac%20rates", "title", "£ and € rates"},
2015-11-27 12:17:19 +01:00
};
TEST_HEADER();
2015-11-27 12:17:19 +01:00
for(i=0; i<sizeof(name_from_header_test)/sizeof(struct name_from_header_test); i++){
extractNameFromHeaderLine(name_from_header_test[i].line, name_from_header_test[i].token, resultbuf, SMALLBUFSIZE);
ASSERT(strcmp(resultbuf, name_from_header_test[i].expected_result) == 0, name_from_header_test[i].expected_result);
2015-11-27 12:17:19 +01:00
}
TEST_FOOTER();
2015-11-27 12:17:19 +01:00
}
static void test_fixupEncodedHeaderLine(){
2016-04-05 21:10:09 +02:00
unsigned int i;
2015-11-27 12:17:19 +01:00
char buf[SMALLBUFSIZE];
struct str_pair pair[] = {
{"=?utf-8?Q?Tanjoubi,_azaz_sz=C3=BClet=C3=A9snap!_10_=C3=A9ves_az_I_Love_Su?= =?utf-8?Q?shi!?=", "Tanjoubi, azaz születésnap! 10 éves az I Love Sushi!"},
2015-11-27 12:17:19 +01:00
{"=?UTF-8?Q?IAM:_N2YPF_-_#1_Request_new_privilege?=", "IAM: N2YPF - #1 Request new privilege"},
{"=?UTF-8?B?SG9neWFuIMOtcmp1bmsgcGFuYXN6bGV2ZWxldD8=?=", "Hogyan írjunk panaszlevelet?"},
{"Re: [Bitbucket] Issue #627: ldap user can't login (jsuto/piler)", "Re: [Bitbucket] Issue #627: ldap user can't login (jsuto/piler)"},
{"=?iso-8859-2?Q?RE:_test.aaa.fu_z=F3na?=", "RE: test.aaa.fu zóna"},
{"=?iso-8859-2?Q?V=E1ltoz=E1s_az_IT_szervezetben_/_Personal_changes_in_the_?=", "Változás az IT szervezetben / Personal changes in the "},
{"Re: AAAmil /29 UZ736363", "Re: AAAmil /29 UZ736363"},
2015-11-27 12:17:19 +01:00
{"=?UTF-8?Q?[JIRA]_Created:_(HUDSS-196)_T=C5=B1zfal_?=", "[JIRA] Created: (HUDSS-196) Tűzfal "},
{"=?iso-8859-2?Q?RE:_Baptista_Szeretetszolg=E1lat?=", "RE: Baptista Szeretetszolgálat"},
{"=?iso-8859-2?B?SXR0IGF6IE1OQiBuYWd5IGRvYuFzYTogaXNt6XQgYmVsZW55+mxuYWsgYSBoaXRlbGV66XNiZSAoMjAxNS4xMS4wMy4gLSBzakBhY3RzLmh1KQ==?=", "Itt az MNB nagy dobása: ismét belenyúlnak a hitelezésbe (2015.11.03. - sj@acts.hu)"},
{"=?UTF-8?B?TGludXggQURNSU4gaG96esOhZsOpcsOpc2Vr?=", "Linux ADMIN hozzáférések"},
{"Burn 14 Calories a Minute with This Workout!", "Burn 14 Calories a Minute with This Workout!"},
{"=?utf-8?Q?Help=20Net=20Security=20Newsletter=20=2D=20=20November=203rd=202015?=", "Help Net Security Newsletter - November 3rd 2015"},
{"=?ISO-8859-2?Q?Re=3A_kimen=F5_levelez=E9si_probl=E9ma_-_cscs=40aaaaa=2Efu?=", "Re: kimenő levelezési probléma - cscs@aaaaa.fu"},
{"Re: cccc@aaa.fu - e-mail =?UTF-8?B?a8OpcmTDqXM=?=", "Re: cccc@aaa.fu - e-mail kérdés"},
{"=?WINDOWS-1250?Q?<AZ-17226/1-2015>=20www.xxxxx.com=20new=20virtual=20?=", "<AZ-17226/1-2015> www.xxxxx.com new virtual "},
{"Re: FW: =?ISO-8859-2?Q?Sopron-Gy=F5r_optikai_sz=E1l_probl=E9?=", "Re: FW: Sopron-Győr optikai szál problé"},
{"=?UTF-8?Q?Megh=C3=ADv=C3=B3=20a=20Pulzus=20felm=C3=A9r=C3=A9sre=20/=20Inv?= =?UTF-8?Q?itation=20to=20the=20Pulse=20Survey?=", "Meghívó a Pulzus felmérésre / Invitation to the Pulse Survey"},
2015-11-27 12:17:19 +01:00
{"=?iso-8859-2?Q?vhost_l=E9trehoz=E1sa?=", "vhost létrehozása"},
{"Re: MAIL =?UTF-8?B?U1pPTEfDgUxUQVTDgVMgSElCQSAgIEdUUzogOTE1NDUyMQ==?=", "Re: MAIL SZOLGÁLTATÁS HIBA GTS: 9154521"},
{"[spam???] Better Sex. Better Body. Better Life.", "[spam???] Better Sex. Better Body. Better Life."},
2015-11-27 12:17:19 +01:00
{"1gy2tt. V3l4d. M5sk6nt", "1gy2tt. V3l4d. M5sk6nt"},
{"=?iso-8859-2?B?03Jp4XNpIG1lZ2xlcGV06XMsIG5pbmNzIHT2YmIgbWVudHPpZyBBbWVyaWthIHN64W3hcmEgKDIwMTUuMTEuMDYuIC0gc2pAYWN0cy5odSk=?=", "Óriási meglepetés, nincs több mentség Amerika számára (2015.11.06. - sj@acts.hu)"},
{"=?utf-8?B?Rlc6IEVtYWlsIGZvZ2Fkw6FzaSBoaWJh?=", "FW: Email fogadási hiba"},
{"=?ISO-8859-15?Q?RE=3A_FW=3A_K=E9rd=E9s?=", "RE: FW: Kérdés"},
{"=?iso-8859-2?Q?RE:_spam_tilt=E1s?=", "RE: spam tiltás"},
{"Subject: Administrator has responded to your request for 'Cloud Operations", "Subject: Administrator has responded to your request for 'Cloud Operations"},
{"Subject: =?GB2312?B?VFYgYmFjayBLSVQgc3RyaXAgcmYgcmVtb3RlIENvbnRyb2wgIFVTRDUuNS9TRVQ=?=", "Subject: TV back KIT strip rf remote Control USD5.5/SET"},
{"Subject: =?UTF-8?Q?Ha_rossz_a_k=C3=B6z=C3=A9rzete?=", "Subject: Ha rossz a közérzete"},
{"Subject: =?UTF-8?B?SsOhdHNzeiBhIHZpbMOhZyBsZWdixZFrZXrFsWJiIGxvdHTDs2rDoW4gSU5HWUVO?=", "Subject: Játssz a világ legbőkezűbb lottóján INGYEN"},
{"Subject: =?UTF-8?B?w5Zua29ybcOhbnl6YXRpIGFkYXRiw6F6aXMgMiwzIEZ0IC8gZGIgw6Fyb24=?=", "Subject: Önkormányzati adatbázis 2,3 Ft / db áron"},
{"Subject: =?UTF-8?Q?Experience=20a=20Crazy=20Reward=20Delivered=20to=20you?=", "Subject: Experience a Crazy Reward Delivered to you"},
{"Subject: =?windows-1251?B?ze7i7uPu5O3o5SDv7uTg8OroIOTr/yDC4Pjo?=", "Subject: Новогодние подарки для Ваши"},
{"Subject: =?utf-8?Q?Divatos,_=C3=BCde_sz=C3=ADneinek_k=C3=B6sz=C3=B6nhet=C5=91en_el?=", "Subject: Divatos, üde színeinek köszönhetően el"},
{"=?gb2312?B?yc/Gz76pIC0gw7/fTMir0bKy6YjzuOYgKDIwMTcxMDMwLTMxKSBHQlcgUG9k?==?gb2312?Q?ium_&_Basement.docx?=", "上葡京 - 每週全巡查報告 (20171030-31) GBW Podium & Basement.docx"},
{"Subject: =?UTF-8?Q?=E2=98=85_JubiDu!Versandkost?= =?UTF-8?Q?enfrei-Verl=C3=A4ngerung!=E2=98=85?=", "Subject: ★ JubiDu!Versandkostenfrei-Verlängerung!★"},
{"Happy New Year! =?utf-8?q?=F0=9F=8E=86?=", "Happy New Year! 🎆"},
2015-11-27 12:17:19 +01:00
};
TEST_HEADER();
2015-11-27 12:17:19 +01:00
for(i=0; i<sizeof(pair)/sizeof(struct str_pair); i++){
snprintf(buf, sizeof(buf)-1, "%s", pair[i].line);
fixupEncodedHeaderLine(buf, sizeof(buf)-1);
ASSERT(strcmp(buf, pair[i].expected_result) == 0, pair[i].expected_result);
2015-11-27 12:17:19 +01:00
}
TEST_FOOTER();
2015-11-27 12:17:19 +01:00
}
static void test_translateLine(){
2016-04-05 21:10:09 +02:00
unsigned int i;
2015-11-27 12:17:19 +01:00
char buf[SMALLBUFSIZE];
struct parser_state state;
struct str_pair pair[] = {
{"From: \"'user@domain'\"", "From user@domain "},
{"From: \"''user@domain'\"", "From 'user@domain "},
{"From: \"''user'@domain'\"", "From 'user'@domain "},
{"From: \"'user'@domain'\"", "From user'@domain "},
{"From: Mike D'Amaaaaa <mike@aaa.fu>", "From Mike D'Amaaaaa mike@aaa.fu "},
{"From: VMware Technical Support <webform@vmware.com>", "From VMware Technical Support webform@vmware.com "}
/*
* TODO: we need many more tests here
*/
};
TEST_HEADER();
2015-11-27 12:17:19 +01:00
for(i=0; i<sizeof(pair)/sizeof(struct str_pair); i++){
init_state(&state);
state.message_state = MSG_FROM;
state.is_header = 1;
snprintf(buf, sizeof(buf)-1, "%s", pair[i].line);
translateLine((unsigned char*)buf, &state);
ASSERT(strcmp(buf, pair[i].expected_result) == 0, pair[i].expected_result);
2015-11-27 12:17:19 +01:00
}
TEST_FOOTER();
2015-11-27 12:17:19 +01:00
}
static void test_fixURL(){
2016-04-05 21:10:09 +02:00
unsigned int i;
2015-11-27 12:17:19 +01:00
char buf[SMALLBUFSIZE];
struct str_pair pair[] = {
{"http://www.aaa.fu", "__URL__wwwXaaaXfu "},
{"http://www.aaa.fu/", "__URL__wwwXaaaXfu "},
{"http://www.aaa.fu/ahaha", "__URL__wwwXaaaXfu "},
{"http://www.aaa.fu/bbb/ccc", "__URL__wwwXaaaXfu "},
{"http://www.aaa.fu/ahahah/aiaiai?url=http://iii.oo/", "__URL__wwwXaaaXfu "},
{"https://www.aaa.fu/", "__URL__wwwXaaaXfu "}
};
TEST_HEADER();
2015-11-27 12:17:19 +01:00
for(i=0; i<sizeof(pair)/sizeof(struct str_pair); i++){
snprintf(buf, sizeof(buf)-1, "%s", pair[i].line);
fixURL(buf, sizeof(buf)-1);
ASSERT(strcmp(buf, pair[i].expected_result) == 0, pair[i].expected_result);
2015-11-27 12:17:19 +01:00
}
TEST_FOOTER();
2015-11-27 12:17:19 +01:00
}
static void test_degenerateToken(){
2016-04-05 21:10:09 +02:00
unsigned int i;
2015-11-27 12:17:19 +01:00
char buf[SMALLBUFSIZE];
struct str_pair pair[] = {
{"Hello", "Hello"},
{"Hello!", "Hello"},
{"Hello!!", "Hello"},
{"Hello!!!", "Hello"},
{"Hello?", "Hello"},
{"Hello??", "Hello"},
{"Hello???", "Hello"},
{"Hello.", "Hello"},
{"Hello..", "Hello"},
{"Hello...", "Hello"}
};
TEST_HEADER();
2015-11-27 12:17:19 +01:00
for(i=0; i<sizeof(pair)/sizeof(struct str_pair); i++){
snprintf(buf, sizeof(buf)-1, "%s", pair[i].line);
degenerateToken((unsigned char*)buf);
ASSERT(strcmp(buf, pair[i].expected_result) == 0, pair[i].expected_result);
2015-11-27 12:17:19 +01:00
}
TEST_FOOTER();
2015-11-27 12:17:19 +01:00
}
/*
other functions to test in the future:
- int extract_boundary(char *p, struct parser_state *state)
- void fix_email_address_for_sphinx(char *s)
- void reassembleToken(char *p)
*/
int main(){
test_parse_date_header();
test_extractNameFromHeaderLine();
test_fixupEncodedHeaderLine();
test_translateLine();
test_fixURL();
test_degenerateToken();
return 0;
}