Sophie

Sophie

distrib > Mandriva > 2010.0 > i586 > media > contrib-release > by-pkgid > ced98ca62eed61aa32c12cb3eb98f8ed > files > 1

perl-Mail-SpamAssassin-Plugin-ocrtext-3.2-3mdv2010.0.noarch.rpm

gocr_path	/usr/bin/gocr
pnmtools_path	/usr/bin
ocrtext_dscore	15

ocrtext_words	realtime;alert;actquick;announce;headline;charts;increase;below;rating;takeoff;resource;ready::0.1;profit;news::0.1;wallstreet;free::0;pick::0.1;breaking;explosive;strong;spotlight;watch;symbol;stock;investor;offer;international;company;money::0;million;thousand;loose;buy;price::0.1;trade;worldtrade;target::0.1;higher;banking;service;recommendation;viagra;soma::0.1;cialis::0.1;xanax;valium;meridia::0.1;zanaflex;levitra;herbal::0.1;medicine;doctor;pills;legal;penis::0;erection::0.1;supplement;medication;weightloss;growth;drugs;pharmacy;prescription;click::0.1;here::0;software;kunde;volksbank;sparkasse;master;degree;bachelor;diploma;removal;visit;browser;readmore;type::0.1;cheap;shipping;quality;sideeffects;size::0.1;focused;replica::0.1;sale::0.1;bags::0.1;development;technology;expect;long-term;quick::0.1;afford;tradeout;compensate

ocrtext_pwords	information

body		OCRTEXT			eval:ocrtext_check()
priority	OCRTEXT			100

#
# Validate the GIF/PNG/JPEG pictures
#
body		SPAMPIC_FORGED_CT	eval:ocrtext_eval()
describe        SPAMPIC_FORGED_CT	Forged content-type in mime header
score           SPAMPIC_FORGED_CT	3.000

body            SPAMPIC_SUSPECT         eval:ocrtext_eval()
describe        SPAMPIC_SUSPECT		Suspect image found
score           SPAMPIC_SUSPECT		0.900

body		GIFANIM_SUSPECT		eval:ocrtext_eval()
describe        GIFANIM_SUSPECT		Suspect animated gif found
score           GIFANIM_SUSPECT		2.500

body		SPAMPIC_UNKNOWN		eval:ocrtext_eval()
describe        SPAMPIC_UNKNOWN		Failed to read image header
score           SPAMPIC_UNKNOWN		2.000

body		SPAMPIC_NONSTD		eval:ocrtext_eval()
describe        SPAMPIC_NONSTD		Non standard image header
score           SPAMPIC_NONSTD		0.200

body		SPAMPIC_BROKEN		eval:ocrtext_eval()
describe        SPAMPIC_BROKEN		Contains damaged image
score           SPAMPIC_BROKEN		1.500

body		SPAMPIC_ALPHA_1		eval:ocrtext_eval()
describe	SPAMPIC_ALPHA_1		Image contains many alphanumeric chars
score		SPAMPIC_ALPHA_1		0.500

body		SPAMPIC_ALPHA_2		eval:ocrtext_eval()
describe	SPAMPIC_ALPHA_2		Image contains many alphanumeric chars
score		SPAMPIC_ALPHA_2		1.000

body		SPAMPIC_ALPHA_3		eval:ocrtext_eval()
describe	SPAMPIC_ALPHA_3		Image contains many alphanumeric chars
score		SPAMPIC_ALPHA_3		1.500

body		__SPAMPIC_COUNT_2	eval:ocrtext_eval()
body		__SPAMPIC_COUNT_3	eval:ocrtext_eval()
body		__SPAMPIC_COUNT_4	eval:ocrtext_eval()
body		__SPAMPIC_COUNT_5	eval:ocrtext_eval()
body		__SPAMPIC_COUNT_6	eval:ocrtext_eval()
body		__SPAMPIC_COUNT_7	eval:ocrtext_eval()
rawbody         __HAVE_CID              /src=["']?cid:/i

body		ONE_PICTURE		eval:ocrtext_eval()
describe	ONE_PICTURE		Single picture
score		ONE_PICTURE		0.100

#
# Multiple inline pics without text are very suspicios
#
meta		SPAMPIC_MULTI_1		(__SPAMPIC_COUNT_2 + (HTML_IMAGE_ONLY_04 || HTML_IMAGE_ONLY_08 || HTML_IMAGE_ONLY_12 || HTML_IMAGE_ONLY_16 || HTML_IMAGE_ONLY_20 || HTML_IMAGE_ONLY_24 || HTML_IMAGE_ONLY_28 || HTML_IMAGE_ONLY_32) + __HAVE_CID + (IMPPYZOR_CHECK || SPAMPIC_WORDS_1 || SPAMPIC_ALPHA_1 || SPAMPIC_ALPHA_2 || SPAMPIC_ALPHA_3) == 4)
describe	SPAMPIC_MULTI_1		Contains inline pics (2)
score           SPAMPIC_MULTI_1		1.000

meta		SPAMPIC_MULTI_2		(__SPAMPIC_COUNT_3 + (HTML_IMAGE_ONLY_04 || HTML_IMAGE_ONLY_08 || HTML_IMAGE_ONLY_12 || HTML_IMAGE_ONLY_16 || HTML_IMAGE_ONLY_20 || HTML_IMAGE_ONLY_24 || HTML_IMAGE_ONLY_28 || HTML_IMAGE_ONLY_32) + __HAVE_CID + (IMPPYZOR_CHECK || SPAMPIC_WORDS_1 || SPAMPIC_ALPHA_1 || SPAMPIC_ALPHA_2 || SPAMPIC_ALPHA_3) == 4)
describe        SPAMPIC_MULTI_2		Contains inline pics (3)
score           SPAMPIC_MULTI_2		2.000

meta		SPAMPIC_MULTI_3		(__SPAMPIC_COUNT_4 + (HTML_IMAGE_ONLY_04 || HTML_IMAGE_ONLY_08 || HTML_IMAGE_ONLY_12 || HTML_IMAGE_ONLY_16 || HTML_IMAGE_ONLY_20 || HTML_IMAGE_ONLY_24 || HTML_IMAGE_ONLY_28 || HTML_IMAGE_ONLY_32) + __HAVE_CID + (IMPPYZOR_CHECK || SPAMPIC_WORDS_1 || SPAMPIC_ALPHA_1 || SPAMPIC_ALPHA_2 || SPAMPIC_ALPHA_3) == 4)
describe        SPAMPIC_MULTI_3		Contains inline pics (4)
score           SPAMPIC_MULTI_3		2.500

meta		SPAMPIC_MULTI_4		(__SPAMPIC_COUNT_5 + (HTML_IMAGE_ONLY_04 || HTML_IMAGE_ONLY_08 || HTML_IMAGE_ONLY_12 || HTML_IMAGE_ONLY_16 || HTML_IMAGE_ONLY_20 || HTML_IMAGE_ONLY_24 || HTML_IMAGE_ONLY_28 || HTML_IMAGE_ONLY_32) + __HAVE_CID + (IMPPYZOR_CHECK || SPAMPIC_WORDS_1 || SPAMPIC_ALPHA_1 || SPAMPIC_ALPHA_2 || SPAMPIC_ALPHA_3) == 4)
describe        SPAMPIC_MULTI_4		Contains inline pics (5)
score           SPAMPIC_MULTI_4		3.000

meta		SPAMPIC_MULTI_5		(__SPAMPIC_COUNT_6 + (HTML_IMAGE_ONLY_04 || HTML_IMAGE_ONLY_08 || HTML_IMAGE_ONLY_12 || HTML_IMAGE_ONLY_16 || HTML_IMAGE_ONLY_20 || HTML_IMAGE_ONLY_24 || HTML_IMAGE_ONLY_28 || HTML_IMAGE_ONLY_32) + __HAVE_CID + (IMPPYZOR_CHECK || SPAMPIC_WORDS_1 || SPAMPIC_ALPHA_1 || SPAMPIC_ALPHA_2 || SPAMPIC_ALPHA_3) == 4)
describe        SPAMPIC_MULTI_5		Contains inline pics (6)
score           SPAMPIC_MULTI_5		4.000

meta		SPAMPIC_MULTI_6		(__SPAMPIC_COUNT_7 + (HTML_IMAGE_ONLY_04 || HTML_IMAGE_ONLY_08 || HTML_IMAGE_ONLY_12 || HTML_IMAGE_ONLY_16 || HTML_IMAGE_ONLY_20 || HTML_IMAGE_ONLY_24 || HTML_IMAGE_ONLY_28 || HTML_IMAGE_ONLY_32) + __HAVE_CID + (IMPPYZOR_CHECK || SPAMPIC_WORDS_1 || SPAMPIC_ALPHA_1 || SPAMPIC_ALPHA_2 || SPAMPIC_ALPHA_3) == 4)
describe        SPAMPIC_MULTI_6		Contains inline pics (7+)
score           SPAMPIC_MULTI_6		5.000



#
# Summarize the OCR scan results
#
body		SPAMPIC_WORDS_1		eval:ocrtext_eval()
describe        SPAMPIC_WORDS_1		Contains inline spam picture (1)
score           SPAMPIC_WORDS_1		1.500

body		SPAMPIC_WORDS_2	eval:ocrtext_eval()
describe        SPAMPIC_WORDS_2		Contains inline spam picture (2)
score           SPAMPIC_WORDS_2		4.000

body		SPAMPIC_WORDS_3	eval:ocrtext_eval()
describe        SPAMPIC_WORDS_3		Contains inline spam picture (3)
score           SPAMPIC_WORDS_3		6.000

body		SPAMPIC_WORDS_4	eval:ocrtext_eval()
describe        SPAMPIC_WORDS_4		Contains inline spam picture (4)
score           SPAMPIC_WORDS_4		9.000

body		SPAMPIC_WORDS_5	eval:ocrtext_eval()
describe        SPAMPIC_WORDS_5		Contains inline spam picture (5+)
score           SPAMPIC_WORDS_5		12.000