Dan,

Friday, March 12, 2004, 9:56:40 PM, you wrote:

> http://bugzilla.spamassassin.org/show_bug.cgi?id=2843

> ------- Additional Comments From [EMAIL PROTECTED]  2004-03-12 21:56 -------
> Bob?

Yes, I have sent my CLA to Apache, and yes, I'm the author of those rules
listed below in the bug submission (I've removed those rules of which I
am not the author; also shown below are my current or recent personal
corpus results): 

RM_fw_LeadingPrep     -- 267s/3h of 106585 corpus (86917s/19668h) 03/08/04
RM_ft_Noname          -- 1287s/3h of 106585 corpus (86917s/19668h) 03/08/04
RM_sp_CopyDVD         -- 85s/0h of 100793 corpus (82099s/18694h) 02/21/04
RM_sp_FreePPV         -- 41s/0h of 100793 corpus (82099s/18694h) 02/21/04
RM_spd_Money          -- 102s/1h of 97268 corpus (79437s/17831h) 01/24/04
RM_spd_WorthCash      -- 350s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_swd_investors      -- 119s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_swd_Paying         -- 229s/4h of 97268 corpus (79437s/17831h) 01/24/04
RM_swt_ConsWord6      -- 863s/0h of 97268 corpus (79437s/17831h) 01/24/04
CMO_RM_swt_Masked05   -- 807s/3h of 97268 corpus (79437s/17831h) 01/24/04
CMO_RM_swt_Masked06   -- 153s/0h of 97268 corpus (79437s/17831h) 01/24/04
CMO_RM_swt_Masked07   -- 88s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_swt_Masked19       -- 368s/0h of 97268 corpus (79437s/17831h) 01/24/04
CMO_RM_swt_Masked19   -- 358s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_LettersNums     -- 94s/0h of 100793 corpus (82099s/18694h) 02/21/04
RM_sl_RandomLetters2a -- 852s/3h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomLetters2b -- 158s/0h of 100793 corpus (82099s/18694h) 02/21/04
RM_sl_RandomLetters3a -- 122s/2h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomLetters3b -- 113s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomLetters3c -- 364s/2h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomLetters4a -- 239s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomLetters5a -- 473s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomCons6a    -- 661s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_sl_RandomCons7a    -- 628s/2h of 97268 corpus (79437s/17831h) 01/24/04
RM_st_LongSubject     -- 214s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_hr_HeloSender      -- 144s/3h of 97268 corpus (79437s/17831h) 01/24/04
RM_hr_VirtuaComBr     -- 104s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_hr_telesp          -- 442s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_hxl_ForgedIndy     -- 93s/0h of 106585 corpus (86917s/19668h) 03/08/04
RM_hx_JLH             -- 458s/0h of 97268 corpus (79437s/17831h) 01/24/04
RM_h_tracking         -- 289s/0h of 97268 corpus (79437s/17831h) 01/24/04

also:

CMO_RM_sw_boost which I've since replaced with
header    RM_sw_boosto1          Subject =~ 
/(?!\bboost\b)(?:\b[b8]|\B(?:[\xDF]|\xCE\x92|\xCE\xB2|\xD0\x92|\xD0\xB2))[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[o0\*\xB0\xBA\xD8\xF8\xD2-\xD6\xF2-\xF6]|\(\)|\[\]|\xC5[\x8C-\x91]|\xC6[\xA0-\xA1]|\xC7[\x91-\x92]|\xC7[\xBE-\xBF]|\xCE\x8C|\xCE\x98|\xCE\x9F|\xCE\xB8|\xCE\xBF|\xCF\x8C|\xD0\x9E|\xD0\xBE|\xD5\x95)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[o0\*\xB0\xBA\xD8\xF8\xD2-\xD6\xF2-\xF6]|\(\)|\[\]|\xC5[\x8C-\x91]|\xC6[\xA0-\xA1]|\xC7[\x91-\x92]|\xC7[\xBE-\xBF]|\xCE\x8C|\xCE\x98|\xCE\x9F|\xCE\xB8|\xCE\xBF|\xCF\x8C|\xD0\x9E|\xD0\xBE|\xD5\x95)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[s5\$\xA7]|\xC5[\x9A-\xA1]|\xD0\x85|\xD1\x95|\xD5\x8F)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:t\b|(?:[\+]|\xC5[\xA2-\xA7]|\xCE\xA4|\xCF\x84|\xD0\xA2|\xD1\x82)\B)/i
describe  RM_sw_boosto1          boost in Subject
score     RM_sw_boosto1          8.500  # type=obfu - 20s/0h of 97268 corpus 
(79437s/17831h) 01/24/04
header    RM_sw_boosto2          Subject =~ /(?!\bboost\b)\bb.?o.?o.?s.?t\b/i
describe  RM_sw_boosto2          boost in Subject
score     RM_sw_boosto2          4.500  # type=obfu - 2s/0h of 91714 corpus 
(74113s/17601h) 01/24/04
                                        # Note: boost itself, w/o obfu, matches 
INCREASE_SOMETHING

CMO_RM_sw_Forever which I've since replaced with
header    RM_sw_Forever          Subject =~ /forever/i
describe  RM_sw_Forever          Forever in Subject
score     RM_sw_Forever          2.410  # 141s/0h of 97268 corpus 
(79437s/17831h) 01/24/04

CMO_RM_sw_Proven "
header    RM_sw_Proven           Subject =~ /\bproven\b/i
describe  RM_sw_Proven           Proven in Subject
score     RM_sw_Proven           2.290  # 129s/0h of 97268 corpus 
(79437s/17831h) 01/24/04
header    RM_sw_Proveno1         Subject =~ 
/(?!\bproven\b)(?:\bp|\B(?:[\xDE]|\xCE\xA1|\xCF\x81|\xD0\xA0|\xD1\x80))[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[r\xAE]|\xC5[\x94-\x99]|\xD1\x93)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[o0\*\xB0\xBA\xD8\xF8\xD2-\xD6\xF2-\xF6]|\(\)|\[\]|\xC5[\x8C-\x91]|\xC6[\xA0-\xA1]|\xC7[\x91-\x92]|\xC7[\xBE-\xBF]|\xCE\x8C|\xCE\x98|\xCE\x9F|\xCE\xB8|\xCE\xBF|\xCF\x8C|\xD0\x9E|\xD0\xBE|\xD5\x95)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[vu]|\\\/|\xCE\xBD])[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[e3\*\xC8-\xCB\xE8-\xEB]|\xC4[\x92-\x9B]|\xCE\x88|\xCE\x95|\xCE\xA3|\xCE\xAD|\xCE\xB5|\xD0\x81|\xD0\x95|\xD0\xB5|\xD1\x91)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:n\b|(?:[\xD1\xF1]|\|\\\||\xC5[\x83-\x8B]|\xCE\x9D|\xCE\xA0|\xCE\xAE|\xCE\xB7|\xD5\xB2|\xD5\xB8)\B)/i
describe  RM_sw_Proveno1         Proven in Subject
score     RM_sw_Proveno1         8.500  # type=obfu - 17s/0h of 91714 corpus 
(74113s/17601h) 01/24/04
header    RM_sw_Proveno2         Subject =~ 
/(?!\bproven\b)\bp.?r.?o.?v.?e.?n\b/i
describe  RM_sw_Proveno2         Proven in Subject
score     RM_sw_Proveno2         4.500  # type=obfu - 0s/0h of 91714 corpus 
(74113s/17601h) 01/24/04

CMO_RM_swd_debt "
header    RM_swd_debt           Subject =~ /\bdebt\b/i
describe  RM_swd_debt           Subject mentions debt with anti-spam avoidance 
techniques
score     RM_swd_debt           3.000  # 609s/0h of 97268 corpus 
(79437s/17831h) 01/24/04
header    RM_swd_debto1         Subject =~ 
/(?!\bdebt\b)(?:\bd|\B(?:[\xD0]|\xC4[\x8E-\x91]))[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[e3\*\xC8-\xCB\xE8-\xEB]|\xC4[\x92-\x9B]|\xCE\x88|\xCE\x95|\xCE\xA3|\xCE\xAD|\xCE\xB5|\xD0\x81|\xD0\x95|\xD0\xB5|\xD1\x91)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[b8\xDF]|\xCE\x92|\xCE\xB2|\xD0\x92|\xD0\xB2)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:t\b|(?:[\+]|\xC5[\xA2-\xA7]|\xCE\xA4|\xCF\x84|\xD0\xA2|\xD1\x82)\B)/i
describe  RM_swd_debto1         Subject mentions debt with anti-spam avoidance 
techniques
score     RM_swd_debto1         4.500  # type=obfu - 9s/0h of 100793 corpus 
(82099s/18694h) 02/21/04
                                       # max: 12s/0h of 91714 corpus 
(74113s/17601h) 01/24/04
header    RM_swd_debto2         Subject =~ /(?!\bdebi?t\b)\bd.?e.?b.?t\b/i
describe  RM_swd_debto2         Subject mentions debt with anti-spam avoidance 
techniques
score     RM_swd_debto2         8.500  # type=obfu -- 17s/0h of 91714 corpus 
(74113s/17601h) 01/24/04

CMO_RM_swm_DrugsV "
header    RM_swm_Drug28          Subject =~ 
/(?!viagra)(?:Viarga|Vagira|Virgaa|v.?i.?a.?g.?r.?a|(?:\b[vu]|\B(?:\\\/|\xCE\xBD))[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[il1:\|\*\xCC-\xCF\xEC-\xEF\xA6]|\xC4[\xA8-\xB0]|\xC4\xBA|\xC4\xBC|\xC4\xBE|\xC5\x80|\xC5\x82|\xC7[\x8F-\x90]|\xD0[\x86-\x87]|\xD1[\x96-\x97]|\xCE\x8A|\xCE\x90|\xCE\x99|\xCE\xAA|\xCE\xAF|\xCE\xB9|\xCF\x8A)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[EMAIL
 
PROTECTED]|\/\\|\xC4[\x80-\x85]|\xC7[\x8D-\x8E]|\xC7[\xBA-\xBB]|\xCE\x86|\xCE\x91|\xCE\x94|\xCE\x9B|\xCE\xAC|\xCE\xB1|\xD0\x90|\xD0\xB0)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[g6]|\xC4[\x9C-\xA3]])[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[r\xAE]|\xC5[\x94-\x99]|\xD1\x93)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[a4]\b|(?:[EMAIL
 
PROTECTED]|\/\\|\xC4[\x80-\x85]|\xC7[\x8D-\x8E]|\xC7[\xBA-\xBB]|\xCE\x86|\xCE\x91|\xCE\x94|\xCE\x9B|\xCE\xAC|\xCE\xB1|\xD0\x90|\xD0\xB0)\B))/i
describe  RM_swm_Drug28          Subject mentions known spam subject
score     RM_swm_Drug28          18.00  # type=obfu - 3668s/0h of 106571 corpus 
(87322s/19249h) 02/22/04
                                        # non-obfuscated rule is distrib 
SUBJ_VIAGRA

CMO_RM_swm_Medication
header    RM_swm_Medication      Subject =~ /medication/i
describe  RM_swm_Medication      Subject mentions medication
score     RM_swm_Medication      3.000  # 830s/1h of 97268 corpus 
(79437s/17831h) 01/24/04
                                        # ham: personal medication info
header    RM_swm_Medicationo1    Subject =~ 
/(?!medication)(?:m|rn|\/V\\|\/\\\/\\|\xCE\x9C|\xD0\x9C|\xD0\xBC])[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[e3\*\xC8-\xCB\xE8-\xEB]|\xC4[\x92-\x9B]|\xCE\x88|\xCE\x95|\xCE\xA3|\xCE\xAD|\xCE\xB5|\xD0\x81|\xD0\x95|\xD0\xB5|\xD1\x91)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[d\xD0]|\xC4[\x8E-\x91])[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[il1:\|\*\xCC-\xCF\xEC-\xEF\xA6]|\xC4[\xA8-\xB0]|\xC4\xBA|\xC4\xBC|\xC4\xBE|\xC5\x80|\xC5\x82|\xC7[\x8F-\x90]|\xD0[\x86-\x87]|\xD1[\x96-\x97]|\xCE\x8A|\xCE\x90|\xCE\x99|\xCE\xAA|\xCE\xAF|\xCE\xB9|\xCF\x8A)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[c\*\xC7\xE7\xA2\xA9]|\xC4[\x86-\x8D]|\xD0\xA1|\xD1\x81)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[EMAIL
 
PROTECTED]|\/\\|\xC4[\x80-\x85]|\xC7[\x8D-\x8E]|\xC7[\xBA-\xBB]|\xCE\x86|\xCE\x91|\xCE\x94|\xCE\x9B|\xCE\xAC|\xCE\xB1|\xD0\x90|\xD0\xB0)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[t\+]|\xC5[\xA2-\xA7]|\xCE\xA4|\xCF\x84|\xD0\xA2|\xD1\x82)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[il1:\|\*\xCC-\xCF\xEC-\xEF\xA6]|\xC4[\xA8-\xB0]|\xC4\xBA|\xC4\xBC|\xC4\xBE|\xC5\x80|\xC5\x82|\xC7[\x8F-\x90]|\xD0[\x86-\x87]|\xD1[\x96-\x97]|\xCE\x8A|\xCE\x90|\xCE\x99|\xCE\xAA|\xCE\xAF|\xCE\xB9|\xCF\x8A)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[o0\*\xB0\xBA\xD8\xF8\xD2-\xD6\xF2-\xF6]|\(\)|\[\]|\xC5[\x8C-\x91]|\xC6[\xA0-\xA1]|\xC7[\x91-\x92]|\xC7[\xBE-\xBF]|\xCE\x8C|\xCE\x98|\xCE\x9F|\xCE\xB8|\xCE\xBF|\xCF\x8C|\xD0\x9E|\xD0\xBE|\xD5\x95)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[n\xD1\xF1]|\|\\\||\xC5[\x83-\x8B]|\xCE\x9D|\xCE\xA0|\xCE\xAE|\xCE\xB7|\xD5\xB2|\xD5\xB8)/i
describe  RM_swm_Medicationo1    Subject mentions medication
score     RM_swm_Medicationo1    18.00  # type=obfu - 161s/0h of 97268 corpus 
(79437s/17831h) 01/24/04
header    RM_swm_Medicationo2    Subject =~ 
/(?!medication)m.?e.?d.?i.?c.?a.?t.?i.?o.?n/i
describe  RM_swm_Medicationo2    Subject mentions medication
score     RM_swm_Medicationo2    8.500  # type=obfu - 28s/0h of 91714 corpus 
(74113s/17601h) 01/24/04

CMO_RM_swm_Younger
header    RM_swm_Younger         Subject =~ /\bYOUNGER\b/i
describe  RM_swm_Younger         Younger in Subject
score     RM_swm_Younger         2.710  # 171s/0h of 97268 corpus 
(79437s/17831h) 01/24/04
header    RM_swm_Youngero1       Subject =~ 
/(?!\bYOUNGER\b)(?:\by|\B(?:[\xA5\xDD\xFD]|\xC5[\xB6-\xB8]|\xCE\x8E|\xCE\xA5|\xCE\xA8|\xCE\xAB|\xCE\xB3|\xD0\xA3|\xD1\x83|\xD1\x9E|\xD2[\xAE-\xB1]))[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[o0\*\xB0\xBA\xD8\xF8\xD2-\xD6\xF2-\xF6]|\(\)|\[\]|\xC5[\x8C-\x91]|\xC6[\xA0-\xA1]|\xC7[\x91-\x92]|\xC7[\xBE-\xBF]|\xCE\x8C|\xCE\x98|\xCE\x9F|\xCE\xB8|\xCE\xBF|\xCF\x8C|\xD0\x9E|\xD0\xBE|\xD5\x95)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[uv\*\xB5\xD9-\xDC\xF9-\xFC]|\xC5[\xA8-\xB3]|\xC6[\xAF-\xB0]|\xC7[\x93-\x9C]|\xCE\xB0|\xCE\xBC|\xCF\x8B|\xCF\x8D|\xD4\xB1|\xD5\x84|\xD5\x8D)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[n\xD1\xF1]|\|\\\||\xC5[\x83-\x8B]|\xCE\x9D|\xCE\xA0|\xCE\xAE|\xCE\xB7|\xD5\xB2|\xD5\xB8)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[g6]|\xC4[\x9C-\xA3]])[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:[e3\*\xC8-\xCB\xE8-\xEB]|\xC4[\x92-\x9B]|\xCE\x88|\xCE\x95|\xCE\xA3|\xCE\xAD|\xCE\xB5|\xD0\x81|\xD0\x95|\xD0\xB5|\xD1\x91)[\x01-\x2F\\\^_`\|\x7F-\xA1\xA4-\xA8\xAB-\xAD\xAF-\xB1\xB4\xB7-\xBB\xBF\xF7]?(?:r\b|(?:[\xAE]|\xC5[\x94-\x99]|\xD1\x93)\B)/i
describe  RM_swm_Youngero1       Younger in Subject
score     RM_swm_Youngero1       8.500  # type=obfu - 16s/0h of 91714 corpus 
(74113s/17601h) 01/24/04
header    RM_swm_Youngero2       Subject =~ 
/(?!\bYOUNGER\b)\by.?o.?u.?n.?g.?e.?r\b/i
describe  RM_swm_Youngero2       Younger in Subject
score     RM_swm_Youngero2       8.500  # type=obfu - 29s/0h of 97268 corpus 
(79437s/17831h) 01/24/04

also new rule for your consideration:

header    RM_hxo_OriginatingIP   X-Originating-IP =~ /.{1,8}\..{1,4}IP/i
describe  RM_hxo_OriginatingIP   header points to probable spammer
score     RM_hxo_OriginatingIP   4.500  # type=spamp - 4347s/0h of 97268 corpus 
(79437s/17831h) 01/24/04

Bob Menschel

Reply via email to