01: // The contents of this file are subject to the Mozilla Public License Version
02: // 1.1
03: //(the "License"); you may not use this file except in compliance with the
04: //License. You may obtain a copy of the License at http://www.mozilla.org/MPL/
05: //
06: //Software distributed under the License is distributed on an "AS IS" basis,
07: //WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
08: //for the specific language governing rights and
09: //limitations under the License.
10: //
11: //The Original Code is "The Columba Project"
12: //
13: //The Initial Developers of the Original Code are Frederik Dietz and Timo
14: // Stich.
15: //Portions created by Frederik Dietz and Timo Stich are Copyright (C) 2003.
16: //
17: //All Rights Reserved.
18: package org.columba.mail.spam.rules;
19:
20: import org.columba.mail.folder.IMailbox;
21: import org.columba.ristretto.message.Header;
22:
23: /**
24: * Search for multiple whitespaces in Subject.
25: * <p>
26: * Example: "Buy this sdf675sv758"
27: * <p>
28: * See the random characters add the end.
29: *
30: * @author fdietz
31: *
32: */
33: public class SubjectWhitespaceRule extends AbstractRule {
34:
35: public SubjectWhitespaceRule() {
36: super ("SubjectWhitespaceRule");
37: }
38:
39: /**
40: * @see org.columba.mail.spam.rules.Rule#score(IMailbox, java.lang.Object)
41: */
42: public float score(IMailbox folder, Object uid) throws Exception {
43: Header header = folder.getHeaderFields(uid,
44: new String[] { "Subject" });
45: String subject = header.get("Subject");
46: if (subject == null)
47: return NEARLY_ZERO;
48: if (subject.length() == 0)
49: return NEARLY_ZERO;
50:
51: int count = 0;
52: boolean whitespace = false;
53: for (int i = 0; i < subject.length(); i++) {
54: char ch = subject.charAt(i);
55:
56: if (ch == ' ') {
57: // whitespace detected
58:
59: // if already detected before
60: if (whitespace)
61: count++;
62:
63: whitespace = true;
64: } else {
65: whitespace = false;
66: }
67: }
68:
69: // check for at least 10 whitespaces
70: if (count > 10)
71: return MAX_PROBABILITY;
72:
73: return NEARLY_ZERO;
74: }
75: }
|