View Javadoc

1   /*
2    * ====================================================================
3    * 
4    * The Apache Software License, Version 1.1
5    *
6    * Copyright (c) 2003 Nick Lothian. All rights reserved.
7    *
8    * Redistribution and use in source and binary forms, with or without
9    * modification, are permitted provided that the following conditions
10   * are met:
11   *
12   * 1. Redistributions of source code must retain the above copyright
13   *    notice, this list of conditions and the following disclaimer. 
14   *
15   * 2. Redistributions in binary form must reproduce the above copyright
16   *    notice, this list of conditions and the following disclaimer in
17   *    the documentation and/or other materials provided with the
18   *    distribution.
19   *
20   * 3. The end-user documentation included with the redistribution, if
21   *    any, must include the following acknowlegement:  
22   *       "This product includes software developed by the 
23   *        developers of Classifier4J (http://classifier4j.sf.net/)."
24   *    Alternately, this acknowlegement may appear in the software itself,
25   *    if and wherever such third-party acknowlegements normally appear.
26   *
27   * 4. The name "Classifier4J" must not be used to endorse or promote 
28   *    products derived from this software without prior written 
29   *    permission. For written permission, please contact   
30   *    http://sourceforge.net/users/nicklothian/.
31   *
32   * 5. Products derived from this software may not be called 
33   *    "Classifier4J", nor may "Classifier4J" appear in their names 
34   *    without prior written permission. For written permission, please 
35   *    contact http://sourceforge.net/users/nicklothian/.
36   *
37   * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
38   * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
39   * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
40   * DISCLAIMED.  IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
41   * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
42   * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
43   * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
44   * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
45   * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
46   * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
47   * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
48   * SUCH DAMAGE.
49   * ====================================================================
50   */
51  
52  package net.sf.classifier4J.bayesian;
53  
54  import java.io.Serializable;
55  import java.util.Collection;
56  import java.util.HashMap;
57  import java.util.Map;
58  
59  /***
60   *
61   * @author Nick Lothian
62   * @author Peter Leschev
63   *  
64   */
65  public class SimpleWordsDataSource implements IWordsDataSource, Serializable {
66  
67      private Map words = new HashMap();
68  
69      public void setWordProbability(WordProbability wp) {
70          words.put(wp.getWord(), wp);
71      }
72  
73      /***
74       * @see net.sf.classifier4J.bayesian.IWordsDataSource#getWordProbability(java.lang.String)
75       */
76      public WordProbability getWordProbability(String word) {
77          if (words.containsKey(word)) {
78              return (WordProbability) words.get(word);
79          } else {
80              return null;
81          }
82      }
83  
84      public Collection getAll() {
85          return words.values();
86      }
87  
88      /***
89       * @see net.sf.classifier4J.bayesian.IWordsDataSource#addMatch(java.lang.String)
90       */
91      public void addMatch(String word) {
92          WordProbability wp = (WordProbability) words.get(word);
93          if (wp == null) {
94              wp = new WordProbability(word, 1, 0);
95          } else {
96              wp.setMatchingCount(wp.getMatchingCount() + 1);
97          }
98          setWordProbability(wp);
99      }
100 
101     /***
102      * @see net.sf.classifier4J.bayesian.IWordsDataSource#addNonMatch(java.lang.String)
103      */
104     public void addNonMatch(String word) {
105         WordProbability wp = (WordProbability) words.get(word);
106         if (wp == null) {
107             wp = new WordProbability(word, 0, 1);
108         } else {
109             wp.setNonMatchingCount(wp.getNonMatchingCount() + 1);
110         }
111         setWordProbability(wp);
112     }
113 
114 }