summaryrefslogtreecommitdiffstats
path: root/src/de/fhswf/in/inf/java1/aufgabe9/WordCount.java
blob: a6d90eff998c2c4b41fbe34960152cedc2b8c018 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
/**
 * 
 */
package de.fhswf.in.inf.java1.aufgabe9;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;
import java.util.Collections;
import java.util.Map.Entry;
import java.util.Set;
import java.util.TreeMap;

/**
 * A class, that counts words in files.
 *
 * @author $Author: $
 * @version $Revision: $, $Date: $ UTC
 */
public class WordCount
{

   private TreeMap<String, Integer> wordMap = new TreeMap<>();

   /**
    * Empty constructor.
    *
    */
   public WordCount()
   {

   }

   /**
    * Reads a file and counts the words.
    *
    * @param file
    *           The file to be read.
    */
   public final void readFile(File file)
   {
      try (BufferedReader f = new BufferedReader(new FileReader(file)))
      {
         wordMap.clear();
         
         String line = null;

         while ((line = f.readLine()) != null)
         {
            String[] lineArray = line
                  .split("[^\\p{IsAlphabetic}\\p{Digit}]+");
            for (String word : lineArray)
            {
               // Split creates empty String, if first char is a split char.
               if (!word.isEmpty())
               {
                  word = word.toLowerCase();

                  Integer tmp = wordMap.get(word);
                  if (tmp != null)
                  {
                     wordMap.put(word, tmp + 1);
                  }
                  else
                  {
                     wordMap.put(word, new Integer(1));
                  }
               }
            }
         }
      }
      catch (IOException e)
      {
         e.printStackTrace(System.err);
      }
   }

   /*
    * (non-Javadoc)
    * 
    * @see java.lang.Object#toString()
    */
   @Override
   public final String toString()
   {
      StringBuilder ret = new StringBuilder();

      for (Entry<String, Integer> mapping : wordMap.entrySet())
      {
         ret.append(mapping.getKey() + " = " + mapping.getValue() + "\n");
      }

      return ret.toString();
   }

   /**
    * Returns all words from the file.
    *
    * @return An unmodifiable Set of the words from the file.
    */
   public final Set<String> getWords()
   {
      return Collections.unmodifiableSet(wordMap.keySet());
   }

   /**
    * Returns the count of a word in a file.
    *
    * @param word
    *           The file to be counted.
    * @return Returns the count of findings in the file.
    */
   public final int getCount(String word)
   {
      if (word == null)
      {
         throw new IllegalArgumentException("Word must be a valid referece.");
      }
      if (word.isEmpty())
      {
         throw new IllegalArgumentException("The word can't be empty.");
      }

      Integer tmp = wordMap.get(word);
      if (tmp == null)
      {
         return 0;
      }
      return tmp;
   }

}