Skip to content

Commit

Permalink
Add Bags of words
Browse files Browse the repository at this point in the history
  • Loading branch information
jjroman committed Jan 31, 2013
1 parent 36eac56 commit 9f7e5b3
Show file tree
Hide file tree
Showing 2 changed files with 59 additions and 1 deletion.
58 changes: 58 additions & 0 deletions src/main/java/sem2/iwi/nlp/BagOfWords.java
Original file line number Diff line number Diff line change
@@ -0,0 +1,58 @@
/*
* To change this template, choose Tools | Templates
* and open the template in the editor.
*/
package sem2.iwi.nlp;

import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.concurrent.atomic.AtomicInteger;

/**
*
* @author jjroman
*/
public class BagOfWords {

private ArrayList<HashMap<String, AtomicInteger>> alhmsacBags = new ArrayList<>();
private ArrayList<AtomicInteger> alaiNoOfWords = new ArrayList<>();

public void addNewBag(List<String> listOfTweets) {
HashMap<String, AtomicInteger> hm = new HashMap<>();
AtomicInteger ai = new AtomicInteger(0);
for (String string : listOfTweets) {
List<String> ls = Stemmer.getWordsOnlyForTags(string, "NN", "VB");
for (String string1 : ls) {
ai.incrementAndGet();
if (hm.containsKey(string1)) {
hm.get(string1).incrementAndGet();
} else {
hm.put(string1, new AtomicInteger(1));
}
}
}
alaiNoOfWords.add(ai);
alhmsacBags.add(hm);
}

public ArrayList<Integer> scoreAgainsAll(String twit) {
ArrayList<Integer> retVal = new ArrayList<>();
for (int i = 0; i < alhmsacBags.size(); i++) {
retVal.add(scoreAgainstSpecific(twit, i));
}
return retVal;
}

public Integer scoreAgainstSpecific(String twit, Integer i) {
HashMap<String, AtomicInteger> hm = alhmsacBags.get(i);
Integer score = 0;
List<String> twitWords = Stemmer.getWordsOnlyForTags(twit, "NN", "VB");
for (String string : twitWords) {
if(hm.containsKey(string)){
score += hm.get(string).get();
}
}
return score;
}
}
2 changes: 1 addition & 1 deletion src/main/java/sem2/iwi/nlp/Stemmer.java
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@ public static void main(String[] args) {

}

private static ArrayList<String> getWordsOnlyForTags(String forPosTagging, String... tags) {
public static ArrayList<String> getWordsOnlyForTags(String forPosTagging, String... tags) {
ArrayList<String> retVal = new ArrayList<>();

try {
Expand Down

0 comments on commit 9f7e5b3

Please sign in to comment.