Skip to content

Commit

Permalink
Merge pull request #74 from Amit223/Amit-31-12
Browse files Browse the repository at this point in the history
fixed runtime problem indexer
  • Loading branch information
Amit223 authored Dec 31, 2018
2 parents 30985ef + 4df0e67 commit c220e85
Showing 1 changed file with 11 additions and 13 deletions.
24 changes: 11 additions & 13 deletions src/main/java/Indexer.java
Original file line number Diff line number Diff line change
Expand Up @@ -183,7 +183,6 @@ public void Index(Map<String,Integer> terms,Vector<Integer> locations,String nam
int maxtf=0;
if(terms.values()!=null&&terms.values().size()>0)
maxtf=getMaxTf(terms.values());
int lineNumDocs=_AtomicNumlineDocs.get();
String line;
Iterator<String>termsKeys=keys.iterator();
StringBuilder entities=new StringBuilder();
Expand All @@ -203,14 +202,17 @@ public void Index(Map<String,Integer> terms,Vector<Integer> locations,String nam
line="X\n";
}
//entities+docs:writing part
int lineNumDocs;
docMutex.lock();
writeToDocumentsAndEntitiesList(nameOfDoc,cityOfDoc,maxtf,terms.size(),numOfWords,language,line); //
lineNumDocs=_AtomicNumlineDocs.get();
docMutex.unlock();

entities=new StringBuilder();//to memory
_AtomicNumlineDocs.getAndAdd(1);
_AtomicNumlineEntities.addAndGet(1);

if(_numOfFiles.get()%10000==0){
if(_numOfFiles.get()%5000==0){
writeDocsAndEntitiesToFile();
}

Expand Down Expand Up @@ -325,9 +327,8 @@ public boolean loadDictionaryToMemory() {
dictionary = new HashMap<>();
BufferedReader bufferedReader = new BufferedReader(new FileReader(_path + "/" + _toStem + "Dictionary.txt"));
String line = bufferedReader.readLine();
String[] lines = line.split("=");
for (int i = 0; i < lines.length; i++) {
String[] pair = lines[i].split("--->");
while (line!=null&&!line.equals("")) {
String[] pair = line.split("--->");
if (pair.length == 2) {
String[] values = pair[1].split("&");
int df = Integer.parseInt(values[0].substring(1, values[0].length()));
Expand All @@ -338,8 +339,8 @@ public boolean loadDictionaryToMemory() {
vector.add(tf);
vector.add(ptr);
dictionary.put(pair[0], vector);
lines[i]="";
}
line=bufferedReader.readLine();
}
bufferedReader.close();
} catch (FileNotFoundException e) {
Expand Down Expand Up @@ -370,13 +371,10 @@ public void loadDictionaryToFile(){
if(dictionary.get(key).size()==3){
pointer=dictionary.get(key).elementAt(2);
}
stringBuilder.append(key + "--->{" + dictionary.get(key).elementAt(0) + "&" + dictionary.get(key).elementAt(1)
+ "&" + pointer + "}=");
if (i % 5000 == 0){
writer.write(stringBuilder.toString());
stringBuilder.setLength(0);

}
String line=(key + "--->{" + dictionary.get(key).elementAt(0) + "&" + dictionary.get(key).elementAt(1)
+ "&" + pointer + "}");
writer.write(line);
writer.newLine();
i++;
}
writer.write(stringBuilder.toString());
Expand Down

0 comments on commit c220e85

Please sign in to comment.