public class MultiDocumentHandler extends Object
Modifier and Type | Field and Description |
---|---|
private cern.colt.list.DoubleArrayList[] |
allscores |
private double |
degree |
private Object[] |
itemNames |
private ArrayList<String>[] |
parsedDocuments |
private ArrayList<String> |
resultdoc |
private ArrayList<String> |
resultfilenames |
private cern.colt.list.DoubleArrayList |
resultscores |
private static String |
WORD_DELIMITER |
Constructor and Description |
---|
MultiDocumentHandler(Object[] items,
ArrayList<String>[] parsedDoc) |
Modifier and Type | Method and Description |
---|---|
(package private) void |
compareDocuments(int d1,
int d2) |
(package private) double |
computeSimilarity(String sent,
String sent2) |
void |
createAllResults(double threshold) |
(package private) void |
find_similarities(double degr)
identifies sentence similarity across documents; numdoc sets the minimum number of documents in which similarity
of sentence occurs; degree sets similarity degree;
|
ArrayList<String> |
getResultDocs() |
ArrayList<String> |
getResultFileNames() |
cern.colt.list.DoubleArrayList |
getResultScores() |
void |
removeRedundancy(ArrayList<String> resultd,
cern.colt.list.DoubleArrayList resultsc,
ArrayList<String> resultfile) |
(package private) void |
storeScores(cern.colt.list.DoubleArrayList[] scores) |
private static final String WORD_DELIMITER
private cern.colt.list.DoubleArrayList[] allscores
private cern.colt.list.DoubleArrayList resultscores
private double degree
private Object[] itemNames
public void createAllResults(double threshold)
public void removeRedundancy(ArrayList<String> resultd, cern.colt.list.DoubleArrayList resultsc, ArrayList<String> resultfile)
public cern.colt.list.DoubleArrayList getResultScores()
void find_similarities(double degr)
void compareDocuments(int d1, int d2)
void storeScores(cern.colt.list.DoubleArrayList[] scores)