at.tuwien.ifs.somtoolbox.summarisation.output
Class MultiDocumentHandler

java.lang.Object
  extended by at.tuwien.ifs.somtoolbox.summarisation.output.MultiDocumentHandler

public class MultiDocumentHandler
extends Object

Version:
$Id: MultiDocumentHandler.java 3589 2010-05-21 10:42:01Z mayer $
Author:
Julius Penaranda

Field Summary
private  cern.colt.list.DoubleArrayList[] allscores
           
private  double degree
           
private  Object[] itemNames
           
private  ArrayList<String>[] parsedDocuments
           
private  ArrayList<String> resultdoc
           
private  ArrayList<String> resultfilenames
           
private  cern.colt.list.DoubleArrayList resultscores
           
private static String WORD_DELIMITER
           
 
Constructor Summary
MultiDocumentHandler(Object[] items, ArrayList<String>[] parsedDoc)
           
 
Method Summary
(package private)  void compareDocuments(int d1, int d2)
           
(package private)  double computeSimilarity(String sent, String sent2)
           
 void createAllResults(double threshold)
           
(package private)  void find_similarities(double degr)
          identifies sentence similarity across documents; numdoc sets the minimum number of documents in which similarity of sentence occurs; degree sets similarity degree;
 ArrayList<String> getResultDocs()
           
 ArrayList<String> getResultFileNames()
           
 cern.colt.list.DoubleArrayList getResultScores()
           
 void removeRedundancy(ArrayList<String> resultd, cern.colt.list.DoubleArrayList resultsc, ArrayList<String> resultfile)
           
(package private)  void storeScores(cern.colt.list.DoubleArrayList[] scores)
           
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Field Detail

WORD_DELIMITER

private static final String WORD_DELIMITER
See Also:
Constant Field Values

parsedDocuments

private ArrayList<String>[] parsedDocuments

allscores

private cern.colt.list.DoubleArrayList[] allscores

resultdoc

private ArrayList<String> resultdoc

resultfilenames

private ArrayList<String> resultfilenames

resultscores

private cern.colt.list.DoubleArrayList resultscores

degree

private double degree

itemNames

private Object[] itemNames
Constructor Detail

MultiDocumentHandler

MultiDocumentHandler(Object[] items,
                     ArrayList<String>[] parsedDoc)
Method Detail

createAllResults

public void createAllResults(double threshold)

removeRedundancy

public void removeRedundancy(ArrayList<String> resultd,
                             cern.colt.list.DoubleArrayList resultsc,
                             ArrayList<String> resultfile)

getResultDocs

public ArrayList<String> getResultDocs()

getResultScores

public cern.colt.list.DoubleArrayList getResultScores()

getResultFileNames

public ArrayList<String> getResultFileNames()

find_similarities

void find_similarities(double degr)
identifies sentence similarity across documents; numdoc sets the minimum number of documents in which similarity of sentence occurs; degree sets similarity degree;


compareDocuments

void compareDocuments(int d1,
                      int d2)

computeSimilarity

double computeSimilarity(String sent,
                         String sent2)

storeScores

void storeScores(cern.colt.list.DoubleArrayList[] scores)