at.tuwien.ifs.somtoolbox.summarisation.parser
Class SentenceParser
java.lang.Object
at.tuwien.ifs.somtoolbox.summarisation.parser.SentenceParser
public class SentenceParser
- extends java.lang.Object
- Version:
- $Id: SentenceParser.java 3590 2010-05-21 10:43:45Z mayer $
- Author:
- Julius Penaranda
Method Summary |
(package private) java.lang.String |
delete_tags(java.lang.String line)
deletes tags within a Web document |
void |
find_parse_Document(java.lang.String name)
|
java.lang.String |
findSentence(java.lang.String line,
java.util.ArrayList<java.lang.String> parseddoc)
finds sentence within String and add it to parseddoc |
java.util.ArrayList<java.lang.String> |
getFileNames()
|
java.util.ArrayList<java.lang.String>[] |
getParsedDocuments()
|
private java.util.ArrayList<java.lang.String> |
parseDocument(java.io.File document)
|
void |
setFileNamePrefix(java.lang.String fnprefix)
|
Methods inherited from class java.lang.Object |
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
prefix
private java.lang.String prefix
parsedDocuments
public java.util.ArrayList<java.lang.String>[] parsedDocuments
numDocs
private int numDocs
filenames
private java.util.ArrayList<java.lang.String> filenames
headtextparser
private HeadlineTextParser headtextparser
docparser
private DocumentParser docparser
SentenceParser
public SentenceParser(java.lang.Object[] itemNames)
setFileNamePrefix
public void setFileNamePrefix(java.lang.String fnprefix)
find_parse_Document
public void find_parse_Document(java.lang.String name)
parseDocument
private java.util.ArrayList<java.lang.String> parseDocument(java.io.File document)
throws java.io.IOException
- Throws:
java.io.IOException
findSentence
public java.lang.String findSentence(java.lang.String line,
java.util.ArrayList<java.lang.String> parseddoc)
- finds sentence within String and add it to parseddoc
delete_tags
java.lang.String delete_tags(java.lang.String line)
- deletes tags within a Web document
- Parameters:
line
- String
- Returns:
- String
getParsedDocuments
public java.util.ArrayList<java.lang.String>[] getParsedDocuments()
getFileNames
public java.util.ArrayList<java.lang.String> getFileNames()