at.tuwien.ifs.somtoolbox.summarisation.parser
Class SentenceParser

java.lang.Object
  extended by at.tuwien.ifs.somtoolbox.summarisation.parser.SentenceParser

public class SentenceParser
extends java.lang.Object

Version:
$Id: SentenceParser.java 3590 2010-05-21 10:43:45Z mayer $
Author:
Julius Penaranda

Field Summary
private  DocumentParser docparser
           
private  java.util.ArrayList<java.lang.String> filenames
           
private  HeadlineTextParser headtextparser
           
private  int numDocs
           
 java.util.ArrayList<java.lang.String>[] parsedDocuments
           
private  java.lang.String prefix
           
 
Constructor Summary
SentenceParser(java.lang.Object[] itemNames)
           
 
Method Summary
(package private)  java.lang.String delete_tags(java.lang.String line)
          deletes tags within a Web document
 void find_parse_Document(java.lang.String name)
           
 java.lang.String findSentence(java.lang.String line, java.util.ArrayList<java.lang.String> parseddoc)
          finds sentence within String and add it to parseddoc
 java.util.ArrayList<java.lang.String> getFileNames()
           
 java.util.ArrayList<java.lang.String>[] getParsedDocuments()
           
private  java.util.ArrayList<java.lang.String> parseDocument(java.io.File document)
           
 void setFileNamePrefix(java.lang.String fnprefix)
           
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Field Detail

prefix

private java.lang.String prefix

parsedDocuments

public java.util.ArrayList<java.lang.String>[] parsedDocuments

numDocs

private int numDocs

filenames

private java.util.ArrayList<java.lang.String> filenames

headtextparser

private HeadlineTextParser headtextparser

docparser

private DocumentParser docparser
Constructor Detail

SentenceParser

public SentenceParser(java.lang.Object[] itemNames)
Method Detail

setFileNamePrefix

public void setFileNamePrefix(java.lang.String fnprefix)

find_parse_Document

public void find_parse_Document(java.lang.String name)

parseDocument

private java.util.ArrayList<java.lang.String> parseDocument(java.io.File document)
                                                     throws java.io.IOException
Throws:
java.io.IOException

findSentence

public java.lang.String findSentence(java.lang.String line,
                                     java.util.ArrayList<java.lang.String> parseddoc)
finds sentence within String and add it to parseddoc


delete_tags

java.lang.String delete_tags(java.lang.String line)
deletes tags within a Web document

Parameters:
line - String
Returns:
String

getParsedDocuments

public java.util.ArrayList<java.lang.String>[] getParsedDocuments()

getFileNames

public java.util.ArrayList<java.lang.String> getFileNames()