public abstract class AbstractDocumentFactory extends java.lang.Object implements IDocumentFactory
Modifier and Type | Class and Description |
---|---|
static class |
AbstractDocumentFactory.Cache<T>
Cache of objects (by sentence index)
|
Modifier and Type | Field and Description |
---|---|
protected AbstractDocumentFactory.Cache<edu.stanford.nlp.trees.GrammaticalStructure> |
grammaticalStructures
Grammatical structure cache
|
protected Language |
language
Language
|
protected AbstractDocumentFactory.Cache<edu.stanford.nlp.trees.Tree> |
parseTrees
Parse tree cache
|
protected RelationDependentsDirectFactory |
relationDependentsDirectFactory
Relation dependents factory
|
private static boolean |
relationDependentsFromGrammaticalStructure
Build relation dependents from GrammaticalStructure
|
private java.util.List<SentenceSegment> |
sentenceSegments
Sentence segments
|
private static boolean |
stanfordMode
XML mode (Stanford|GrammarScope)
|
protected java.lang.String |
text
Text
|
protected AbstractDocumentFactory.Cache<java.util.List<Token>> |
tokens
Tokens
|
protected java.util.Map<TypedDependencyMode,AbstractDocumentFactory.Cache<java.util.Collection<edu.stanford.nlp.trees.TypedDependency>>> |
typedDependencies
Typed dependency cache
|
protected java.util.Map<TypedDependencyMode,AbstractDocumentFactory.Cache<java.util.Collection<edu.stanford.nlp.trees.TypedDependency>>> |
typedDependencies2
Typed dependency cache (workflow 2)
|
private java.util.List<WordSegment> |
wordSegments
Word segments
|
static XMLPrinter |
xMLPrinter
XML printer
|
Constructor and Description |
---|
AbstractDocumentFactory(Language language)
Constructor
|
Modifier and Type | Method and Description |
---|---|
private static java.lang.String |
coreferencesToString(Coreferences coreferences,
boolean isXml)
Coreferences to string
|
private static java.lang.String |
entailmentsToString(java.util.List<Entailment> entailments,
boolean isXml)
Entailments to string
|
private static java.util.List<WordSegment> |
flatten(java.util.List<java.util.List<WordSegment>> sentenceWordSegments)
Flatten hierarchical list of per-sentence word segments
|
AAnalysis |
getAnalysis(int sentenceIdx)
Get (sentence) analysis artifact
|
ACoreferences |
getCoreferences()
Get coreferences artifact
|
java.util.List<Entailment> |
getEntailments(int sentenceIdx)
Get entailments
|
AGrammaticalStructure |
getGrammaticalStructure(int sentenceIdx)
Get grammatical structure artifact
|
ANamedEntities |
getNamedEntities(int sentenceIdx)
Get named entities artifact
|
AParseTree |
getParseTree(int sentenceIdx)
Get parse artifact
|
APartsOfSpeech |
getPoses(int sentenceIdx)
Get parts-of-speech artifact
|
ARelationDependents |
getRelationDependents(int sentenceIdx)
Get relation dependents artifact
|
java.lang.String |
getReport(int sentenceIdx,
boolean xMLFlag)
Get (sentence) analysis string
|
java.lang.String[] |
getReports(int sentenceIdx,
boolean xMLFlag)
Get (sentence) analysis strings
|
protected abstract Segmentation |
getSegmentation()
Get segmentation
|
ASemanticGraph |
getSemanticGraph(int sentenceIdx,
TypedDependencyProvider provider,
TypedDependencyMode mode)
Get semantic graph artifact
|
java.util.Map<TypedDependencyProvider,java.util.Map<TypedDependencyMode,ASemanticGraph>> |
getSemanticGraphs(int sentenceIdx)
Get semantic graph artifacts
|
int |
getSentenceCount()
Get sentence count
|
java.util.List<SentenceSegment> |
getSentences()
Get sentences
|
Sentiment |
getSentiment(int sentenceIdx)
Get sentiment
|
private static Segment |
getSpan(java.util.List<? extends Segment> segments)
Span
|
protected abstract Coreferences |
getStanfordCoreferences()
Get coreferences
|
protected abstract java.util.List<Entailment> |
getStanfordEntailments(int sentenceIdx)
Get entailments
|
protected abstract edu.stanford.nlp.trees.GrammaticalStructure |
getStanfordGrammaticalStructure(int sentenceIdx)
Get grammatical structure
|
protected abstract java.util.List<NamedEntity> |
getStanfordNamedEntities(int sentenceIdx)
Get named entities
|
protected abstract edu.stanford.nlp.trees.Tree |
getStanfordParseTree(int sentenceIdx)
Get parse tree
|
protected abstract edu.stanford.nlp.semgraph.SemanticGraph |
getStanfordSemanticGraph(int sentenceIdx,
TypedDependencyMode mode)
Get semantic graph
|
protected abstract edu.stanford.nlp.semgraph.SemanticGraph |
getStanfordSemanticGraph2(int sentenceIdx,
TypedDependencyMode mode)
Get semantic graph (workflow 2)
|
protected abstract Sentiment |
getStanfordSentiment(int sentenceIdx)
Get sentiment
|
protected abstract java.util.List<Triple> |
getStanfordTriples(int sentenceIdx)
Get triples
|
protected abstract java.util.Collection<edu.stanford.nlp.trees.TypedDependency> |
getStanfordTypedDependencies(int sentenceIdx,
TypedDependencyMode mode)
Get typed dependencies
|
protected abstract java.util.Collection<edu.stanford.nlp.trees.TypedDependency> |
getStanfordTypedDependencies2(int sentenceIdx,
TypedDependencyMode mode)
Get typed dependencies (workflow 2)
|
abstract TypedDependencyMode[] |
getSupportedModes()
Get supported typed dependency modes
|
abstract TypedDependencyProvider[] |
getSupportedProviders()
Get supported typed dependency providers
|
java.lang.String |
getText()
Get text
|
ATextAnalysis |
getTextAnalysis(TypedDependencyProvider provider,
TypedDependencyMode mode)
Get text analysis
|
java.lang.String |
getTextReport(TypedDependencyProvider provider,
TypedDependencyMode mode,
boolean xMLModeFlag)
Get text report
|
java.lang.String[] |
getTextReports(TypedDependencyProvider provider,
TypedDependencyMode mode,
boolean xMLModeFlag)
Get text reports
|
abstract java.util.List<Token> |
getTokens(int sentenceIdx)
Get tokens
|
java.util.List<Triple> |
getTriples(int sentenceIdx)
Get triples
|
java.util.Map<TypedDependencyProvider,java.util.Map<TypedDependencyMode,ATypedDependencies>> |
getTypedDependencies(int sentenceIdx)
Get typed dependencies artifact
|
ATypedDependencies |
getTypedDependencies(int sentenceIdx,
TypedDependencyProvider provider,
TypedDependencyMode mode)
Get typed dependencies artifact
|
java.util.List<WordSegment> |
getWords()
Get words
|
private static java.lang.String |
grammaticalStructureToString(edu.stanford.nlp.trees.GrammaticalStructure grammaticalStructure,
boolean isXml)
Grammatical structure to string
|
private static java.util.List<SentenceSegment> |
groupToSentence(java.util.List<java.util.List<WordSegment>> sentenceWordSegments)
Make sentence segments and map : returns (list of segments, segment to list of words map)
|
boolean |
init(java.lang.String text)
Init processing
|
private java.util.Map<TypedDependencyMode,edu.stanford.nlp.semgraph.SemanticGraph> |
makeSemanticGraphs(int sentenceIdx)
Make semantic graphs
|
private java.util.Map<TypedDependencyMode,edu.stanford.nlp.semgraph.SemanticGraph> |
makeSemanticGraphs2(int sentenceIdx)
Make semantic graphs
|
private java.util.Map<TypedDependencyMode,java.util.Collection<edu.stanford.nlp.trees.TypedDependency>> |
makeTypedDependencies(int sentenceIdx)
Make typed dependencies
|
private java.util.Map<TypedDependencyMode,java.util.Collection<edu.stanford.nlp.trees.TypedDependency>> |
makeTypedDependencies2(int sentenceIdx)
Make typed dependencies 2
|
private static java.lang.String |
namedEntitiesToString(java.util.List<NamedEntity> namedEntities,
java.lang.String sentenceString,
SentenceSegment sentenceSegment,
boolean isXml)
Named entities to string
|
private static java.lang.String |
semanticGraphsToString(java.util.Map<TypedDependencyMode,edu.stanford.nlp.semgraph.SemanticGraph> semanticGraphs,
TypedDependencyProvider provider,
boolean isXml)
Semantic graphs to string
|
private static java.lang.String |
sentimentToString(Sentiment sentiment,
boolean isXml)
Sentiment to string
|
private static java.lang.String |
tokensToString(java.util.List<Token> tokens,
java.lang.String tokenizer,
boolean isXml)
Tokens to string
|
private static java.lang.String |
treeToString(edu.stanford.nlp.trees.Tree parseTree,
boolean isXml)
Parse tree to string
|
private static java.lang.String |
triplesToString(java.util.List<Triple> triples,
boolean isXml)
Triples to string
|
private static java.lang.String |
typedDependenciesToString(java.util.Map<TypedDependencyMode,java.util.Collection<edu.stanford.nlp.trees.TypedDependency>> typedDependencies,
TypedDependencyProvider provider,
boolean isXML)
Typed dependencies to string
|
private static final boolean stanfordMode
private static final boolean relationDependentsFromGrammaticalStructure
public static final XMLPrinter xMLPrinter
protected final Language language
protected java.lang.String text
private java.util.List<WordSegment> wordSegments
private java.util.List<SentenceSegment> sentenceSegments
protected final RelationDependentsDirectFactory relationDependentsDirectFactory
protected final AbstractDocumentFactory.Cache<java.util.List<Token>> tokens
protected final AbstractDocumentFactory.Cache<edu.stanford.nlp.trees.Tree> parseTrees
protected final AbstractDocumentFactory.Cache<edu.stanford.nlp.trees.GrammaticalStructure> grammaticalStructures
protected final java.util.Map<TypedDependencyMode,AbstractDocumentFactory.Cache<java.util.Collection<edu.stanford.nlp.trees.TypedDependency>>> typedDependencies
protected final java.util.Map<TypedDependencyMode,AbstractDocumentFactory.Cache<java.util.Collection<edu.stanford.nlp.trees.TypedDependency>>> typedDependencies2
public AbstractDocumentFactory(Language language)
language
- languagepublic boolean init(java.lang.String text)
IDocumentFactory
init
in interface IDocumentFactory
text
- input textprotected abstract Segmentation getSegmentation() throws java.lang.RuntimeException
java.lang.RuntimeException
- exceptionpublic abstract java.util.List<Token> getTokens(int sentenceIdx) throws java.lang.RuntimeException
getTokens
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
- exceptionprotected abstract edu.stanford.nlp.trees.Tree getStanfordParseTree(int sentenceIdx) throws java.lang.RuntimeException
sentenceIdx
- sentence indexjava.lang.RuntimeException
- exceptionprotected abstract edu.stanford.nlp.trees.GrammaticalStructure getStanfordGrammaticalStructure(int sentenceIdx) throws java.lang.RuntimeException
sentenceIdx
- sentencejava.lang.RuntimeException
protected abstract java.util.Collection<edu.stanford.nlp.trees.TypedDependency> getStanfordTypedDependencies(int sentenceIdx, TypedDependencyMode mode) throws java.lang.RuntimeException
sentenceIdx
- sentencemode
- typed dependency modejava.lang.RuntimeException
- exceptionprotected abstract java.util.Collection<edu.stanford.nlp.trees.TypedDependency> getStanfordTypedDependencies2(int sentenceIdx, TypedDependencyMode mode) throws java.lang.RuntimeException
sentenceIdx
- sentencemode
- typed dependency modejava.lang.RuntimeException
- exceptionprotected abstract edu.stanford.nlp.semgraph.SemanticGraph getStanfordSemanticGraph(int sentenceIdx, TypedDependencyMode mode) throws java.lang.RuntimeException
sentenceIdx
- sentencemode
- typed dependency modejava.lang.RuntimeException
protected abstract edu.stanford.nlp.semgraph.SemanticGraph getStanfordSemanticGraph2(int sentenceIdx, TypedDependencyMode mode) throws java.lang.RuntimeException
sentenceIdx
- sentencemode
- typed dependency modejava.lang.RuntimeException
public abstract TypedDependencyProvider[] getSupportedProviders() throws java.lang.RuntimeException
getSupportedProviders
in interface IDocumentFactoryService
java.lang.RuntimeException
- exceptionpublic abstract TypedDependencyMode[] getSupportedModes() throws java.lang.RuntimeException
getSupportedModes
in interface IDocumentFactoryService
java.lang.RuntimeException
- exceptionprotected abstract java.util.List<NamedEntity> getStanfordNamedEntities(int sentenceIdx) throws java.lang.RuntimeException
sentenceIdx
- sentence indexjava.lang.RuntimeException
- exceptionprotected abstract Sentiment getStanfordSentiment(int sentenceIdx)
sentenceIdx
- sentence indexprotected abstract java.util.List<Entailment> getStanfordEntailments(int sentenceIdx)
sentenceIdx
- sentence indexprotected abstract java.util.List<Triple> getStanfordTriples(int sentenceIdx)
sentenceIdx
- sentence indexprotected abstract Coreferences getStanfordCoreferences() throws java.lang.RuntimeException
java.lang.RuntimeException
public java.lang.String getText() throws java.lang.RuntimeException
IDocumentFactoryService
getText
in interface IDocumentFactoryService
java.lang.RuntimeException
public java.util.List<SentenceSegment> getSentences() throws java.lang.RuntimeException
IDocumentFactoryService
getSentences
in interface IDocumentFactoryService
java.lang.RuntimeException
public int getSentenceCount() throws java.lang.RuntimeException
IDocumentFactoryService
getSentenceCount
in interface IDocumentFactoryService
java.lang.RuntimeException
public java.util.List<WordSegment> getWords() throws java.lang.RuntimeException
IDocumentFactoryService
getWords
in interface IDocumentFactoryService
java.lang.RuntimeException
private static java.util.List<SentenceSegment> groupToSentence(java.util.List<java.util.List<WordSegment>> sentenceWordSegments)
sentenceWordSegments
- list of sentencesprivate static java.util.List<WordSegment> flatten(java.util.List<java.util.List<WordSegment>> sentenceWordSegments)
sentenceWordSegments
- hierarchical list of per-sentence word segmentsprivate static Segment getSpan(java.util.List<? extends Segment> segments)
segments
- segmentspublic AParseTree getParseTree(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getParseTree
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public APartsOfSpeech getPoses(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getPoses
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public AGrammaticalStructure getGrammaticalStructure(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getGrammaticalStructure
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public ARelationDependents getRelationDependents(int sentenceIdx) throws java.lang.RuntimeException
getRelationDependents
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public ATypedDependencies getTypedDependencies(int sentenceIdx, TypedDependencyProvider provider, TypedDependencyMode mode) throws java.lang.RuntimeException
IDocumentFactoryService
getTypedDependencies
in interface IDocumentFactoryService
sentenceIdx
- sentence indexprovider
- typed dependency providermode
- typed dependency modejava.lang.RuntimeException
public java.util.Map<TypedDependencyProvider,java.util.Map<TypedDependencyMode,ATypedDependencies>> getTypedDependencies(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getTypedDependencies
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public ASemanticGraph getSemanticGraph(int sentenceIdx, TypedDependencyProvider provider, TypedDependencyMode mode) throws java.lang.RuntimeException
IDocumentFactoryService
getSemanticGraph
in interface IDocumentFactoryService
sentenceIdx
- sentence indexprovider
- typed dependency providermode
- typed dependency modejava.lang.RuntimeException
public java.util.Map<TypedDependencyProvider,java.util.Map<TypedDependencyMode,ASemanticGraph>> getSemanticGraphs(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getSemanticGraphs
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public ANamedEntities getNamedEntities(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getNamedEntities
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public Sentiment getSentiment(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getSentiment
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
public java.util.List<Entailment> getEntailments(int sentenceIdx)
IDocumentFactoryService
getEntailments
in interface IDocumentFactoryService
sentenceIdx
- sentence indexpublic java.util.List<Triple> getTriples(int sentenceIdx)
IDocumentFactoryService
getTriples
in interface IDocumentFactoryService
sentenceIdx
- sentence indexpublic ACoreferences getCoreferences() throws java.lang.RuntimeException
IDocumentFactoryService
getCoreferences
in interface IDocumentFactoryService
java.lang.RuntimeException
public ATextAnalysis getTextAnalysis(TypedDependencyProvider provider, TypedDependencyMode mode) throws java.lang.RuntimeException
IDocumentFactoryService
getTextAnalysis
in interface IDocumentFactoryService
provider
- providermode
- modejava.lang.RuntimeException
public AAnalysis getAnalysis(int sentenceIdx) throws java.lang.RuntimeException
IDocumentFactoryService
getAnalysis
in interface IDocumentFactoryService
sentenceIdx
- sentence indexjava.lang.RuntimeException
private java.util.Map<TypedDependencyMode,java.util.Collection<edu.stanford.nlp.trees.TypedDependency>> makeTypedDependencies(int sentenceIdx)
sentenceIdx
- sentence indexprivate java.util.Map<TypedDependencyMode,java.util.Collection<edu.stanford.nlp.trees.TypedDependency>> makeTypedDependencies2(int sentenceIdx)
sentenceIdx
- sentence indexprivate java.util.Map<TypedDependencyMode,edu.stanford.nlp.semgraph.SemanticGraph> makeSemanticGraphs(int sentenceIdx)
sentenceIdx
- sentence indexprivate java.util.Map<TypedDependencyMode,edu.stanford.nlp.semgraph.SemanticGraph> makeSemanticGraphs2(int sentenceIdx)
sentenceIdx
- sentence indexpublic java.lang.String[] getReports(int sentenceIdx, boolean xMLFlag) throws java.lang.RuntimeException
IDocumentFactoryService
getReports
in interface IDocumentFactoryService
sentenceIdx
- sentence indexxMLFlag
- XML format requestedjava.lang.RuntimeException
public java.lang.String getReport(int sentenceIdx, boolean xMLFlag) throws java.lang.RuntimeException
IDocumentFactoryService
getReport
in interface IDocumentFactoryService
sentenceIdx
- sentence indexxMLFlag
- XML format requestedjava.lang.RuntimeException
public java.lang.String getTextReport(TypedDependencyProvider provider, TypedDependencyMode mode, boolean xMLModeFlag) throws java.lang.RuntimeException
getTextReport
in interface IDocumentFactoryService
provider
- typed dependency providermode
- typed dependency modexMLModeFlag
- xml formjava.lang.RuntimeException
- exceptionpublic java.lang.String[] getTextReports(TypedDependencyProvider provider, TypedDependencyMode mode, boolean xMLModeFlag) throws java.lang.RuntimeException
getTextReports
in interface IDocumentFactoryService
provider
- typed dependency providermode
- typed dependency modexMLModeFlag
- xml formjava.lang.RuntimeException
- exceptionprivate static java.lang.String tokensToString(java.util.List<Token> tokens, java.lang.String tokenizer, boolean isXml)
tokens
- tokenstokenizer
- tokenizeisXml
- xml formatprivate static java.lang.String treeToString(edu.stanford.nlp.trees.Tree parseTree, boolean isXml)
parseTree
- parse treeisXml
- xml formatprivate static java.lang.String grammaticalStructureToString(edu.stanford.nlp.trees.GrammaticalStructure grammaticalStructure, boolean isXml)
grammaticalStructure
- grammatical structureisXml
- xml formatprivate static java.lang.String typedDependenciesToString(java.util.Map<TypedDependencyMode,java.util.Collection<edu.stanford.nlp.trees.TypedDependency>> typedDependencies, TypedDependencyProvider provider, boolean isXML)
typedDependencies
- typed dependenciesisXML
- xml formatprovider
- providerprivate static java.lang.String semanticGraphsToString(java.util.Map<TypedDependencyMode,edu.stanford.nlp.semgraph.SemanticGraph> semanticGraphs, TypedDependencyProvider provider, boolean isXml)
semanticGraphs
- semantic graphsprovider
- providerisXml
- xml formatprivate static java.lang.String namedEntitiesToString(java.util.List<NamedEntity> namedEntities, java.lang.String sentenceString, SentenceSegment sentenceSegment, boolean isXml)
namedEntities
- named entitiessentenceString
- sentence stringsentenceSegment
- sentence segmentisXml
- xml formatprivate static java.lang.String sentimentToString(Sentiment sentiment, boolean isXml)
sentiment
- sentimentisXml
- xml formatprivate static java.lang.String entailmentsToString(java.util.List<Entailment> entailments, boolean isXml)
entailments
- entailmentsisXml
- xml formatprivate static java.lang.String triplesToString(java.util.List<Triple> triples, boolean isXml)
triples
- triplesisXml
- xml formatprivate static java.lang.String coreferencesToString(Coreferences coreferences, boolean isXml)
coreferences
- coreferencesisXml
- xml format