6 package de.uni_hamburg.corpora;
9 import java.util.Collection;
12 import java.io.IOException;
13 import java.net.MalformedURLException;
14 import java.net.URISyntaxException;
15 import java.util.ArrayList;
16 import org.exmaralda.partitureditor.jexmaralda.JexmaraldaException;
17 import org.jdom.JDOMException;
18 import org.jdom.xpath.XPath;
19 import org.xml.sax.SAXException;
28 Collection<Metadata> metadata =
new ArrayList();
30 Collection<ContentData> contentdata =
new ArrayList();
31 Collection<Recording> recording =
new ArrayList();
32 Collection<AdditionalData> additionaldata =
new ArrayList();
33 Collection<AnnotationSpecification> annotationspecification =
new ArrayList();
34 Collection<ConfigParameters> configparameters =
new ArrayList();
35 private Collection<CmdiData> cmdidata =
new ArrayList();
36 Collection<BasicTranscriptionData> basictranscriptiondata =
new ArrayList();
37 Collection<SegmentedTranscriptionData> segmentedtranscriptiondata =
new ArrayList();
40 Collection<CorpusData> cdc =
new ArrayList<CorpusData>();
51 public Corpus(
ComaData coma, Collection<Class<? extends CorpusData>> clcds) throws MalformedURLException, MalformedURLException, MalformedURLException, SAXException, JexmaraldaException, URISyntaxException, IOException, ClassNotFoundException, JDOMException {
61 for (URL url : urllist) {
63 if (cddd != null && !cdc.contains(cddd)) {
71 if (cd instanceof ContentData) {
72 contentdata.add((ContentData) cd);
74 basictranscriptiondata.add((BasicTranscriptionData) cd);
76 segmentedtranscriptiondata.add((SegmentedTranscriptionData) cd);
78 }
else if (cd instanceof Recording) {
79 recording.add((Recording) cd);
80 }
else if (cd instanceof AdditionalData) {
81 additionaldata.add((AdditionalData) cd);
82 }
else if (cd instanceof Metadata) {
84 metadata.add((Metadata) cd);
86 cmdidata.add((CmdiData) cd);
87 }
else if (cd instanceof AnnotationSpecification) {
88 annotationspecification.add((AnnotationSpecification) cd);
89 }
else if (cd instanceof ConfigParameters) {
90 configparameters.add((ConfigParameters) cd);
98 public Corpus(Collection<CorpusData> cdc)
throws MalformedURLException, MalformedURLException, MalformedURLException, SAXException, JexmaraldaException {
100 if (cd instanceof ContentData) {
101 contentdata.add((ContentData) cd);
102 }
else if (cd instanceof Recording) {
103 recording.add((Recording) cd);
104 }
else if (cd instanceof AdditionalData) {
105 additionaldata.add((AdditionalData) cd);
106 }
else if (cd instanceof Metadata) {
107 metadata.add((Metadata) cd);
108 }
else if (cd instanceof AnnotationSpecification) {
109 annotationspecification.add((AnnotationSpecification) cd);
110 }
else if (cd instanceof ConfigParameters) {
111 configparameters.add((ConfigParameters) cd);
112 }
else if (cd instanceof
CmdiData) {
113 cmdidata.add((CmdiData) cd);
136 return additionaldata;
140 return annotationspecification;
144 return configparameters;
152 return basictranscriptiondata;
156 return segmentedtranscriptiondata;
164 this.metadata = metadata;
168 this.contentdata = contentdata;
172 this.recording = recording;
176 this.additionaldata = additionaldata;
180 this.annotationspecification = annotationspecification;
184 this.configparameters = configparameters;
187 public void setCdc(Collection<CorpusData> cdc) {
192 this.cmdidata = cmdidata;
196 this.basictranscriptiondata = basictranscriptions;
200 this.segmentedtranscriptiondata = segmentedtranscriptions;
204 this.comadata = coma;
208 return basedirectory;
220 String getCorpusSentenceNumber()
throws JDOMException {
221 XPath xpath = XPath.newInstance(
"sum(//Transcription/Description/Key[@Name = '# HIAT:u'])");
222 double DoubleValue = (double) xpath.selectSingleNode(comadata.
getJdom());
223 int IntValue = (int) DoubleValue;
224 return "" + IntValue;
227 String getCorpusTranscriptionNumber()
throws JDOMException {
228 XPath xpath = XPath.newInstance(
"count(//Transcription/Description/Key[@Name = 'segmented' and text() = 'false'])");
229 double DoubleValue = (double) xpath.selectSingleNode(comadata.
getJdom());
230 int IntValue = (int) DoubleValue;
231 return "" + IntValue;
234 String getCorpusSpeakerNumber()
throws JDOMException {
235 XPath xpath = XPath.newInstance(
"count(//Speaker)");
236 double DoubleValue = (double) xpath.selectSingleNode(comadata.
getJdom());
237 int IntValue = (int) DoubleValue;
238 return "" + IntValue;
241 String getCorpusCommunicationNumber()
throws JDOMException {
242 XPath xpath = XPath.newInstance(
"count(//Communication)");
243 double DoubleValue = (double) xpath.selectSingleNode(comadata.
getJdom());
244 int IntValue = (int) DoubleValue;
245 return "" + IntValue;
248 String getCorpusWords()
throws JDOMException {
249 XPath xpath = XPath.newInstance(
"sum(//Transcription/Description/Key[@Name = '# HIAT:w'])");
250 double DoubleValue = (double) xpath.selectSingleNode(comadata.
getJdom());
251 int IntValue = (int) DoubleValue;
252 return "" + IntValue;
void setRecording(Collection< Recording > recording)
Collection< URL > getReferencedCorpusDataURLs()
void setConfigparameters(Collection< ConfigParameters > configparameters)
Collection< ContentData > getContentdata()
Collection< Metadata > getMetadata()
void setCdc(Collection< CorpusData > cdc)
Collection< AnnotationSpecification > getAnnotationspecification()
void setCorpusName(String s)
Corpus(Collection< CorpusData > cdc)
void setAdditionaldata(Collection< AdditionalData > additionaldata)
Collection< CorpusData > getCorpusData()
void setContentdata(Collection< ContentData > contentdata)
CorpusData readFileURL(URL url, Collection< Class<?extends CorpusData >> clcds)
Collection< AdditionalData > getAdditionaldata()
Corpus(ComaData coma, Collection< Class<?extends CorpusData >> clcds)
Collection< CmdiData > getCmdidata()
Collection< ConfigParameters > getConfigparameters()
Collection< Recording > getRecording()
void setMetadata(Collection< Metadata > metadata)
void setBasicTranscriptionData(Collection< BasicTranscriptionData > basictranscriptions)
Collection< BasicTranscriptionData > getBasicTranscriptionData()
void setCmdidata(Collection< CmdiData > cmdidata)
Collection< SegmentedTranscriptionData > getSegmentedTranscriptionData()
void setSegmentedTranscriptionData(Collection< SegmentedTranscriptionData > segmentedtranscriptions)
void setAnnotationspecification(Collection< AnnotationSpecification > annotationspecification)
void setComaData(ComaData coma)