6 package de.uni_hamburg.corpora;
9 import java.io.IOException;
11 import java.net.URISyntaxException;
13 import java.nio.file.Files;
14 import java.nio.file.Paths;
15 import java.util.Collection;
16 import java.util.logging.Level;
17 import java.util.logging.Logger;
18 import javax.xml.parsers.ParserConfigurationException;
19 import javax.xml.transform.TransformerException;
20 import javax.xml.xpath.XPathExpressionException;
21 import org.apache.commons.io.FilenameUtils;
22 import org.jdom.Document;
23 import org.jdom.JDOMException;
24 import org.jdom.input.SAXBuilder;
25 import org.xml.sax.SAXException;
35 String originalstring;
38 String filenamewithoutending;
47 SAXBuilder builder =
new SAXBuilder();
48 jdom = builder.build(url);
49 originalstring =
new String(Files.readAllBytes(Paths.get(url.toURI())),
"UTF-8");
50 URI uri = url.toURI();
51 URI parentURI = uri.getPath().endsWith(
"/") ? uri.resolve(
"..") : uri.resolve(
".");
52 parenturl = parentURI.toURL();
53 filename = FilenameUtils.getName(url.getPath());
54 filenamewithoutending = FilenameUtils.getBaseName(url.getPath());
55 }
catch (JDOMException ex) {
56 Logger.getLogger(
CmdiData.class.getName()).log(Level.SEVERE, null, ex);
57 }
catch (IOException ex) {
58 Logger.getLogger(
CmdiData.class.getName()).log(Level.SEVERE, null, ex);
59 }
catch (URISyntaxException ex) {
60 Logger.getLogger(
CmdiData.class.getName()).log(Level.SEVERE, null, ex);
70 public String
toSaveableString() throws TransformerException, ParserConfigurationException, SAXException, IOException, XPathExpressionException {
71 return toPrettyPrintedXML();
76 return originalstring;
79 private String toPrettyPrintedXML()
throws TransformerException, ParserConfigurationException, SAXException, IOException, XPathExpressionException {
83 return prettyCorpusData;
88 originalstring = newUnformattedString;
128 return filenamewithoutending;
133 filenamewithoutending = s;
138 throw new UnsupportedOperationException(
"Not supported yet.");
Collection< URL > getReferencedCorpusDataURLs()
void setFilenameWithoutFileEnding(String s)
void setJdom(Document doc)
String indent(String xml, String suppressedElements)
void setFilename(String s)
void updateUnformattedString(String newUnformattedString)
String toUnformattedString()
String toSaveableString()
void setParentURL(URL url)
String getFilenameWithoutFileEnding()