From 1f1ae852cc030c48c58b1f4ca3fbf15c9c4ef588 Mon Sep 17 00:00:00 2001 From: Slava Krauchanka Date: Tue, 11 Dec 2018 14:29:42 +0100 Subject: [PATCH] using a local entity resolver, if possible --- src/main/java/be/ugent/rml/records/XML.java | 22 +++++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/src/main/java/be/ugent/rml/records/XML.java b/src/main/java/be/ugent/rml/records/XML.java index 52130df0..fef1cf50 100644 --- a/src/main/java/be/ugent/rml/records/XML.java +++ b/src/main/java/be/ugent/rml/records/XML.java @@ -16,8 +16,28 @@ import java.util.ArrayList; import java.util.List; +import org.xml.sax.EntityResolver; +import org.xml.sax.InputSource; +import org.xml.sax.SAXException; + public class XML extends IteratorFormat { + // Avoid downloading external DTDs (and entities) found in XMLs, + // if those files can be found in the classpath. + public class LocalEntityResolver implements EntityResolver { + @Override + public InputSource resolveEntity(String publicId, String systemId) + throws SAXException, IOException { + String fileName = systemId.substring(systemId.lastIndexOf("/") + 1); + if (getClass().getClassLoader().getResource(fileName) != null) { + return new InputSource(getClass().getClassLoader().getResourceAsStream(fileName)); + } else { + // if a local file is not found, use the default behaviour + return null; + } + } + } + protected String getContentType() { return "application/xml"; } @@ -28,7 +48,9 @@ List _get(InputStream stream, String iterator) throws IOException { try { DocumentBuilderFactory builderFactory = DocumentBuilderFactory.newInstance(); + builderFactory.setValidating(false); DocumentBuilder builder = builderFactory.newDocumentBuilder(); + builder.setEntityResolver(new LocalEntityResolver()); Document xmlDocument = builder.parse(stream); XPath xPath = XPathFactory.newInstance().newXPath();