Skip to content
Snippets Groups Projects
Commit 8ce09901 authored by Thorsten Vitt's avatar Thorsten Vitt
Browse files

Extracted a stylesheet manager

parent ef2ec502
No related branches found
No related tags found
No related merge requests found
......@@ -36,7 +36,7 @@
* The abstract base class for all aggregators/exporters. This tries to capture
* all behavior common to the various format specific exporters, and it tries to
* provide sensible defaults so code complexity for the implementers is reduced.
*
*
* <p>These are the typical steps:</p>
* <ol>
* <li>The exporter is instantiated using one of the constructors and configured
......@@ -53,7 +53,7 @@
* {@link #write(java.io.OutputStream)} method, which is called on-demand when
* the client tries to read the body part of the response.</li>
* </ol>
*
*
* Implementors will typically call at least the following configuration methods:
* <ul>
* <li>{@link #setMediaType(String)} to set the response's content type
......@@ -65,7 +65,7 @@
* <li>extend {@link #createResponse()} to setup the response any further
* </ul>
*
*
*
* @author vitt
*/
public abstract class AbstractExporter implements StreamingOutput {
......@@ -106,7 +106,7 @@ public String getTitle() {
return title;
}
public void setTitle(String title) {
public void setTitle(final String title) {
this.title = title;
}
......@@ -114,7 +114,7 @@ public String getFileExtension() {
return fileExtension;
}
public void setFileExtension(String fileExtension) {
public void setFileExtension(final String fileExtension) {
this.fileExtension = fileExtension;
}
......@@ -122,7 +122,7 @@ public Disposition getDisposition() {
return disposition;
}
public void setDisposition(Disposition disposition) {
public void setDisposition(final Disposition disposition) {
this.disposition = disposition;
}
......@@ -130,7 +130,8 @@ public void setDisposition(Disposition disposition) {
public AbstractExporter(final ITextGridRep repository,
final Request request, final String uriList) {
super();
Preconditions.checkArgument(repository != null, "non-null repository argument required");
stopwatch = new Stopwatch();
stopwatch.start();
this.repository = repository;
......@@ -164,7 +165,7 @@ protected ObjectType[] getRootObjects() throws MetadataParseFault,
* root input. {@link AbstractExporter}'s implementation delegates to
* {@link #getContentBasket()} or {@link #getContentSimple()}, depending on
* the request type.
*
*
* @throws IllegalStateException
* if not supported.
*/
......@@ -178,7 +179,7 @@ protected TGOSupplier<InputStream> getContent() {
/**
* Constructs a single virtual object representing the root objects. Clients
* who need this functionality must override.
*
*
* @throws IllegalStateException
* if not supported.
*/
......@@ -190,11 +191,11 @@ protected TGOSupplier<InputStream> getContentBasket() {
/**
* Returns a {@link TGOSupplier} with content and metadata in case only one
* object has been requested.
*
*
* This method may cause a TG-crud READ request that is left open after the
* metadata part until content data is requested from the supplier's input
* stream.
*
*
* @throws IllegalStateException
* when more than one root object is requested
*/
......@@ -227,7 +228,7 @@ public AbstractExporter sid(final String sid) {
/**
* Returns a last modified date suitable for use in HTTP requests.
*
*
* Implementers may override or extend.
*/
protected Date getLastModified() throws MetadataParseFault,
......@@ -239,10 +240,10 @@ protected Date getLastModified() throws MetadataParseFault,
/**
* Checks whether we can stop exporting and return 304 Not Modified instead.
*
*
* The {@link AbstractExporter} implementation simply checks the results of
* {@link #getLastModified()}.
*
*
* @return a configured {@link ResponseBuilder} when the content is not
* modified, <code>null</code> when the request should be fulfilled
* normally.
......@@ -250,7 +251,7 @@ protected Date getLastModified() throws MetadataParseFault,
protected final ResponseBuilder evaluatePreconditions()
throws MetadataParseFault, ObjectNotFoundFault, IoFault, AuthFault {
ResponseBuilder builder = request == null ? null
final ResponseBuilder builder = request == null ? null
: doEvaluatePreconditions();
if (builder == null) {
this.responseBuilder = Response.ok();
......@@ -276,13 +277,13 @@ protected ResponseBuilder doEvaluatePreconditions()
* generating a real response and can just return
* <code>304 Not Modified</code> instead, allowing the client to serve the
* request from its local cache.
*
*
* <p>
* This runs {@link #evaluatePreconditions()}, if necessary. Clients who
* wish to influence this behaviour should override
* {@link #doEvaluatePreconditions()}.
* </p>
*
*
* @see #evaluatePreconditions()
* @see {@link #doEvaluatePreconditions()}
*/
......@@ -308,7 +309,7 @@ protected ResponseBuilder getResponseBuilder() throws MetadataParseFault,
/**
* Configures caching parameters into the current response builder.
*
*
* @see #getResponseBuilder()
* @see #createResponse()
*/
......@@ -321,7 +322,7 @@ protected void configureCache() throws MetadataParseFault,
/**
* Configures the content-disposition header, which contains the
* content-disposition and a suggested filename.
*
*
* @see #setDisposition(Disposition)
* @see #setTitle(String)
* @see #setFileExtension(String)
......@@ -357,8 +358,17 @@ public String getMediaType() {
return mediaType;
}
public void setMediaType(String mediaType) {
public void setMediaType(final String mediaType) {
this.mediaType = mediaType;
}
@Override
protected void finalize() throws Throwable {
if (stopwatch.isRunning())
stopwatch.stop();
super.finalize();
}
}
\ No newline at end of file
package info.textgrid.services.aggregator.html;
import info.textgrid.namespaces.metadata.core._2010.ObjectType;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.AuthFault;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.IoFault;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.MetadataParseFault;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.ObjectNotFoundFault;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.ProtocolNotImplementedFault;
import info.textgrid.services.aggregator.ITextGridRep;
import info.textgrid.services.aggregator.ITextGridRep.TGOSupplier;
import info.textgrid.services.aggregator.TextGridRepProvider;
import java.io.IOException;
import java.io.InputStream;
import java.net.MalformedURLException;
import java.net.URI;
import java.net.URL;
import java.text.MessageFormat;
import java.util.concurrent.ExecutionException;
import java.util.logging.Level;
import java.util.logging.Logger;
import javax.servlet.ServletContext;
......@@ -30,188 +23,34 @@
import javax.ws.rs.core.Context;
import javax.ws.rs.core.Request;
import javax.ws.rs.core.Response;
import javax.xml.transform.stream.StreamSource;
import net.sf.saxon.s9api.Processor;
import net.sf.saxon.s9api.SaxonApiException;
import net.sf.saxon.s9api.XsltCompiler;
import net.sf.saxon.s9api.XsltExecutable;
import org.apache.cxf.jaxrs.model.wadl.Description;
import com.google.common.base.Optional;
import com.google.common.cache.Cache;
import com.google.common.cache.CacheBuilder;
import com.google.common.cache.CacheLoader;
import com.google.common.cache.RemovalListener;
import com.google.common.cache.RemovalNotification;
@Path("/html")
@Description("Creates an HTML representation of the given TEI document, or aggregation of TEI documents. This is currently extremely experimental and probably broken.")
@Description("Creates an HTML representation of the given TEI document, or aggregation of TEI documents.")
public class HTML {
private static final String TO_HTML_XSL = "/WEB-INF/stylesheets/db2xhtml.xsl";
private static final String EXTRACT_BODY_XSL = "/WEB-INF/stylesheets/extractbody.xsl";
ITextGridRep repository = TextGridRepProvider.getInstance();
final Logger logger = Logger
.getLogger("info.textgrid.services.aggregator.html.HTML");
private XsltExecutable toHtml;
private XsltExecutable extractBody;
final Processor xsltProcessor;
@Context
private ServletContext servlet;
private Cache<URI, XsltExecutable> stylesheets;
XsltExecutable getToHtml() {
if (toHtml == null) {
try {
final URL stylesheet = servlet.getResource(TO_HTML_XSL);
final XsltCompiler xsltCompiler = xsltProcessor
.newXsltCompiler();
toHtml = xsltCompiler.compile(new StreamSource(stylesheet
.toString()));
} catch (final MalformedURLException e) {
throw new IllegalStateException(e);
} catch (final SaxonApiException e) {
throw new IllegalStateException(e);
}
}
return toHtml;
}
@Context ServletContext servlet;
XsltExecutable getExtractBody() {
if (extractBody == null) {
try {
URL stylesheet;
stylesheet = servlet.getResource(EXTRACT_BODY_XSL);
extractBody = xsltProcessor.newXsltCompiler().compile(
new StreamSource(stylesheet.toString()));
} catch (final MalformedURLException e) {
throw new IllegalStateException(e);
} catch (final SaxonApiException e) {
throw new IllegalStateException(e);
}
}
return extractBody;
}
private StylesheetManager stylesheetManager;
public HTML(final ITextGridRep repository) throws IOException {
this.repository = repository;
xsltProcessor = new Processor(false);
xsltProcessor.getUnderlyingConfiguration().setURIResolver(
new TGUriResolver(repository));
// xsltProcessor.getUnderlyingConfiguration().setAllowExternalFunctions(
// false); // we run external stylesheets
xsltProcessor.getUnderlyingConfiguration().setCompileWithTracing(true);
stylesheets = CacheBuilder.newBuilder().maximumSize(50).softValues()
.removalListener(new RemovalListener<URI, XsltExecutable>() {
@Override
public void onRemoval(
final RemovalNotification<URI, XsltExecutable> notification) {
logger.info(MessageFormat
.format("Removed stylesheet {0} from cache, reason: {1}",
notification.getKey(),
notification.getCause()));
}
}).build(new CacheLoader<URI, XsltExecutable>() {
@Override
public XsltExecutable load(final URI url) throws Exception {
final XsltCompiler compiler = xsltProcessor
.newXsltCompiler();
try {
final XsltExecutable executable = compiler
.compile(new StreamSource(url.toString()));
logger.log(Level.INFO,
"Successfully loaded stylesheet {0}", url);
return executable;
} catch (final Exception e) {
logger.log(Level.SEVERE, MessageFormat.format(
"Failed to load stylesheet {0}", url), e);
throw e;
}
}
});
public StylesheetManager getStylesheetManager() {
if (stylesheetManager == null)
stylesheetManager = new StylesheetManager(servlet, repository);
return stylesheetManager;
}
/**
* Returns an appropriate stylesheet for the given URI.
*
* Basically, we try the following options in order:
* <ol>
* <li>The stylesheet is cached -> return the cached version.
* <li>The stylesheet is public or external -> load & cache it.
* <li>The stylesheet is non-public TextGrid internal -> load & do not cache
* it.
* </ol>
*
* @param uri
* the URI of the stylesheet to load
* @param sid
* the session ID to use, if present
* @param forceLoad
* do not use a cached version even if present.
* @throws IOException
* if an error occurs reading the stylesheet.
* @throws SaxonApiException
* if saxon fails to compile the stylesheet.
*/
protected XsltExecutable getStylesheet(final URI uri,
final Optional<String> sid, final boolean forceLoad)
throws SaxonApiException, IOException {
XsltExecutable executable = null;
// (1) try cached version, if it exists
if (!forceLoad) {
executable = stylesheets.getIfPresent(uri);
}
if (executable == null) {
final XsltCompiler compiler = xsltProcessor.newXsltCompiler();
if (TGUriResolver.isResolveable(uri)) {
// (2/3) it's a TextGrid object, load it from TG-crud.
final TGOSupplier<InputStream> xsltSupplier = repository.read(
uri, sid.orNull());
executable = compiler.compile(new StreamSource(xsltSupplier
.getInput(), uri.toString()));
if (isPublic(xsltSupplier.getMetadata())) {
// (2) it's public -> we can cache it.
stylesheets.put(uri, executable);
logger.log(Level.INFO, "Cached public stylesheet {0}", uri);
} else {
logger.log(Level.INFO, "Loaded private stylesheet {0}", uri);
}
} else {
// (2) it's non-TextGrid -- load & cache it.
executable = compiler.compile(new StreamSource(uri.toString()));
stylesheets.put(uri, executable);
logger.log(Level.INFO, "Cached external stylesheet {0}", uri);
}
} else {
logger.log(Level.INFO, "Reusing cached stylesheed {0}", uri);
}
return executable;
}
private static boolean isPublic(final ObjectType metadata) {
try {
return metadata.getGeneric().getGenerated().getAvailability()
.contains("public");
} catch (final NullPointerException e) {
return false;
}
public HTML(final ITextGridRep repository) throws IOException {
this.repository = repository;
}
@GET
......@@ -233,7 +72,7 @@ public Response get(
logger.fine("HTML called for root objects: " + uriList);
final HTMLWriter writer = new HTMLWriter(this, uriList, xsluri,
final HTMLWriter writer = new HTMLWriter(repository, getStylesheetManager(), uriList, xsluri,
refreshStylesheet, pi, embedded, css, sid, mediaType, request);
return writer.createResponse().build();
}
......
......@@ -6,6 +6,7 @@
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.MetadataParseFault;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.ObjectNotFoundFault;
import info.textgrid.namespaces.middleware.tgcrud.services.tgcrudservice.ProtocolNotImplementedFault;
import info.textgrid.services.aggregator.ITextGridRep;
import java.io.IOException;
import java.io.OutputStream;
......@@ -70,6 +71,8 @@
*
*/
public class HTMLWriter extends CorpusBasedExporter implements StreamingOutput {
private static final URI TO_HTML_XSL = URI.create("/WEB-INF/stylesheets/db2xhtml.xsl");
private static final URI EXTRACT_BODY_XSL = URI.create("/WEB-INF/stylesheets/extractbody.xsl");
private Optional<URI> explicitStylesheetURI = Optional.absent();
private boolean refreshStylesheet = false;
......@@ -86,29 +89,29 @@ public class HTMLWriter extends CorpusBasedExporter implements StreamingOutput {
private Optional<String> requestedMediaType;
protected final HTML service;
private Source source;
private StylesheetManager stylesheetManager;
// Constructor and configuration
public HTMLWriter(final HTML service, final String rootURIs, final Request request) {
super(service.repository, request, rootURIs);
public HTMLWriter(final ITextGridRep repository, final StylesheetManager stylesheetManager, final String rootURIs, final Request request) {
super(repository, request, rootURIs);
logger.log(Level.INFO, "Starting HTML export for {0}", rootURIs);
this.service = service;
this.stylesheetManager = stylesheetManager;
setDisposition(Disposition.INLINE);
setFileExtension("html");
setMediaType(MediaType.TEXT_HTML);
}
public HTMLWriter(final HTML service, final String rootURIs,
public HTMLWriter(final ITextGridRep repository, final StylesheetManager stylesheetManager, final String rootURIs,
final URI stylesheetURI, final boolean refreshStylesheet,
final boolean readStylesheetPI, final boolean embedded,
final URI css, final String sid, final String mediaType,
final Request request) {
this(service, rootURIs, request);
this(repository, stylesheetManager, rootURIs, request);
this.explicitStylesheetURI = Optional.fromNullable(stylesheetURI);
this.refreshStylesheet = refreshStylesheet;
......@@ -163,15 +166,15 @@ private XsltExecutable getStylesheet() throws SaxonApiException,
IOException {
if (explicitStylesheetURI.isPresent()) {
actualStylesheetLabel = explicitStylesheetURI.get().toString() + " (explicit)";
return service.getStylesheet(explicitStylesheetURI.get(), sid,
refreshStylesheet);
return stylesheetManager.getStylesheet(explicitStylesheetURI.get(), sid,
refreshStylesheet, false);
} else if (associatedStylesheetURI.isPresent()) {
actualStylesheetLabel = associatedStylesheetURI.get().toString() + " (associated)";
return service.getStylesheet(associatedStylesheetURI.get(), sid,
refreshStylesheet);
return stylesheetManager.getStylesheet(associatedStylesheetURI.get(), sid,
refreshStylesheet, false);
} else {
actualStylesheetLabel = "(internal)";
return service.getToHtml();
return stylesheetManager.getStylesheet(TO_HTML_XSL, sid, false, true);
}
}
......@@ -223,9 +226,9 @@ public void write(final OutputStream out) throws IOException,
WebApplicationException {
try {
logger.log(Level.INFO, MessageFormat.format("Ready for transformation of {0} after {1}", rootURIs, stopwatch.toString()));
final Serializer serializer = service.xsltProcessor.newSerializer(out);
final Serializer serializer = stylesheetManager.xsltProcessor.newSerializer(out);
if (embedded) {
final XsltTransformer extractBody = service.getExtractBody().load();
final XsltTransformer extractBody = stylesheetManager.getStylesheet(EXTRACT_BODY_XSL, sid, false, true).load();
extractBody.setDestination(serializer);
getTransformer().setDestination(extractBody);
} else {
......
package info.textgrid.services.aggregator.html;
import info.textgrid.namespaces.metadata.core._2010.ObjectType;
import info.textgrid.services.aggregator.ITextGridRep;
import info.textgrid.services.aggregator.ITextGridRep.TGOSupplier;
import java.io.IOException;
import java.io.InputStream;
import java.net.MalformedURLException;
import java.net.URI;
import java.net.URL;
import java.text.MessageFormat;
import java.util.Set;
import java.util.logging.Level;
import java.util.logging.Logger;
import javax.servlet.ServletContext;
import javax.xml.transform.stream.StreamSource;
import net.sf.saxon.s9api.Processor;
import net.sf.saxon.s9api.SaxonApiException;
import net.sf.saxon.s9api.XsltCompiler;
import net.sf.saxon.s9api.XsltExecutable;
import com.google.common.base.Optional;
import com.google.common.cache.Cache;
import com.google.common.cache.CacheBuilder;
import com.google.common.cache.CacheLoader;
import com.google.common.cache.RemovalListener;
import com.google.common.cache.RemovalNotification;
import com.google.common.cache.Weigher;
import com.google.common.collect.Sets;
/**
* Manages and caches XSLT stylesheets across service calls, also maintains
* processor policies etc. All stylesheets invoked throughout the service should
* be invoked through the manager's {@link #getStylesheet(URI, Optional, boolean, boolean)} method.
*/
public class StylesheetManager {
private static final Logger logger = Logger
.getLogger(StylesheetManager.class.getCanonicalName());
public final Processor xsltProcessor;
private Cache<URI, XsltExecutable> stylesheets;
private ITextGridRep repository;
private ServletContext servlet;
private Set<URI> importantStylesheets = Sets.newHashSet();
/**
* Initializes a stylesheet manager.
*
* @param servlet
* The servlet context, used for retrieving internal stylesheets.
* @param repository
* The TextGridRep instance, used for retrieving textgrid
* stylesheets.
*/
public StylesheetManager(final ServletContext servlet,
final ITextGridRep repository) {
this.servlet = servlet;
this.repository = repository;
xsltProcessor = new Processor(false);
xsltProcessor.getUnderlyingConfiguration().setURIResolver(
new TGUriResolver(repository));
// xsltProcessor.getUnderlyingConfiguration().setAllowExternalFunctions(
// false); // we run external stylesheets
xsltProcessor.getUnderlyingConfiguration().setCompileWithTracing(true);
stylesheets = CacheBuilder.newBuilder().recordStats()
.maximumWeight(200).weigher(new Weigher<URI, XsltExecutable>() {
@Override
public int weigh(final URI key, final XsltExecutable value) {
return importantStylesheets.contains(key) ? 1 : 10;
}
}).removalListener(new RemovalListener<URI, XsltExecutable>() {
@Override
public void onRemoval(
final RemovalNotification<URI, XsltExecutable> notification) {
logger.info(MessageFormat
.format("Removed stylesheet {0} from cache, reason: {1}",
notification.getKey(),
notification.getCause()));
logger.info(stylesheets.stats().toString());
}
}).build(new CacheLoader<URI, XsltExecutable>() {
@Override
public XsltExecutable load(final URI url) throws Exception {
final XsltCompiler compiler = xsltProcessor
.newXsltCompiler();
try {
final XsltExecutable executable = compiler
.compile(new StreamSource(url.toString()));
logger.log(Level.INFO,
"Successfully loaded stylesheet {0}", url);
return executable;
} catch (final Exception e) {
logger.log(Level.SEVERE, MessageFormat.format(
"Failed to load stylesheet {0}", url), e);
throw e;
}
}
});
}
/**
* Returns an appropriate stylesheet for the given URI.
*
* Basically, we try the following options in order:
* <ol>
* <li>The stylesheet is cached -> return the cached version.
* <li>The stylesheet is public or external -> load & cache it.
* <li>The stylesheet is non-public TextGrid internal -> load & do not cache
* it.
* </ol>
*
* @param uri
* the URI of the stylesheet to load
* @param sid
* the session ID to use, if present
* @param forceLoad
* do not use a cached version even if present.
* @param frequentlyUsed
* if <code>true</code>, this stylesheet will be less likely
* evicted.
* @throws IOException
* if an error occurs reading the stylesheet.
* @throws SaxonApiException
* if saxon fails to compile the stylesheet.
*/
protected XsltExecutable getStylesheet(final URI uri,
final Optional<String> sid, final boolean forceLoad,
final boolean frequentlyUsed) throws SaxonApiException, IOException {
XsltExecutable executable = null;
// (1) try cached version, if it exists
if (!forceLoad) {
executable = stylesheets.getIfPresent(uri);
}
if (executable == null) {
if (frequentlyUsed)
importantStylesheets.add(uri);
final XsltCompiler compiler = xsltProcessor.newXsltCompiler();
// (2) it's internal, load & cache it from the servlet
if (uri.getScheme() == null || uri.getScheme() == "file") {
final URL resource = resolveInternalPath(uri.getPath());
executable = compiler.compile(new StreamSource(resource.openStream(), resource.toExternalForm()));
stylesheets.put(uri, executable);
logger.log(Level.INFO, "Cached internal stylesheet {0}", resource);
} else if (TGUriResolver.isResolveable(uri)) {
// (3/4) it's a TextGrid object, load it from TG-crud.
final TGOSupplier<InputStream> xsltSupplier = repository.read(
uri, sid.orNull());
executable = compiler.compile(new StreamSource(xsltSupplier
.getInput(), uri.toString()));
if (isPublic(xsltSupplier.getMetadata())) {
// (3) it's public -> we can cache it.
stylesheets.put(uri, executable);
logger.log(Level.INFO, "Cached public stylesheet {0}", uri);
} else {
// (4) it's private -> no caching
logger.log(Level.INFO, "Loaded private stylesheet {0}", uri);
}
} else {
// (2) it's non-TextGrid -- load & cache it.
executable = compiler.compile(new StreamSource(uri.toString()));
stylesheets.put(uri, executable);
logger.log(Level.INFO, "Cached external stylesheet {0}", uri);
}
} else {
logger.log(Level.INFO, "Reusing cached stylesheed {0}", uri);
}
return executable;
}
private URL resolveInternalPath(final String path) throws MalformedURLException {
URL stylesheet;
if (servlet == null) {
logger.info("No servlet context, trying fallback property");
final String dir = System.getProperty("webapp.directory");
if (dir == null)
throw new IllegalStateException(
"Could not find stylesheet: Neither ServletContext nor fallback property webapp.directory have been defined.");
stylesheet = new URL("file://" + dir + path);
} else {
stylesheet = servlet.getResource(path);
}
logger.fine("Resolved internal stylesheet: " + stylesheet.toExternalForm());
return stylesheet;
}
private static boolean isPublic(final ObjectType metadata) {
try {
return metadata.getGeneric().getGenerated().getAvailability()
.contains("public");
} catch (final NullPointerException e) {
return false;
}
}
@Override
protected void finalize() throws Throwable {
if (stylesheets != null)
logger.log(Level.INFO, "Shutting down stylesheet manager. Stats: {0}", stylesheets.stats());
super.finalize();
}
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment