The Android Open Source Project | 8e35f3c | 2009-03-03 19:30:52 -0800 | [diff] [blame^] | 1 | /* |
| 2 | * This file is part of the XSL implementation. |
| 3 | * |
| 4 | * Copyright (C) 2004, 2005, 2006, 2007, 2008 Apple, Inc. All rights reserved. |
| 5 | * Copyright (C) 2005, 2006 Alexey Proskuryakov <ap@webkit.org> |
| 6 | * |
| 7 | * This library is free software; you can redistribute it and/or |
| 8 | * modify it under the terms of the GNU Library General Public |
| 9 | * License as published by the Free Software Foundation; either |
| 10 | * version 2 of the License, or (at your option) any later version. |
| 11 | * |
| 12 | * This library is distributed in the hope that it will be useful, |
| 13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 15 | * Library General Public License for more details. |
| 16 | * |
| 17 | * You should have received a copy of the GNU Library General Public License |
| 18 | * along with this library; see the file COPYING.LIB. If not, write to |
| 19 | * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, |
| 20 | * Boston, MA 02110-1301, USA. |
| 21 | */ |
| 22 | |
| 23 | #include "config.h" |
| 24 | |
| 25 | #if ENABLE(XSLT) |
| 26 | |
| 27 | #include "XSLTProcessor.h" |
| 28 | |
| 29 | #include "CString.h" |
| 30 | #include "Console.h" |
| 31 | #include "DOMImplementation.h" |
| 32 | #include "DOMWindow.h" |
| 33 | #include "DocLoader.h" |
| 34 | #include "DocumentFragment.h" |
| 35 | #include "Frame.h" |
| 36 | #include "FrameLoader.h" |
| 37 | #include "FrameView.h" |
| 38 | #include "HTMLDocument.h" |
| 39 | #include "HTMLTokenizer.h" |
| 40 | #include "Page.h" |
| 41 | #include "ResourceError.h" |
| 42 | #include "ResourceHandle.h" |
| 43 | #include "ResourceRequest.h" |
| 44 | #include "ResourceResponse.h" |
| 45 | #include "Text.h" |
| 46 | #include "TextResourceDecoder.h" |
| 47 | #include "XMLTokenizer.h" |
| 48 | #include "XSLTExtensions.h" |
| 49 | #include "XSLTUnicodeSort.h" |
| 50 | #include "loader.h" |
| 51 | #include "markup.h" |
| 52 | #include <libxslt/imports.h> |
| 53 | #include <libxslt/variables.h> |
| 54 | #include <libxslt/xsltutils.h> |
| 55 | #include <wtf/Assertions.h> |
| 56 | #include <wtf/Platform.h> |
| 57 | #include <wtf/Vector.h> |
| 58 | #if PLATFORM(MAC) |
| 59 | #include "SoftLinking.h" |
| 60 | #endif |
| 61 | |
| 62 | #if PLATFORM(MAC) |
| 63 | SOFT_LINK_LIBRARY(libxslt); |
| 64 | SOFT_LINK(libxslt, xsltFreeStylesheet, void, (xsltStylesheetPtr sheet), (sheet)) |
| 65 | SOFT_LINK(libxslt, xsltFreeTransformContext, void, (xsltTransformContextPtr ctxt), (ctxt)) |
| 66 | SOFT_LINK(libxslt, xsltNewTransformContext, xsltTransformContextPtr, (xsltStylesheetPtr style, xmlDocPtr doc), (style, doc)) |
| 67 | SOFT_LINK(libxslt, xsltApplyStylesheetUser, xmlDocPtr, (xsltStylesheetPtr style, xmlDocPtr doc, const char** params, const char* output, FILE* profile, xsltTransformContextPtr userCtxt), (style, doc, params, output, profile, userCtxt)) |
| 68 | SOFT_LINK(libxslt, xsltQuoteUserParams, int, (xsltTransformContextPtr ctxt, const char** params), (ctxt, params)) |
| 69 | SOFT_LINK(libxslt, xsltSetCtxtSortFunc, void, (xsltTransformContextPtr ctxt, xsltSortFunc handler), (ctxt, handler)) |
| 70 | SOFT_LINK(libxslt, xsltSetLoaderFunc, void, (xsltDocLoaderFunc f), (f)) |
| 71 | SOFT_LINK(libxslt, xsltSaveResultTo, int, (xmlOutputBufferPtr buf, xmlDocPtr result, xsltStylesheetPtr style), (buf, result, style)) |
| 72 | SOFT_LINK(libxslt, xsltNextImport, xsltStylesheetPtr, (xsltStylesheetPtr style), (style)) |
| 73 | #endif |
| 74 | |
| 75 | namespace WebCore { |
| 76 | |
| 77 | void XSLTProcessor::genericErrorFunc(void* userData, const char* msg, ...) |
| 78 | { |
| 79 | // It would be nice to do something with this error message. |
| 80 | } |
| 81 | |
| 82 | void XSLTProcessor::parseErrorFunc(void* userData, xmlError* error) |
| 83 | { |
| 84 | Console* console = static_cast<Console*>(userData); |
| 85 | if (!console) |
| 86 | return; |
| 87 | |
| 88 | MessageLevel level; |
| 89 | switch (error->level) { |
| 90 | case XML_ERR_NONE: |
| 91 | level = TipMessageLevel; |
| 92 | break; |
| 93 | case XML_ERR_WARNING: |
| 94 | level = WarningMessageLevel; |
| 95 | break; |
| 96 | case XML_ERR_ERROR: |
| 97 | case XML_ERR_FATAL: |
| 98 | default: |
| 99 | level = ErrorMessageLevel; |
| 100 | break; |
| 101 | } |
| 102 | |
| 103 | console->addMessage(XMLMessageSource, level, error->message, error->line, error->file); |
| 104 | } |
| 105 | |
| 106 | // FIXME: There seems to be no way to control the ctxt pointer for loading here, thus we have globals. |
| 107 | static XSLTProcessor* globalProcessor = 0; |
| 108 | static DocLoader* globalDocLoader = 0; |
| 109 | static xmlDocPtr docLoaderFunc(const xmlChar* uri, |
| 110 | xmlDictPtr dict, |
| 111 | int options, |
| 112 | void* ctxt, |
| 113 | xsltLoadType type) |
| 114 | { |
| 115 | if (!globalProcessor) |
| 116 | return 0; |
| 117 | |
| 118 | switch (type) { |
| 119 | case XSLT_LOAD_DOCUMENT: { |
| 120 | xsltTransformContextPtr context = (xsltTransformContextPtr)ctxt; |
| 121 | xmlChar* base = xmlNodeGetBase(context->document->doc, context->node); |
| 122 | KURL url(KURL(reinterpret_cast<const char*>(base)), reinterpret_cast<const char*>(uri)); |
| 123 | xmlFree(base); |
| 124 | ResourceError error; |
| 125 | ResourceResponse response; |
| 126 | |
| 127 | Vector<char> data; |
| 128 | |
| 129 | bool requestAllowed = globalDocLoader->frame() && globalDocLoader->doc()->securityOrigin()->canRequest(url); |
| 130 | if (requestAllowed) { |
| 131 | globalDocLoader->frame()->loader()->loadResourceSynchronously(url, error, response, data); |
| 132 | requestAllowed = globalDocLoader->doc()->securityOrigin()->canRequest(response.url()); |
| 133 | } |
| 134 | if (!requestAllowed) { |
| 135 | data.clear(); |
| 136 | globalDocLoader->printAccessDeniedMessage(url); |
| 137 | } |
| 138 | |
| 139 | Console* console = 0; |
| 140 | if (Frame* frame = globalProcessor->xslStylesheet()->ownerDocument()->frame()) |
| 141 | console = frame->domWindow()->console(); |
| 142 | xmlSetStructuredErrorFunc(console, XSLTProcessor::parseErrorFunc); |
| 143 | xmlSetGenericErrorFunc(console, XSLTProcessor::genericErrorFunc); |
| 144 | |
| 145 | // We don't specify an encoding here. Neither Gecko nor WinIE respects |
| 146 | // the encoding specified in the HTTP headers. |
| 147 | xmlDocPtr doc = xmlReadMemory(data.data(), data.size(), (const char*)uri, 0, options); |
| 148 | |
| 149 | xmlSetStructuredErrorFunc(0, 0); |
| 150 | xmlSetGenericErrorFunc(0, 0); |
| 151 | |
| 152 | return doc; |
| 153 | } |
| 154 | case XSLT_LOAD_STYLESHEET: |
| 155 | return globalProcessor->xslStylesheet()->locateStylesheetSubResource(((xsltStylesheetPtr)ctxt)->doc, uri); |
| 156 | default: |
| 157 | break; |
| 158 | } |
| 159 | |
| 160 | return 0; |
| 161 | } |
| 162 | |
| 163 | static inline void setXSLTLoadCallBack(xsltDocLoaderFunc func, XSLTProcessor* processor, DocLoader* loader) |
| 164 | { |
| 165 | xsltSetLoaderFunc(func); |
| 166 | globalProcessor = processor; |
| 167 | globalDocLoader = loader; |
| 168 | } |
| 169 | |
| 170 | static int writeToVector(void* context, const char* buffer, int len) |
| 171 | { |
| 172 | Vector<UChar>& resultOutput = *static_cast<Vector<UChar>*>(context); |
| 173 | String decodedChunk = String::fromUTF8(buffer, len); |
| 174 | resultOutput.append(decodedChunk.characters(), decodedChunk.length()); |
| 175 | return len; |
| 176 | } |
| 177 | |
| 178 | static bool saveResultToString(xmlDocPtr resultDoc, xsltStylesheetPtr sheet, String& resultString) |
| 179 | { |
| 180 | xmlOutputBufferPtr outputBuf = xmlAllocOutputBuffer(0); |
| 181 | if (!outputBuf) |
| 182 | return false; |
| 183 | |
| 184 | Vector<UChar> resultVector; |
| 185 | outputBuf->context = &resultVector; |
| 186 | outputBuf->writecallback = writeToVector; |
| 187 | |
| 188 | int retval = xsltSaveResultTo(outputBuf, resultDoc, sheet); |
| 189 | xmlOutputBufferClose(outputBuf); |
| 190 | if (retval < 0) |
| 191 | return false; |
| 192 | |
| 193 | // Workaround for <http://bugzilla.gnome.org/show_bug.cgi?id=495668>: libxslt appends an extra line feed to the result. |
| 194 | if (resultVector.size() > 0 && resultVector[resultVector.size() - 1] == '\n') |
| 195 | resultVector.removeLast(); |
| 196 | |
| 197 | resultString = String::adopt(resultVector); |
| 198 | |
| 199 | return true; |
| 200 | } |
| 201 | |
| 202 | static inline void transformTextStringToXHTMLDocumentString(String& text) |
| 203 | { |
| 204 | // Modify the output so that it is a well-formed XHTML document with a <pre> tag enclosing the text. |
| 205 | text.replace('&', "&"); |
| 206 | text.replace('<', "<"); |
| 207 | text = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n" |
| 208 | "<!DOCTYPE html PUBLIC \"-//W3C//DTD XHTML 1.0 Strict//EN\" \"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd\">\n" |
| 209 | "<html xmlns=\"http://www.w3.org/1999/xhtml\">\n" |
| 210 | "<head><title/></head>\n" |
| 211 | "<body>\n" |
| 212 | "<pre>" + text + "</pre>\n" |
| 213 | "</body>\n" |
| 214 | "</html>\n"; |
| 215 | } |
| 216 | |
| 217 | static const char** xsltParamArrayFromParameterMap(XSLTProcessor::ParameterMap& parameters) |
| 218 | { |
| 219 | if (parameters.isEmpty()) |
| 220 | return 0; |
| 221 | |
| 222 | const char** parameterArray = (const char**)fastMalloc(((parameters.size() * 2) + 1) * sizeof(char*)); |
| 223 | |
| 224 | XSLTProcessor::ParameterMap::iterator end = parameters.end(); |
| 225 | unsigned index = 0; |
| 226 | for (XSLTProcessor::ParameterMap::iterator it = parameters.begin(); it != end; ++it) { |
| 227 | parameterArray[index++] = strdup(it->first.utf8().data()); |
| 228 | parameterArray[index++] = strdup(it->second.utf8().data()); |
| 229 | } |
| 230 | parameterArray[index] = 0; |
| 231 | |
| 232 | return parameterArray; |
| 233 | } |
| 234 | |
| 235 | static void freeXsltParamArray(const char** params) |
| 236 | { |
| 237 | const char** temp = params; |
| 238 | if (!params) |
| 239 | return; |
| 240 | |
| 241 | while (*temp) { |
| 242 | free((void*)*(temp++)); // strdup returns malloc'd blocks, so we have to use free() here |
| 243 | free((void*)*(temp++)); |
| 244 | } |
| 245 | fastFree(params); |
| 246 | } |
| 247 | |
| 248 | |
| 249 | PassRefPtr<Document> XSLTProcessor::createDocumentFromSource(const String& sourceString, |
| 250 | const String& sourceEncoding, const String& sourceMIMEType, Node* sourceNode, Frame* frame) |
| 251 | { |
| 252 | RefPtr<Document> ownerDocument = sourceNode->document(); |
| 253 | bool sourceIsDocument = (sourceNode == ownerDocument.get()); |
| 254 | String documentSource = sourceString; |
| 255 | |
| 256 | RefPtr<Document> result; |
| 257 | if (sourceMIMEType == "text/plain") { |
| 258 | result = ownerDocument->implementation()->createDocument(frame); |
| 259 | transformTextStringToXHTMLDocumentString(documentSource); |
| 260 | } else |
| 261 | result = ownerDocument->implementation()->createDocument(sourceMIMEType, frame, false); |
| 262 | |
| 263 | // Before parsing, we need to save & detach the old document and get the new document |
| 264 | // in place. We have to do this only if we're rendering the result document. |
| 265 | if (frame) { |
| 266 | if (FrameView* view = frame->view()) |
| 267 | view->clear(); |
| 268 | result->setTransformSourceDocument(frame->document()); |
| 269 | frame->setDocument(result); |
| 270 | } |
| 271 | |
| 272 | if (sourceIsDocument) |
| 273 | result->setURL(ownerDocument->url()); |
| 274 | result->open(); |
| 275 | |
| 276 | RefPtr<TextResourceDecoder> decoder = TextResourceDecoder::create(sourceMIMEType); |
| 277 | decoder->setEncoding(sourceEncoding.isEmpty() ? UTF8Encoding() : TextEncoding(sourceEncoding), TextResourceDecoder::EncodingFromXMLHeader); |
| 278 | result->setDecoder(decoder.release()); |
| 279 | |
| 280 | result->write(documentSource); |
| 281 | result->finishParsing(); |
| 282 | result->close(); |
| 283 | |
| 284 | return result.release(); |
| 285 | } |
| 286 | |
| 287 | static inline RefPtr<DocumentFragment> createFragmentFromSource(const String& sourceString, const String& sourceMIMEType, Node* sourceNode, Document* outputDoc) |
| 288 | { |
| 289 | RefPtr<DocumentFragment> fragment = new DocumentFragment(outputDoc); |
| 290 | |
| 291 | if (sourceMIMEType == "text/html") |
| 292 | parseHTMLDocumentFragment(sourceString, fragment.get()); |
| 293 | else if (sourceMIMEType == "text/plain") |
| 294 | fragment->addChild(new Text(outputDoc, sourceString)); |
| 295 | else { |
| 296 | bool successfulParse = parseXMLDocumentFragment(sourceString, fragment.get(), outputDoc->documentElement()); |
| 297 | if (!successfulParse) |
| 298 | return 0; |
| 299 | } |
| 300 | |
| 301 | // FIXME: Do we need to mess with URLs here? |
| 302 | |
| 303 | return fragment; |
| 304 | } |
| 305 | |
| 306 | static xsltStylesheetPtr xsltStylesheetPointer(RefPtr<XSLStyleSheet>& cachedStylesheet, Node* stylesheetRootNode) |
| 307 | { |
| 308 | if (!cachedStylesheet && stylesheetRootNode) { |
| 309 | cachedStylesheet = XSLStyleSheet::create(stylesheetRootNode->parent() ? stylesheetRootNode->parent() : stylesheetRootNode, |
| 310 | stylesheetRootNode->document()->url().string()); |
| 311 | cachedStylesheet->parseString(createMarkup(stylesheetRootNode)); |
| 312 | } |
| 313 | |
| 314 | if (!cachedStylesheet || !cachedStylesheet->document()) |
| 315 | return 0; |
| 316 | |
| 317 | return cachedStylesheet->compileStyleSheet(); |
| 318 | } |
| 319 | |
| 320 | static inline xmlDocPtr xmlDocPtrFromNode(Node* sourceNode, bool& shouldDelete) |
| 321 | { |
| 322 | RefPtr<Document> ownerDocument = sourceNode->document(); |
| 323 | bool sourceIsDocument = (sourceNode == ownerDocument.get()); |
| 324 | |
| 325 | xmlDocPtr sourceDoc = 0; |
| 326 | if (sourceIsDocument) |
| 327 | sourceDoc = (xmlDocPtr)ownerDocument->transformSource(); |
| 328 | if (!sourceDoc) { |
| 329 | sourceDoc = (xmlDocPtr)xmlDocPtrForString(ownerDocument->docLoader(), createMarkup(sourceNode), |
| 330 | sourceIsDocument ? ownerDocument->url().string() : String()); |
| 331 | shouldDelete = (sourceDoc != 0); |
| 332 | } |
| 333 | return sourceDoc; |
| 334 | } |
| 335 | |
| 336 | static inline String resultMIMEType(xmlDocPtr resultDoc, xsltStylesheetPtr sheet) |
| 337 | { |
| 338 | // There are three types of output we need to be able to deal with: |
| 339 | // HTML (create an HTML document), XML (create an XML document), |
| 340 | // and text (wrap in a <pre> and create an XML document). |
| 341 | |
| 342 | const xmlChar* resultType = 0; |
| 343 | XSLT_GET_IMPORT_PTR(resultType, sheet, method); |
| 344 | if (resultType == 0 && resultDoc->type == XML_HTML_DOCUMENT_NODE) |
| 345 | resultType = (const xmlChar*)"html"; |
| 346 | |
| 347 | if (xmlStrEqual(resultType, (const xmlChar*)"html")) |
| 348 | return "text/html"; |
| 349 | else if (xmlStrEqual(resultType, (const xmlChar*)"text")) |
| 350 | return "text/plain"; |
| 351 | |
| 352 | return "application/xml"; |
| 353 | } |
| 354 | |
| 355 | bool XSLTProcessor::transformToString(Node* sourceNode, String& mimeType, String& resultString, String& resultEncoding) |
| 356 | { |
| 357 | RefPtr<Document> ownerDocument = sourceNode->document(); |
| 358 | |
| 359 | setXSLTLoadCallBack(docLoaderFunc, this, ownerDocument->docLoader()); |
| 360 | xsltStylesheetPtr sheet = xsltStylesheetPointer(m_stylesheet, m_stylesheetRootNode.get()); |
| 361 | if (!sheet) { |
| 362 | setXSLTLoadCallBack(0, 0, 0); |
| 363 | return false; |
| 364 | } |
| 365 | m_stylesheet->clearDocuments(); |
| 366 | |
| 367 | xmlChar* origMethod = sheet->method; |
| 368 | if (!origMethod && mimeType == "text/html") |
| 369 | sheet->method = (xmlChar*)"html"; |
| 370 | |
| 371 | bool success = false; |
| 372 | bool shouldFreeSourceDoc = false; |
| 373 | if (xmlDocPtr sourceDoc = xmlDocPtrFromNode(sourceNode, shouldFreeSourceDoc)) { |
| 374 | // The XML declaration would prevent parsing the result as a fragment, and it's not needed even for documents, |
| 375 | // as the result of this function is always immediately parsed. |
| 376 | sheet->omitXmlDeclaration = true; |
| 377 | |
| 378 | xsltTransformContextPtr transformContext = xsltNewTransformContext(sheet, sourceDoc); |
| 379 | registerXSLTExtensions(transformContext); |
| 380 | |
| 381 | // <http://bugs.webkit.org/show_bug.cgi?id=16077>: XSLT processor <xsl:sort> algorithm only compares by code point |
| 382 | xsltSetCtxtSortFunc(transformContext, xsltUnicodeSortFunction); |
| 383 | |
| 384 | // This is a workaround for a bug in libxslt. |
| 385 | // The bug has been fixed in version 1.1.13, so once we ship that this can be removed. |
| 386 | if (transformContext->globalVars == NULL) |
| 387 | transformContext->globalVars = xmlHashCreate(20); |
| 388 | |
| 389 | const char** params = xsltParamArrayFromParameterMap(m_parameters); |
| 390 | xsltQuoteUserParams(transformContext, params); |
| 391 | xmlDocPtr resultDoc = xsltApplyStylesheetUser(sheet, sourceDoc, 0, 0, 0, transformContext); |
| 392 | |
| 393 | xsltFreeTransformContext(transformContext); |
| 394 | freeXsltParamArray(params); |
| 395 | |
| 396 | if (shouldFreeSourceDoc) |
| 397 | xmlFreeDoc(sourceDoc); |
| 398 | |
| 399 | if (success = saveResultToString(resultDoc, sheet, resultString)) { |
| 400 | mimeType = resultMIMEType(resultDoc, sheet); |
| 401 | resultEncoding = (char*)resultDoc->encoding; |
| 402 | } |
| 403 | xmlFreeDoc(resultDoc); |
| 404 | } |
| 405 | |
| 406 | sheet->method = origMethod; |
| 407 | setXSLTLoadCallBack(0, 0, 0); |
| 408 | xsltFreeStylesheet(sheet); |
| 409 | m_stylesheet = 0; |
| 410 | |
| 411 | return success; |
| 412 | } |
| 413 | |
| 414 | PassRefPtr<Document> XSLTProcessor::transformToDocument(Node* sourceNode) |
| 415 | { |
| 416 | String resultMIMEType; |
| 417 | String resultString; |
| 418 | String resultEncoding; |
| 419 | if (!transformToString(sourceNode, resultMIMEType, resultString, resultEncoding)) |
| 420 | return 0; |
| 421 | return createDocumentFromSource(resultString, resultEncoding, resultMIMEType, sourceNode, 0); |
| 422 | } |
| 423 | |
| 424 | PassRefPtr<DocumentFragment> XSLTProcessor::transformToFragment(Node* sourceNode, Document* outputDoc) |
| 425 | { |
| 426 | String resultMIMEType; |
| 427 | String resultString; |
| 428 | String resultEncoding; |
| 429 | |
| 430 | // If the output document is HTML, default to HTML method. |
| 431 | if (outputDoc->isHTMLDocument()) |
| 432 | resultMIMEType = "text/html"; |
| 433 | |
| 434 | if (!transformToString(sourceNode, resultMIMEType, resultString, resultEncoding)) |
| 435 | return 0; |
| 436 | return createFragmentFromSource(resultString, resultMIMEType, sourceNode, outputDoc); |
| 437 | } |
| 438 | |
| 439 | void XSLTProcessor::setParameter(const String& namespaceURI, const String& localName, const String& value) |
| 440 | { |
| 441 | // FIXME: namespace support? |
| 442 | // should make a QualifiedName here but we'd have to expose the impl |
| 443 | m_parameters.set(localName, value); |
| 444 | } |
| 445 | |
| 446 | String XSLTProcessor::getParameter(const String& namespaceURI, const String& localName) const |
| 447 | { |
| 448 | // FIXME: namespace support? |
| 449 | // should make a QualifiedName here but we'd have to expose the impl |
| 450 | return m_parameters.get(localName); |
| 451 | } |
| 452 | |
| 453 | void XSLTProcessor::removeParameter(const String& namespaceURI, const String& localName) |
| 454 | { |
| 455 | // FIXME: namespace support? |
| 456 | m_parameters.remove(localName); |
| 457 | } |
| 458 | |
| 459 | } // namespace WebCore |
| 460 | |
| 461 | #endif // ENABLE(XSLT) |