/** * Copyright (C) 1999 Lars Knoll (knoll@kde.org) * (C) 1999 Antti Koivisto (koivisto@kde.org) * Copyright (C) 2003, 2004, 2005, 2006, 2007 Apple Inc. All rights reserved. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public License * along with this library; see the file COPYING.LIB. If not, write to * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, * Boston, MA 02110-1301, USA. * * Portions are Copyright (C) 2002 Netscape Communications Corporation. * Other contributors: David Baron * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA * * Alternatively, the document type parsing portions of this file may be used * under the terms of either the Mozilla Public License Version 1.1, found at * http://www.mozilla.org/MPL/ (the "MPL") or the GNU General Public * License Version 2.0, found at http://www.fsf.org/copyleft/gpl.html * (the "GPL"), in which case the provisions of the MPL or the GPL are * applicable instead of those above. If you wish to allow use of your * version of this file only under the terms of one of those two * licenses (the MPL or the GPL) and not to allow others to use your * version of this file under the LGPL, indicate your decision by * deleting the provisions above and replace them with the notice and * other provisions required by the MPL or the GPL, as the case may be. * If you do not delete the provisions above, a recipient may use your * version of this file under any of the LGPL, the MPL or the GPL. */ #include "config.h" #include "HTMLDocument.h" #include "CSSPropertyNames.h" #include "CSSStyleSelector.h" #include "CString.h" #include "CookieJar.h" #include "DocumentLoader.h" #include "DocumentType.h" #include "ExceptionCode.h" #include "Frame.h" #include "FrameLoader.h" #include "FrameView.h" #include "HTMLBodyElement.h" #include "HTMLElement.h" #include "HTMLElementFactory.h" #include "HTMLNames.h" #include "HTMLTokenizer.h" #include "InspectorController.h" #include "KURL.h" #include "Page.h" #include "DocTypeStrings.cpp" namespace WebCore { using namespace HTMLNames; HTMLDocument::HTMLDocument(DOMImplementation* implementation, Frame* frame) : Document(implementation, frame) { clearXMLVersion(); } HTMLDocument::~HTMLDocument() { } int HTMLDocument::width() { updateLayoutIgnorePendingStylesheets(); FrameView* frameView = view(); return frameView ? frameView->contentsWidth() : 0; } int HTMLDocument::height() { updateLayoutIgnorePendingStylesheets(); FrameView* frameView = view(); return frameView ? frameView->contentsHeight() : 0; } String HTMLDocument::dir() { HTMLElement* b = body(); if (!b) return String(); return b->dir(); } void HTMLDocument::setDir(const String& value) { HTMLElement* b = body(); if (b) b->setDir(value); } String HTMLDocument::designMode() const { return inDesignMode() ? "on" : "off"; } void HTMLDocument::setDesignMode(const String& value) { InheritedBool mode; if (equalIgnoringCase(value, "on")) mode = on; else if (equalIgnoringCase(value, "off")) mode = off; else mode = inherit; Document::setDesignMode(mode); } String HTMLDocument::compatMode() const { return inCompatMode() ? "BackCompat" : "CSS1Compat"; } String HTMLDocument::bgColor() { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (!bodyElement) return String(); return bodyElement->bgColor(); } void HTMLDocument::setBgColor(const String& value) { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (bodyElement) bodyElement->setBgColor(value); } String HTMLDocument::fgColor() { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (!bodyElement) return String(); return bodyElement->text(); } void HTMLDocument::setFgColor(const String& value) { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (bodyElement) bodyElement->setText(value); } String HTMLDocument::alinkColor() { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (!bodyElement) return String(); return bodyElement->aLink(); } void HTMLDocument::setAlinkColor(const String& value) { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (bodyElement) { // This check is a bit silly, but some benchmarks like to set the // document's link colors over and over to the same value and we // don't want to incur a style update each time. if (bodyElement->aLink() != value) bodyElement->setALink(value); } } String HTMLDocument::linkColor() { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (!bodyElement) return String(); return bodyElement->link(); } void HTMLDocument::setLinkColor(const String& value) { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (bodyElement) { // This check is a bit silly, but some benchmarks like to set the // document's link colors over and over to the same value and we // don't want to incur a style update each time. if (bodyElement->link() != value) bodyElement->setLink(value); } } String HTMLDocument::vlinkColor() { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (!bodyElement) return String(); return bodyElement->vLink(); } void HTMLDocument::setVlinkColor(const String& value) { HTMLElement* b = body(); HTMLBodyElement* bodyElement = (b && b->hasTagName(bodyTag)) ? static_cast(b) : 0; if (bodyElement) { // This check is a bit silly, but some benchmarks like to set the // document's link colors over and over to the same value and we // don't want to incur a style update each time. if (bodyElement->vLink() != value) bodyElement->setVLink(value); } } void HTMLDocument::captureEvents() { } void HTMLDocument::releaseEvents() { } Tokenizer *HTMLDocument::createTokenizer() { bool reportErrors = true; return new HTMLTokenizer(this, reportErrors); } // -------------------------------------------------------------------------- // not part of the DOM // -------------------------------------------------------------------------- bool HTMLDocument::childAllowed(Node *newChild) { return newChild->hasTagName(htmlTag) || newChild->isCommentNode(); } PassRefPtr HTMLDocument::createElement(const String &name, ExceptionCode& ec) { String lowerName(name.lower()); if (!isValidName(lowerName)) { ec = INVALID_CHARACTER_ERR; return 0; } return HTMLElementFactory::createHTMLElement(AtomicString(lowerName), this, 0, false); } static void addItemToMap(HTMLDocument::NameCountMap& map, const String& name) { if (name.length() == 0) return; HTMLDocument::NameCountMap::iterator it = map.find(name.impl()); if (it == map.end()) map.set(name.impl(), 1); else ++(it->second); } static void removeItemFromMap(HTMLDocument::NameCountMap& map, const String& name) { if (name.length() == 0) return; HTMLDocument::NameCountMap::iterator it = map.find(name.impl()); if (it == map.end()) return; int oldVal = it->second; ASSERT(oldVal != 0); int newVal = oldVal - 1; if (newVal == 0) map.remove(it); else it->second = newVal; } void HTMLDocument::addNamedItem(const String& name) { addItemToMap(namedItemCounts, name); } void HTMLDocument::removeNamedItem(const String &name) { removeItemFromMap(namedItemCounts, name); } bool HTMLDocument::hasNamedItem(const String& name) { return namedItemCounts.get(name.impl()) != 0; } void HTMLDocument::addDocExtraNamedItem(const String& name) { addItemToMap(docExtraNamedItemCounts, name); } void HTMLDocument::removeDocExtraNamedItem(const String& name) { removeItemFromMap(docExtraNamedItemCounts, name); } bool HTMLDocument::hasDocExtraNamedItem(const String& name) { return docExtraNamedItemCounts.get(name.impl()) != 0; } const int PARSEMODE_HAVE_DOCTYPE = (1<<0); const int PARSEMODE_HAVE_PUBLIC_ID = (1<<1); const int PARSEMODE_HAVE_SYSTEM_ID = (1<<2); const int PARSEMODE_HAVE_INTERNAL = (1<<3); static int parseDocTypePart(const String& buffer, int index) { while (true) { UChar ch = buffer[index]; if (ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r') ++index; else if (ch == '-') { int tmpIndex=index; if (buffer[index+1] == '-' && ((tmpIndex=buffer.find("--", index+2)) != -1)) index = tmpIndex+2; else return index; } else return index; } } static bool containsString(const char* str, const String& buffer, int offset) { String startString(str); if (offset + startString.length() > buffer.length()) return false; String bufferString = buffer.substring(offset, startString.length()).lower(); String lowerStart = startString.lower(); return bufferString.startsWith(lowerStart); } static bool parseDocTypeDeclaration(const String& buffer, int* resultFlags, String& name, String& publicID, String& systemID) { bool haveDocType = false; *resultFlags = 0; // Skip through any comments and processing instructions. int index = 0; do { index = buffer.find('<', index); if (index == -1) break; UChar nextChar = buffer[index+1]; if (nextChar == '!') { if (containsString("doctype", buffer, index+2)) { haveDocType = true; index += 9; // Skip "', index); } else if (nextChar == '?') index = buffer.find('>', index); else break; } while (index != -1); if (!haveDocType) return true; *resultFlags |= PARSEMODE_HAVE_DOCTYPE; index = parseDocTypePart(buffer, index); if (!containsString("html", buffer, index)) return false; name = buffer.substring(index, 4); index = parseDocTypePart(buffer, index+4); bool hasPublic = containsString("public", buffer, index); if (hasPublic) { index = parseDocTypePart(buffer, index+6); // We've read ') { // Public identifier present, but no system identifier. // Do nothing. Note that this is the most common // case. } else if (next == '\"' || next == '\'') { // We have a system identifier. *resultFlags |= PARSEMODE_HAVE_SYSTEM_ID; int systemIDStart = index+1; int systemIDEnd = buffer.find(next, systemIDStart); if (systemIDEnd == -1) return false; systemID = buffer.substring(systemIDStart, systemIDEnd - systemIDStart); } else if (next == '[') { // We found an internal subset. *resultFlags |= PARSEMODE_HAVE_INTERNAL; } else return false; // Something's wrong. // We need to trim whitespace off the public identifier. publicID = buffer.substring(publicIDStart, publicIDEnd - publicIDStart); publicID = publicID.stripWhiteSpace(); *resultFlags |= PARSEMODE_HAVE_PUBLIC_ID; } else { if (containsString("system", buffer, index)) { // Doctype has a system ID but no public ID *resultFlags |= PARSEMODE_HAVE_SYSTEM_ID; index = parseDocTypePart(buffer, index+6); UChar next = buffer[index]; if (next != '\"' && next != '\'') return false; int systemIDStart = index+1; int systemIDEnd = buffer.find(next, systemIDStart); if (systemIDEnd == -1) return false; systemID = buffer.substring(systemIDStart, systemIDEnd - systemIDStart); index = parseDocTypePart(buffer, systemIDEnd+1); } UChar nextChar = buffer[index]; if (nextChar == '[') *resultFlags |= PARSEMODE_HAVE_INTERNAL; else if (nextChar != '>') return false; } return true; } void HTMLDocument::determineParseMode(const String& str) { // This code more or less mimics Mozilla's implementation (specifically the // doctype parsing implemented by David Baron in Mozilla's nsParser.cpp). // // There are three possible parse modes: // COMPAT - quirks mode emulates WinIE // and NS4. CSS parsing is also relaxed in this mode, e.g., unit types can // be omitted from numbers. // ALMOST STRICT - This mode is identical to strict mode // except for its treatment of line-height in the inline box model. For // now (until the inline box model is re-written), this mode is identical // to STANDARDS mode. // STRICT - no quirks apply. Web pages will obey the specifications to // the letter. String name, systemID, publicID; int resultFlags = 0; if (parseDocTypeDeclaration(str, &resultFlags, name, publicID, systemID)) { if (resultFlags & PARSEMODE_HAVE_DOCTYPE) setDocType(new DocumentType(this, name, publicID, systemID)); if (!(resultFlags & PARSEMODE_HAVE_DOCTYPE)) { // No doctype found at all. Default to quirks mode and Html4. setParseMode(Compat); setHTMLMode(Html4); } else if ((resultFlags & PARSEMODE_HAVE_INTERNAL) || !(resultFlags & PARSEMODE_HAVE_PUBLIC_ID)) { // Internal subsets always denote full standards, as does // a doctype without a public ID. setParseMode(Strict); setHTMLMode(Html4); } else { // We have to check a list of public IDs to see what we // should do. String lowerPubID = publicID.lower(); CString pubIDStr = lowerPubID.latin1(); // Look up the entry in our gperf-generated table. const PubIDInfo* doctypeEntry = findDoctypeEntry(pubIDStr.data(), pubIDStr.length()); if (!doctypeEntry) { // The DOCTYPE is not in the list. Assume strict mode. setParseMode(Strict); setHTMLMode(Html4); return; } switch ((resultFlags & PARSEMODE_HAVE_SYSTEM_ID) ? doctypeEntry->mode_if_sysid : doctypeEntry->mode_if_no_sysid) { case PubIDInfo::eQuirks3: setParseMode(Compat); setHTMLMode(Html3); break; case PubIDInfo::eQuirks: setParseMode(Compat); setHTMLMode(Html4); break; case PubIDInfo::eAlmostStandards: setParseMode(AlmostStrict); setHTMLMode(Html4); break; default: ASSERT(false); } } } else { // Malformed doctype implies quirks mode. setParseMode(Compat); setHTMLMode(Html3); } styleSelector()->strictParsing = !inCompatMode(); } }