/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* ***** BEGIN LICENSE BLOCK ***** * Version: MPL 1.1/GPL 2.0/LGPL 2.1 * * The contents of this file are subject to the Mozilla Public License Version * 1.1 (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the * License. * * The Original Code is mozilla.org code. * * The Initial Developer of the Original Code is * Netscape Communications Corporation. * Portions created by the Initial Developer are Copyright (C) 1998 * the Initial Developer. All Rights Reserved. * * Contributor(s): * * Alternatively, the contents of this file may be used under the terms of * either the GNU General Public License Version 2 or later (the "GPL"), or * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"), * in which case the provisions of the GPL or the LGPL are applicable instead * of those above. If you wish to allow use of your version of this file only * under the terms of either the GPL or the LGPL, and not to allow others to * use your version of this file under the terms of the MPL, indicate your * decision by deleting the provisions above and replace them with the notice * and other provisions required by the GPL or the LGPL. If you do not delete * the provisions above, a recipient may use your version of this file under * the terms of any one of the MPL, the GPL or the LGPL. * * ***** END LICENSE BLOCK ***** */ /* * Base class for the XML and HTML content sinks, which construct a * DOM based on information from the parser. */ #include "nsContentSink.h" #include "nsIScriptLoader.h" #include "nsIDocument.h" #include "nsICSSLoader.h" #include "nsStyleConsts.h" #include "nsStyleLinkElement.h" #include "nsINodeInfo.h" #include "nsIDocShell.h" #include "nsIDocShellTreeItem.h" #include "nsCPrefetchService.h" #include "nsIURI.h" #include "nsNetUtil.h" #include "nsIHttpChannel.h" #include "nsIContent.h" #include "nsIScriptElement.h" #include "nsIParser.h" #include "nsContentErrors.h" #include "nsIPresShell.h" #include "nsPresContext.h" #include "nsIViewManager.h" #include "nsIScrollableView.h" #include "nsIContentViewer.h" #include "nsIAtom.h" #include "nsHTMLAtoms.h" #include "nsIDOMWindowInternal.h" #include "nsIPrincipal.h" #include "nsIScriptGlobalObject.h" #include "nsNetCID.h" #include "nsICookieService.h" #include "nsIPrompt.h" #include "nsServiceManagerUtils.h" #include "nsContentUtils.h" #include "nsParserUtils.h" #include "nsCRT.h" #include "nsEscape.h" #include "nsWeakReference.h" #include "nsUnicharUtils.h" #include "nsNodeInfoManager.h" #ifdef ALLOW_ASYNCH_STYLE_SHEETS const PRBool kBlockByDefault = PR_FALSE; #else const PRBool kBlockByDefault = PR_TRUE; #endif class nsScriptLoaderObserverProxy : public nsIScriptLoaderObserver { public: nsScriptLoaderObserverProxy(nsIScriptLoaderObserver* aInner) : mInner(do_GetWeakReference(aInner)) { } virtual ~nsScriptLoaderObserverProxy() { } NS_DECL_ISUPPORTS NS_DECL_NSISCRIPTLOADEROBSERVER nsWeakPtr mInner; }; NS_IMPL_ISUPPORTS1(nsScriptLoaderObserverProxy, nsIScriptLoaderObserver) NS_IMETHODIMP nsScriptLoaderObserverProxy::ScriptAvailable(nsresult aResult, nsIScriptElement *aElement, PRBool aIsInline, PRBool aWasPending, nsIURI *aURI, PRInt32 aLineNo, const nsAString & aScript) { nsCOMPtr inner = do_QueryReferent(mInner); if (inner) { return inner->ScriptAvailable(aResult, aElement, aIsInline, aWasPending, aURI, aLineNo, aScript); } return NS_OK; } NS_IMETHODIMP nsScriptLoaderObserverProxy::ScriptEvaluated(nsresult aResult, nsIScriptElement *aElement, PRBool aIsInline, PRBool aWasPending) { nsCOMPtr inner = do_QueryReferent(mInner); if (inner) { return inner->ScriptEvaluated(aResult, aElement, aIsInline, aWasPending); } return NS_OK; } NS_IMPL_ISUPPORTS3(nsContentSink, nsICSSLoaderObserver, nsISupportsWeakReference, nsIScriptLoaderObserver) nsContentSink::nsContentSink() : mNeedToBlockParser(PR_FALSE) { } nsContentSink::~nsContentSink() { } nsresult nsContentSink::Init(nsIDocument* aDoc, nsIURI* aURI, nsISupports* aContainer, nsIChannel* aChannel) { NS_PRECONDITION(aDoc, "null ptr"); NS_PRECONDITION(aURI, "null ptr"); if (!aDoc || !aURI) { return NS_ERROR_NULL_POINTER; } mDocument = aDoc; mDocumentURI = aURI; mDocumentBaseURI = aURI; mDocShell = do_QueryInterface(aContainer); // use this to avoid a circular reference sink->document->scriptloader->sink nsCOMPtr proxy = new nsScriptLoaderObserverProxy(this); NS_ENSURE_TRUE(proxy, NS_ERROR_OUT_OF_MEMORY); nsIScriptLoader *loader = mDocument->GetScriptLoader(); NS_ENSURE_TRUE(loader, NS_ERROR_FAILURE); nsresult rv = loader->AddObserver(proxy); NS_ENSURE_SUCCESS(rv, rv); mCSSLoader = aDoc->CSSLoader(); ProcessHTTPHeaders(aChannel); mNodeInfoManager = aDoc->NodeInfoManager(); return NS_OK; } NS_IMETHODIMP nsContentSink::StyleSheetLoaded(nsICSSStyleSheet* aSheet, PRBool aWasAlternate, nsresult aStatus) { return NS_OK; } NS_IMETHODIMP nsContentSink::ScriptAvailable(nsresult aResult, nsIScriptElement *aElement, PRBool aIsInline, PRBool aWasPending, nsIURI *aURI, PRInt32 aLineNo, const nsAString& aScript) { PRUint32 count = mScriptElements.Count(); if (count == 0) { return NS_OK; } // Check if this is the element we were waiting for if (aElement != mScriptElements[count - 1]) { return NS_OK; } if (mParser && !mParser->IsParserEnabled()) { // make sure to unblock the parser before evaluating the script, // we must unblock the parser even if loading the script failed or // if the script was empty, if we don't, the parser will never be // unblocked. mParser->UnblockParser(); } // Mark the current script as loaded mNeedToBlockParser = PR_FALSE; if (NS_SUCCEEDED(aResult) && aResult != NS_CONTENT_SCRIPT_IS_EVENTHANDLER) { PreEvaluateScript(); } else { mScriptElements.RemoveObjectAt(count - 1); if (mParser && aWasPending && aResult != NS_BINDING_ABORTED) { // Loading external script failed!. So, resume parsing since the parser // got blocked when loading external script. See // http://bugzilla.mozilla.org/show_bug.cgi?id=94903. // // XXX We don't resume parsing if we get NS_BINDING_ABORTED from the // script load, assuming that that error code means that the user // stopped the load through some action (like clicking a link). See // http://bugzilla.mozilla.org/show_bug.cgi?id=243392. mParser->ContinueInterruptedParsing(); } } return NS_OK; } NS_IMETHODIMP nsContentSink::ScriptEvaluated(nsresult aResult, nsIScriptElement *aElement, PRBool aIsInline, PRBool aWasPending) { // Check if this is the element we were waiting for PRInt32 count = mScriptElements.Count(); if (count == 0) { return NS_OK; } if (aElement != mScriptElements[count - 1]) { return NS_OK; } // Pop the script element stack mScriptElements.RemoveObjectAt(count - 1); if (NS_SUCCEEDED(aResult)) { PostEvaluateScript(aElement); } if (mParser && mParser->IsParserEnabled() && aWasPending) { mParser->ContinueInterruptedParsing(); } return NS_OK; } nsresult nsContentSink::ProcessHTTPHeaders(nsIChannel* aChannel) { nsCOMPtr httpchannel(do_QueryInterface(aChannel)); if (!httpchannel) { return NS_OK; } // Note that the only header we care about is the "link" header, since we // have all the infrastructure for kicking off stylesheet loads. nsCAutoString linkHeader; nsresult rv = httpchannel->GetResponseHeader(NS_LITERAL_CSTRING("link"), linkHeader); if (NS_SUCCEEDED(rv) && !linkHeader.IsEmpty()) { ProcessHeaderData(nsHTMLAtoms::link, NS_ConvertASCIItoUTF16(linkHeader)); } return NS_OK; } nsresult nsContentSink::ProcessHeaderData(nsIAtom* aHeader, const nsAString& aValue, nsIContent* aContent) { nsresult rv = NS_OK; // necko doesn't process headers coming in from the parser mDocument->SetHeaderData(aHeader, aValue); if (aHeader == nsHTMLAtoms::setcookie) { // Note: Necko already handles cookies set via the channel. We can't just // call SetCookie on the channel because we want to do some security checks // here and want to use the prompt associated to our current window, not // the window where the channel was dispatched. nsCOMPtr cookieServ = do_GetService(NS_COOKIESERVICE_CONTRACTID, &rv); if (NS_FAILED(rv)) { return rv; } // Get a URI from the document principal // We use the original codebase in case the codebase was changed // by SetDomain // Note that a non-codebase principal (eg the system principal) will return // a null URI. nsCOMPtr codebaseURI; rv = mDocument->NodePrincipal()->GetURI(getter_AddRefs(codebaseURI)); NS_ENSURE_TRUE(codebaseURI, rv); nsCOMPtr prompt; nsCOMPtr window (do_QueryInterface(mDocument->GetScriptGlobalObject())); if (window) { window->GetPrompter(getter_AddRefs(prompt)); } nsCOMPtr channel; if (mParser) { mParser->GetChannel(getter_AddRefs(channel)); } rv = cookieServ->SetCookieString(codebaseURI, prompt, NS_ConvertUTF16toUTF8(aValue).get(), channel); if (NS_FAILED(rv)) { return rv; } } else if (aHeader == nsHTMLAtoms::link) { rv = ProcessLinkHeader(aContent, aValue); } else if (aHeader == nsHTMLAtoms::msthemecompatible) { // Disable theming for the presshell if the value is no. // XXXbz don't we want to support this as an HTTP header too? nsAutoString value(aValue); if (value.LowerCaseEqualsLiteral("no")) { nsIPresShell* shell = mDocument->GetShellAt(0); if (shell) { shell->DisableThemeSupport(); } } } // Don't report "refresh" headers back to necko, since our document handles // them else if (aHeader != nsHTMLAtoms::refresh && mParser) { // we also need to report back HTTP-EQUIV headers to the channel // so that it can process things like pragma: no-cache or other // cache-control headers. Ideally this should also be the way for // cookies to be set! But we'll worry about that in the next // iteration nsCOMPtr channel; if (NS_SUCCEEDED(mParser->GetChannel(getter_AddRefs(channel)))) { nsCOMPtr httpChannel(do_QueryInterface(channel)); if (httpChannel) { const char* header; (void)aHeader->GetUTF8String(&header); (void)httpChannel->SetResponseHeader(nsDependentCString(header), NS_ConvertUTF16toUTF8(aValue), PR_TRUE); } } } return rv; } static const PRUnichar kSemiCh = PRUnichar(';'); static const PRUnichar kCommaCh = PRUnichar(','); static const PRUnichar kEqualsCh = PRUnichar('='); static const PRUnichar kLessThanCh = PRUnichar('<'); static const PRUnichar kGreaterThanCh = PRUnichar('>'); nsresult nsContentSink::ProcessLinkHeader(nsIContent* aElement, const nsAString& aLinkData) { nsresult rv = NS_OK; // parse link content and call process style link nsAutoString href; nsAutoString rel; nsAutoString title; nsAutoString type; nsAutoString media; PRBool didBlock = PR_FALSE; // copy to work buffer nsAutoString stringList(aLinkData); // put an extra null at the end stringList.Append(kNullCh); PRUnichar* start = stringList.BeginWriting(); PRUnichar* end = start; PRUnichar* last = start; PRUnichar endCh; while (*start != kNullCh) { // skip leading space while ((*start != kNullCh) && nsCRT::IsAsciiSpace(*start)) { ++start; } end = start; last = end - 1; // look for semicolon or comma while (*end != kNullCh && *end != kSemiCh && *end != kCommaCh) { PRUnichar ch = *end; if (ch == kApostrophe || ch == kQuote || ch == kLessThanCh) { // quoted string PRUnichar quote = *end; if (quote == kLessThanCh) { quote = kGreaterThanCh; } PRUnichar* closeQuote = (end + 1); // seek closing quote while (*closeQuote != kNullCh && quote != *closeQuote) { ++closeQuote; } if (quote == *closeQuote) { // found closer // skip to close quote end = closeQuote; last = end - 1; ch = *(end + 1); if (ch != kNullCh && ch != kSemiCh && ch != kCommaCh) { // end string here *(++end) = kNullCh; ch = *(end + 1); // keep going until semi or comma while (ch != kNullCh && ch != kSemiCh && ch != kCommaCh) { ++end; ch = *end; } } } } ++end; ++last; } endCh = *end; // end string here *end = kNullCh; if (start < end) { if ((*start == kLessThanCh) && (*last == kGreaterThanCh)) { *last = kNullCh; if (href.IsEmpty()) { // first one wins href = (start + 1); href.StripWhitespace(); } } else { PRUnichar* equals = start; while ((*equals != kNullCh) && (*equals != kEqualsCh)) { equals++; } if (*equals != kNullCh) { *equals = kNullCh; nsAutoString attr(start); attr.StripWhitespace(); PRUnichar* value = ++equals; while (nsCRT::IsAsciiSpace(*value)) { value++; } if (((*value == kApostrophe) || (*value == kQuote)) && (*value == *last)) { *last = kNullCh; value++; } if (attr.LowerCaseEqualsLiteral("rel")) { if (rel.IsEmpty()) { rel = value; rel.CompressWhitespace(); } } else if (attr.LowerCaseEqualsLiteral("title")) { if (title.IsEmpty()) { title = value; title.CompressWhitespace(); } } else if (attr.LowerCaseEqualsLiteral("type")) { if (type.IsEmpty()) { type = value; type.StripWhitespace(); } } else if (attr.LowerCaseEqualsLiteral("media")) { if (media.IsEmpty()) { media = value; // HTML4.0 spec is inconsistent, make it case INSENSITIVE ToLowerCase(media); } } } } } if (endCh == kCommaCh) { // hit a comma, process what we've got so far if (!href.IsEmpty() && !rel.IsEmpty()) { rv = ProcessLink(aElement, href, rel, title, type, media); if (rv == NS_ERROR_HTMLPARSER_BLOCK) { didBlock = PR_TRUE; } } href.Truncate(); rel.Truncate(); title.Truncate(); type.Truncate(); media.Truncate(); } start = ++end; } if (!href.IsEmpty() && !rel.IsEmpty()) { rv = ProcessLink(aElement, href, rel, title, type, media); if (NS_SUCCEEDED(rv) && didBlock) { rv = NS_ERROR_HTMLPARSER_BLOCK; } } return rv; } nsresult nsContentSink::ProcessLink(nsIContent* aElement, const nsSubstring& aHref, const nsSubstring& aRel, const nsSubstring& aTitle, const nsSubstring& aType, const nsSubstring& aMedia) { // XXX seems overkill to generate this string array nsStringArray linkTypes; nsStyleLinkElement::ParseLinkTypes(aRel, linkTypes); PRBool hasPrefetch = (linkTypes.IndexOf(NS_LITERAL_STRING("prefetch")) != -1); // prefetch href if relation is "next" or "prefetch" if (hasPrefetch || linkTypes.IndexOf(NS_LITERAL_STRING("next")) != -1) { PrefetchHref(aHref, hasPrefetch); } // is it a stylesheet link? if (linkTypes.IndexOf(NS_LITERAL_STRING("stylesheet")) == -1) { return NS_OK; } PRBool isAlternate = linkTypes.IndexOf(NS_LITERAL_STRING("alternate")) != -1; return ProcessStyleLink(aElement, aHref, isAlternate, aTitle, aType, aMedia); } nsresult nsContentSink::ProcessStyleLink(nsIContent* aElement, const nsSubstring& aHref, PRBool aAlternate, const nsSubstring& aTitle, const nsSubstring& aType, const nsSubstring& aMedia) { if (aAlternate && aTitle.IsEmpty()) { // alternates must have title return without error, for now return NS_OK; } nsAutoString mimeType; nsAutoString params; nsParserUtils::SplitMimeType(aType, mimeType, params); // see bug 18817 if (!mimeType.IsEmpty() && !mimeType.LowerCaseEqualsLiteral("text/css")) { // Unknown stylesheet language return NS_OK; } nsCOMPtr url; nsresult rv = NS_NewURI(getter_AddRefs(url), aHref, nsnull, mDocumentBaseURI); if (NS_FAILED(rv)) { // The URI is bad, move along, don't propagate the error (for now) return NS_OK; } nsIParser* parser = nsnull; if (kBlockByDefault) { parser = mParser; } PRBool isAlternate; rv = mCSSLoader->LoadStyleLink(aElement, url, aTitle, aMedia, aAlternate, parser, this, &isAlternate); if (NS_SUCCEEDED(rv) && parser && !isAlternate) { rv = NS_ERROR_HTMLPARSER_BLOCK; } return rv; } nsresult nsContentSink::ProcessMETATag(nsIContent* aContent) { NS_ASSERTION(aContent, "missing base-element"); nsresult rv = NS_OK; // set any HTTP-EQUIV data into document's header data as well as url nsAutoString header; aContent->GetAttr(kNameSpaceID_None, nsHTMLAtoms::httpEquiv, header); if (!header.IsEmpty()) { nsAutoString result; aContent->GetAttr(kNameSpaceID_None, nsHTMLAtoms::content, result); if (!result.IsEmpty()) { ToLowerCase(header); nsCOMPtr fieldAtom(do_GetAtom(header)); rv = ProcessHeaderData(fieldAtom, result, aContent); } } return rv; } void nsContentSink::PrefetchHref(const nsAString &aHref, PRBool aExplicit) { // // SECURITY CHECK: disable prefetching from mailnews! // // walk up the docshell tree to see if any containing // docshell are of type MAIL. // if (!mDocShell) return; nsCOMPtr docshell = mDocShell; nsCOMPtr treeItem, parentItem; do { PRUint32 appType = 0; nsresult rv = docshell->GetAppType(&appType); if (NS_FAILED(rv) || appType == nsIDocShell::APP_TYPE_MAIL) return; // do not prefetch from mailnews if (treeItem = do_QueryInterface(docshell)) { treeItem->GetParent(getter_AddRefs(parentItem)); if (parentItem) { treeItem = parentItem; docshell = do_QueryInterface(treeItem); if (!docshell) { NS_ERROR("cannot get a docshell from a treeItem!"); return; } } } } while (parentItem); // OK, we passed the security check... nsCOMPtr prefetchService(do_GetService(NS_PREFETCHSERVICE_CONTRACTID)); if (prefetchService) { // construct URI using document charset const nsACString &charset = mDocument->GetDocumentCharacterSet(); nsCOMPtr uri; NS_NewURI(getter_AddRefs(uri), aHref, charset.IsEmpty() ? nsnull : PromiseFlatCString(charset).get(), mDocumentBaseURI); if (uri) { prefetchService->PrefetchURI(uri, mDocumentURI, aExplicit); } } } PRBool nsContentSink::ScrollToRef(PRBool aReallyScroll) { if (mRef.IsEmpty()) { return PR_FALSE; } PRBool didScroll = PR_FALSE; char* tmpstr = ToNewCString(mRef); if (!tmpstr) { return PR_FALSE; } nsUnescape(tmpstr); nsCAutoString unescapedRef; unescapedRef.Assign(tmpstr); nsMemory::Free(tmpstr); nsresult rv = NS_ERROR_FAILURE; // We assume that the bytes are in UTF-8, as it says in the spec: // http://www.w3.org/TR/html4/appendix/notes.html#h-B.2.1 NS_ConvertUTF8toUTF16 ref(unescapedRef); PRInt32 i, ns = mDocument->GetNumberOfShells(); for (i = 0; i < ns; i++) { nsIPresShell* shell = mDocument->GetShellAt(i); if (shell) { // Check an empty string which might be caused by the UTF-8 conversion if (!ref.IsEmpty()) { // Note that GoToAnchor will handle flushing layout as needed. rv = shell->GoToAnchor(ref, aReallyScroll); } else { rv = NS_ERROR_FAILURE; } // If UTF-8 URI failed then try to assume the string as a // document's charset. if (NS_FAILED(rv)) { const nsACString &docCharset = mDocument->GetDocumentCharacterSet(); rv = nsContentUtils::ConvertStringFromCharset(docCharset, unescapedRef, ref); if (NS_SUCCEEDED(rv) && !ref.IsEmpty()) rv = shell->GoToAnchor(ref, aReallyScroll); } if (NS_SUCCEEDED(rv)) { didScroll = PR_TRUE; } } } return didScroll; } nsresult nsContentSink::RefreshIfEnabled(nsIViewManager* vm) { if (!vm) { return NS_OK; } NS_ENSURE_TRUE(mDocShell, NS_ERROR_FAILURE); nsCOMPtr contentViewer; mDocShell->GetContentViewer(getter_AddRefs(contentViewer)); if (contentViewer) { PRBool enabled; contentViewer->GetEnableRendering(&enabled); if (enabled) { vm->EnableRefresh(NS_VMREFRESH_IMMEDIATE); } } return NS_OK; } void nsContentSink::StartLayout(PRBool aIsFrameset) { PRUint32 i, ns = mDocument->GetNumberOfShells(); for (i = 0; i < ns; i++) { nsIPresShell *shell = mDocument->GetShellAt(i); if (shell) { // Make sure we don't call InitialReflow() for a shell that has // already called it. This can happen when the layout frame for // an iframe is constructed *between* the Embed() call for the // docshell in the iframe, and the content sink's call to OpenBody(). // (Bug 153815) PRBool didInitialReflow = PR_FALSE; shell->GetDidInitialReflow(&didInitialReflow); if (didInitialReflow) { // XXX: The assumption here is that if something already // called InitialReflow() on this shell, it also did some of // the setup below, so we do nothing and just move on to the // next shell in the list. continue; } // Make shell an observer for next time shell->BeginObservingDocument(); // Resize-reflow this time nsRect r = shell->GetPresContext()->GetVisibleArea(); nsresult rv = shell->InitialReflow(r.width, r.height); if (NS_FAILED(rv)) { return; } // Now trigger a refresh RefreshIfEnabled(shell->GetViewManager()); } } // If the document we are loading has a reference or it is a // frameset document, disable the scroll bars on the views. if (mDocumentURI) { nsCAutoString ref; // Since all URI's that pass through here aren't URL's we can't // rely on the nsIURI implementation for providing a way for // finding the 'ref' part of the URI, we'll haveto revert to // string routines for finding the data past '#' mDocumentURI->GetSpec(ref); nsReadingIterator start, end; ref.BeginReading(start); ref.EndReading(end); if (FindCharInReadable('#', start, end)) { ++start; // Skip over the '#' mRef = Substring(start, end); } } }