/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* * The contents of this file are subject to the Netscape Public * License Version 1.1 (the "License"); you may not use this file * except in compliance with the License. You may obtain a copy of * the License at http://www.mozilla.org/NPL/ * * Software distributed under the License is distributed on an "AS * IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or * implied. See the License for the specific language governing * rights and limitations under the License. * * The Original Code is mozilla.org code. * * The Initial Developer of the Original Code is Netscape * Communications Corporation. Portions created by Netscape are * Copyright (C) 1998 Netscape Communications Corporation. All * Rights Reserved. * * Contributor(s): */ /** * MODULE NOTES: * @update gess 4/8/98 * * */ #ifdef RAPTOR_PERF_METRICS # define START_TIMER() \ if(mParser) mParser->mParseTime.Start(PR_FALSE); \ if(mParser) mParser->mDTDTime.Start(PR_FALSE); # define STOP_TIMER() \ if(mParser) mParser->mParseTime.Stop(); \ if(mParser) mParser->mDTDTime.Stop(); #else # define STOP_TIMER() # define START_TIMER() #endif #include "nsIDTDDebug.h" #include "nsViewSourceHTML.h" #include "nsCRT.h" #include "nsParser.h" #include "nsScanner.h" #include "nsIParser.h" #include "nsTokenHandler.h" #include "nsDTDUtils.h" #include "nsIContentSink.h" #include "nsIHTMLContentSink.h" #include "nsHTMLTokenizer.h" #include "prenv.h" //this is here for debug reasons... #include "prtypes.h" //this is here for debug reasons... #include "prio.h" #include "plstr.h" #ifdef XP_PC #include //this is here for debug reasons... #endif #include "prmem.h" #ifdef RAPTOR_PERF_METRICS #include "stopwatch.h" Stopwatch vsTimer; #endif static NS_DEFINE_IID(kISupportsIID, NS_ISUPPORTS_IID); static NS_DEFINE_IID(kIDTDIID, NS_IDTD_IID); static NS_DEFINE_IID(kClassIID, NS_VIEWSOURCE_HTML_IID); static CTokenRecycler* gTokenRecycler=0; //#define rickgdebug #ifdef rickgdebug #include fstream* gDumpFile=0; #endif /** * This method gets called as part of our COM-like interfaces. * Its purpose is to create an interface to parser object * of some type. * * @update gess 4/8/98 * @param nsIID id of object to discover * @param aInstancePtr ptr to newly discovered interface * @return NS_xxx result code */ nsresult CViewSourceHTML::QueryInterface(const nsIID& aIID, void** aInstancePtr) { if (NULL == aInstancePtr) { return NS_ERROR_NULL_POINTER; } if(aIID.Equals(kISupportsIID)) { //do IUnknown... *aInstancePtr = (nsIDTD*)(this); } else if(aIID.Equals(kIDTDIID)) { //do IParser base class... *aInstancePtr = (nsIDTD*)(this); } else if(aIID.Equals(kClassIID)) { //do this class... *aInstancePtr = (CViewSourceHTML*)(this); } else { *aInstancePtr=0; return NS_NOINTERFACE; } NS_ADDREF_THIS(); return NS_OK; } /** * This method is defined in nsIParser. It is used to * cause the COM-like construction of an nsParser. * * @update gess 4/8/98 * @param nsIParser** ptr to newly instantiated parser * @return NS_xxx error result */ NS_HTMLPARS nsresult NS_NewViewSourceHTML(nsIDTD** aInstancePtrResult) { CViewSourceHTML* it = new CViewSourceHTML(); if (it == 0) { return NS_ERROR_OUT_OF_MEMORY; } return it->QueryInterface(kClassIID, (void **) aInstancePtrResult); } NS_IMPL_ADDREF(CViewSourceHTML) NS_IMPL_RELEASE(CViewSourceHTML) /******************************************** ********************************************/ class CIndirectTextToken : public CTextToken { public: CIndirectTextToken() : CTextToken() { mIndirectString=0; } void SetIndirectString(const nsString& aString) { mIndirectString=&aString; } virtual nsString& GetStringValueXXX(void){ return (nsString&)*mIndirectString; } const nsString* mIndirectString; }; /******************************************************************* Now define the CSharedVSCOntext class... *******************************************************************/ class CSharedVSContext { public: CSharedVSContext() : mEndNode(), mStartNode(), mTokenNode(), mITextToken(), mITextNode(&mITextToken), mTextToken(), mTextNode(&mTextToken){ } ~CSharedVSContext() { } static CSharedVSContext& GetSharedContext() { static CSharedVSContext gSharedVSContext; return gSharedVSContext; } nsCParserNode mEndNode; nsCParserNode mStartNode; nsCParserNode mTokenNode; CIndirectTextToken mITextToken; nsCParserNode mITextNode; CTextToken mTextToken; nsCParserNode mTextNode; }; /** * Default constructor * * @update gess 4/9/98 * @param * @return */ CViewSourceHTML::CViewSourceHTML() : nsIDTD(), mStartTag("start"), mEndTag("end"), mCommentTag("comment"), mCDATATag("cdata"), mDocTypeTag("doctype"), mPITag("pi"), mEntityTag("entity"), mText("txt"), mKey("key"), mValue("val") { NS_INIT_REFCNT(); mParser=0; mSink=0; mLineNumber=0; mTokenizer=0; mIsText=PR_FALSE; #ifdef rickgdebug gDumpFile = new fstream("c:/temp/viewsource.xml",ios::trunc); #endif } /** * Default destructor * * @update gess 4/9/98 * @param * @return */ CViewSourceHTML::~CViewSourceHTML(){ mParser=0; //just to prove we destructed... NS_IF_RELEASE(mTokenizer); } /** * * @update gess1/8/99 * @param * @return */ const nsIID& CViewSourceHTML::GetMostDerivedIID(void) const{ return kClassIID; } /** * Call this method if you want the DTD to construct a fresh * instance of itself. * @update gess7/23/98 * @param * @return */ nsresult CViewSourceHTML::CreateNewInstance(nsIDTD** aInstancePtrResult){ return NS_NewViewSourceHTML(aInstancePtrResult); } /** * This method is called to determine if the given DTD can parse * a document in a given source-type. * NOTE: Parsing always assumes that the end result will involve * storing the result in the main content model. * @update gess6/24/98 * @param * @return TRUE if this DTD can satisfy the request; FALSE otherwise. */ eAutoDetectResult CViewSourceHTML::CanParse(nsString& aContentType, nsString& aCommand, nsString& aBuffer, PRInt32 aVersion) { eAutoDetectResult result=eUnknownDetect; if(aContentType.Equals(kPlainTextContentType) || aContentType.Equals(kTextCSSContentType)) { result=eValidDetect; } else if(aCommand.Equals(kViewSourceCommand)) { if(aContentType.Equals(kXMLTextContentType) || aContentType.Equals(kRDFTextContentType) || aContentType.Equals(kHTMLTextContentType) || aContentType.Equals(kPlainTextContentType) || aContentType.Equals(kXULTextContentType)) { result=ePrimaryDetect; } } return result; } /** * * @update gess5/18/98 * @param * @return */ NS_IMETHODIMP CViewSourceHTML::WillBuildModel(nsString& aFilename,PRBool aNotifySink, nsString& aSourceType,eParseMode aParseMode, nsString& aCommand,nsIContentSink* aSink){ nsresult result=NS_OK; #ifdef RAPTOR_PERF_METRICS vsTimer.Reset(); NS_START_STOPWATCH(vsTimer); #endif STOP_TIMER(); mSink=(nsIXMLContentSink*)aSink; if((aNotifySink) && (mSink)) { static const char* theHeader=""; CToken ssToken(theHeader); nsCParserNode ssNode(&ssToken); result= mSink->AddCharacterData(ssNode); #ifdef rickgdebug (*gDumpFile) << theHeader << endl; (*gDumpFile) << "" << endl; #endif //now let's automatically open the root container... CToken theToken("viewsource"); nsCParserNode theNode(&theToken,0); CAttributeToken theAttr("xmlns","http://www.mozilla.org/viewsource"); theNode.AddAttribute(&theAttr); mSink->OpenContainer(theNode); } mIsText=((!aCommand.Equals(kViewSourceCommand)) || (aSourceType.Equals(kPlainTextContentType))); mLineNumber=0; result = mSink->WillBuildModel(); START_TIMER(); return result; } /** * The parser uses a code sandwich to wrap the parsing process. Before * the process begins, WillBuildModel() is called. Afterwards the parser * calls DidBuildModel(). * @update gess5/18/98 * @param aFilename is the name of the file being parsed. * @return error code (almost always 0) */ NS_IMETHODIMP CViewSourceHTML::BuildModel(nsIParser* aParser,nsITokenizer* aTokenizer,nsITokenObserver* anObserver,nsIContentSink* aSink) { nsresult result=NS_OK; if(aTokenizer && aParser) { nsITokenizer* oldTokenizer=mTokenizer; mTokenizer=aTokenizer; gTokenRecycler=(CTokenRecycler*)mTokenizer->GetTokenRecycler(); if(gTokenRecycler) { while(NS_SUCCEEDED(result)){ CToken* theToken=mTokenizer->PopToken(); if(theToken) { result=HandleToken(theToken,aParser); if(NS_SUCCEEDED(result)) { gTokenRecycler->RecycleToken(theToken); } else if(NS_ERROR_HTMLPARSER_BLOCK!=result){ mTokenizer->PushTokenFront(theToken); } // theRootDTD->Verify(kEmptyString,aParser); } else break; }//while } mTokenizer=oldTokenizer; } else result=NS_ERROR_HTMLPARSER_BADTOKENIZER; return result; } /** * * @update gess5/18/98 * @param * @return */ NS_IMETHODIMP CViewSourceHTML::DidBuildModel(nsresult anErrorCode,PRBool aNotifySink,nsIParser* aParser,nsIContentSink* aSink){ nsresult result= NS_OK; //ADD CODE HERE TO CLOSE OPEN CONTAINERS... if(aParser){ mParser=(nsParser*)aParser; //debug XXX STOP_TIMER(); mSink=(nsIXMLContentSink*)aParser->GetContentSink(); if((aNotifySink) && (mSink)) { //now let's automatically auto-opened containers... #ifdef rickgdebug if(gDumpFile){ (*gDumpFile) << "" << endl; gDumpFile->close(); delete gDumpFile; } #endif if(!mIsText) { //now let's automatically close the root container... CToken theToken("viewsource"); nsCParserNode theNode(&theToken,0); mSink->CloseContainer(theNode); } result = mSink->DidBuildModel(1); } START_TIMER(); } #ifdef RAPTOR_PERF_METRICS NS_STOP_STOPWATCH(vsTimer); printf("viewsource timer: "); vsTimer.Print(); printf("\n"); #endif return result; } /** * * @update gess8/4/98 * @param * @return */ nsITokenRecycler* CViewSourceHTML::GetTokenRecycler(void){ nsITokenizer* theTokenizer=0; nsresult result=GetTokenizer(theTokenizer); if (NS_SUCCEEDED(result)) { return theTokenizer->GetTokenRecycler(); } return 0; } /** * Use this id you want to stop the building content model * --------------[ Sets DTD to STOP mode ]---------------- * It's recommended to use this method in accordance with * the parser's terminate() method. * * @update harishd 07/22/99 * @param * @return */ nsresult CViewSourceHTML::Terminate(void) { return NS_ERROR_HTMLPARSER_STOPPARSING; } /** * Retrieve the preferred tokenizer for use by this DTD. * @update gess12/28/98 * @param none * @return ptr to tokenizer */ nsresult CViewSourceHTML::GetTokenizer(nsITokenizer*& aTokenizer) { nsresult result=NS_OK; if(!mTokenizer) { result=NS_NewHTMLTokenizer(&mTokenizer,eParseMode_quirks,mIsText); } aTokenizer=mTokenizer; return result; } /** * * @update gess5/18/98 * @param * @return */ NS_IMETHODIMP CViewSourceHTML::WillResumeParse(void){ nsresult result = NS_OK; if(mSink) { result = mSink->WillResume(); } return result; } /** * * @update gess5/18/98 * @param * @return */ NS_IMETHODIMP CViewSourceHTML::WillInterruptParse(void){ nsresult result = NS_OK; if(mSink) { result = mSink->WillInterrupt(); } return result; } /** * Called by the parser to initiate dtd verification of the * internal context stack. * @update gess 7/23/98 * @param * @return */ PRBool CViewSourceHTML::Verify(nsString& aURLRef,nsIParser* aParser) { PRBool result=PR_TRUE; mParser=(nsParser*)aParser; return result; } /** * Called by the parser to enable/disable dtd verification of the * internal context stack. * @update gess 7/23/98 * @param * @return */ void CViewSourceHTML::SetVerification(PRBool aEnabled){ } /** * This method is called to determine whether or not a tag * of one type can contain a tag of another type. * * @update gess 3/25/98 * @param aParent -- int tag of parent container * @param aChild -- int tag of child container * @return PR_TRUE if parent can contain child */ PRBool CViewSourceHTML::CanContain(PRInt32 aParent,PRInt32 aChild) const{ PRBool result=PR_TRUE; return result; } /** * Give rest of world access to our tag enums, so that CanContain(), etc, * become useful. */ NS_IMETHODIMP CViewSourceHTML::StringTagToIntTag(nsString &aTag, PRInt32* aIntTag) const { return NS_ERROR_NOT_IMPLEMENTED; } NS_IMETHODIMP CViewSourceHTML::IntTagToStringTag(PRInt32 aIntTag, nsString& aTag) const { return NS_ERROR_NOT_IMPLEMENTED; } NS_IMETHODIMP CViewSourceHTML::ConvertEntityToUnicode(const nsString& aEntity, PRInt32* aUnicode) const { return NS_ERROR_NOT_IMPLEMENTED; } /** * This method gets called to determine whether a given * tag is itself a container * * @update gess 3/25/98 * @param aTag -- tag to test for containership * @return PR_TRUE if given tag can contain other tags */ PRBool CViewSourceHTML::IsContainer(PRInt32 aTag) const{ PRBool result=PR_TRUE; return result; } /** * This method gets called when a tag needs to be sent out * * @update gess 3/25/98 * @param * @return result status */ nsresult WriteText(const nsString& aTextString,nsIContentSink& aSink,PRBool aPreserveSpace,PRBool aPlainText,CSharedVSContext& aContext) { nsresult result=NS_OK; nsString& temp=aContext.mTextToken.GetStringValueXXX(); temp.Truncate(); PRInt32 theEnd=aTextString.Length(); PRInt32 theTextOffset=0; PRInt32 theOffset=-1; //aTextString.FindCharInSet("\t\n\r ",theStartOffset); PRInt32 theSpaces=0; PRUnichar theChar=0; PRUnichar theNextChar=0; while(++theOffsetPeekToken(); if(theToken) { eHTMLTokenTypes theType=eHTMLTokenTypes(theToken->GetTokenType()); if(eToken_attribute==theType){ mTokenizer->PopToken(); //pop it for real... theContext.mTokenNode.AddAttribute(theToken); //and add it to the node. CAttributeToken* theAttrToken=(CAttributeToken*)theToken; CToken theKeyToken(theAttrToken->GetKey()); result=WriteTag(mKey,&theKeyToken,0,PR_FALSE); nsString& theValue=theToken->GetStringValueXXX(); if((0mHasEqualWithoutValue)){ result=WriteTag(mValue,theToken,0,PR_FALSE); } } } else return kEOF; } } return result; } /** * This method gets called when a tag needs to be sent out * * @update gess 3/25/98 * @param * @return result status */ nsresult CViewSourceHTML::WriteTag(nsString &theXMLTagName,CToken* aToken,PRInt32 attrCount,PRBool aNewlineRequired) { static nsString theString(""); nsresult result=NS_OK; CSharedVSContext& theContext=CSharedVSContext::GetSharedContext(); CToken theTagToken(theXMLTagName); theContext.mStartNode.Init(&theTagToken,mLineNumber); STOP_TIMER(); mSink->OpenContainer(theContext.mStartNode); //emit ... START_TIMER(); #ifdef rickgdebug if(aNewlineRequired) { (*gDumpFile)<"; cstr.Assign(aToken->GetStringValueXXX()); if('<'==cstr.First()) { cstr.Cut(0,2); cstr.Truncate(cstr.Length()-1); } (*gDumpFile) << cstr; #endif theContext.mITextToken.SetIndirectString(aToken->GetStringValueXXX()); //now emit the tag name... STOP_TIMER(); mSink->AddLeaf(theContext.mITextNode); START_TIMER(); if(attrCount){ result=WriteAttributes(attrCount); } STOP_TIMER(); theContext.mEndNode.Init(&theTagToken,mLineNumber); mSink->CloseContainer(theContext.mEndNode); //emit ... START_TIMER(); #ifdef rickgdebug cstr.Assign(theXMLTagName); (*gDumpFile) << ""; #endif return result; } /** * This method gets called when a tag needs to be sent out * * @update gess 3/25/98 * @param * @return result status */ nsresult CViewSourceHTML::WriteTag(nsString &theXMLTagName,nsString & aText,PRInt32 attrCount,PRBool aNewlineRequired) { static nsString theString(""); nsresult result=NS_OK; CSharedVSContext& theContext=CSharedVSContext::GetSharedContext(); CToken theTagToken(theXMLTagName); theContext.mStartNode.Init(&theTagToken,mLineNumber); STOP_TIMER(); mSink->OpenContainer(theContext.mStartNode); //emit ... START_TIMER(); #ifdef rickgdebug if(aNewlineRequired) { (*gDumpFile)<"; cstr.Assign(aText); (*gDumpFile) << cstr; #endif theContext.mITextToken.SetIndirectString(aText); //now emit the tag name... STOP_TIMER(); mSink->AddLeaf(theContext.mITextNode); START_TIMER(); if(attrCount){ result=WriteAttributes(attrCount); } theContext.mEndNode.Init(&theTagToken,mLineNumber); STOP_TIMER(); mSink->CloseContainer(theContext.mEndNode); //emit ... START_TIMER(); #ifdef rickgdebug cstr.Assign(theXMLTagName); (*gDumpFile) << ""; #endif return result; } /** * * @update gess 3/25/98 * @param aToken -- token object to be put into content model * @return 0 if all is well; non-zero is an error */ NS_IMETHODIMP CViewSourceHTML::HandleToken(CToken* aToken,nsIParser* aParser) { nsresult result=NS_OK; CHTMLToken* theToken= (CHTMLToken*)(aToken); eHTMLTokenTypes theType= (eHTMLTokenTypes)theToken->GetTokenType(); mParser=(nsParser*)aParser; mSink=(nsIXMLContentSink*)aParser->GetContentSink(); CSharedVSContext& theContext=CSharedVSContext::GetSharedContext(); theContext.mTokenNode.Init(theToken,mLineNumber); switch(theType) { case eToken_start: result=WriteTag(mStartTag,aToken,aToken->GetAttributeCount(),PR_TRUE); if((!mIsText) && mParser && (NS_OK==result)) { CObserverService* theService=mParser->GetObserverService(); if(theService) { CParserContext* pc=mParser->PeekContext(); void* theDocID=(pc)? pc->mKey:0; eHTMLTags theTag=(eHTMLTags)theToken->GetTypeID(); result=theService->Notify(theTag,theContext.mTokenNode,(PRUint32)theDocID,kViewSourceCommand,mParser); } } theContext.mTokenNode.Init(0,0,gTokenRecycler); //now recycle. break; case eToken_end: result=WriteTag(mEndTag,aToken,0,PR_TRUE); break; case eToken_cdatasection: { nsString& theStr=aToken->GetStringValueXXX(); theStr.Insert(""); result=WriteTag(mCDATATag,aToken,0,PR_TRUE); } break; case eToken_comment: result=WriteTag(mCommentTag,aToken,0,PR_TRUE); break; case eToken_doctypeDecl: result=WriteTag(mDocTypeTag,aToken,0,PR_TRUE); break; case eToken_newline: mLineNumber++; case eToken_whitespace: case eToken_text: result=WriteTag(mText,aToken,0,PR_FALSE); break; case eToken_entity: { nsAutoString theStr; nsString& theEntity=aToken->GetStringValueXXX(); if(!theEntity.EqualsIgnoreCase("XI",2)) { PRUnichar theChar=theEntity.CharAt(0); if((nsString::IsDigit(theChar)) || ('X'==theChar) || ('x'==theChar)){ theStr.Append("#"); } theStr.Append(theEntity); } result=WriteTag(mEntityTag,theStr,0,PR_FALSE); } break; case eToken_instruction: result=WriteTag(mPITag,aToken,0,PR_TRUE); default: result=NS_OK; }//switch while(theContext.mTokenNode.PopAttributeToken()){ //dump the attributes since they're on the stack... } return result; } /** * This method causes all tokens to be dispatched to the given tag handler. * * @update gess 3/25/98 * @param aHandler -- object to receive subsequent tokens... * @return error code (usually 0) */ nsresult CViewSourceHTML::CaptureTokenPump(nsITagHandler* aHandler) { nsresult result=NS_OK; return result; } /** * This method releases the token-pump capture obtained in CaptureTokenPump() * * @update gess 3/25/98 * @param aHandler -- object that received tokens... * @return error code (usually 0) */ nsresult CViewSourceHTML::ReleaseTokenPump(nsITagHandler* aHandler){ nsresult result=NS_OK; return result; }