1998-04-13 20:24:54 +00:00
|
|
|
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
|
|
|
/*
|
|
|
|
* The contents of this file are subject to the Netscape Public License
|
|
|
|
* Version 1.0 (the "NPL"); you may not use this file except in
|
|
|
|
* compliance with the NPL. You may obtain a copy of the NPL at
|
|
|
|
* http://www.mozilla.org/NPL/
|
|
|
|
*
|
|
|
|
* Software distributed under the NPL is distributed on an "AS IS" basis,
|
|
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the NPL
|
|
|
|
* for the specific language governing rights and limitations under the
|
|
|
|
* NPL.
|
|
|
|
*
|
|
|
|
* The Initial Developer of this code under the NPL is Netscape
|
|
|
|
* Communications Corporation. Portions created by Netscape are
|
|
|
|
* Copyright (C) 1998 Netscape Communications Corporation. All Rights
|
|
|
|
* Reserved.
|
|
|
|
*/
|
|
|
|
#include "nsIRobotSink.h"
|
|
|
|
#include "nsIRobotSinkObserver.h"
|
|
|
|
#include "nsIParserNode.h"
|
1999-01-09 01:19:49 +00:00
|
|
|
#include "nsIParser.h"
|
1998-04-13 20:24:54 +00:00
|
|
|
#include "nsString.h"
|
|
|
|
#include "nsIURL.h"
|
|
|
|
#include "nsCRT.h"
|
|
|
|
#include "nsVoidArray.h"
|
|
|
|
class nsIDocument;
|
|
|
|
|
|
|
|
// TODO
|
|
|
|
// - add in base tag support
|
|
|
|
// - get links from other sources:
|
|
|
|
// - LINK tag
|
|
|
|
// - STYLE SRC
|
|
|
|
// - IMG SRC
|
|
|
|
// - LAYER SRC
|
|
|
|
|
|
|
|
static NS_DEFINE_IID(kISupportsIID, NS_ISUPPORTS_IID);
|
1998-07-15 22:30:39 +00:00
|
|
|
static NS_DEFINE_IID(kIHTMLContentSinkIID, NS_IHTML_CONTENT_SINK_IID);
|
1998-04-13 20:24:54 +00:00
|
|
|
static NS_DEFINE_IID(kIRobotSinkIID, NS_IROBOTSINK_IID);
|
|
|
|
|
|
|
|
class RobotSink : public nsIRobotSink {
|
|
|
|
public:
|
|
|
|
RobotSink();
|
|
|
|
~RobotSink();
|
|
|
|
|
|
|
|
void* operator new(size_t size) {
|
|
|
|
void* rv = ::operator new(size);
|
|
|
|
nsCRT::zero(rv, size);
|
|
|
|
return (void*) rv;
|
|
|
|
}
|
|
|
|
|
|
|
|
// nsISupports
|
|
|
|
NS_DECL_ISUPPORTS
|
|
|
|
|
|
|
|
// nsIHTMLContentSink
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHOD SetTitle(const nsString& aValue);
|
|
|
|
NS_IMETHOD OpenHTML(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseHTML(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD OpenHead(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseHead(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD OpenBody(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseBody(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD OpenForm(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseForm(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD OpenMap(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseMap(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD OpenFrameset(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseFrameset(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD OpenContainer(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD CloseContainer(const nsIParserNode& aNode);
|
1998-11-11 22:04:42 +00:00
|
|
|
NS_IMETHOD NotifyError(nsresult aErrorResult);
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHOD CloseTopmostContainer();
|
|
|
|
NS_IMETHOD AddLeaf(const nsIParserNode& aNode);
|
1998-11-10 04:20:40 +00:00
|
|
|
NS_IMETHOD AddComment(const nsIParserNode& aNode);
|
|
|
|
NS_IMETHOD AddProcessingInstruction(const nsIParserNode& aNode);
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHOD WillBuildModel(void) { return NS_OK; }
|
|
|
|
NS_IMETHOD DidBuildModel(PRInt32 aQualityLevel) { return NS_OK; }
|
|
|
|
NS_IMETHOD WillInterrupt(void) { return NS_OK; }
|
|
|
|
NS_IMETHOD WillResume(void) { return NS_OK; }
|
1998-12-11 17:02:37 +00:00
|
|
|
NS_IMETHOD SetParser(nsIParser* aParser) { return NS_OK; }
|
1998-04-13 20:24:54 +00:00
|
|
|
|
|
|
|
// nsIRobotSink
|
|
|
|
NS_IMETHOD Init(nsIURL* aDocumentURL);
|
|
|
|
NS_IMETHOD AddObserver(nsIRobotSinkObserver* aObserver);
|
|
|
|
NS_IMETHOD RemoveObserver(nsIRobotSinkObserver* aObserver);
|
|
|
|
|
|
|
|
void ProcessLink(const nsString& aLink);
|
|
|
|
|
|
|
|
protected:
|
|
|
|
nsIURL* mDocumentURL;
|
|
|
|
nsVoidArray mObservers;
|
|
|
|
};
|
|
|
|
|
|
|
|
nsresult NS_NewRobotSink(nsIRobotSink** aInstancePtrResult)
|
|
|
|
{
|
|
|
|
RobotSink* it = new RobotSink();
|
|
|
|
return it->QueryInterface(kIRobotSinkIID, (void**) aInstancePtrResult);
|
|
|
|
}
|
|
|
|
|
|
|
|
RobotSink::RobotSink()
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
RobotSink::~RobotSink()
|
|
|
|
{
|
|
|
|
NS_IF_RELEASE(mDocumentURL);
|
|
|
|
PRInt32 i, n = mObservers.Count();
|
|
|
|
for (i = 0; i < n; i++) {
|
|
|
|
nsIRobotSinkObserver* cop = (nsIRobotSinkObserver*)mObservers.ElementAt(i);
|
|
|
|
NS_RELEASE(cop);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMPL_ADDREF(RobotSink);
|
|
|
|
|
|
|
|
NS_IMPL_RELEASE(RobotSink);
|
|
|
|
|
|
|
|
NS_IMETHODIMP RobotSink::QueryInterface(REFNSIID aIID, void** aInstancePtr)
|
|
|
|
{
|
|
|
|
if (NULL == aInstancePtr) {
|
|
|
|
return NS_ERROR_NULL_POINTER;
|
|
|
|
}
|
|
|
|
if (aIID.Equals(kIRobotSinkIID)) {
|
|
|
|
*aInstancePtr = (void*) this;
|
|
|
|
AddRef();
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
if (aIID.Equals(kIHTMLContentSinkIID)) {
|
|
|
|
*aInstancePtr = (void*) this;
|
|
|
|
AddRef();
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
if (aIID.Equals(kISupportsIID)) {
|
|
|
|
*aInstancePtr = (void*) ((nsISupports*)this);
|
|
|
|
AddRef();
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
return NS_NOINTERFACE;
|
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::SetTitle(const nsString& aValue)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::OpenHTML(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseHTML(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::OpenHead(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseHead(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::OpenBody(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseBody(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::OpenForm(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseForm(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::OpenMap(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseMap(const nsIParserNode& aNode)
|
|
|
|
{
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP RobotSink::OpenFrameset(const nsIParserNode& aNode)
|
|
|
|
{
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP RobotSink::CloseFrameset(const nsIParserNode& aNode)
|
|
|
|
{
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP RobotSink::OpenContainer(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
|
|
|
nsAutoString tmp(aNode.GetText());
|
1999-02-12 06:17:06 +00:00
|
|
|
tmp.ToLowerCase();
|
|
|
|
if (tmp.Equals("a")) {
|
1998-04-13 20:24:54 +00:00
|
|
|
nsAutoString k, v;
|
|
|
|
PRInt32 ac = aNode.GetAttributeCount();
|
|
|
|
for (PRInt32 i = 0; i < ac; i++) {
|
|
|
|
// Get upper-cased key
|
|
|
|
const nsString& key = aNode.GetKeyAt(i);
|
|
|
|
k.Truncate();
|
|
|
|
k.Append(key);
|
1999-02-12 06:17:06 +00:00
|
|
|
k.ToLowerCase();
|
|
|
|
if (k.Equals("href")) {
|
1998-04-13 20:24:54 +00:00
|
|
|
// Get value and remove mandatory quotes
|
|
|
|
v.Truncate();
|
|
|
|
v.Append(aNode.GetValueAt(i));
|
|
|
|
PRUnichar first = v.First();
|
|
|
|
if ((first == '"') || (first == '\'')) {
|
|
|
|
if (v.Last() == first) {
|
|
|
|
v.Cut(0, 1);
|
|
|
|
PRInt32 pos = v.Length() - 1;
|
|
|
|
if (pos >= 0) {
|
|
|
|
v.Cut(pos, 1);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// Mismatched quotes - leave them in
|
|
|
|
}
|
|
|
|
}
|
|
|
|
ProcessLink(v);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseContainer(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::CloseTopmostContainer()
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-07-15 22:30:39 +00:00
|
|
|
NS_IMETHODIMP RobotSink::AddLeaf(const nsIParserNode& aNode)
|
1998-04-13 20:24:54 +00:00
|
|
|
{
|
1998-07-15 22:30:39 +00:00
|
|
|
return NS_OK;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
|
1998-11-11 22:04:42 +00:00
|
|
|
NS_IMETHODIMP RobotSink::NotifyError(nsresult aErrorResult)
|
|
|
|
{
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
1998-11-10 04:20:40 +00:00
|
|
|
/**
|
|
|
|
* This gets called by the parsing system when we find a comment
|
|
|
|
* @update gess11/9/98
|
|
|
|
* @param aNode contains a comment token
|
|
|
|
* @return error code
|
|
|
|
*/
|
|
|
|
NS_IMETHODIMP RobotSink::AddComment(const nsIParserNode& aNode) {
|
|
|
|
nsresult result= NS_OK;
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* This gets called by the parsing system when we find a PI
|
|
|
|
* @update gess11/9/98
|
|
|
|
* @param aNode contains a comment token
|
|
|
|
* @return error code
|
|
|
|
*/
|
|
|
|
NS_IMETHODIMP RobotSink::AddProcessingInstruction(const nsIParserNode& aNode) {
|
|
|
|
nsresult result= NS_OK;
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
1998-04-13 20:24:54 +00:00
|
|
|
NS_IMETHODIMP RobotSink::Init(nsIURL* aDocumentURL)
|
|
|
|
{
|
|
|
|
NS_IF_RELEASE(mDocumentURL);
|
|
|
|
mDocumentURL = aDocumentURL;
|
|
|
|
NS_IF_ADDREF(aDocumentURL);
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP RobotSink::AddObserver(nsIRobotSinkObserver* aObserver)
|
|
|
|
{
|
|
|
|
if (mObservers.AppendElement(aObserver)) {
|
|
|
|
NS_ADDREF(aObserver);
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
return NS_ERROR_OUT_OF_MEMORY;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP RobotSink::RemoveObserver(nsIRobotSinkObserver* aObserver)
|
|
|
|
{
|
|
|
|
if (mObservers.RemoveElement(aObserver)) {
|
|
|
|
NS_RELEASE(aObserver);
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
//XXX return NS_ERROR_NOT_FOUND;
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
void RobotSink::ProcessLink(const nsString& aLink)
|
|
|
|
{
|
|
|
|
nsAutoString absURLSpec(aLink);
|
|
|
|
|
|
|
|
// Make link absolute
|
|
|
|
// XXX base tag handling
|
|
|
|
nsIURL* docURL = mDocumentURL;
|
|
|
|
if (nsnull != docURL) {
|
|
|
|
nsIURL* absurl;
|
1998-12-16 05:40:20 +00:00
|
|
|
nsresult rv = NS_NewURL(&absurl, aLink, docURL);
|
1998-04-13 20:24:54 +00:00
|
|
|
if (NS_OK == rv) {
|
|
|
|
absURLSpec.Truncate();
|
1998-12-16 05:40:20 +00:00
|
|
|
PRUnichar* str;
|
|
|
|
absurl->ToString(&str);
|
|
|
|
absURLSpec = str;
|
1998-04-13 20:24:54 +00:00
|
|
|
NS_RELEASE(absurl);
|
1998-12-16 05:40:20 +00:00
|
|
|
delete str;
|
1998-04-13 20:24:54 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Now give link to robot observers
|
|
|
|
PRInt32 i, n = mObservers.Count();
|
|
|
|
for (i = 0; i < n; i++) {
|
|
|
|
nsIRobotSinkObserver* cop = (nsIRobotSinkObserver*)mObservers.ElementAt(i);
|
|
|
|
cop->ProcessLink(absURLSpec);
|
|
|
|
}
|
|
|
|
}
|
1998-05-28 00:21:34 +00:00
|
|
|
|