Files
tubestation/htmlparser/tests/grabpage/grabpage.cpp
dougt@netscape.com a70fce6f87 Revising nsIChannel to allow for overlapped i/o. This consists of three parts:
1. Factoring nsIChannel into a protocol specific part, the nsIChannel, and a socket specific, the nsITransport.
2. Derive the nsIChannel from a nsIRequest.
2. Changes the notification system from necko and the URILoader to pass the nsIRequest interface instead of nsIChannel interface.

This goal stems from wanting to be able to have active AsyncRead and AsyncWrite operations on nsSocketTransport.
This is desired because it would greatly simplify the task of maintaining persistent/reusable socket connections
for FTP, HTTP, and Imap (and potentially other protocols).  The problem with the existing nsIChannel interface is
that it does not allow one to selectively suspend just one of the read or write operations while keeping the other active.

The full details of the change on written up in the netlib newsgroup.

r=darin@netscape.com
sr=rpotts@netscape.com
2001-02-10 00:16:26 +00:00

286 lines
6.1 KiB
C++

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
*
* The contents of this file are subject to the Netscape Public
* License Version 1.1 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.mozilla.org/NPL/
*
* Software distributed under the License is distributed on an "AS
* IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or
* implied. See the License for the specific language governing
* rights and limitations under the License.
*
* The Original Code is Mozilla Communicator client code.
*
* The Initial Developer of the Original Code is Netscape Communications
* Corporation. Portions created by Netscape are
* Copyright (C) 1998 Netscape Communications Corporation. All
* Rights Reserved.
*
* Contributor(s):
*/
#include "nsIStreamListener.h"
#include "nsIInputStream.h"
#include "nsIURL.h"
#include "nsIIOService.h"
#include "nsIChannel.h"
static NS_DEFINE_CID(kIOServiceCID, NS_IOSERVICE_CID);
#include "nsString.h"
#include "nsCRT.h"
#include "prprf.h"
#ifdef XP_PC
#include <windows.h>
#include <sys/types.h>
#include <sys/stat.h>
#endif
#ifdef XP_UNIX
#include <sys/types.h>
#include <sys/stat.h>
#endif
NS_DEFINE_IID(kIStreamListenerIID, NS_ISTREAMLISTENER_IID);
class StreamToFile : public nsIStreamListener {
public:
StreamToFile(FILE* fp);
NS_DECL_ISUPPORTS
NS_IMETHOD GetBindInfo(nsIURI* aURL);
NS_IMETHOD OnProgress(nsIURI* aURL, PRInt32 Progress, PRInt32 ProgressMax);
NS_IMETHOD OnStatus(nsIURI* aURL, const nsString& aMsg);
NS_IMETHOD OnStartRequest(nsIURI* aURL, const char *aContentType);
NS_IMETHOD OnDataAvailable(nsIURI* aURL, nsIInputStream *pIStream, PRInt32 length);
NS_IMETHOD OnStopRequest(nsIURI* aURL, PRInt32 status, const nsString& aMsg);
PRBool IsDone() const { return mDone; }
PRBool HaveError() const { return mError; }
protected:
~StreamToFile();
PRBool mDone;
PRBool mError;
FILE* mFile;
};
StreamToFile::StreamToFile(FILE* fp)
{
NS_INIT_REFCNT();
mDone = PR_FALSE;
mError = PR_FALSE;
mFile = fp;
}
NS_IMPL_ISUPPORTS(StreamToFile,kIStreamListenerIID)
StreamToFile::~StreamToFile()
{
if (nsnull != mFile) {
fclose(mFile);
}
}
NS_IMETHODIMP
StreamToFile::GetBindInfo(nsIURI* aURL)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnProgress(nsIURI* aURL, PRInt32 Progress, PRInt32 ProgressMax)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnStatus(nsIURI* aURL, const nsString& aMsg)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnStartRequest(nsIURI* aURL, const char *aContentType)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnDataAvailable(nsIURI* aURL, nsIInputStream *pIStream,
PRInt32 length)
{
PRUint32 len;
do {
char buffer[4000];
nsresult err = pIStream->Read(buffer, 0, sizeof(buffer), &len);
if (NS_SUCCEEDED(err)) {
if (nsnull != mFile) {
fwrite(buffer, 1, len, mFile);
}
}
} while (len > 0);
return 0;
}
NS_IMETHODIMP
StreamToFile::OnStopRequest(nsIURI* aURL, PRInt32 status, const nsString& aMsg)
{
mDone = PR_TRUE;
if (0 != status) {
mError = PR_TRUE;
}
return 0;
}
//----------------------------------------------------------------------
// This could turn into a handy utility someday...
class PageGrabber {
public:
PageGrabber();
~PageGrabber();
NS_DECL_AND_IMPL_ZEROING_OPERATOR_NEW
nsresult Init(const nsString& aDirectory);
nsresult Grab(const nsString& aURL);
protected:
char* NextFile(const char* aExtension);
nsString mDirectory;
PRInt32 mFileNum;
};
PageGrabber::PageGrabber()
{
}
PageGrabber::~PageGrabber()
{
}
nsresult
PageGrabber::Init(const nsString& aDirectory)
{
mDirectory = aDirectory;
if (aDirectory.Last() != '/') {
mDirectory.Append('/');
}
return NS_OK;
}
char*
PageGrabber::NextFile(const char* aExtension)
{
char* cname = nsnull;
nsAutoString name;
for (;;) {
name.Truncate();
name.Append(mDirectory);
char fileName[20];
PR_snprintf(fileName, sizeof(fileName), "%08d.%s", mFileNum, aExtension);
name.Append(fileName);
// See if file already exists; if it does advance mFileNum by 100 and
// try again.
cname = name.ToNewCString();
struct stat sb;
int s = stat(cname, &sb);
if (s < 0) {
mFileNum++;
break;
}
else {
mFileNum += 100;
delete [] cname;
}
}
return cname;
}
nsresult
PageGrabber::Grab(const nsString& aURL)
{
char* cname = NextFile("html");
if (nsnull == cname) {
return NS_ERROR_OUT_OF_MEMORY;
}
FILE* fp = fopen(cname, "wb");
if (nsnull == fp) {
return NS_ERROR_OUT_OF_MEMORY;
}
printf("Copying ");
fputs(aURL, stdout);
printf(" to %s\n", cname);
// Create the URL object...
nsIURI* url = NULL;
nsresult rv;
rv = NS_WITH_SERVICE(nsIIOService, ioService, kIOServiceCID, &rv);
if (NS_FAILED(rv)) return rv;
nsIChannel *channel = nsnull;
// XXX NECKO what verb? what eventSinkGetter?
rv = ioService->NewChannel("load", aURL, nsnull, nsnull, &channel);
if (NS_FAILED(rv)) return rv;
// Start the URL load...
StreamToFile* copier = new StreamToFile(fp);
if(copier) {
NS_ADDREF(copier);
rv = channel->AsyncOpen(copier, nsnull);
if (NS_OK != rv) {
NS_RELEASE(copier);
NS_RELEASE(url);
return rv;
}
// Enter the message pump to allow the URL load to proceed.
#ifdef XP_PC
MSG msg;
while ( !copier->IsDone() ) {
if (PeekMessage(&msg, NULL, 0, 0, PM_REMOVE)) {
TranslateMessage(&msg);
DispatchMessage(&msg);
}
}
#endif
PRBool error = copier->HaveError();
NS_RELEASE(copier);
}
NS_RELEASE(url);
return error ? NS_ERROR_OUT_OF_MEMORY : NS_OK;
}
//----------------------------------------------------------------------
int
main(int argc, char **argv)
{
nsString url_address;
if (argc != 3) {
fprintf(stderr, "Usage: grabpage url directory\n");
return -1;
}
PageGrabber* grabber = new PageGrabber();
if(grabber) {
grabber->Init(argv[2]);
if (NS_OK != grabber->Grab(argv[1])) {
return -1;
}
}
return 0;
}