gecko-dev/htmlparser/tests/grabpage/grabpage.cpp

301 строка
7.0 KiB
C++

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* ***** BEGIN LICENSE BLOCK *****
* Version: NPL 1.1/GPL 2.0/LGPL 2.1
*
* The contents of this file are subject to the Netscape Public License
* Version 1.1 (the "License"); you may not use this file except in
* compliance with the License. You may obtain a copy of the License at
* http://www.mozilla.org/NPL/
*
* Software distributed under the License is distributed on an "AS IS" basis,
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
* for the specific language governing rights and limitations under the
* License.
*
* The Original Code is Mozilla Communicator client code.
*
* The Initial Developer of the Original Code is
* Netscape Communications Corporation.
* Portions created by the Initial Developer are Copyright (C) 1998
* the Initial Developer. All Rights Reserved.
*
* Contributor(s):
*
*
* Alternatively, the contents of this file may be used under the terms of
* either the GNU General Public License Version 2 or later (the "GPL"), or
* the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
* in which case the provisions of the GPL or the LGPL are applicable instead
* of those above. If you wish to allow use of your version of this file only
* under the terms of either the GPL or the LGPL, and not to allow others to
* use your version of this file under the terms of the NPL, indicate your
* decision by deleting the provisions above and replace them with the notice
* and other provisions required by the GPL or the LGPL. If you do not delete
* the provisions above, a recipient may use your version of this file under
* the terms of any one of the NPL, the GPL or the LGPL.
*
* ***** END LICENSE BLOCK ***** */
#include "nsIStreamListener.h"
#include "nsIInputStream.h"
#include "nsIURL.h"
#include "nsIIOService.h"
#include "nsIChannel.h"
static NS_DEFINE_CID(kIOServiceCID, NS_IOSERVICE_CID);
#include "nsString.h"
#include "nsReadableUtils.h"
#include "nsCRT.h"
#include "prprf.h"
#ifdef XP_PC
#include <windows.h>
#include <sys/types.h>
#include <sys/stat.h>
#endif
#ifdef XP_UNIX
#include <sys/types.h>
#include <sys/stat.h>
#endif
class StreamToFile : public nsIStreamListener {
public:
StreamToFile(FILE* fp);
NS_DECL_ISUPPORTS
NS_IMETHOD GetBindInfo(nsIURI* aURL);
NS_IMETHOD OnProgress(nsIURI* aURL, PRInt32 Progress, PRInt32 ProgressMax);
NS_IMETHOD OnStatus(nsIURI* aURL, const nsString& aMsg);
NS_IMETHOD OnStartRequest(nsIURI* aURL, const char *aContentType);
NS_IMETHOD OnDataAvailable(nsIURI* aURL, nsIInputStream *pIStream, PRInt32 length);
NS_IMETHOD OnStopRequest(nsIURI* aURL, PRInt32 status, const nsString& aMsg);
PRBool IsDone() const { return mDone; }
PRBool HaveError() const { return mError; }
protected:
~StreamToFile();
PRBool mDone;
PRBool mError;
FILE* mFile;
};
StreamToFile::StreamToFile(FILE* fp)
{
NS_INIT_REFCNT();
mDone = PR_FALSE;
mError = PR_FALSE;
mFile = fp;
}
NS_IMPL_ISUPPORTS1(StreamToFile, nsIStreamListener)
StreamToFile::~StreamToFile()
{
if (nsnull != mFile) {
fclose(mFile);
}
}
NS_IMETHODIMP
StreamToFile::GetBindInfo(nsIURI* aURL)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnProgress(nsIURI* aURL, PRInt32 Progress, PRInt32 ProgressMax)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnStatus(nsIURI* aURL, const nsString& aMsg)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnStartRequest(nsIURI* aURL, const char *aContentType)
{
return 0;
}
NS_IMETHODIMP
StreamToFile::OnDataAvailable(nsIURI* aURL, nsIInputStream *pIStream,
PRInt32 length)
{
PRUint32 len;
do {
char buffer[4000];
nsresult err = pIStream->Read(buffer, 0, sizeof(buffer), &len);
if (NS_SUCCEEDED(err)) {
if (nsnull != mFile) {
fwrite(buffer, 1, len, mFile);
}
}
} while (len > 0);
return 0;
}
NS_IMETHODIMP
StreamToFile::OnStopRequest(nsIURI* aURL, PRInt32 status, const nsString& aMsg)
{
mDone = PR_TRUE;
if (0 != status) {
mError = PR_TRUE;
}
return 0;
}
//----------------------------------------------------------------------
// This could turn into a handy utility someday...
class PageGrabber {
public:
PageGrabber();
~PageGrabber();
NS_DECL_AND_IMPL_ZEROING_OPERATOR_NEW
nsresult Init(const nsString& aDirectory);
nsresult Grab(const nsString& aURL);
protected:
char* NextFile(const char* aExtension);
nsString mDirectory;
PRInt32 mFileNum;
};
PageGrabber::PageGrabber()
{
}
PageGrabber::~PageGrabber()
{
}
nsresult
PageGrabber::Init(const nsString& aDirectory)
{
mDirectory = aDirectory;
if (aDirectory.Last() != '/') {
mDirectory.Append('/');
}
return NS_OK;
}
char*
PageGrabber::NextFile(const char* aExtension)
{
char* cname = nsnull;
nsAutoString name;
for (;;) {
name.Truncate();
name.Append(mDirectory);
char fileName[20];
PR_snprintf(fileName, sizeof(fileName), "%08d.%s", mFileNum, aExtension);
name.Append(fileName);
// See if file already exists; if it does advance mFileNum by 100 and
// try again.
cname = ToNewCString(name);
struct stat sb;
int s = stat(cname, &sb);
if (s < 0) {
mFileNum++;
break;
}
else {
mFileNum += 100;
delete [] cname;
}
}
return cname;
}
nsresult
PageGrabber::Grab(const nsString& aURL)
{
char* cname = NextFile("html");
if (nsnull == cname) {
return NS_ERROR_OUT_OF_MEMORY;
}
FILE* fp = fopen(cname, "wb");
if (nsnull == fp) {
return NS_ERROR_OUT_OF_MEMORY;
}
printf("Copying ");
fputs(aURL, stdout);
printf(" to %s\n", cname);
// Create the URL object...
nsIURI* url = NULL;
nsresult rv;
rv = nsCOMPtr<nsIIOService> ioService(do_GetService(kIOServiceCID, &rv));
if (NS_FAILED(rv)) return rv;
nsIChannel *channel = nsnull;
// XXX NECKO what verb? what eventSinkGetter?
rv = ioService->NewChannel("load", aURL, nsnull, nsnull, &channel);
if (NS_FAILED(rv)) return rv;
// Start the URL load...
StreamToFile* copier = new StreamToFile(fp);
if(copier) {
NS_ADDREF(copier);
rv = channel->AsyncOpen(copier, nsnull);
if (NS_OK != rv) {
NS_RELEASE(copier);
NS_RELEASE(url);
return rv;
}
// Enter the message pump to allow the URL load to proceed.
#ifdef XP_PC
MSG msg;
while ( !copier->IsDone() ) {
if (PeekMessage(&msg, NULL, 0, 0, PM_REMOVE)) {
TranslateMessage(&msg);
DispatchMessage(&msg);
}
}
#endif
PRBool error = copier->HaveError();
NS_RELEASE(copier);
}
NS_RELEASE(url);
return error ? NS_ERROR_OUT_OF_MEMORY : NS_OK;
}
//----------------------------------------------------------------------
int
main(int argc, char **argv)
{
nsString url_address;
if (argc != 3) {
fprintf(stderr, "Usage: grabpage url directory\n");
return -1;
}
PageGrabber* grabber = new PageGrabber();
if(grabber) {
grabber->Init(argv[2]);
if (NS_OK != grabber->Grab(argv[1])) {
return -1;
}
}
return 0;
}