Let me know if the attached works for you--it seemed like it in my minimal
testing just now.
-Geoff
Index: htdig/Retriever.cc
===================================================================
RCS file: /opt/htdig/cvs/htdig3/htdig/Retriever.cc,v
retrieving revision 1.72.2.40
diff -c -3 -p -r1.72.2.40 Retriever.cc
*** htdig/Retriever.cc 2000/10/10 03:15:36 1.72.2.40
--- htdig/Retriever.cc 2000/10/31 04:39:43
*************** Retriever::got_redirect(const char *new_
*** 1629,1635 ****
delete localRobotsFile;
}
server->push(url.get(), ref->DocHopCount(), base->get(),
! IsLocalURL(url.get()));
String temp = url.get();
visited.Add(temp, 0);
--- 1629,1635 ----
delete localRobotsFile;
}
server->push(url.get(), ref->DocHopCount(), base->get(),
! IsLocalURL(url.get()), 0);
String temp = url.get();
visited.Add(temp, 0);
Index: htdig/Server.cc
===================================================================
RCS file: /opt/htdig/cvs/htdig3/htdig/Server.cc,v
retrieving revision 1.17.2.17
diff -c -3 -p -r1.17.2.17 Server.cc
*** htdig/Server.cc 2000/10/20 03:40:56 1.17.2.17
--- htdig/Server.cc 2000/10/31 04:39:44
*************** void Server::robotstxt(Document &doc)
*** 294,302 ****
//*****************************************************************************
! // void Server::push(String &path, int hopcount, char *referer, int local)
//
! void Server::push(const String &path, int hopcount, const String &referer, int
local)
{
if (_bad_server && !local)
return;
--- 294,303 ----
//*****************************************************************************
! // void Server::push(String &path, int hopcount, char *referer, int local, int
newDoc)
//
! void Server::push(const String &path, int hopcount, const String &referer,
! int local, int newDoc)
{
if (_bad_server && !local)
return;
*************** void Server::push(const String &path, in
*** 309,316 ****
return;
}
! // We use -1 as no limit
! if (_max_documents != -1 &&
_documents >= _max_documents)
{
if (debug>2) // Hey! we only want to get max_docs
--- 310,318 ----
return;
}
! // We use -1 as no limit, but we also don't want
! // to forbid redirects from old places
! if (_max_documents != -1 && newDoc &&
_documents >= _max_documents)
{
if (debug>2) // Hey! we only want to get max_docs
*************** void Server::push(const String &path, in
*** 325,331 ****
ref->SetReferer(referer);
_paths.Add(ref);
! _documents++;
// cout << "***** pushing '" << path << "' with '" << referer << "'\n";
}
--- 327,334 ----
ref->SetReferer(referer);
_paths.Add(ref);
! if (newDoc)
! _documents++;
// cout << "***** pushing '" << path << "' with '" << referer << "'\n";
}
Index: htdig/Server.h
===================================================================
RCS file: /opt/htdig/cvs/htdig3/htdig/Server.h,v
retrieving revision 1.9.2.10
diff -c -3 -p -r1.9.2.10 Server.h
*** htdig/Server.h 2000/10/20 03:40:56 1.9.2.10
--- htdig/Server.h 2000/10/31 04:39:45
*************** public:
*** 61,67 ****
// if it's down, it simply will not be added
//
void push(const String &path, int hopcount, const String &referer,
! int local = 0);
//
// Return the next URL from the queue for this server.
--- 61,67 ----
// if it's down, it simply will not be added
//
void push(const String &path, int hopcount, const String &referer,
! int local = 0, int newDoc = 1);
//
// Return the next URL from the queue for this server.
------------------------------------
To unsubscribe from the htdig3-dev mailing list, send a message to
[EMAIL PROTECTED]
You will receive a message to confirm this.