Here are three site files I've been learning with, all local to the
San Francisco bay area:

URL:  http://www.bayarea.com/news/
Name: BayArea.com News
Description: local news for the SF Bay Area from BayArea.com
AuthorName: Bill Janssen
AuthorEmail: [EMAIL PROTECTED]
Levels: 2
StoryURL:  http://www.bayarea.com/.*
ContentsCachable: 0
ContentsStart: <!--Date-->
ContentsEnd: <CENTER>
StoryStart: <SNML_HEADLINES>
StoryEnd: </SNML_BODY>
ContentsHTMLPreProcess: {
  s,(<I><B>Last updated</B>),<H1>SF Bay Area News</H1><br><i>(from 
http://www.bayarea.com/news/)</i><br>$1,s;
}


URL:  http://www.sfgate.com/news/
Name: SFGate.com News
Description: SF Bay Area news stories from sfgate.com (Chronicle/Examiner/KRON)
AuthorName: Bill Janssen
AuthorEmail: [EMAIL PROTECTED]
Levels: 2
StoryURL:  http://www.sfgate.com/cgi-bin/article.cgi.*
StoryURL:  http://www.sfgate.com/news/baycitynews/.*
ContentsCachable: 0
ContentsStart: <!-- \*\*\*\*\*\*\*\* BEGIN STEW \*\*\*\*\*\*\*\*\*\*\* -->
ContentsEnd: <!-- END STORIES SCRIPT \*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\* --> 
StoryStart: <!-- BEGIN HEADLINE NESTED TABLE -->
StoryEnd: <!-- \*\*\*\*\* END OF BIG TABLE \*\*\*\*\* -->
ContentsHTMLPreProcess: {
  s/^/<H1>News from SFGate\.com<\/H1><br><i>(from SF Chronicle, SF Examiner, KRON, AP, 
SF Gate sources)<\/i><br>/gs;
}
StoryPostProcess: {
        s/<TABLE WIDTH=[0-9]*/<TABLE/gm;
        s/<TD([^>]*)WIDTH=[0-9]*/<TD$1/gm;
        s/<TD([^>]*)NOWRAP/<TD$1/gm;
}


URL:  http://www.sfgate.com/cgi-bin/article-list.cgi?key=FD&directory=Food
Name: SF Chronicle Food
Description: San Francisco Chronicle Food section (published Wednesdays)
AuthorName: Bill Janssen
AuthorEmail: [EMAIL PROTECTED]
Levels: 2
StoryURL:  http://www.sfgate.com/cgi-bin/article.cgi.*
ImageURL: .*/templates/brands/chronicle/images/chronicle\.gif
ContentsCachable: 0
ContentsStart: <!--END HEADLINE MODULE-->
ContentsEnd: <!-- \*\*\*\*\* END OF BIG TABLE \*\*\*\*\* -->
StoryStart: <!-- BEGIN HEADLINE NESTED TABLE -->
StoryEnd: <!-- \*\*\*\*\* END OF BIG TABLE \*\*\*\*\* -->
ContentsHTMLPreProcess: {
  s,^,<H1>SF Chronicle Food Section</H1>,s;
}
StoryPostProcess: {
        s/<TABLE WIDTH=[0-9]*/<TABLE/gm;
        s/<TD([^>]*)WIDTH=[0-9]*/<TD$1/gm;
        s/<TD([^>]*)NOWRAP/<TD$1/gm;
}
_______________________________________________
Sitescooper-talk mailing list
[EMAIL PROTECTED]
http://lists.sourceforge.net/mailman/listinfo/sitescooper-talk

Reply via email to