Changes between Version 3 and Version 4 of Swish-e

Show
Ignore:
Timestamp:
09/07/08 22:22:53 (16 years ago)
Author:
tianxc (IP: 192.168.192.144)
Comment:

--

Legend:

Unmodified
Added
Removed
Modified
  • Swish-e

    v3 v4  
    1919    email       => 'tianxc@ihep.ac.cn', 
    2020    base_url    => 'http://dayabay.ihep.ac.cn/', 
     21    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    2122    delay_sec   => '1', 
    22     max_depth   => '1', 
    23     credentials => 'username:password' 
     23    max_depth   => 'username:password' 
    2424); 
    2525 
     
    2727    email       => 'tianxc@ihep.ac.cn', 
    2828    base_url    => 'http://dayabay.bnl.gov/private/documents/', 
     29    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    2930    delay_sec   => '1', 
    3031    max_depth   => '1', 
     
    3536    email       => 'tianxc@ihep.ac.cn', 
    3637    base_url    => 'http://dayabay.ihep.ac.cn/cgi-bin/DocDB/ListBy?alldocs=1', 
     38    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    3739    delay_sec   => '1', 
    3840    max_depth   => '1', 
     
    4345    email       => 'tianxc@ihep.ac.cn', 
    4446    base_url    => 'http://dayabay.ihep.ac.cn/cgi-bin/EngDB/ListBy?alldocs=1', 
     47    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    4548    delay_sec   => '1', 
    4649    max_depth   => '1', 
     
    5154    email       => 'tianxc@ihep.ac.cn', 
    5255    base_url    => 'http://dayabay.ihep.ac.cn/internal/', 
     56    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    5357    delay_sec   => '1', 
    5458    max_depth   => '1', 
     
    5963    email       => 'tianxc@ihep.ac.cn', 
    6064    base_url    => 'https://wiki.bnl.gov/dayabay/index.php?title=Main_Page', 
     65    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    6166    delay_sec   => '1', 
    6267    max_depth   => '2', 
     
    6671    email       => 'tianxc@ihep.ac.cn', 
    6772    base_url    => 'https://wiki.bnl.gov/dayabay-private/index.php?title=Main_Page', 
     73    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    6874    delay_sec   => '1', 
    6975    max_depth   => '2', 
     
    7379my %repository  = ( 
    7480    email       => 'tianxc@ihep.ac.cn', 
    75     base_url    => 'http://dayabay.ihep.ac.cn/tracs/dybsvn/browser/', 
     81    base_url    => 'http://dayabay.ihep.ac.cn/svn/dybsvn', 
     82    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root|pdf|ps)$/i }, 
    7683    delay_sec   => '1', 
    7784    max_depth   => '10', 
     
    8289    email       => 'tianxc@ihep.ac.cn', 
    8390    base_url    => 'http://dayabay.ihep.ac.cn/tracs/dybsvn', 
     91    test_url    => sub {  $_[0]->path !~ /\.(?:gif|jpeg|png|gz|root)$/i }, 
    8492    delay_sec   => '1', 
    8593    max_depth   => '2', 
     
    123131 
    124132== Trouble shooting == 
     133   * External program failed to return required headers Path-Name (Swish-e 2.4.5) 
     134{{{                                                                               
     135Warning: document 'http://dayabay.ihep.ac.cn/svn/dybsvn/data/trunk/SimuAlg/output/neutron.output' has no content 
     136Warning: document 'http://dayabay.ihep.ac.cn/svn/dybsvn/db/trunk/DatabaseMaintenance/dict/dict.h' has no content 
     137Warning: document 'http://dayabay.ihep.ac.cn/svn/dybsvn/db/trunk/DatabaseMaintenance/dict/dict.xml' has no content 
     138Warning: document 'http://dayabay.ihep.ac.cn/svn/dybsvn/db/trunk/Util/src/Singleton.cc' has no content 
     139Warning: document 'http://dayabay.ihep.ac.cn/svn/dybsvn/dybgaudi/trunk/Control/DybCommon/ChangeLog' has no content 
     140Warning: document 'http://dayabay.ihep.ac.cn/svn/dybsvn/gaudi/trunk/Gaudi/options/empty.opts' has no content 
     141External Program found: /home/tianxc/local/lib/swish-e/spider.pl 
     142 
     143Warning: Unknown header line: 's' from program spider.pl 
     144 
     145Warning: Unknown header line: '//--------------------------------------------------------------' from program spider.pl 
     146 
     147Warning: Unknown header line: 'ApplicationMgr.EvtMax   = 1;' from program spider.pl 
     148 
     149Warning: Unknown header line: 'ApplicationMgr.EvtSel  = "NONE";' from program spider.pl 
     150err: External program failed to return required headers Path-Name: 
     151}}} 
     152   In spider.pl (see http://swish-e.org/archive/2007-03/11360.html), change: 
    125153{{{ 
    126 Warning: Unknown header line: 'h-Name: http://www.xxx.xxx/xx.htm' from program spider.pl 
    127 err: External program failed to return required headers Path-Name:. 
     154my $bytecount = length pack 'C0a*', $$content; 
    128155}}} 
    129    *  my $bytecount = length($$content); 
    130    * see http://swish-e.org/archive/2007-03/11360.html 
     156to: 
    131157{{{ 
    132 HTTP authorization with password protected Trac/mediawiki  
     158my $bytecount = length($$content); 
    133159}}} 
     160 
     161   * HTTP authorization with password protected Trac/mediawiki  
     162