okay, enough

git-svn-id: file:///svn/phpbb/trunk@8222 89ea8834-ac86-4346-8a33-228a782c2dd0
This commit is contained in:
Henry Sudhof 2007-11-01 13:01:41 +00:00
parent 5f37327568
commit ce8be416d8

View file

@ -23,66 +23,66 @@ $auth->acl($user->data);
$user->setup(); $user->setup();
$bots = array( $bots = array(
'AdsBot [Google]', 'AdsBot [Google]' => array('AdsBot-Google', ''),
'Alexa [Bot]', 'Alexa [Bot]' => array('ia_archiver', ''),
'Alta Vista [Bot]', 'Alta Vista [Bot]' => array('Scooter/', ''),
'Ask Jeeves [Bot]', 'Ask Jeeves [Bot]' => array('Ask Jeeves', ''),
'Baidu [Spider]', 'Baidu [Spider]' => array('Baiduspider+(', ''),
'Exabot [Bot]', 'Exabot [Bot]' => array('Exabot/', ''),
'FAST Enterprise [Crawler]', 'FAST Enterprise [Crawler]' => array('FAST Enterprise Crawler', ''),
'FAST WebCrawler [Crawler]', 'FAST WebCrawler [Crawler]' => array('FAST-WebCrawler/', ''),
'Francis [Bot]', 'Francis [Bot]' => array('http://www.neomo.de/', ''),
'Gigabot [Bot]', 'Gigabot [Bot]' => array('Gigabot/', ''),
'Google Adsense [Bot]', 'Google Adsense [Bot]' => array('Mediapartners-Google', ''),
'Google Desktop', 'Google Desktop' => array('Google Desktop', ''),
'Google Feedfetcher', 'Google Feedfetcher' => array('Feedfetcher-Google', ''),
'Google [Bot]', 'Google [Bot]' => array('Googlebot', ''),
'Heise IT-Markt [Crawler]', 'Heise IT-Markt [Crawler]' => array('heise-IT-Markt-Crawler', ''),
'Heritrix [Crawler]', 'Heritrix [Crawler]' => array('heritrix/1.', ''),
'IBM Research [Bot]', 'IBM Research [Bot]' => array('ibm.com/cs/crawler', ''),
'ICCrawler - ICjobs', 'ICCrawler - ICjobs' => array('ICCrawler - ICjobs', ''),
'ichiro [Crawler]', 'ichiro [Crawler]' => array('ichiro/2', ''),
'Majestic-12 [Bot]', 'Majestic-12 [Bot]' => array('MJ12bot/', ''),
'Metager [Bot]', 'Metager [Bot]' => array('MetagerBot/', ''),
'MSN NewsBlogs', 'MSN NewsBlogs' => array('msnbot-NewsBlogs/', ''),
'MSN [Bot]', 'MSN [Bot]' => array('msnbot/', ''),
'MSNbot Media', 'MSNbot Media' => array('msnbot-media/', ''),
'NG-Search [Bot]', 'NG-Search [Bot]' => array('NG-Search/', ''),
'Nutch [Bot]', 'Nutch [Bot]' => array('http://lucene.apache.org/nutch/', ''),
'Nutch/CVS [Bot]', 'Nutch/CVS [Bot]' => array('NutchCVS/', ''),
'OmniExplorer [Bot]', 'OmniExplorer [Bot]' => array('OmniExplorer_Bot/', ''),
'Online link [Validator]', 'Online link [Validator]' => array('online link validator', ''),
'psbot [Picsearch]', 'psbot [Picsearch]' => array('psbot/0', ''),
'Seekport [Bot]', 'Seekport [Bot]' => array('Seekbot/', ''),
'Sensis [Crawler]', 'Sensis [Crawler]' => array('Sensis Web Crawler', ''),
'SEO Crawler', 'SEO Crawler' => array('SEO search Crawler/', ''),
'Seoma [Crawler]', 'Seoma [Crawler]' => array('Seoma [SEO Crawler]', ''),
'SEOSearch [Crawler]', 'SEOSearch [Crawler]' => array('SEOsearch/', ''),
'Snappy [Bot]', 'Snappy [Bot]' => array('Snappy/1.1 ( http://www.urltrends.com/ )', ''),
'Steeler [Crawler]', 'Steeler [Crawler]' => array('http://www.tkl.iis.u-tokyo.ac.jp/~crawler/', ''),
'Synoo [Bot]', 'Synoo [Bot]' => array('SynooBot/', ''),
'Telekom [Bot]', 'Telekom [Bot]' => array('crawleradmin.t-info@telekom.de', ''),
'TurnitinBot [Bot]', 'TurnitinBot [Bot]' => array('TurnitinBot/', ''),
'Voyager [Bot]', 'Voyager [Bot]' => array('voyager/1.0', ''),
'W3 [Sitesearch]', 'W3 [Sitesearch]' => array('W3 SiteSearch Crawler', ''),
'W3C [Linkcheck]', 'W3C [Linkcheck]' => array('W3C-checklink/', ''),
'W3C [Validator]', 'W3C [Validator]' => array('W3C_*Validator', ''),
'WiseNut [Bot]', 'WiseNut [Bot]' => array('http://www.WISEnutbot.com', ''),
'YaCy [Bot]', 'YaCy [Bot]' => array('yacybot', ''),
'Yahoo MMCrawler [Bot]', 'Yahoo MMCrawler [Bot]' => array('Yahoo-MMCrawler/', ''),
'Yahoo Slurp [Bot]', 'Yahoo Slurp [Bot]' => array('Yahoo! DE Slurp', ''),
'Yahoo [Bot]', 'Yahoo [Bot]' => array('Yahoo! Slurp', ''),
'YahooSeeker [Bot]', 'YahooSeeker [Bot]' => array('YahooSeeker/', ''),
); );
$bot_ids = array(); $bot_ids = array();
user_get_id_name($bot_ids, $bots, USER_IGNORE); user_get_id_name($bot_ids, array_keys($bots), USER_IGNORE);
foreach($bot_ids as $bot) foreach($bot_ids as $bot)
{ {
user_delete('remove', $bot); user_delete('remove', $bot);
} }
// Done // Done
add_bots(); add_bots($bots);
echo 'done'; echo 'done';
@ -92,7 +92,7 @@ echo 'done';
* If you are converting bots this function should not be called * If you are converting bots this function should not be called
* @todo We might want to look at sharing the bot list between the install code and this code for consistency * @todo We might want to look at sharing the bot list between the install code and this code for consistency
*/ */
function add_bots() function add_bots($bots)
{ {
global $db, $config; global $db, $config;
@ -113,58 +113,7 @@ function add_bots()
} }
$bots = array(
'AdsBot [Google]' => array('AdsBot-Google', ''),
'Alexa [Bot]' => array('ia_archiver', ''),
'Alta Vista [Bot]' => array('Scooter/', ''),
'Ask Jeeves [Bot]' => array('Ask Jeeves', ''),
'Baidu [Spider]' => array('Baiduspider+(', ''),
'Exabot [Bot]' => array('Exabot/', ''),
'FAST Enterprise [Crawler]' => array('FAST Enterprise Crawler', ''),
'FAST WebCrawler [Crawler]' => array('FAST-WebCrawler/', ''),
'Francis [Bot]' => array('http://www.neomo.de/', ''),
'Gigabot [Bot]' => array('Gigabot/', ''),
'Google Adsense [Bot]' => array('Mediapartners-Google', ''),
'Google Desktop' => array('Google Desktop', ''),
'Google Feedfetcher' => array('Feedfetcher-Google', ''),
'Google [Bot]' => array('Googlebot', ''),
'Heise IT-Markt [Crawler]' => array('heise-IT-Markt-Crawler', ''),
'Heritrix [Crawler]' => array('heritrix/1.', ''),
'IBM Research [Bot]' => array('ibm.com/cs/crawler', ''),
'ICCrawler - ICjobs' => array('ICCrawler - ICjobs', ''),
'ichiro [Crawler]' => array('ichiro/2', ''),
'Majestic-12 [Bot]' => array('MJ12bot/', ''),
'Metager [Bot]' => array('MetagerBot/', ''),
'MSN NewsBlogs' => array('msnbot-NewsBlogs/', ''),
'MSN [Bot]' => array('msnbot/', ''),
'MSNbot Media' => array('msnbot-media/', ''),
'NG-Search [Bot]' => array('NG-Search/', ''),
'Nutch [Bot]' => array('http://lucene.apache.org/nutch/', ''),
'Nutch/CVS [Bot]' => array('NutchCVS/', ''),
'OmniExplorer [Bot]' => array('OmniExplorer_Bot/', ''),
'Online link [Validator]' => array('online link validator', ''),
'psbot [Picsearch]' => array('psbot/0', ''),
'Seekport [Bot]' => array('Seekbot/', ''),
'Sensis [Crawler]' => array('Sensis Web Crawler', ''),
'SEO Crawler' => array('SEO search Crawler/', ''),
'Seoma [Crawler]' => array('Seoma [SEO Crawler]', ''),
'SEOSearch [Crawler]' => array('SEOsearch/', ''),
'Snappy [Bot]' => array('Snappy/1.1 ( http://www.urltrends.com/ )', ''),
'Steeler [Crawler]' => array('http://www.tkl.iis.u-tokyo.ac.jp/~crawler/', ''),
'Synoo [Bot]' => array('SynooBot/', ''),
'Telekom [Bot]' => array('crawleradmin.t-info@telekom.de', ''),
'TurnitinBot [Bot]' => array('TurnitinBot/', ''),
'Voyager [Bot]' => array('voyager/1.0', ''),
'W3 [Sitesearch]' => array('W3 SiteSearch Crawler', ''),
'W3C [Linkcheck]' => array('W3C-checklink/', ''),
'W3C [Validator]' => array('W3C_*Validator', ''),
'WiseNut [Bot]' => array('http://www.WISEnutbot.com', ''),
'YaCy [Bot]' => array('yacybot', ''),
'Yahoo MMCrawler [Bot]' => array('Yahoo-MMCrawler/', ''),
'Yahoo Slurp [Bot]' => array('Yahoo! DE Slurp', ''),
'Yahoo [Bot]' => array('Yahoo! Slurp', ''),
'YahooSeeker [Bot]' => array('YahooSeeker/', ''),
);
foreach ($bots as $bot_name => $bot_ary) foreach ($bots as $bot_name => $bot_ary)