Commit | Line | Data |
---|---|---|
25ab2d04 MW |
1 | <?xml version="1.0" encoding="UTF-8"?> |
2 | <data xmlns="http://www.woltlab.com" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.woltlab.com http://www.woltlab.com/XSD/maelstrom/spiderList.xsd"> | |
3 | <spider ident="ABCdatos"> | |
4 | <name>ABCdatos BotLink</name> | |
5 | <url>http://www.robotstxt.org/wc/active/html/abcdatos.html</url> | |
6 | </spider> | |
9581146e PM |
7 | <spider ident="AbraveSpider"> |
8 | <name>Abrave</name> | |
9 | <url>http://robot.abrave.co.uk/</url> | |
10 | </spider> | |
25ab2d04 MW |
11 | <spider ident="abot/"> |
12 | <name>abot</name> | |
13 | <url>http://www.abot.com/</url> | |
14 | </spider> | |
15 | <spider ident="Accelatech RSSCrawler"> | |
16 | <name>Accelatech</name> | |
17 | </spider> | |
18 | <spider ident="Accoona-AI-Agent"> | |
19 | <name>Accoona</name> | |
20 | <url>http://accoona.com/about/about_accoona.jsp</url> | |
21 | </spider> | |
22 | <spider ident="aconon Index"> | |
23 | <name>aconon Index (raubfische.de)</name> | |
24 | </spider> | |
25 | <spider ident="AcoonBot"> | |
26 | <name>Acoon</name> | |
27 | <url>http://www.acoon.de/robot.asp</url> | |
28 | </spider> | |
29 | <spider ident="Ahoy!"> | |
30 | <name>Ahoy!</name> | |
31 | <url>http://www.robotstxt.org/wc/active/html/ahoythehomepagefinder.html</url> | |
32 | </spider> | |
33 | <spider ident="AhrefsBot"> | |
34 | <name>Ahrefs</name> | |
35 | <url>http://ahrefs.com/robot/</url> | |
36 | </spider> | |
37 | <spider ident="AlkalineBOT"> | |
38 | <name>Alkaline</name> | |
39 | <url>http://www.robotstxt.org/wc/active/html/Alkaline.html</url> | |
40 | </spider> | |
f55aa1aa P |
41 | <spider ident="AlexaBOT"> |
42 | <name>Alexa</name> | |
43 | <url>http://www.alexa.com/help/webmasters</url> | |
44 | </spider> | |
25ab2d04 MW |
45 | <spider ident="http://www.almaden.ibm.com/cs/crawler"> |
46 | <name>Almaden Crawler</name> | |
47 | <url>http://www.almaden.ibm.com/cs/crawler/</url> | |
48 | </spider> | |
49 | <spider ident="EMC Spider"> | |
50 | <name>ananzi</name> | |
51 | </spider> | |
52 | <spider ident="Anthill"> | |
53 | <name>Anthill</name> | |
54 | <url>http://www.robotstxt.org/wc/active/html/anthill.html</url> | |
55 | </spider> | |
56 | <spider ident="Aport"> | |
57 | <name>Aport</name> | |
58 | <url>http://www.aport.ru/</url> | |
59 | </spider> | |
60 | <spider ident="AppleSyndication"> | |
61 | <name>Apple</name> | |
62 | </spider> | |
63 | <spider ident="Arachnophilia"> | |
64 | <name>Arachnophilia</name> | |
65 | <url>http://www.robotstxt.org/wc/active/html/arachnophilia.html</url> | |
66 | </spider> | |
67 | <spider ident="Araneo"> | |
68 | <name>Araneo</name> | |
69 | <url>http://www.robotstxt.org/wc/active/html/araneo.html</url> | |
70 | </spider> | |
71 | <spider ident="ArchitextSpider"> | |
72 | <name>ArchitextSpider</name> | |
73 | <url>http://www.robotstxt.org/wc/active/html/architext.html</url> | |
74 | </spider> | |
89b52a1a | 75 | <spider ident="archive.org_bot"> |
25ab2d04 | 76 | <name>Archive.org</name> |
89b52a1a | 77 | <url>https://archive.org/details/archive.org_bot</url> |
25ab2d04 MW |
78 | </spider> |
79 | <spider ident="arks/1.0"> | |
80 | <name>arks</name> | |
81 | <url>http://www.robotstxt.org/wc/active/html/arks.html</url> | |
82 | </spider> | |
83 | <spider ident="ASpider"> | |
84 | <name>ASpider</name> | |
85 | <url>http://www.robotstxt.org/wc/active/html/aspider.html</url> | |
86 | </spider> | |
87 | <spider ident="ATN_Worldwide"> | |
88 | <name>ATN Worldwide</name> | |
89 | <url>http://www.robotstxt.org/wc/active/html/atn.txt.html</url> | |
90 | </spider> | |
91 | <spider ident="Atomz"> | |
92 | <name>Atomz.com</name> | |
93 | <url>http://www.robotstxt.org/wc/active/html/atomz.html</url> | |
94 | </spider> | |
95 | <spider ident="AURESYS"> | |
96 | <name>AURESYS</name> | |
97 | <url>http://www.robotstxt.org/wc/active/html/auresys.html</url> | |
98 | </spider> | |
99 | <spider ident="BackRub"> | |
100 | <name>BackRub</name> | |
101 | <url>http://www.robotstxt.org/wc/active/html/backrub.html</url> | |
102 | </spider> | |
103 | <spider ident="Baiduspider"> | |
104 | <name>Baiduspider</name> | |
105 | <url>http://www.baidu.com/search/spider.htm</url> | |
106 | </spider> | |
107 | <spider ident="bbot"> | |
108 | <name>BBot</name> | |
109 | <url>http://www.robotstxt.org/wc/active/html/bbot.html</url> | |
110 | </spider> | |
111 | <spider ident="BecomeBot"> | |
112 | <name>BecomeBot</name> | |
113 | <url>http://www.become.com/webmasters.html</url> | |
114 | </spider> | |
115 | <spider ident="Big Brother"> | |
116 | <name>Big Brother</name> | |
117 | <url>http://www.robotstxt.org/wc/active/html/bigbrother.html</url> | |
118 | </spider> | |
119 | <spider ident="BigmirSpider"> | |
120 | <name>Bigmir</name> | |
121 | <url>http://www.bigmir.net/</url> | |
122 | </spider> | |
123 | <spider ident="bingbot"> | |
124 | <name>Bing</name> | |
125 | <url>http://www.bing.com/bingbot.htm</url> | |
126 | </spider> | |
127 | <spider ident="Bitacle bot"> | |
128 | <name>Bitacle</name> | |
129 | <url>http://bitacle.org/</url> | |
130 | </spider> | |
131 | <spider ident="Biz360 Spider"> | |
132 | <name>Biz</name> | |
133 | <url>http://www.biz360.com</url> | |
134 | </spider> | |
135 | <spider ident="Bjaaland"> | |
136 | <name>Bjaaland</name> | |
137 | <url>http://www.robotstxt.org/wc/active/html/bjaaland.html</url> | |
138 | </spider> | |
139 | <spider ident="BlackWidow"> | |
140 | <name>BlackWidow</name> | |
141 | <url>http://www.robotstxt.org/wc/active/html/blackwidow.html</url> | |
142 | </spider> | |
b730b757 MW |
143 | <spider ident="BLEXBot"> |
144 | <name>BLEXBot</name> | |
145 | <url>http://webmeup.com/crawler.html</url> | |
146 | </spider> | |
25ab2d04 MW |
147 | <spider ident="BlogCrawler by Xango"> |
148 | <name>BlogCrawler</name> | |
149 | </spider> | |
150 | <spider ident="blogdb"> | |
151 | <name>BlogDb</name> | |
152 | <url>http://blogdb.jp</url> | |
153 | </spider> | |
154 | <spider ident="blog search engine by BlogFan.ORG"> | |
155 | <name>BlogFan</name> | |
156 | <url>http://www.blogfan.org</url> | |
157 | </spider> | |
158 | <spider ident="Bloglines"> | |
159 | <name>Bloglies</name> | |
160 | <url>http://www.bloglines.com</url> | |
161 | </spider> | |
162 | <spider ident="BlogPulse (ISSpider-3.0)"> | |
163 | <name>BlogPulse</name> | |
164 | </spider> | |
165 | <spider ident="BlogSearch"> | |
166 | <name>BlogSearch</name> | |
167 | <url>http://www.icerocket.com</url> | |
168 | </spider> | |
169 | <spider ident="BlogsNowBot"> | |
170 | <name>BlogsNow</name> | |
171 | <url>http://www.blogsnow.com/</url> | |
172 | </spider> | |
173 | <spider ident="BlogStreetBot"> | |
174 | <name>BlogStreetBot</name> | |
175 | <url>http://www.blogstreet.com/</url> | |
176 | </spider> | |
177 | <spider ident="Bulkfeeds"> | |
178 | <name>BlogStreetBot</name> | |
179 | <url>http://bulkfeeds.net</url> | |
180 | </spider> | |
181 | <spider ident="BoardPulse"> | |
182 | <name>BoardPulse</name> | |
183 | <url>http://www.boardpulse.com/</url> | |
184 | </spider> | |
185 | <spider ident="BoardReader"> | |
186 | <name>BoardReader</name> | |
187 | <url>http://www.boardreader.com/aboutus.asp</url> | |
188 | </spider> | |
189 | <spider ident="BoardViewer"> | |
190 | <name>BoardViewer</name> | |
191 | <url>http://www.boardviewer.com/</url> | |
192 | </spider> | |
193 | <spider ident="boitho.com-robot"> | |
194 | <name>Boitho</name> | |
195 | <url>http://www.boitho.com/bot.html</url> | |
196 | </spider> | |
197 | <spider ident="borg-bot"> | |
198 | <name>Borg-Bot</name> | |
199 | <url>http://www.robotstxt.org/wc/active/html/borg-bot.html</url> | |
200 | </spider> | |
201 | <spider ident="BSpider"> | |
202 | <name>BSpider</name> | |
203 | <url>http://www.robotstxt.org/wc/active/html/bspider.html</url> | |
204 | </spider> | |
205 | <spider ident="CACTVS Chemistry Spider"> | |
206 | <name>CACTVS Chemistry</name> | |
207 | </spider> | |
208 | <spider ident="Calif"> | |
209 | <name>Calif</name> | |
210 | </spider> | |
211 | <spider ident="CaRP/3.6Evolution"> | |
212 | <name>CaRP</name> | |
213 | <url>http://www.biz360.com</url> | |
214 | </spider> | |
215 | <spider ident="Checkbot"> | |
216 | <name>Checkbot</name> | |
217 | </spider> | |
218 | <spider ident="ChristCrawler.com"> | |
219 | <name>ChristCrawler.com</name> | |
220 | </spider> | |
221 | <spider ident="www.cienciaficcion.net"> | |
222 | <name>cIeNcIaFiCcIoN.nEt</name> | |
223 | </spider> | |
224 | <spider ident="CipinetBot"> | |
225 | <name>Cipinet</name> | |
226 | <url>http://www.cipinet.com/bot.html</url> | |
227 | </spider> | |
228 | <spider ident="CJNetworkQuality"> | |
229 | <name>CJNetworkQuality</name> | |
230 | <url>http://www.cj.com/networkquality/</url> | |
231 | </spider> | |
232 | <spider ident="CMC/0.01"> | |
233 | <name>CMC/0.01</name> | |
234 | </spider> | |
235 | <spider ident="ColdFusion"> | |
236 | <name>ColdFusion</name> | |
237 | </spider> | |
238 | <spider ident="combine"> | |
239 | <name>Combine System</name> | |
240 | </spider> | |
241 | <spider ident="Crawler (cometsearch@cometsystems.com)"> | |
242 | <name>cometsystems.com</name> | |
243 | </spider> | |
244 | <spider ident="ComputingSite Robi/1.0"> | |
245 | <name>ComputingSite Robi/1.0</name> | |
246 | </spider> | |
247 | <spider ident="conceptbot"> | |
248 | <name>Conceptbot</name> | |
249 | </spider> | |
250 | <spider ident="Cooby.de Crawler"> | |
251 | <name>Cooby.de Crawler</name> | |
252 | </spider> | |
253 | <spider ident="CoolBot"> | |
254 | <name>CoolBot</name> | |
255 | </spider> | |
256 | <spider ident="Cusco"> | |
257 | <name>Cusco</name> | |
258 | </spider> | |
259 | <spider ident="CyberSpyder"> | |
260 | <name>CyberSpyder</name> | |
261 | </spider> | |
262 | <spider ident="daypopbot"> | |
263 | <name>daypop</name> | |
264 | </spider> | |
265 | <spider ident="DesertRealm.com"> | |
266 | <name>Desert Realm</name> | |
267 | </spider> | |
268 | <spider ident="Deweb"> | |
269 | <name>DeWeb(c)</name> | |
270 | </spider> | |
271 | <spider ident="Die Blinde Kuh"> | |
272 | <name>Die Blinde Kuh</name> | |
273 | <url>http://www.robotstxt.org/wc/active/html/blindekuh.html</url> | |
274 | </spider> | |
275 | <spider ident="dienstspider"> | |
276 | <name>DienstSpider</name> | |
277 | </spider> | |
278 | <spider ident="Digger/1.0 JDK/1.3.0"> | |
279 | <name>Digger</name> | |
280 | </spider> | |
281 | <spider ident="Digimarc WebReader"> | |
282 | <name>Digimarc MarcSpider</name> | |
283 | </spider> | |
284 | <spider ident="Digimarc CGIReader"> | |
285 | <name>Digimarc Marcspider/CGI</name> | |
286 | </spider> | |
287 | <spider ident="DIIbot"> | |
288 | <name>Digital Integrity Robot</name> | |
289 | </spider> | |
290 | <spider ident="grabber"> | |
291 | <name>Direct Hit Grabber</name> | |
292 | </spider> | |
293 | <spider ident="discobot"> | |
294 | <name>Discovery</name> | |
295 | <url>http://discoveryengine.com/discobot.html</url> | |
296 | </spider> | |
297 | <spider ident="DNAbot/1.0"> | |
298 | <name>DNAbot</name> | |
299 | </spider> | |
300 | <spider ident="DragonBot/1.0 libwww/5.0"> | |
301 | <name>DragonBot</name> | |
302 | </spider> | |
303 | <spider ident="DWCP/2.0"> | |
304 | <name>DWCP (Dridus' Web Cataloging Project)</name> | |
305 | </spider> | |
306 | <spider ident="e-SocietyRobot"> | |
307 | <name>e-Society</name> | |
308 | <url>http://www.yama.info.waseda.ac.jp/~yamana/es/index_eng.htm</url> | |
309 | </spider> | |
310 | <spider ident="exactseek-pagereaper"> | |
311 | <name>eaxactseek-page</name> | |
312 | </spider> | |
313 | <spider ident="EbiNess/0.01a"> | |
314 | <name>EbiNess</name> | |
315 | </spider> | |
316 | <spider ident="edgeio-retriever"> | |
317 | <name>Edgeio</name> | |
318 | <url>http://www.edgeio.com</url> | |
319 | </spider> | |
320 | <spider ident="EIT-Link-Verifier-Robot/0.2"> | |
321 | <name>EIT Link Verifier Robot</name> | |
322 | </spider> | |
323 | <spider ident="elfinbot"> | |
324 | <name>ELFINBOT</name> | |
325 | </spider> | |
326 | <spider ident="Emacs-w3/v[0-9\.]+"> | |
327 | <name>Emacs-w3 Search Engine</name> | |
328 | </spider> | |
329 | <spider ident="esther"> | |
330 | <name>Esther</name> | |
331 | </spider> | |
332 | <spider ident="EuripBot/"> | |
333 | <name>EuripBot</name> | |
334 | </spider> | |
335 | <spider ident="Evliya Celebi"> | |
336 | <name>Evliya Celebi</name> | |
337 | </spider> | |
338 | <spider ident="ExactSeek_Spider"> | |
339 | <name>ExactSeek_Spider</name> | |
340 | <url>http://www.askjeevs.com</url> | |
341 | </spider> | |
342 | <spider ident="NG/2.0"> | |
343 | <name>ExaLead</name> | |
344 | <url>http://botspotter.net/bs-389.html</url> | |
345 | </spider> | |
346 | <spider ident="ExaBot"> | |
347 | <name>ExaLead Beta</name> | |
348 | <url>http://beta.exalead.com/search/C=0/2p=Help.7</url> | |
349 | </spider> | |
f55aa1aa P |
350 | <spider ident="ExaLead"> |
351 | <name>ExaLead</name> | |
352 | <url>http://www.exalead.com/search</url> | |
353 | </spider> | |
25ab2d04 MW |
354 | <spider ident="facebookexternalhit"> |
355 | <name>Facebook</name> | |
356 | <url>http://www.facebook.com/externalhit_uatext.php</url> | |
357 | </spider> | |
358 | <spider ident="fast-webcrawler"> | |
359 | <name>FAST / AlltheWeb</name> | |
360 | <url>http://help.yahoo.com/help/us/ysearch/slurp/index.html</url> | |
361 | </spider> | |
362 | <spider ident="FastCrawler"> | |
363 | <name>FastCrawler</name> | |
364 | </spider> | |
365 | <spider ident="Feed24.com"> | |
366 | <name>Feed24</name> | |
367 | <url>http://www.feed24.com</url> | |
368 | </spider> | |
369 | <spider ident="FeedBlitz"> | |
370 | <name>FeedBlitz</name> | |
371 | <url>http://www.feedblitz.com</url> | |
372 | </spider> | |
373 | <spider ident="FeedBurner"> | |
374 | <name>FeedBurner</name> | |
375 | <url>http://www.FeedBurner.com</url> | |
376 | </spider> | |
7a944c3f MW |
377 | <spider ident="Feedly"> |
378 | <name>Feedly</name> | |
379 | <url>http://www.feedly.com/fetcher.html</url> | |
380 | </spider> | |
25ab2d04 MW |
381 | <spider ident="Feedfetcher-Google"> |
382 | <name>FeedFetcher-Google</name> | |
383 | <url>http://www.google.com/feedfetcher.html</url> | |
384 | </spider> | |
385 | <spider ident="UniversalFeedParser"> | |
386 | <name>FeedParser</name> | |
387 | <url>http://www.feedparser.org</url> | |
388 | </spider> | |
389 | <spider ident="Feedster Crawler"> | |
390 | <name>Feedster</name> | |
391 | <url>http://www.feedstermedia.com/</url> | |
392 | </spider> | |
393 | <spider ident="FEHLSTART Superspider"> | |
394 | <name>FEHLSTART</name> | |
395 | </spider> | |
396 | <spider ident="FelixIDE"> | |
397 | <name>Felix IDE</name> | |
398 | </spider> | |
399 | <spider ident="ESIRover"> | |
400 | <name>FetchRover</name> | |
401 | </spider> | |
402 | <spider ident="fido"> | |
403 | <name>fido</name> | |
404 | </spider> | |
405 | <spider ident="findlinks"> | |
406 | <name>FindLinks</name> | |
407 | <url>http://wortschatz.uni-leipzig.de/findlinks/</url> | |
408 | </spider> | |
409 | <spider ident="FindoryBot"> | |
410 | <name>Findroy</name> | |
411 | <url>http://www.findory.com</url> | |
412 | </spider> | |
413 | <spider ident="Fish-Search-Robot"> | |
414 | <name>Fish search</name> | |
415 | </spider> | |
416 | <spider ident="Mozilla/4.0 (compatible: FDSE robot)"> | |
417 | <name>Fluid Dynamics</name> | |
418 | </spider> | |
419 | <spider ident="fouineur.9bit.qc.ca"> | |
420 | <name>Fouineur</name> | |
421 | </spider> | |
422 | <spider ident="Freecrawl"> | |
423 | <name>Freecrawl</name> | |
424 | </spider> | |
425 | <spider ident="FunnelWeb"> | |
426 | <name>FunnelWeb</name> | |
427 | </spider> | |
428 | <spider ident="GaisBot"> | |
429 | <name>Gais</name> | |
430 | <url>http://gais.cs.ccu.edu.tw/robot.php</url> | |
431 | </spider> | |
432 | <spider ident="gamekitbot"> | |
433 | <name>GAMEKIT</name> | |
434 | <url>http://www.uchoose.de/crawler/gamekitbot/</url> | |
435 | </spider> | |
436 | <spider ident="gammaSpider"> | |
437 | <name>gammaSpider</name> | |
438 | </spider> | |
439 | <spider ident="gazz"> | |
440 | <name>gazz</name> | |
441 | </spider> | |
442 | <spider ident="gcreep"> | |
443 | <name>GCreep</name> | |
444 | </spider> | |
445 | <spider ident="genieBot"> | |
446 | <name>genieBot</name> | |
447 | <url>http://64.5.245.11/faq/faq.html</url> | |
448 | </spider> | |
449 | <spider ident="geourl"> | |
450 | <name>GeoURL</name> | |
451 | <url>http://geourl.org/bot.html</url> | |
452 | </spider> | |
453 | <spider ident="GetterroboPlus"> | |
454 | <name>GetterroboPlus Puu</name> | |
455 | </spider> | |
456 | <spider ident="GetURL.rexx"> | |
457 | <name>GetURL</name> | |
458 | </spider> | |
459 | <spider ident="Gigabot"> | |
460 | <name>Gigabot</name> | |
461 | <url>http://www.gigablast.com/spider.html</url> | |
462 | </spider> | |
463 | <spider ident="Girafabot"> | |
464 | <name>Girafabot</name> | |
465 | <url>http://www.girafa.com/</url> | |
466 | </spider> | |
467 | <spider ident="Goku"> | |
468 | <name>Goku</name> | |
469 | <url>http://goku.ru/bot.htm; bot@goku.ru</url> | |
470 | </spider> | |
471 | <spider ident="Golem"> | |
472 | <name>Golem</name> | |
473 | </spider> | |
474 | <spider ident="gonzo"> | |
475 | <name>Gonzo</name> | |
476 | </spider> | |
477 | <spider ident="Googlebot/"> | |
478 | <name>Google</name> | |
479 | <url>http://www.google.com/bot.html</url> | |
480 | </spider> | |
481 | <spider ident="Mediapartners-Google"> | |
482 | <name>Google AdSense</name> | |
483 | <url>https://www.google.com/adsense/faq</url> | |
484 | </spider> | |
485 | <spider ident="Googlebot-Image"> | |
486 | <name>Googlebot-Image</name> | |
487 | <url>http://www.googlebot.com/bot.html</url> | |
488 | </spider> | |
489 | <spider ident="Googlebot-Mobile"> | |
490 | <name>Googlebot-Mobile</name> | |
491 | <url>http://www.google.com/bot.html</url> | |
492 | </spider> | |
493 | <spider ident="Gpostbot"> | |
494 | <name>Gpostbot</name> | |
495 | <url>http://www.gpost.info/help.php?c=bot</url> | |
496 | </spider> | |
497 | <spider ident="griffon"> | |
498 | <name>Griffon</name> | |
499 | </spider> | |
500 | <spider ident="Gromit"> | |
501 | <name>Gromit</name> | |
502 | </spider> | |
503 | <spider ident="http://grub.org"> | |
504 | <name>Grub Client</name> | |
505 | </spider> | |
506 | <spider ident="Gulper Web Bot"> | |
507 | <name>Gulper Bot</name> | |
508 | </spider> | |
509 | <spider ident="havIndex"> | |
510 | <name>havIndex</name> | |
511 | </spider> | |
512 | <spider ident="HeinrichderMiragoRobot"> | |
513 | <name>HeinrichderMiragoRobot</name> | |
514 | </spider> | |
515 | <spider ident="HenryTheMiragoRobot"> | |
516 | <name>HenryTheMiragoRobot</name> | |
517 | </spider> | |
518 | <spider ident="heritrix"> | |
519 | <name>Heritrix</name> | |
520 | <url>http://www.worio.com</url> | |
521 | </spider> | |
522 | <spider ident="HKU WWW Robot"> | |
523 | <name>HKU WWW Octopus</name> | |
524 | </spider> | |
525 | <spider ident="HolyCowDude"> | |
526 | <name>HolyCowDude</name> | |
527 | <url>http://www.holycowdude.com/spider.htm</url> | |
528 | </spider> | |
9581146e PM |
529 | <spider ident="HomeTags"> |
530 | <name>HomeTags</name> | |
531 | <url>http://www.hometags.nl/bot</url> | |
532 | </spider> | |
25ab2d04 MW |
533 | <spider ident="Hometown"> |
534 | <name>Hometown</name> | |
535 | </spider> | |
536 | <spider ident="htdig"> | |
537 | <name>ht://Dig</name> | |
538 | </spider> | |
539 | <spider ident="AITCSRobot"> | |
540 | <name>HTML Index</name> | |
541 | </spider> | |
542 | <spider ident="HTMLgobble"> | |
543 | <name>HTMLgobble</name> | |
544 | </spider> | |
545 | <spider ident="I Robot"> | |
546 | <name>I, Robot</name> | |
547 | </spider> | |
548 | <spider ident="iajaBot"> | |
549 | <name>iajaBot</name> | |
550 | </spider> | |
551 | <spider ident="IBM_Planetwide"> | |
552 | <name>IBM_Planetwide</name> | |
553 | </spider> | |
554 | <spider ident="+http://www.icerocket.com/"> | |
555 | <name>IceRocket</name> | |
556 | <url>http://www.icerocket.com/</url> | |
557 | </spider> | |
558 | <spider ident="ichiro"> | |
559 | <name>ichiro</name> | |
560 | </spider> | |
561 | <spider ident="IlTrovatore-Setaccio"> | |
562 | <name>IlTrovatore-Setaccio</name> | |
563 | <url>http://www.iltrovatore.it/aiuto/faq.html</url> | |
564 | </spider> | |
565 | <spider ident="image.kapsi.net"> | |
566 | <name>image.kapsi.net</name> | |
567 | </spider> | |
568 | <spider ident="Mozilla 3.01 PBWF (Win95)"> | |
569 | <name>Imagelock</name> | |
570 | </spider> | |
571 | <spider ident="IncyWincy"> | |
572 | <name>IncyWincy</name> | |
573 | </spider> | |
574 | <spider ident="Informant"> | |
575 | <name>Informant</name> | |
576 | </spider> | |
577 | <spider ident="InfoSeek Robot"> | |
578 | <name>InfoSeek Robot 1.0</name> | |
579 | </spider> | |
580 | <spider ident="Infoseek Sidewinder"> | |
581 | <name>Infoseek Sidewinder</name> | |
582 | </spider> | |
583 | <spider ident="InfoSpiders"> | |
584 | <name>InfoSpiders</name> | |
585 | </spider> | |
586 | <spider ident="INGRID"> | |
587 | <name>Ingrid</name> | |
588 | </spider> | |
589 | <spider ident="slurp@inktomi"> | |
590 | <name>Inktomi</name> | |
591 | </spider> | |
592 | <spider ident="Insitor"> | |
593 | <name>Insitor</name> | |
594 | <url>http://www.insitor.de/</url> | |
595 | </spider> | |
596 | <spider ident="inspectorwww"> | |
597 | <name>Inspector Web</name> | |
598 | </spider> | |
599 | <spider ident="IAGENT"> | |
600 | <name>IntelliAgent</name> | |
601 | </spider> | |
602 | <spider ident="Intelliseek"> | |
603 | <name>Intelliseek</name> | |
604 | <url>http://www.intelliseek.com/</url> | |
605 | </spider> | |
606 | <spider ident="Internet Cruiser Robot"> | |
607 | <name>Internet Cruiser</name> | |
608 | </spider> | |
609 | <spider ident="internetseer"> | |
610 | <name>Internet Seer</name> | |
611 | </spider> | |
612 | <spider ident="sharp-info-agent"> | |
613 | <name>Internet Shinchakubin</name> | |
614 | </spider> | |
615 | <spider ident="InternetLinkAgent"> | |
616 | <name>InternetLinkAgent</name> | |
617 | </spider> | |
618 | <spider ident="IRLbot"> | |
619 | <name>IRL Crawler</name> | |
620 | <url>http://irl.cs.tamu.edu/crawler</url> | |
621 | </spider> | |
622 | <spider ident="Iron33"> | |
623 | <name>Iron33</name> | |
624 | </spider> | |
625 | <spider ident="IsraeliSearch"> | |
626 | <name>Israeli-search</name> | |
627 | </spider> | |
628 | <spider ident="itchBot"> | |
629 | <name>itch</name> | |
630 | <url>http://www.itch.com/infoforwebmasters.html</url> | |
631 | </spider> | |
632 | <spider ident="JavaBee"> | |
633 | <name>JavaBee</name> | |
634 | </spider> | |
635 | <spider ident="JBot"> | |
636 | <name>JBot</name> | |
637 | </spider> | |
638 | <spider ident="JCrawler"> | |
639 | <name>JCrawler</name> | |
640 | </spider> | |
641 | <spider ident="JetBot"> | |
642 | <name>JetEye</name> | |
643 | <url>http://www.jeteye.com/jetbot.html</url> | |
644 | </spider> | |
645 | <spider ident="JoBo"> | |
646 | <name>JoBo</name> | |
647 | </spider> | |
648 | <spider ident="Jobot"> | |
649 | <name>Jobot</name> | |
650 | </spider> | |
651 | <spider ident="jobs.de"> | |
652 | <name>Jobs.de</name> | |
653 | <url>http://www.jobs.de/</url> | |
654 | </spider> | |
655 | <spider ident="JoeBot"> | |
656 | <name>JoeBot</name> | |
657 | </spider> | |
658 | <spider ident="jumpstation"> | |
659 | <name>JumpStation</name> | |
660 | </spider> | |
661 | <spider ident="Katipo"> | |
662 | <name>Katipo</name> | |
663 | </spider> | |
664 | <spider ident="KDD-Explorer"> | |
665 | <name>KDD-Explorer</name> | |
666 | </spider> | |
667 | <spider ident="KIT-Fireball"> | |
668 | <name>KIT-Fireball</name> | |
669 | </spider> | |
670 | <spider ident="KO_Yappo_Robot"> | |
671 | <name>KO_Yappo_Robot</name> | |
672 | </spider> | |
673 | <spider ident="LabelGrab"> | |
674 | <name>LabelGrabber</name> | |
675 | </spider> | |
676 | <spider ident="larbin"> | |
677 | <name>larbin</name> | |
678 | </spider> | |
679 | <spider ident="legs"> | |
680 | <name>legs</name> | |
681 | </spider> | |
682 | <spider ident="LinkScan Server"> | |
683 | <name>LinkScan</name> | |
684 | </spider> | |
685 | <spider ident="LinkWalker"> | |
686 | <name>LinkWalker</name> | |
687 | </spider> | |
f55aa1aa P |
688 | <spider ident="Linguee Bot"> |
689 | <name>Linguee</name> | |
690 | <url>http://www.linguee.com/bot</url> | |
691 | </spider> | |
25ab2d04 MW |
692 | <spider ident="livedoorCheckers/"> |
693 | <name>livedoorCheckers</name> | |
694 | </spider> | |
695 | <spider ident="Lockon"> | |
696 | <name>Lockon</name> | |
697 | </spider> | |
698 | <spider ident="logo.gif crawler"> | |
699 | <name>logo.gif</name> | |
700 | </spider> | |
701 | <spider ident="Lycos"> | |
702 | <name>Lycos</name> | |
703 | </spider> | |
704 | <spider ident="Magpie"> | |
705 | <name>Magpie</name> | |
706 | </spider> | |
707 | <spider ident="MJ12bot"> | |
708 | <name>Majestics MJ12bot</name> | |
709 | </spider> | |
710 | <spider ident="Mammoth"> | |
711 | <name>Mammoth</name> | |
712 | <url>http://www.sli-systems.com</url> | |
713 | </spider> | |
714 | <spider ident="Marvin"> | |
715 | <name>Marvin</name> | |
716 | </spider> | |
717 | <spider ident="marvin/infoseek"> | |
718 | <name>marvin/infoseek</name> | |
719 | </spider> | |
720 | <spider ident="M/3.8"> | |
721 | <name>Mattie</name> | |
722 | </spider> | |
723 | <spider ident="MediaFox"> | |
724 | <name>MediaFox</name> | |
725 | </spider> | |
d9cc31f0 SG |
726 | <spider ident="memorybot"> |
727 | <name>Memorybot</name> | |
728 | <url>http://archivethe.net/en/index.php/about/internet_memory1</url> | |
729 | </spider> | |
25ab2d04 MW |
730 | <spider ident="mercator"> |
731 | <name>Mercator</name> | |
732 | <url>http://research.compaq.com/SRC/mercator/</url> | |
733 | </spider> | |
734 | <spider ident="MerzScope"> | |
735 | <name>MerzScope</name> | |
736 | </spider> | |
737 | <spider ident="METASpider"> | |
738 | <name>META</name> | |
739 | <url>http://www.meta.com.ua/</url> | |
740 | </spider> | |
741 | <spider ident="MetaGer-LinkChecker"> | |
742 | <name>MetaGer</name> | |
743 | </spider> | |
744 | <spider ident="MindCrawler"> | |
745 | <name>MindCrawler</name> | |
746 | </spider> | |
747 | <spider ident="Miva"> | |
748 | <name>Miva</name> | |
749 | </spider> | |
750 | <spider ident="UdmSearch"> | |
751 | <name>mnoGoSearch</name> | |
752 | </spider> | |
753 | <spider ident="moget"> | |
754 | <name>moget</name> | |
755 | </spider> | |
756 | <spider ident="MOMspider"> | |
757 | <name>MOMspider</name> | |
758 | </spider> | |
759 | <spider ident="Monster"> | |
760 | <name>Monster</name> | |
761 | </spider> | |
762 | <spider ident="Moreoverbot"> | |
763 | <name>Moreover</name> | |
764 | <url>http://www.moreover.com</url> | |
765 | </spider> | |
766 | <spider ident="msnbot"> | |
767 | <name>MSNBot</name> | |
768 | <url>http://search.msn.com/msnbot.htm</url> | |
769 | </spider> | |
770 | <spider ident="MSRBOT"> | |
771 | <name>MSRBOT</name> | |
772 | <url>http://research.microsoft.com/research/sv/msrbot/</url> | |
773 | </spider> | |
774 | <spider ident="MuscatFerret"> | |
775 | <name>Muscat Ferret</name> | |
776 | </spider> | |
777 | <spider ident="MwdSearch"> | |
778 | <name>Mwd.Search</name> | |
779 | </spider> | |
780 | <spider ident="NPBot"> | |
781 | <name>NameProtect</name> | |
782 | </spider> | |
783 | <spider ident="NaverBot"> | |
784 | <name>NaverBot</name> | |
785 | <url>http://www.spidermatic.com/en/robot-spider/20</url> | |
52bb0ca4 | 786 | </spider> |
6a3fbb36 | 787 | <spider ident="NDSpider"> |
52bb0ca4 | 788 | <name>NDSpider</name> |
25ab2d04 MW |
789 | </spider> |
790 | <spider ident="NEC-MeshExplorer"> | |
791 | <name>NEC-MeshExplorer</name> | |
792 | </spider> | |
793 | <spider ident="Nederland.zoek"> | |
794 | <name>Nederland.zoek</name> | |
795 | </spider> | |
89b52a1a MW |
796 | <spider ident="NerdyBot"> |
797 | <name>NerdyBot</name> | |
798 | <url>http://nerdybot.com/</url> | |
799 | </spider> | |
25ab2d04 MW |
800 | <spider ident="NetCarta CyberPilot Pro"> |
801 | <name>NetCarta WebMap</name> | |
802 | </spider> | |
803 | <spider ident="Netcraft"> | |
804 | <name>Netcraft Web Server Survey</name> | |
805 | <url>http://news.netcraft.com/</url> | |
806 | </spider> | |
807 | <spider ident="NetMechanic"> | |
808 | <name>NetMechanic</name> | |
809 | </spider> | |
810 | <spider ident="NetScoop"> | |
811 | <name>NetScoop</name> | |
812 | </spider> | |
813 | <spider ident="newscan-online"> | |
814 | <name>newscan-online</name> | |
815 | </spider> | |
816 | <spider ident="NextGenSearchBot 1"> | |
817 | <name>NextGenSearchBot</name> | |
818 | <url>http://www.zoominfo.com/NextGenSearchBot</url> | |
819 | </spider> | |
820 | <spider ident="NHSEWalker"> | |
821 | <name>NHSE Web Forager</name> | |
822 | </spider> | |
823 | <spider ident="NIF"> | |
824 | <name>NIF</name> | |
825 | <url>http://www.newsisfree.com/robot.php users</url> | |
826 | </spider> | |
827 | <spider ident="NimbleCrawler"> | |
828 | <name>NimbleCrawler</name> | |
829 | <url>http://www.healthline.com/aboutus.jsp</url> | |
830 | </spider> | |
831 | <spider ident="Nomad"> | |
832 | <name>Nomad</name> | |
833 | </spider> | |
834 | <spider ident="Norbert the Spider"> | |
835 | <name>Norbert</name> | |
836 | <url>http://www.Burf.com</url> | |
837 | </spider> | |
838 | <spider ident="Gulliver"> | |
839 | <name>Northern Light</name> | |
840 | </spider> | |
841 | <spider ident="explorersearch"> | |
842 | <name>nzexplorer</name> | |
843 | </spider> | |
844 | <spider ident="Occam"> | |
845 | <name>Occam</name> | |
846 | </spider> | |
847 | <spider ident="Ocelli"> | |
848 | <name>Ocelli</name> | |
849 | <url>http://www.globalspec.com/Ocelli</url> | |
850 | </spider> | |
851 | <spider ident="Online24-Bot"> | |
852 | <name>Online24-Bot</name> | |
853 | </spider> | |
854 | <spider ident="Openbot"> | |
855 | <name>Openbot</name> | |
856 | <url>http://www.openfind.com.tw/robot.html</url> | |
857 | </spider> | |
858 | <spider ident="Openfind"> | |
859 | <name>Openfind data gatherer</name> | |
860 | </spider> | |
861 | <spider ident="Orbsearch"> | |
862 | <name>Orb Search</name> | |
863 | </spider> | |
864 | <spider ident="PackRat"> | |
865 | <name>Pack Rat</name> | |
866 | </spider> | |
867 | <spider ident="PageBoy"> | |
868 | <name>PageBoy</name> | |
869 | </spider> | |
870 | <spider ident="ParaSite"> | |
871 | <name>ParaSite</name> | |
872 | </spider> | |
873 | <spider ident="Patric"> | |
874 | <name>Patric</name> | |
875 | </spider> | |
876 | <spider ident="PEGASUS"> | |
877 | <name>pegasus</name> | |
878 | </spider> | |
879 | <spider ident="PerlCrawler/1.0 Xavatoria/2.0"> | |
880 | <name>PerlCrawler 1.0</name> | |
881 | </spider> | |
882 | <spider ident="PGP-KA"> | |
883 | <name>PGP Key Agent</name> | |
884 | </spider> | |
885 | <spider ident="Duppies"> | |
886 | <name>Phantom</name> | |
887 | </spider> | |
888 | <spider ident="phpdig"> | |
889 | <name>PhpDig</name> | |
890 | </spider> | |
891 | <spider ident="PiltdownMan"> | |
892 | <name>PiltdownMan</name> | |
893 | </spider> | |
894 | <spider ident="Pimptrain's robot"> | |
895 | <name>Pimptrain.com's</name> | |
896 | </spider> | |
897 | <spider ident="pingalink"> | |
898 | <name>PingALink</name> | |
899 | </spider> | |
900 | <spider ident="Pioneer"> | |
901 | <name>Pioneer</name> | |
902 | </spider> | |
903 | <spider ident="PluckFeedCrawler"> | |
904 | <name>Pluck</name> | |
905 | <url>http://www.pluck.com</url> | |
906 | </spider> | |
907 | <spider ident="PlumtreeWebAccessor"> | |
908 | <name>PlumtreeWebAccessor</name> | |
909 | </spider> | |
910 | <spider ident="PodNova"> | |
911 | <name>PodNova</name> | |
912 | <url>http://www.podnova.com</url> | |
913 | </spider> | |
914 | <spider ident="Pompos"> | |
915 | <name>Pompos</name> | |
916 | <url>http://dir.com/pompos.html</url> | |
917 | </spider> | |
918 | <spider ident="Poppi"> | |
919 | <name>Poppi</name> | |
920 | </spider> | |
921 | <spider ident="gestaltIconoclast"> | |
922 | <name>Popular Iconoclast</name> | |
923 | </spider> | |
924 | <spider ident="PortalJuice.com"> | |
925 | <name>Portal Juice</name> | |
926 | </spider> | |
927 | <spider ident="PortalBSpider"> | |
928 | <name>PortalB Spider</name> | |
929 | </spider> | |
f55aa1aa P |
930 | <spider ident="Qualidator"> |
931 | <name>Qualidator</name> | |
932 | <url>www.qualidator.com/Web/de/Support/FAQ_OnlineTestStatistiken.htm</url> | |
933 | </spider> | |
25ab2d04 MW |
934 | <spider ident="www.kolinka.com"> |
935 | <name>Project Kolinka Forum Search</name> | |
936 | <url>http://www.kolinka.com/</url> | |
937 | </spider> | |
938 | <spider ident="psbot"> | |
939 | <name>psbot</name> | |
940 | </spider> | |
941 | <spider ident="Qango.com Web Directory"> | |
942 | <name>Qango</name> | |
943 | <url>http://www.qango.com</url> | |
944 | </spider> | |
f55aa1aa P |
945 | <spider ident="SBSearch"> |
946 | <name>SecretSearchEngineLabs.com</name> | |
947 | <url>http://www.secretsearchenginelabs.com/secret-web-crawler.php</url> | |
948 | </spider> | |
25ab2d04 MW |
949 | <spider ident="StackRambler"> |
950 | <name>Rambler</name> | |
951 | <url>http://www.rambler.ru/</url> | |
952 | </spider> | |
953 | <spider ident="Raven"> | |
954 | <name>Raven Search</name> | |
955 | </spider> | |
956 | <spider ident="Resume Robot"> | |
957 | <name>Resume Robot</name> | |
958 | </spider> | |
959 | <spider ident="Road Runner: ImageScape Robot"> | |
960 | <name>Road Runner: The ImageScape Robot</name> | |
961 | </spider> | |
962 | <spider ident="RHCS"> | |
963 | <name>RoadHouse Crawling System</name> | |
964 | </spider> | |
965 | <spider ident="Robbie"> | |
966 | <name>Robbie the Robot</name> | |
967 | </spider> | |
968 | <spider ident="RoboCrawl"> | |
969 | <name>RoboCrawl</name> | |
970 | </spider> | |
971 | <spider ident="Robofox"> | |
972 | <name>RoboFox</name> | |
973 | </spider> | |
974 | <spider ident="Robot du CRIM 1.0a"> | |
975 | <name>Robot Francoroute</name> | |
976 | </spider> | |
977 | <spider ident="Robozilla"> | |
978 | <name>Robozilla</name> | |
979 | </spider> | |
980 | <spider ident="Roverbot"> | |
981 | <name>Roverbot</name> | |
982 | </spider> | |
983 | <spider ident="RSS-SPIDER"> | |
984 | <name>RSS Feed Seeker</name> | |
985 | <url>http://www.rss-spider.com/fsb.php</url> | |
986 | </spider> | |
987 | <spider ident="RuLeS"> | |
988 | <name>RuLeS</name> | |
989 | </spider> | |
9581146e PM |
990 | <spider ident="RyzeCrawler"> |
991 | <name>RyzeCrawler</name> | |
992 | <url>http://www.domain2day.nl/crawler/</url> | |
993 | </spider> | |
25ab2d04 MW |
994 | <spider ident="SafetyNet Robot"> |
995 | <name>SafetyNet</name> | |
996 | </spider> | |
997 | <spider ident="SBIder"> | |
998 | <name>SBIder.</name> | |
999 | <url>http://www.sitesell.com/sbider.html</url> | |
1000 | </spider> | |
1001 | <spider ident="Scharia"> | |
1002 | <name>Scharia</name> | |
1003 | </spider> | |
1004 | <spider ident="Science-Index"> | |
1005 | <name>Science-Index</name> | |
1006 | </spider> | |
1007 | <spider ident="Scooter"> | |
1008 | <name>Scooter</name> | |
1009 | </spider> | |
1010 | <spider ident="SearchNZ"> | |
1011 | <name>SearchNZ</name> | |
1012 | <url>http://www.searchnz.co.nz/</url> | |
1013 | </spider> | |
1014 | <spider ident="searchprocess"> | |
1015 | <name>SearchProcess</name> | |
1016 | </spider> | |
1017 | <spider ident="SearchmetricsBot"> | |
1018 | <name>SearchmetricsBot</name> | |
1019 | <url>http://www.searchmetrics.com/en/searchmetrics-bot/</url> | |
1020 | </spider> | |
1021 | <spider ident="Seekbot"> | |
1022 | <name>Seekbot</name> | |
1023 | <url>http://www.seekbot.net/bot.html</url> | |
1024 | </spider> | |
1025 | <spider ident="Senrigan"> | |
1026 | <name>Senrigan</name> | |
1027 | </spider> | |
1028 | <spider ident="Sensis Web Crawler"> | |
1029 | <name>Sensis Web Crawler</name> | |
1030 | <url>http://www.sensis.com.au/help.do</url> | |
1031 | </spider> | |
1032 | <spider ident="SG-Scout"> | |
1033 | <name>SG-Scout</name> | |
1034 | </spider> | |
1035 | <spider ident="Shagseeker"> | |
1036 | <name>ShagSeeker</name> | |
1037 | </spider> | |
1038 | <spider ident="Shai'Hulud"> | |
1039 | <name>Shai'Hulud</name> | |
1040 | </spider> | |
1041 | <spider ident="SimBot/1.0"> | |
1042 | <name>Simmany Robot Ver1.0</name> | |
1043 | </spider> | |
1044 | <spider ident="ssearcher100"> | |
1045 | <name>Site Searcher</name> | |
1046 | </spider> | |
1047 | <spider ident="Site Valet"> | |
1048 | <name>Site Valet</name> | |
1049 | </spider> | |
1050 | <spider ident="http://www.site-list.net"> | |
1051 | <name>Site-List</name> | |
1052 | <url>http://www.site-list.net</url> | |
1053 | </spider> | |
1054 | <spider ident="SiteTech-Rover"> | |
1055 | <name>SiteTech-Rover</name> | |
1056 | </spider> | |
1057 | <spider ident="+SitiDi.net/SitiDiBot/"> | |
1058 | <name>SitiDi.net/SitiDiBot</name> | |
1059 | </spider> | |
1060 | <spider ident="aWapClient"> | |
1061 | <name>Skymob.com</name> | |
1062 | </spider> | |
1063 | <spider ident="SLCrawler"> | |
1064 | <name>SLCrawler</name> | |
1065 | </spider> | |
1066 | <spider ident="Sleek Spider"> | |
1067 | <name>Sleek</name> | |
1068 | </spider> | |
1069 | <spider ident="ESISmartSpider"> | |
1070 | <name>Smart Spider</name> | |
1071 | </spider> | |
1072 | <spider ident="Snapbot"> | |
1073 | <name>Snapbot</name> | |
1074 | <url>http://www.snap.com/</url> | |
1075 | </spider> | |
1076 | <spider ident="Snooper"> | |
1077 | <name>Snooper</name> | |
1078 | </spider> | |
1079 | <spider ident="sohu-search"> | |
1080 | <name>sohu-search</name> | |
1081 | </spider> | |
1082 | <spider ident="Solbot"> | |
1083 | <name>Solbot</name> | |
1084 | </spider> | |
1085 | <spider ident="Speedy Spider"> | |
1086 | <name>Speedy Spider</name> | |
1087 | <url>http://www.entireweb.com/about/search_tech/speedyspider/</url> | |
1088 | </spider> | |
1089 | <spider ident="Sphere Scout"> | |
1090 | <name>Sphere</name> | |
1091 | </spider> | |
1092 | <spider ident="Sphider2"> | |
1093 | <name>Sphider</name> | |
1094 | </spider> | |
1095 | <spider ident="SpiderBot"> | |
1096 | <name>SpiderBot</name> | |
1097 | </spider> | |
1098 | <spider ident="spiderline"> | |
1099 | <name>Spiderline Crawler</name> | |
1100 | </spider> | |
1101 | <spider ident="SpiderMan"> | |
1102 | <name>SpiderMan</name> | |
1103 | </spider> | |
1104 | <spider ident="SpiderView"> | |
1105 | <name>SpiderView(tm)</name> | |
1106 | </spider> | |
1107 | <spider ident="mouse.house"> | |
1108 | <name>spider_monkey</name> | |
1109 | </spider> | |
1110 | <spider ident="suke"> | |
1111 | <name>Suke</name> | |
1112 | </spider> | |
1113 | <spider ident="suntek"> | |
1114 | <name>suntek search engine</name> | |
1115 | </spider> | |
1116 | <spider ident="Szukacz"> | |
1117 | <name>Szukacz</name> | |
1118 | <url>http://www.szukacz.pl/html/RobotEnglishVersion.html</url> | |
1119 | </spider> | |
1120 | <spider ident="T-H-U-N-D-E-R-S-T-O-N-E"> | |
1121 | <name>T-H-U-N-D-E-R-S-T-O-N-E</name> | |
1122 | </spider> | |
f55aa1aa P |
1123 | <spider ident="TinEye Crawler"> |
1124 | <name>TinEye</name> | |
1125 | <url>http://tineye.com/crawler.html</url> | |
1126 | </spider> | |
25ab2d04 MW |
1127 | <spider ident="Black Widow"> |
1128 | <name>TACH Black Widow</name> | |
1129 | </spider> | |
1130 | <spider ident="Tarantula"> | |
1131 | <name>Tarantula</name> | |
1132 | </spider> | |
1133 | <spider ident="tarspider"> | |
1134 | <name>tarspider</name> | |
1135 | </spider> | |
1136 | <spider ident="dlw3robot"> | |
1137 | <name>Tcl W3 Robot</name> | |
1138 | </spider> | |
1139 | <spider ident="TechBOT"> | |
1140 | <name>TechBOT</name> | |
1141 | </spider> | |
1142 | <spider ident="Technoratibot"> | |
1143 | <name>Technorati</name> | |
1144 | <url>http://technorati.com/about/</url> | |
1145 | </spider> | |
1146 | <spider ident="Templeton"> | |
1147 | <name>Templeton</name> | |
1148 | </spider> | |
1149 | <spider ident="teoma"> | |
1150 | <name>Teoma/Ask Jeeves</name> | |
1151 | <url>http://sp.teoma.com/docs/teoma/about/</url> | |
1152 | </spider> | |
1153 | <spider ident="JubiiRobot"> | |
1154 | <name>The Jubii</name> | |
1155 | </spider> | |
1156 | <spider ident="NorthStar"> | |
1157 | <name>The NorthStar Robot</name> | |
1158 | </spider> | |
1159 | <spider ident="w3index"> | |
1160 | <name>The NWI Robot</name> | |
1161 | </spider> | |
1162 | <spider ident="Peregrinator-Mathematics"> | |
1163 | <name>The Peregrinator</name> | |
1164 | </spider> | |
1165 | <spider ident="thumbshots-de-Bot"> | |
1166 | <name>thumbshots-de-Bot</name> | |
1167 | </spider> | |
1168 | <spider ident="TITAN"> | |
1169 | <name>TITAN</name> | |
1170 | </spider> | |
1171 | <spider ident="TitIn"> | |
1172 | <name>TitIn</name> | |
1173 | </spider> | |
1174 | <spider ident="TLSpider"> | |
1175 | <name>TLSpider</name> | |
1176 | </spider> | |
1177 | <spider ident="TMCrawler"> | |
1178 | <name>TMCrawler</name> | |
1179 | </spider> | |
1180 | <spider ident="trendictionbot"> | |
1181 | <name>Trendiction-Bot</name> | |
1182 | <url>http://www.trendiction.com/bot</url> | |
1183 | </spider> | |
1184 | <spider ident="slysearch"> | |
1185 | <name>Turnitin.com</name> | |
1186 | <url>http://www.turnitin.com/static/products_services/search_engines.html</url> | |
1187 | </spider> | |
1188 | <spider ident="TurnitinBot/"> | |
1189 | <name>TurnitinBot</name> | |
1190 | </spider> | |
1191 | <spider ident="TurtleScanner"> | |
1192 | <name>Turtle</name> | |
1193 | <url>http://www.turtle.ru/</url> | |
1194 | </spider> | |
9581146e PM |
1195 | <spider ident="TwengaBot"> |
1196 | <name>Twenga</name> | |
1197 | <url>http://www.twenga.com/bot.html</url> | |
1198 | </spider> | |
25ab2d04 MW |
1199 | <spider ident="Twiceler"> |
1200 | <name>Twiceler</name> | |
1201 | <url>http://www.cuill.com/twiceler/robot.html</url> | |
1202 | </spider> | |
1203 | <spider ident="UCSD-Crawler"> | |
1204 | <name>UCSD Crawl</name> | |
1205 | </spider> | |
1206 | <spider ident="UMBC-memeta-Bot"> | |
1207 | <name>UMBC</name> | |
1208 | </spider> | |
1209 | <spider ident="unisterbot"> | |
1210 | <name>Unister</name> | |
1211 | </spider> | |
1212 | <spider ident="Unpartisan"> | |
1213 | <name>Unpartisan</name> | |
1214 | <url>http://www.unpartisan.com</url> | |
1215 | </spider> | |
1216 | <spider ident="urlck"> | |
1217 | <name>URL Check</name> | |
1218 | </spider> | |
1219 | <spider ident="URL Spider Pro"> | |
1220 | <name>URL Spider Pro</name> | |
1221 | </spider> | |
1222 | <spider ident="Valkyrie"> | |
1223 | <name>Valkyrie</name> | |
1224 | </spider> | |
1225 | <spider ident="Verticrawl"> | |
1226 | <name>Verticrawl</name> | |
1227 | </spider> | |
1228 | <spider ident="Victoria"> | |
1229 | <name>Victoria</name> | |
1230 | </spider> | |
1231 | <spider ident="vision-search"> | |
1232 | <name>vision-search</name> | |
1233 | </spider> | |
1234 | <spider ident="VoilaBot"> | |
1235 | <name>VoilaBot</name> | |
1236 | <url>http://www.voila.com/</url> | |
1237 | </spider> | |
9581146e PM |
1238 | <spider ident="VisBot"> |
1239 | <name>VisBot</name> | |
1240 | <url>http://www.visvo.com/webmasters.html</url> | |
1241 | </spider> | |
25ab2d04 MW |
1242 | <spider ident="Voyager"> |
1243 | <name>Voyager</name> | |
1244 | </spider> | |
1245 | <spider ident="VWbot_K"> | |
1246 | <name>VWbot</name> | |
1247 | </spider> | |
1248 | <spider ident="W3M2"> | |
1249 | <name>W3M2</name> | |
1250 | </spider> | |
1251 | <spider ident="w3mir"> | |
1252 | <name>w3mir</name> | |
1253 | </spider> | |
1254 | <spider ident="w@pSpider"> | |
1255 | <name>w@pSpider</name> | |
1256 | </spider> | |
1257 | <spider ident="appie"> | |
1258 | <name>Walhello appie</name> | |
1259 | <url>http://www.robotstxt.org/wc/active/html/appie.html</url> | |
1260 | </spider> | |
1261 | <spider ident="CrawlPaper"> | |
1262 | <name>WallPaper</name> | |
1263 | </spider> | |
1264 | <spider ident="root"> | |
1265 | <name>Web Core / Roots</name> | |
1266 | </spider> | |
f55aa1aa P |
1267 | <spider ident="WBSearchBot"> |
1268 | <name>Ware Bay</name> | |
1269 | <url>http://www.warebay.com/bot.html</url> | |
1270 | </spider> | |
25ab2d04 MW |
1271 | <spider ident="WebMoose"> |
1272 | <name>Web Moose</name> | |
1273 | </spider> | |
1274 | <spider ident="WebBandit"> | |
1275 | <name>WebBandit</name> | |
1276 | </spider> | |
1277 | <spider ident="WebCatcher"> | |
1278 | <name>WebCatcher</name> | |
1279 | </spider> | |
1280 | <spider ident="Webclipping"> | |
1281 | <name>Webclipping</name> | |
1282 | </spider> | |
1283 | <spider ident="WebCopy"> | |
1284 | <name>WebCopy</name> | |
1285 | </spider> | |
1286 | <spider ident="WebFetcher"> | |
1287 | <name>webfetcher</name> | |
1288 | </spider> | |
1289 | <spider ident="weblayers"> | |
1290 | <name>weblayers</name> | |
1291 | </spider> | |
1292 | <spider ident="WebLinker"> | |
1293 | <name>WebLinker</name> | |
1294 | </spider> | |
1295 | <spider ident="wlm"> | |
1296 | <name>Weblog Monitor</name> | |
1297 | </spider> | |
1298 | <spider ident="WebQuest"> | |
1299 | <name>WebQuest</name> | |
1300 | </spider> | |
1301 | <spider ident="WebReaper"> | |
1302 | <name>WebReaper</name> | |
1303 | </spider> | |
1304 | <spider ident="webs@recruit.co.jp"> | |
1305 | <name>webs</name> | |
1306 | </spider> | |
1307 | <spider ident="websearchbench"> | |
1308 | <name>WebSearchBench</name> | |
1309 | <url>http://websearchbench.cs.uni-dortmund.de/</url> | |
1310 | </spider> | |
1311 | <spider ident="WOLP"> | |
1312 | <name>WebStolperer</name> | |
1313 | </spider> | |
1314 | <spider ident="webvac"> | |
1315 | <name>WebVac</name> | |
1316 | </spider> | |
1317 | <spider ident="webwalk"> | |
1318 | <name>webwalk</name> | |
1319 | </spider> | |
1320 | <spider ident="WebWalker"> | |
1321 | <name>WebWalker</name> | |
1322 | </spider> | |
1323 | <spider ident="WebWatch"> | |
1324 | <name>WebWatch</name> | |
52bb0ca4 | 1325 | </spider> |
6a3fbb36 | 1326 | <spider ident="WebZinger"> |
52bb0ca4 | 1327 | <name>WebZinger</name> |
25ab2d04 MW |
1328 | </spider> |
1329 | <spider ident="whatUseek_winona"> | |
1330 | <name>whatUseek Winona</name> | |
52bb0ca4 | 1331 | </spider> |
6a3fbb36 | 1332 | <spider ident="WhoWhere Robot"> |
52bb0ca4 P |
1333 | <name>WebWatch</name> |
1334 | <url>http://www.whowhere.com</url> | |
25ab2d04 MW |
1335 | </spider> |
1336 | <spider ident="SurveyBot"> | |
1337 | <name>Whois Source</name> | |
1338 | <url>http://www.whois.sc/info/webmasters/surveybot.html</url> | |
1339 | </spider> | |
1340 | <spider ident="Hazel's Ferret Web hopper"> | |
1341 | <name>Wild Ferret Web Hopper</name> | |
1342 | </spider> | |
1343 | <spider ident="WinHTTP"> | |
1344 | <name>WinHTTP</name> | |
1345 | </spider> | |
1346 | <spider ident="wired-digital-newsbot"> | |
1347 | <name>Wired Digital</name> | |
1348 | </spider> | |
1349 | <spider ident="zyborg"> | |
1350 | <name>WiseNut</name> | |
1351 | </spider> | |
1352 | <spider ident="OmniExplorer_Bot"> | |
1353 | <name>WorldIndexer</name> | |
1354 | <url>http://www.omni-explorer.com</url> | |
1355 | </spider> | |
1356 | <spider ident="WWWC"> | |
1357 | <name>WWWC</name> | |
1358 | </spider> | |
1359 | <spider ident="WWWeasel Robot"> | |
1360 | <name>WWWeasel Robot</name> | |
1361 | </spider> | |
1362 | <spider ident="wwwster"> | |
1363 | <name>wwwster</name> | |
1364 | </spider> | |
1365 | <spider ident="WWWWanderer"> | |
1366 | <name>WWWWanderer</name> | |
1367 | </spider> | |
1368 | <spider ident="TECOMAC-Crawler"> | |
1369 | <name>X-Crawler</name> | |
1370 | </spider> | |
1371 | <spider ident="XGET"> | |
1372 | <name>XGET</name> | |
1373 | </spider> | |
1374 | <spider ident="cosmos"> | |
1375 | <name>XYLEME Robot</name> | |
1376 | </spider> | |
1377 | <spider ident="yacybot"> | |
1378 | <name>YaCy-Bot</name> | |
1379 | <url>http://yacy.net/yacy/bot.html</url> | |
1380 | </spider> | |
1381 | <spider ident="YahooYSMcm"> | |
1382 | <name>Yahoo Publisher Network</name> | |
1383 | <url>http://publisher.yahoo.com/</url> | |
1384 | </spider> | |
1385 | <spider ident="Yahoo-Blogs"> | |
1386 | <name>Yahoo-Blogs</name> | |
1387 | <url>http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html</url> | |
1388 | </spider> | |
1389 | <spider ident="Yahoo Pipes"> | |
1390 | <name>Yahoo Pipes</name> | |
1391 | </spider> | |
1392 | <spider ident="Yahoo! Slurp"> | |
1393 | <name>Yahoo! Slurp</name> | |
1394 | <url>http://help.yahoo.com/help/us/ysearch/slurp</url> | |
1395 | </spider> | |
1396 | <spider ident="Yahoo-VerticalCrawler"> | |
1397 | <name>Yahoo-VerticalCrawler</name> | |
1398 | </spider> | |
1399 | <spider ident="YahooFeedSeeker"> | |
1400 | <name>YahooFeedSeeker</name> | |
1401 | <url>http://my.yahoo.com/s/publishers.html</url> | |
1402 | </spider> | |
1403 | <spider ident="Yandex"> | |
1404 | <name>Yandex</name> | |
1405 | <url>http://www.yandex.ru/</url> | |
1406 | </spider> | |
1407 | <spider ident="zeus"> | |
1408 | <name>Zeus Internet Marketing</name> | |
1409 | <url>http://www.cyber-robotics.com/</url> | |
1410 | </spider> | |
1411 | <spider ident="http://www.zorkk.com"> | |
1412 | <name>Zork</name> | |
1413 | <url>http://www.zorkk.com</url> | |
1414 | </spider> | |
f55aa1aa P |
1415 | <spider ident="Zookabot"> |
1416 | <name>Zookabotk</name> | |
1417 | <url>http://zookabot.com/</url> | |
1418 | </spider> | |
52bb0ca4 | 1419 | </data> |