Commit | Line | Data |
---|---|---|
25ab2d04 MW |
1 | <?xml version="1.0" encoding="UTF-8"?> |
2 | <data xmlns="http://www.woltlab.com" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.woltlab.com http://www.woltlab.com/XSD/maelstrom/spiderList.xsd"> | |
3 | <spider ident="ABCdatos"> | |
4 | <name>ABCdatos BotLink</name> | |
5 | <url>http://www.robotstxt.org/wc/active/html/abcdatos.html</url> | |
6 | </spider> | |
7 | <spider ident="abot/"> | |
8 | <name>abot</name> | |
9 | <url>http://www.abot.com/</url> | |
10 | </spider> | |
11 | <spider ident="Accelatech RSSCrawler"> | |
12 | <name>Accelatech</name> | |
13 | </spider> | |
14 | <spider ident="Accoona-AI-Agent"> | |
15 | <name>Accoona</name> | |
16 | <url>http://accoona.com/about/about_accoona.jsp</url> | |
17 | </spider> | |
18 | <spider ident="aconon Index"> | |
19 | <name>aconon Index (raubfische.de)</name> | |
20 | </spider> | |
21 | <spider ident="AcoonBot"> | |
22 | <name>Acoon</name> | |
23 | <url>http://www.acoon.de/robot.asp</url> | |
24 | </spider> | |
25 | <spider ident="Ahoy!"> | |
26 | <name>Ahoy!</name> | |
27 | <url>http://www.robotstxt.org/wc/active/html/ahoythehomepagefinder.html</url> | |
28 | </spider> | |
29 | <spider ident="AhrefsBot"> | |
30 | <name>Ahrefs</name> | |
31 | <url>http://ahrefs.com/robot/</url> | |
32 | </spider> | |
33 | <spider ident="AlkalineBOT"> | |
34 | <name>Alkaline</name> | |
35 | <url>http://www.robotstxt.org/wc/active/html/Alkaline.html</url> | |
36 | </spider> | |
37 | <spider ident="http://www.almaden.ibm.com/cs/crawler"> | |
38 | <name>Almaden Crawler</name> | |
39 | <url>http://www.almaden.ibm.com/cs/crawler/</url> | |
40 | </spider> | |
41 | <spider ident="EMC Spider"> | |
42 | <name>ananzi</name> | |
43 | </spider> | |
44 | <spider ident="Anthill"> | |
45 | <name>Anthill</name> | |
46 | <url>http://www.robotstxt.org/wc/active/html/anthill.html</url> | |
47 | </spider> | |
48 | <spider ident="Aport"> | |
49 | <name>Aport</name> | |
50 | <url>http://www.aport.ru/</url> | |
51 | </spider> | |
52 | <spider ident="AppleSyndication"> | |
53 | <name>Apple</name> | |
54 | </spider> | |
55 | <spider ident="Arachnophilia"> | |
56 | <name>Arachnophilia</name> | |
57 | <url>http://www.robotstxt.org/wc/active/html/arachnophilia.html</url> | |
58 | </spider> | |
59 | <spider ident="Araneo"> | |
60 | <name>Araneo</name> | |
61 | <url>http://www.robotstxt.org/wc/active/html/araneo.html</url> | |
62 | </spider> | |
63 | <spider ident="ArchitextSpider"> | |
64 | <name>ArchitextSpider</name> | |
65 | <url>http://www.robotstxt.org/wc/active/html/architext.html</url> | |
66 | </spider> | |
67 | <spider ident="ia_archiver"> | |
68 | <name>Archive.org</name> | |
69 | <url>http://www.archive.org/about/exclude.php</url> | |
70 | </spider> | |
71 | <spider ident="arks/1.0"> | |
72 | <name>arks</name> | |
73 | <url>http://www.robotstxt.org/wc/active/html/arks.html</url> | |
74 | </spider> | |
75 | <spider ident="ASpider"> | |
76 | <name>ASpider</name> | |
77 | <url>http://www.robotstxt.org/wc/active/html/aspider.html</url> | |
78 | </spider> | |
79 | <spider ident="ATN_Worldwide"> | |
80 | <name>ATN Worldwide</name> | |
81 | <url>http://www.robotstxt.org/wc/active/html/atn.txt.html</url> | |
82 | </spider> | |
83 | <spider ident="Atomz"> | |
84 | <name>Atomz.com</name> | |
85 | <url>http://www.robotstxt.org/wc/active/html/atomz.html</url> | |
86 | </spider> | |
87 | <spider ident="AURESYS"> | |
88 | <name>AURESYS</name> | |
89 | <url>http://www.robotstxt.org/wc/active/html/auresys.html</url> | |
90 | </spider> | |
91 | <spider ident="BackRub"> | |
92 | <name>BackRub</name> | |
93 | <url>http://www.robotstxt.org/wc/active/html/backrub.html</url> | |
94 | </spider> | |
95 | <spider ident="Baiduspider"> | |
96 | <name>Baiduspider</name> | |
97 | <url>http://www.baidu.com/search/spider.htm</url> | |
98 | </spider> | |
99 | <spider ident="bbot"> | |
100 | <name>BBot</name> | |
101 | <url>http://www.robotstxt.org/wc/active/html/bbot.html</url> | |
102 | </spider> | |
103 | <spider ident="BecomeBot"> | |
104 | <name>BecomeBot</name> | |
105 | <url>http://www.become.com/webmasters.html</url> | |
106 | </spider> | |
107 | <spider ident="Big Brother"> | |
108 | <name>Big Brother</name> | |
109 | <url>http://www.robotstxt.org/wc/active/html/bigbrother.html</url> | |
110 | </spider> | |
111 | <spider ident="BigmirSpider"> | |
112 | <name>Bigmir</name> | |
113 | <url>http://www.bigmir.net/</url> | |
114 | </spider> | |
115 | <spider ident="bingbot"> | |
116 | <name>Bing</name> | |
117 | <url>http://www.bing.com/bingbot.htm</url> | |
118 | </spider> | |
119 | <spider ident="Bitacle bot"> | |
120 | <name>Bitacle</name> | |
121 | <url>http://bitacle.org/</url> | |
122 | </spider> | |
123 | <spider ident="Biz360 Spider"> | |
124 | <name>Biz</name> | |
125 | <url>http://www.biz360.com</url> | |
126 | </spider> | |
127 | <spider ident="Bjaaland"> | |
128 | <name>Bjaaland</name> | |
129 | <url>http://www.robotstxt.org/wc/active/html/bjaaland.html</url> | |
130 | </spider> | |
131 | <spider ident="BlackWidow"> | |
132 | <name>BlackWidow</name> | |
133 | <url>http://www.robotstxt.org/wc/active/html/blackwidow.html</url> | |
134 | </spider> | |
b730b757 MW |
135 | <spider ident="BLEXBot"> |
136 | <name>BLEXBot</name> | |
137 | <url>http://webmeup.com/crawler.html</url> | |
138 | </spider> | |
25ab2d04 MW |
139 | <spider ident="BlogCrawler by Xango"> |
140 | <name>BlogCrawler</name> | |
141 | </spider> | |
142 | <spider ident="blogdb"> | |
143 | <name>BlogDb</name> | |
144 | <url>http://blogdb.jp</url> | |
145 | </spider> | |
146 | <spider ident="blog search engine by BlogFan.ORG"> | |
147 | <name>BlogFan</name> | |
148 | <url>http://www.blogfan.org</url> | |
149 | </spider> | |
150 | <spider ident="Bloglines"> | |
151 | <name>Bloglies</name> | |
152 | <url>http://www.bloglines.com</url> | |
153 | </spider> | |
154 | <spider ident="BlogPulse (ISSpider-3.0)"> | |
155 | <name>BlogPulse</name> | |
156 | </spider> | |
157 | <spider ident="BlogSearch"> | |
158 | <name>BlogSearch</name> | |
159 | <url>http://www.icerocket.com</url> | |
160 | </spider> | |
161 | <spider ident="BlogsNowBot"> | |
162 | <name>BlogsNow</name> | |
163 | <url>http://www.blogsnow.com/</url> | |
164 | </spider> | |
165 | <spider ident="BlogStreetBot"> | |
166 | <name>BlogStreetBot</name> | |
167 | <url>http://www.blogstreet.com/</url> | |
168 | </spider> | |
169 | <spider ident="Bulkfeeds"> | |
170 | <name>BlogStreetBot</name> | |
171 | <url>http://bulkfeeds.net</url> | |
172 | </spider> | |
173 | <spider ident="BoardPulse"> | |
174 | <name>BoardPulse</name> | |
175 | <url>http://www.boardpulse.com/</url> | |
176 | </spider> | |
177 | <spider ident="BoardReader"> | |
178 | <name>BoardReader</name> | |
179 | <url>http://www.boardreader.com/aboutus.asp</url> | |
180 | </spider> | |
181 | <spider ident="BoardViewer"> | |
182 | <name>BoardViewer</name> | |
183 | <url>http://www.boardviewer.com/</url> | |
184 | </spider> | |
185 | <spider ident="boitho.com-robot"> | |
186 | <name>Boitho</name> | |
187 | <url>http://www.boitho.com/bot.html</url> | |
188 | </spider> | |
189 | <spider ident="borg-bot"> | |
190 | <name>Borg-Bot</name> | |
191 | <url>http://www.robotstxt.org/wc/active/html/borg-bot.html</url> | |
192 | </spider> | |
193 | <spider ident="BSpider"> | |
194 | <name>BSpider</name> | |
195 | <url>http://www.robotstxt.org/wc/active/html/bspider.html</url> | |
196 | </spider> | |
197 | <spider ident="CACTVS Chemistry Spider"> | |
198 | <name>CACTVS Chemistry</name> | |
199 | </spider> | |
200 | <spider ident="Calif"> | |
201 | <name>Calif</name> | |
202 | </spider> | |
203 | <spider ident="CaRP/3.6Evolution"> | |
204 | <name>CaRP</name> | |
205 | <url>http://www.biz360.com</url> | |
206 | </spider> | |
207 | <spider ident="Checkbot"> | |
208 | <name>Checkbot</name> | |
209 | </spider> | |
210 | <spider ident="ChristCrawler.com"> | |
211 | <name>ChristCrawler.com</name> | |
212 | </spider> | |
213 | <spider ident="www.cienciaficcion.net"> | |
214 | <name>cIeNcIaFiCcIoN.nEt</name> | |
215 | </spider> | |
216 | <spider ident="CipinetBot"> | |
217 | <name>Cipinet</name> | |
218 | <url>http://www.cipinet.com/bot.html</url> | |
219 | </spider> | |
220 | <spider ident="CJNetworkQuality"> | |
221 | <name>CJNetworkQuality</name> | |
222 | <url>http://www.cj.com/networkquality/</url> | |
223 | </spider> | |
224 | <spider ident="CMC/0.01"> | |
225 | <name>CMC/0.01</name> | |
226 | </spider> | |
227 | <spider ident="ColdFusion"> | |
228 | <name>ColdFusion</name> | |
229 | </spider> | |
230 | <spider ident="combine"> | |
231 | <name>Combine System</name> | |
232 | </spider> | |
233 | <spider ident="Crawler (cometsearch@cometsystems.com)"> | |
234 | <name>cometsystems.com</name> | |
235 | </spider> | |
236 | <spider ident="ComputingSite Robi/1.0"> | |
237 | <name>ComputingSite Robi/1.0</name> | |
238 | </spider> | |
239 | <spider ident="conceptbot"> | |
240 | <name>Conceptbot</name> | |
241 | </spider> | |
242 | <spider ident="Cooby.de Crawler"> | |
243 | <name>Cooby.de Crawler</name> | |
244 | </spider> | |
245 | <spider ident="CoolBot"> | |
246 | <name>CoolBot</name> | |
247 | </spider> | |
248 | <spider ident="Cusco"> | |
249 | <name>Cusco</name> | |
250 | </spider> | |
251 | <spider ident="CyberSpyder"> | |
252 | <name>CyberSpyder</name> | |
253 | </spider> | |
254 | <spider ident="daypopbot"> | |
255 | <name>daypop</name> | |
256 | </spider> | |
257 | <spider ident="DesertRealm.com"> | |
258 | <name>Desert Realm</name> | |
259 | </spider> | |
260 | <spider ident="Deweb"> | |
261 | <name>DeWeb(c)</name> | |
262 | </spider> | |
263 | <spider ident="Die Blinde Kuh"> | |
264 | <name>Die Blinde Kuh</name> | |
265 | <url>http://www.robotstxt.org/wc/active/html/blindekuh.html</url> | |
266 | </spider> | |
267 | <spider ident="dienstspider"> | |
268 | <name>DienstSpider</name> | |
269 | </spider> | |
270 | <spider ident="Digger/1.0 JDK/1.3.0"> | |
271 | <name>Digger</name> | |
272 | </spider> | |
273 | <spider ident="Digimarc WebReader"> | |
274 | <name>Digimarc MarcSpider</name> | |
275 | </spider> | |
276 | <spider ident="Digimarc CGIReader"> | |
277 | <name>Digimarc Marcspider/CGI</name> | |
278 | </spider> | |
279 | <spider ident="DIIbot"> | |
280 | <name>Digital Integrity Robot</name> | |
281 | </spider> | |
282 | <spider ident="grabber"> | |
283 | <name>Direct Hit Grabber</name> | |
284 | </spider> | |
285 | <spider ident="discobot"> | |
286 | <name>Discovery</name> | |
287 | <url>http://discoveryengine.com/discobot.html</url> | |
288 | </spider> | |
289 | <spider ident="DNAbot/1.0"> | |
290 | <name>DNAbot</name> | |
291 | </spider> | |
292 | <spider ident="DragonBot/1.0 libwww/5.0"> | |
293 | <name>DragonBot</name> | |
294 | </spider> | |
295 | <spider ident="DWCP/2.0"> | |
296 | <name>DWCP (Dridus' Web Cataloging Project)</name> | |
297 | </spider> | |
298 | <spider ident="e-SocietyRobot"> | |
299 | <name>e-Society</name> | |
300 | <url>http://www.yama.info.waseda.ac.jp/~yamana/es/index_eng.htm</url> | |
301 | </spider> | |
302 | <spider ident="exactseek-pagereaper"> | |
303 | <name>eaxactseek-page</name> | |
304 | </spider> | |
305 | <spider ident="EbiNess/0.01a"> | |
306 | <name>EbiNess</name> | |
307 | </spider> | |
308 | <spider ident="edgeio-retriever"> | |
309 | <name>Edgeio</name> | |
310 | <url>http://www.edgeio.com</url> | |
311 | </spider> | |
312 | <spider ident="EIT-Link-Verifier-Robot/0.2"> | |
313 | <name>EIT Link Verifier Robot</name> | |
314 | </spider> | |
315 | <spider ident="elfinbot"> | |
316 | <name>ELFINBOT</name> | |
317 | </spider> | |
318 | <spider ident="Emacs-w3/v[0-9\.]+"> | |
319 | <name>Emacs-w3 Search Engine</name> | |
320 | </spider> | |
321 | <spider ident="esther"> | |
322 | <name>Esther</name> | |
323 | </spider> | |
324 | <spider ident="EuripBot/"> | |
325 | <name>EuripBot</name> | |
326 | </spider> | |
327 | <spider ident="Evliya Celebi"> | |
328 | <name>Evliya Celebi</name> | |
329 | </spider> | |
330 | <spider ident="ExactSeek_Spider"> | |
331 | <name>ExactSeek_Spider</name> | |
332 | <url>http://www.askjeevs.com</url> | |
333 | </spider> | |
334 | <spider ident="NG/2.0"> | |
335 | <name>ExaLead</name> | |
336 | <url>http://botspotter.net/bs-389.html</url> | |
337 | </spider> | |
338 | <spider ident="ExaBot"> | |
339 | <name>ExaLead Beta</name> | |
340 | <url>http://beta.exalead.com/search/C=0/2p=Help.7</url> | |
341 | </spider> | |
342 | <spider ident="facebookexternalhit"> | |
343 | <name>Facebook</name> | |
344 | <url>http://www.facebook.com/externalhit_uatext.php</url> | |
345 | </spider> | |
346 | <spider ident="fast-webcrawler"> | |
347 | <name>FAST / AlltheWeb</name> | |
348 | <url>http://help.yahoo.com/help/us/ysearch/slurp/index.html</url> | |
349 | </spider> | |
350 | <spider ident="FastCrawler"> | |
351 | <name>FastCrawler</name> | |
352 | </spider> | |
353 | <spider ident="Feed24.com"> | |
354 | <name>Feed24</name> | |
355 | <url>http://www.feed24.com</url> | |
356 | </spider> | |
357 | <spider ident="FeedBlitz"> | |
358 | <name>FeedBlitz</name> | |
359 | <url>http://www.feedblitz.com</url> | |
360 | </spider> | |
361 | <spider ident="FeedBurner"> | |
362 | <name>FeedBurner</name> | |
363 | <url>http://www.FeedBurner.com</url> | |
364 | </spider> | |
365 | <spider ident="Feedfetcher-Google"> | |
366 | <name>FeedFetcher-Google</name> | |
367 | <url>http://www.google.com/feedfetcher.html</url> | |
368 | </spider> | |
369 | <spider ident="UniversalFeedParser"> | |
370 | <name>FeedParser</name> | |
371 | <url>http://www.feedparser.org</url> | |
372 | </spider> | |
373 | <spider ident="Feedster Crawler"> | |
374 | <name>Feedster</name> | |
375 | <url>http://www.feedstermedia.com/</url> | |
376 | </spider> | |
377 | <spider ident="FEHLSTART Superspider"> | |
378 | <name>FEHLSTART</name> | |
379 | </spider> | |
380 | <spider ident="FelixIDE"> | |
381 | <name>Felix IDE</name> | |
382 | </spider> | |
383 | <spider ident="ESIRover"> | |
384 | <name>FetchRover</name> | |
385 | </spider> | |
386 | <spider ident="fido"> | |
387 | <name>fido</name> | |
388 | </spider> | |
389 | <spider ident="findlinks"> | |
390 | <name>FindLinks</name> | |
391 | <url>http://wortschatz.uni-leipzig.de/findlinks/</url> | |
392 | </spider> | |
393 | <spider ident="FindoryBot"> | |
394 | <name>Findroy</name> | |
395 | <url>http://www.findory.com</url> | |
396 | </spider> | |
397 | <spider ident="Fish-Search-Robot"> | |
398 | <name>Fish search</name> | |
399 | </spider> | |
400 | <spider ident="Mozilla/4.0 (compatible: FDSE robot)"> | |
401 | <name>Fluid Dynamics</name> | |
402 | </spider> | |
403 | <spider ident="fouineur.9bit.qc.ca"> | |
404 | <name>Fouineur</name> | |
405 | </spider> | |
406 | <spider ident="Freecrawl"> | |
407 | <name>Freecrawl</name> | |
408 | </spider> | |
409 | <spider ident="FunnelWeb"> | |
410 | <name>FunnelWeb</name> | |
411 | </spider> | |
412 | <spider ident="GaisBot"> | |
413 | <name>Gais</name> | |
414 | <url>http://gais.cs.ccu.edu.tw/robot.php</url> | |
415 | </spider> | |
416 | <spider ident="gamekitbot"> | |
417 | <name>GAMEKIT</name> | |
418 | <url>http://www.uchoose.de/crawler/gamekitbot/</url> | |
419 | </spider> | |
420 | <spider ident="gammaSpider"> | |
421 | <name>gammaSpider</name> | |
422 | </spider> | |
423 | <spider ident="gazz"> | |
424 | <name>gazz</name> | |
425 | </spider> | |
426 | <spider ident="gcreep"> | |
427 | <name>GCreep</name> | |
428 | </spider> | |
429 | <spider ident="genieBot"> | |
430 | <name>genieBot</name> | |
431 | <url>http://64.5.245.11/faq/faq.html</url> | |
432 | </spider> | |
433 | <spider ident="geourl"> | |
434 | <name>GeoURL</name> | |
435 | <url>http://geourl.org/bot.html</url> | |
436 | </spider> | |
437 | <spider ident="GetterroboPlus"> | |
438 | <name>GetterroboPlus Puu</name> | |
439 | </spider> | |
440 | <spider ident="GetURL.rexx"> | |
441 | <name>GetURL</name> | |
442 | </spider> | |
443 | <spider ident="Gigabot"> | |
444 | <name>Gigabot</name> | |
445 | <url>http://www.gigablast.com/spider.html</url> | |
446 | </spider> | |
447 | <spider ident="Girafabot"> | |
448 | <name>Girafabot</name> | |
449 | <url>http://www.girafa.com/</url> | |
450 | </spider> | |
451 | <spider ident="Goku"> | |
452 | <name>Goku</name> | |
453 | <url>http://goku.ru/bot.htm; bot@goku.ru</url> | |
454 | </spider> | |
455 | <spider ident="Golem"> | |
456 | <name>Golem</name> | |
457 | </spider> | |
458 | <spider ident="gonzo"> | |
459 | <name>Gonzo</name> | |
460 | </spider> | |
461 | <spider ident="Googlebot/"> | |
462 | <name>Google</name> | |
463 | <url>http://www.google.com/bot.html</url> | |
464 | </spider> | |
465 | <spider ident="Mediapartners-Google"> | |
466 | <name>Google AdSense</name> | |
467 | <url>https://www.google.com/adsense/faq</url> | |
468 | </spider> | |
469 | <spider ident="Googlebot-Image"> | |
470 | <name>Googlebot-Image</name> | |
471 | <url>http://www.googlebot.com/bot.html</url> | |
472 | </spider> | |
473 | <spider ident="Googlebot-Mobile"> | |
474 | <name>Googlebot-Mobile</name> | |
475 | <url>http://www.google.com/bot.html</url> | |
476 | </spider> | |
477 | <spider ident="Gpostbot"> | |
478 | <name>Gpostbot</name> | |
479 | <url>http://www.gpost.info/help.php?c=bot</url> | |
480 | </spider> | |
481 | <spider ident="griffon"> | |
482 | <name>Griffon</name> | |
483 | </spider> | |
484 | <spider ident="Gromit"> | |
485 | <name>Gromit</name> | |
486 | </spider> | |
487 | <spider ident="http://grub.org"> | |
488 | <name>Grub Client</name> | |
489 | </spider> | |
490 | <spider ident="Gulper Web Bot"> | |
491 | <name>Gulper Bot</name> | |
492 | </spider> | |
493 | <spider ident="havIndex"> | |
494 | <name>havIndex</name> | |
495 | </spider> | |
496 | <spider ident="HeinrichderMiragoRobot"> | |
497 | <name>HeinrichderMiragoRobot</name> | |
498 | </spider> | |
499 | <spider ident="HenryTheMiragoRobot"> | |
500 | <name>HenryTheMiragoRobot</name> | |
501 | </spider> | |
502 | <spider ident="heritrix"> | |
503 | <name>Heritrix</name> | |
504 | <url>http://www.worio.com</url> | |
505 | </spider> | |
506 | <spider ident="HKU WWW Robot"> | |
507 | <name>HKU WWW Octopus</name> | |
508 | </spider> | |
509 | <spider ident="HolyCowDude"> | |
510 | <name>HolyCowDude</name> | |
511 | <url>http://www.holycowdude.com/spider.htm</url> | |
512 | </spider> | |
513 | <spider ident="Hometown"> | |
514 | <name>Hometown</name> | |
515 | </spider> | |
516 | <spider ident="htdig"> | |
517 | <name>ht://Dig</name> | |
518 | </spider> | |
519 | <spider ident="AITCSRobot"> | |
520 | <name>HTML Index</name> | |
521 | </spider> | |
522 | <spider ident="HTMLgobble"> | |
523 | <name>HTMLgobble</name> | |
524 | </spider> | |
525 | <spider ident="I Robot"> | |
526 | <name>I, Robot</name> | |
527 | </spider> | |
528 | <spider ident="iajaBot"> | |
529 | <name>iajaBot</name> | |
530 | </spider> | |
531 | <spider ident="IBM_Planetwide"> | |
532 | <name>IBM_Planetwide</name> | |
533 | </spider> | |
534 | <spider ident="+http://www.icerocket.com/"> | |
535 | <name>IceRocket</name> | |
536 | <url>http://www.icerocket.com/</url> | |
537 | </spider> | |
538 | <spider ident="ichiro"> | |
539 | <name>ichiro</name> | |
540 | </spider> | |
541 | <spider ident="IlTrovatore-Setaccio"> | |
542 | <name>IlTrovatore-Setaccio</name> | |
543 | <url>http://www.iltrovatore.it/aiuto/faq.html</url> | |
544 | </spider> | |
545 | <spider ident="image.kapsi.net"> | |
546 | <name>image.kapsi.net</name> | |
547 | </spider> | |
548 | <spider ident="Mozilla 3.01 PBWF (Win95)"> | |
549 | <name>Imagelock</name> | |
550 | </spider> | |
551 | <spider ident="IncyWincy"> | |
552 | <name>IncyWincy</name> | |
553 | </spider> | |
554 | <spider ident="Informant"> | |
555 | <name>Informant</name> | |
556 | </spider> | |
557 | <spider ident="InfoSeek Robot"> | |
558 | <name>InfoSeek Robot 1.0</name> | |
559 | </spider> | |
560 | <spider ident="Infoseek Sidewinder"> | |
561 | <name>Infoseek Sidewinder</name> | |
562 | </spider> | |
563 | <spider ident="InfoSpiders"> | |
564 | <name>InfoSpiders</name> | |
565 | </spider> | |
566 | <spider ident="INGRID"> | |
567 | <name>Ingrid</name> | |
568 | </spider> | |
569 | <spider ident="slurp@inktomi"> | |
570 | <name>Inktomi</name> | |
571 | </spider> | |
572 | <spider ident="Insitor"> | |
573 | <name>Insitor</name> | |
574 | <url>http://www.insitor.de/</url> | |
575 | </spider> | |
576 | <spider ident="inspectorwww"> | |
577 | <name>Inspector Web</name> | |
578 | </spider> | |
579 | <spider ident="IAGENT"> | |
580 | <name>IntelliAgent</name> | |
581 | </spider> | |
582 | <spider ident="Intelliseek"> | |
583 | <name>Intelliseek</name> | |
584 | <url>http://www.intelliseek.com/</url> | |
585 | </spider> | |
586 | <spider ident="Internet Cruiser Robot"> | |
587 | <name>Internet Cruiser</name> | |
588 | </spider> | |
589 | <spider ident="internetseer"> | |
590 | <name>Internet Seer</name> | |
591 | </spider> | |
592 | <spider ident="sharp-info-agent"> | |
593 | <name>Internet Shinchakubin</name> | |
594 | </spider> | |
595 | <spider ident="InternetLinkAgent"> | |
596 | <name>InternetLinkAgent</name> | |
597 | </spider> | |
598 | <spider ident="IRLbot"> | |
599 | <name>IRL Crawler</name> | |
600 | <url>http://irl.cs.tamu.edu/crawler</url> | |
601 | </spider> | |
602 | <spider ident="Iron33"> | |
603 | <name>Iron33</name> | |
604 | </spider> | |
605 | <spider ident="IsraeliSearch"> | |
606 | <name>Israeli-search</name> | |
607 | </spider> | |
608 | <spider ident="itchBot"> | |
609 | <name>itch</name> | |
610 | <url>http://www.itch.com/infoforwebmasters.html</url> | |
611 | </spider> | |
612 | <spider ident="JavaBee"> | |
613 | <name>JavaBee</name> | |
614 | </spider> | |
615 | <spider ident="JBot"> | |
616 | <name>JBot</name> | |
617 | </spider> | |
618 | <spider ident="JCrawler"> | |
619 | <name>JCrawler</name> | |
620 | </spider> | |
621 | <spider ident="JetBot"> | |
622 | <name>JetEye</name> | |
623 | <url>http://www.jeteye.com/jetbot.html</url> | |
624 | </spider> | |
625 | <spider ident="JoBo"> | |
626 | <name>JoBo</name> | |
627 | </spider> | |
628 | <spider ident="Jobot"> | |
629 | <name>Jobot</name> | |
630 | </spider> | |
631 | <spider ident="jobs.de"> | |
632 | <name>Jobs.de</name> | |
633 | <url>http://www.jobs.de/</url> | |
634 | </spider> | |
635 | <spider ident="JoeBot"> | |
636 | <name>JoeBot</name> | |
637 | </spider> | |
638 | <spider ident="jumpstation"> | |
639 | <name>JumpStation</name> | |
640 | </spider> | |
641 | <spider ident="Katipo"> | |
642 | <name>Katipo</name> | |
643 | </spider> | |
644 | <spider ident="KDD-Explorer"> | |
645 | <name>KDD-Explorer</name> | |
646 | </spider> | |
647 | <spider ident="KIT-Fireball"> | |
648 | <name>KIT-Fireball</name> | |
649 | </spider> | |
650 | <spider ident="KO_Yappo_Robot"> | |
651 | <name>KO_Yappo_Robot</name> | |
652 | </spider> | |
653 | <spider ident="LabelGrab"> | |
654 | <name>LabelGrabber</name> | |
655 | </spider> | |
656 | <spider ident="larbin"> | |
657 | <name>larbin</name> | |
658 | </spider> | |
659 | <spider ident="legs"> | |
660 | <name>legs</name> | |
661 | </spider> | |
662 | <spider ident="LinkScan Server"> | |
663 | <name>LinkScan</name> | |
664 | </spider> | |
665 | <spider ident="LinkWalker"> | |
666 | <name>LinkWalker</name> | |
667 | </spider> | |
668 | <spider ident="livedoorCheckers/"> | |
669 | <name>livedoorCheckers</name> | |
670 | </spider> | |
671 | <spider ident="Lockon"> | |
672 | <name>Lockon</name> | |
673 | </spider> | |
674 | <spider ident="logo.gif crawler"> | |
675 | <name>logo.gif</name> | |
676 | </spider> | |
677 | <spider ident="Lycos"> | |
678 | <name>Lycos</name> | |
679 | </spider> | |
680 | <spider ident="Magpie"> | |
681 | <name>Magpie</name> | |
682 | </spider> | |
683 | <spider ident="MJ12bot"> | |
684 | <name>Majestics MJ12bot</name> | |
685 | </spider> | |
686 | <spider ident="Mammoth"> | |
687 | <name>Mammoth</name> | |
688 | <url>http://www.sli-systems.com</url> | |
689 | </spider> | |
690 | <spider ident="Marvin"> | |
691 | <name>Marvin</name> | |
692 | </spider> | |
693 | <spider ident="marvin/infoseek"> | |
694 | <name>marvin/infoseek</name> | |
695 | </spider> | |
696 | <spider ident="M/3.8"> | |
697 | <name>Mattie</name> | |
698 | </spider> | |
699 | <spider ident="MediaFox"> | |
700 | <name>MediaFox</name> | |
701 | </spider> | |
702 | <spider ident="mercator"> | |
703 | <name>Mercator</name> | |
704 | <url>http://research.compaq.com/SRC/mercator/</url> | |
705 | </spider> | |
706 | <spider ident="MerzScope"> | |
707 | <name>MerzScope</name> | |
708 | </spider> | |
709 | <spider ident="METASpider"> | |
710 | <name>META</name> | |
711 | <url>http://www.meta.com.ua/</url> | |
712 | </spider> | |
713 | <spider ident="MetaGer-LinkChecker"> | |
714 | <name>MetaGer</name> | |
715 | </spider> | |
716 | <spider ident="MindCrawler"> | |
717 | <name>MindCrawler</name> | |
718 | </spider> | |
719 | <spider ident="Miva"> | |
720 | <name>Miva</name> | |
721 | </spider> | |
722 | <spider ident="UdmSearch"> | |
723 | <name>mnoGoSearch</name> | |
724 | </spider> | |
725 | <spider ident="moget"> | |
726 | <name>moget</name> | |
727 | </spider> | |
728 | <spider ident="MOMspider"> | |
729 | <name>MOMspider</name> | |
730 | </spider> | |
731 | <spider ident="Monster"> | |
732 | <name>Monster</name> | |
733 | </spider> | |
734 | <spider ident="Moreoverbot"> | |
735 | <name>Moreover</name> | |
736 | <url>http://www.moreover.com</url> | |
737 | </spider> | |
738 | <spider ident="msnbot"> | |
739 | <name>MSNBot</name> | |
740 | <url>http://search.msn.com/msnbot.htm</url> | |
741 | </spider> | |
742 | <spider ident="MSRBOT"> | |
743 | <name>MSRBOT</name> | |
744 | <url>http://research.microsoft.com/research/sv/msrbot/</url> | |
745 | </spider> | |
746 | <spider ident="MuscatFerret"> | |
747 | <name>Muscat Ferret</name> | |
748 | </spider> | |
749 | <spider ident="MwdSearch"> | |
750 | <name>Mwd.Search</name> | |
751 | </spider> | |
752 | <spider ident="NPBot"> | |
753 | <name>NameProtect</name> | |
754 | </spider> | |
755 | <spider ident="NaverBot"> | |
756 | <name>NaverBot</name> | |
757 | <url>http://www.spidermatic.com/en/robot-spider/20</url> | |
758 | </spider> | |
759 | <spider ident="NEC-MeshExplorer"> | |
760 | <name>NEC-MeshExplorer</name> | |
761 | </spider> | |
762 | <spider ident="Nederland.zoek"> | |
763 | <name>Nederland.zoek</name> | |
764 | </spider> | |
765 | <spider ident="NetCarta CyberPilot Pro"> | |
766 | <name>NetCarta WebMap</name> | |
767 | </spider> | |
768 | <spider ident="Netcraft"> | |
769 | <name>Netcraft Web Server Survey</name> | |
770 | <url>http://news.netcraft.com/</url> | |
771 | </spider> | |
772 | <spider ident="NetMechanic"> | |
773 | <name>NetMechanic</name> | |
774 | </spider> | |
775 | <spider ident="NetScoop"> | |
776 | <name>NetScoop</name> | |
777 | </spider> | |
778 | <spider ident="newscan-online"> | |
779 | <name>newscan-online</name> | |
780 | </spider> | |
781 | <spider ident="NextGenSearchBot 1"> | |
782 | <name>NextGenSearchBot</name> | |
783 | <url>http://www.zoominfo.com/NextGenSearchBot</url> | |
784 | </spider> | |
785 | <spider ident="NHSEWalker"> | |
786 | <name>NHSE Web Forager</name> | |
787 | </spider> | |
788 | <spider ident="NIF"> | |
789 | <name>NIF</name> | |
790 | <url>http://www.newsisfree.com/robot.php users</url> | |
791 | </spider> | |
792 | <spider ident="NimbleCrawler"> | |
793 | <name>NimbleCrawler</name> | |
794 | <url>http://www.healthline.com/aboutus.jsp</url> | |
795 | </spider> | |
796 | <spider ident="Nomad"> | |
797 | <name>Nomad</name> | |
798 | </spider> | |
799 | <spider ident="Norbert the Spider"> | |
800 | <name>Norbert</name> | |
801 | <url>http://www.Burf.com</url> | |
802 | </spider> | |
803 | <spider ident="Gulliver"> | |
804 | <name>Northern Light</name> | |
805 | </spider> | |
806 | <spider ident="explorersearch"> | |
807 | <name>nzexplorer</name> | |
808 | </spider> | |
809 | <spider ident="Occam"> | |
810 | <name>Occam</name> | |
811 | </spider> | |
812 | <spider ident="Ocelli"> | |
813 | <name>Ocelli</name> | |
814 | <url>http://www.globalspec.com/Ocelli</url> | |
815 | </spider> | |
816 | <spider ident="Online24-Bot"> | |
817 | <name>Online24-Bot</name> | |
818 | </spider> | |
819 | <spider ident="Openbot"> | |
820 | <name>Openbot</name> | |
821 | <url>http://www.openfind.com.tw/robot.html</url> | |
822 | </spider> | |
823 | <spider ident="Openfind"> | |
824 | <name>Openfind data gatherer</name> | |
825 | </spider> | |
826 | <spider ident="Orbsearch"> | |
827 | <name>Orb Search</name> | |
828 | </spider> | |
829 | <spider ident="PackRat"> | |
830 | <name>Pack Rat</name> | |
831 | </spider> | |
832 | <spider ident="PageBoy"> | |
833 | <name>PageBoy</name> | |
834 | </spider> | |
835 | <spider ident="ParaSite"> | |
836 | <name>ParaSite</name> | |
837 | </spider> | |
838 | <spider ident="Patric"> | |
839 | <name>Patric</name> | |
840 | </spider> | |
841 | <spider ident="PEGASUS"> | |
842 | <name>pegasus</name> | |
843 | </spider> | |
844 | <spider ident="PerlCrawler/1.0 Xavatoria/2.0"> | |
845 | <name>PerlCrawler 1.0</name> | |
846 | </spider> | |
847 | <spider ident="PGP-KA"> | |
848 | <name>PGP Key Agent</name> | |
849 | </spider> | |
850 | <spider ident="Duppies"> | |
851 | <name>Phantom</name> | |
852 | </spider> | |
853 | <spider ident="phpdig"> | |
854 | <name>PhpDig</name> | |
855 | </spider> | |
856 | <spider ident="PiltdownMan"> | |
857 | <name>PiltdownMan</name> | |
858 | </spider> | |
859 | <spider ident="Pimptrain's robot"> | |
860 | <name>Pimptrain.com's</name> | |
861 | </spider> | |
862 | <spider ident="pingalink"> | |
863 | <name>PingALink</name> | |
864 | </spider> | |
865 | <spider ident="Pioneer"> | |
866 | <name>Pioneer</name> | |
867 | </spider> | |
868 | <spider ident="PluckFeedCrawler"> | |
869 | <name>Pluck</name> | |
870 | <url>http://www.pluck.com</url> | |
871 | </spider> | |
872 | <spider ident="PlumtreeWebAccessor"> | |
873 | <name>PlumtreeWebAccessor</name> | |
874 | </spider> | |
875 | <spider ident="PodNova"> | |
876 | <name>PodNova</name> | |
877 | <url>http://www.podnova.com</url> | |
878 | </spider> | |
879 | <spider ident="Pompos"> | |
880 | <name>Pompos</name> | |
881 | <url>http://dir.com/pompos.html</url> | |
882 | </spider> | |
883 | <spider ident="Poppi"> | |
884 | <name>Poppi</name> | |
885 | </spider> | |
886 | <spider ident="gestaltIconoclast"> | |
887 | <name>Popular Iconoclast</name> | |
888 | </spider> | |
889 | <spider ident="PortalJuice.com"> | |
890 | <name>Portal Juice</name> | |
891 | </spider> | |
892 | <spider ident="PortalBSpider"> | |
893 | <name>PortalB Spider</name> | |
894 | </spider> | |
895 | <spider ident="www.kolinka.com"> | |
896 | <name>Project Kolinka Forum Search</name> | |
897 | <url>http://www.kolinka.com/</url> | |
898 | </spider> | |
899 | <spider ident="psbot"> | |
900 | <name>psbot</name> | |
901 | </spider> | |
902 | <spider ident="Qango.com Web Directory"> | |
903 | <name>Qango</name> | |
904 | <url>http://www.qango.com</url> | |
905 | </spider> | |
906 | <spider ident="StackRambler"> | |
907 | <name>Rambler</name> | |
908 | <url>http://www.rambler.ru/</url> | |
909 | </spider> | |
910 | <spider ident="Raven"> | |
911 | <name>Raven Search</name> | |
912 | </spider> | |
913 | <spider ident="Resume Robot"> | |
914 | <name>Resume Robot</name> | |
915 | </spider> | |
916 | <spider ident="Road Runner: ImageScape Robot"> | |
917 | <name>Road Runner: The ImageScape Robot</name> | |
918 | </spider> | |
919 | <spider ident="RHCS"> | |
920 | <name>RoadHouse Crawling System</name> | |
921 | </spider> | |
922 | <spider ident="Robbie"> | |
923 | <name>Robbie the Robot</name> | |
924 | </spider> | |
925 | <spider ident="RoboCrawl"> | |
926 | <name>RoboCrawl</name> | |
927 | </spider> | |
928 | <spider ident="Robofox"> | |
929 | <name>RoboFox</name> | |
930 | </spider> | |
931 | <spider ident="Robot du CRIM 1.0a"> | |
932 | <name>Robot Francoroute</name> | |
933 | </spider> | |
934 | <spider ident="Robozilla"> | |
935 | <name>Robozilla</name> | |
936 | </spider> | |
937 | <spider ident="Roverbot"> | |
938 | <name>Roverbot</name> | |
939 | </spider> | |
940 | <spider ident="RSS-SPIDER"> | |
941 | <name>RSS Feed Seeker</name> | |
942 | <url>http://www.rss-spider.com/fsb.php</url> | |
943 | </spider> | |
944 | <spider ident="RuLeS"> | |
945 | <name>RuLeS</name> | |
946 | </spider> | |
947 | <spider ident="SafetyNet Robot"> | |
948 | <name>SafetyNet</name> | |
949 | </spider> | |
950 | <spider ident="SBIder"> | |
951 | <name>SBIder.</name> | |
952 | <url>http://www.sitesell.com/sbider.html</url> | |
953 | </spider> | |
954 | <spider ident="Scharia"> | |
955 | <name>Scharia</name> | |
956 | </spider> | |
957 | <spider ident="Science-Index"> | |
958 | <name>Science-Index</name> | |
959 | </spider> | |
960 | <spider ident="Scooter"> | |
961 | <name>Scooter</name> | |
962 | </spider> | |
963 | <spider ident="SearchNZ"> | |
964 | <name>SearchNZ</name> | |
965 | <url>http://www.searchnz.co.nz/</url> | |
966 | </spider> | |
967 | <spider ident="searchprocess"> | |
968 | <name>SearchProcess</name> | |
969 | </spider> | |
970 | <spider ident="SearchmetricsBot"> | |
971 | <name>SearchmetricsBot</name> | |
972 | <url>http://www.searchmetrics.com/en/searchmetrics-bot/</url> | |
973 | </spider> | |
974 | <spider ident="Seekbot"> | |
975 | <name>Seekbot</name> | |
976 | <url>http://www.seekbot.net/bot.html</url> | |
977 | </spider> | |
978 | <spider ident="Senrigan"> | |
979 | <name>Senrigan</name> | |
980 | </spider> | |
981 | <spider ident="Sensis Web Crawler"> | |
982 | <name>Sensis Web Crawler</name> | |
983 | <url>http://www.sensis.com.au/help.do</url> | |
984 | </spider> | |
985 | <spider ident="SG-Scout"> | |
986 | <name>SG-Scout</name> | |
987 | </spider> | |
988 | <spider ident="Shagseeker"> | |
989 | <name>ShagSeeker</name> | |
990 | </spider> | |
991 | <spider ident="Shai'Hulud"> | |
992 | <name>Shai'Hulud</name> | |
993 | </spider> | |
994 | <spider ident="SimBot/1.0"> | |
995 | <name>Simmany Robot Ver1.0</name> | |
996 | </spider> | |
997 | <spider ident="ssearcher100"> | |
998 | <name>Site Searcher</name> | |
999 | </spider> | |
1000 | <spider ident="Site Valet"> | |
1001 | <name>Site Valet</name> | |
1002 | </spider> | |
1003 | <spider ident="http://www.site-list.net"> | |
1004 | <name>Site-List</name> | |
1005 | <url>http://www.site-list.net</url> | |
1006 | </spider> | |
1007 | <spider ident="SiteTech-Rover"> | |
1008 | <name>SiteTech-Rover</name> | |
1009 | </spider> | |
1010 | <spider ident="+SitiDi.net/SitiDiBot/"> | |
1011 | <name>SitiDi.net/SitiDiBot</name> | |
1012 | </spider> | |
1013 | <spider ident="aWapClient"> | |
1014 | <name>Skymob.com</name> | |
1015 | </spider> | |
1016 | <spider ident="SLCrawler"> | |
1017 | <name>SLCrawler</name> | |
1018 | </spider> | |
1019 | <spider ident="Sleek Spider"> | |
1020 | <name>Sleek</name> | |
1021 | </spider> | |
1022 | <spider ident="ESISmartSpider"> | |
1023 | <name>Smart Spider</name> | |
1024 | </spider> | |
1025 | <spider ident="Snapbot"> | |
1026 | <name>Snapbot</name> | |
1027 | <url>http://www.snap.com/</url> | |
1028 | </spider> | |
1029 | <spider ident="Snooper"> | |
1030 | <name>Snooper</name> | |
1031 | </spider> | |
1032 | <spider ident="sohu-search"> | |
1033 | <name>sohu-search</name> | |
1034 | </spider> | |
1035 | <spider ident="Solbot"> | |
1036 | <name>Solbot</name> | |
1037 | </spider> | |
1038 | <spider ident="Speedy Spider"> | |
1039 | <name>Speedy Spider</name> | |
1040 | <url>http://www.entireweb.com/about/search_tech/speedyspider/</url> | |
1041 | </spider> | |
1042 | <spider ident="Sphere Scout"> | |
1043 | <name>Sphere</name> | |
1044 | </spider> | |
1045 | <spider ident="Sphider2"> | |
1046 | <name>Sphider</name> | |
1047 | </spider> | |
1048 | <spider ident="SpiderBot"> | |
1049 | <name>SpiderBot</name> | |
1050 | </spider> | |
1051 | <spider ident="spiderline"> | |
1052 | <name>Spiderline Crawler</name> | |
1053 | </spider> | |
1054 | <spider ident="SpiderMan"> | |
1055 | <name>SpiderMan</name> | |
1056 | </spider> | |
1057 | <spider ident="SpiderView"> | |
1058 | <name>SpiderView(tm)</name> | |
1059 | </spider> | |
1060 | <spider ident="mouse.house"> | |
1061 | <name>spider_monkey</name> | |
1062 | </spider> | |
1063 | <spider ident="suke"> | |
1064 | <name>Suke</name> | |
1065 | </spider> | |
1066 | <spider ident="suntek"> | |
1067 | <name>suntek search engine</name> | |
1068 | </spider> | |
1069 | <spider ident="Szukacz"> | |
1070 | <name>Szukacz</name> | |
1071 | <url>http://www.szukacz.pl/html/RobotEnglishVersion.html</url> | |
1072 | </spider> | |
1073 | <spider ident="T-H-U-N-D-E-R-S-T-O-N-E"> | |
1074 | <name>T-H-U-N-D-E-R-S-T-O-N-E</name> | |
1075 | </spider> | |
1076 | <spider ident="Black Widow"> | |
1077 | <name>TACH Black Widow</name> | |
1078 | </spider> | |
1079 | <spider ident="Tarantula"> | |
1080 | <name>Tarantula</name> | |
1081 | </spider> | |
1082 | <spider ident="tarspider"> | |
1083 | <name>tarspider</name> | |
1084 | </spider> | |
1085 | <spider ident="dlw3robot"> | |
1086 | <name>Tcl W3 Robot</name> | |
1087 | </spider> | |
1088 | <spider ident="TechBOT"> | |
1089 | <name>TechBOT</name> | |
1090 | </spider> | |
1091 | <spider ident="Technoratibot"> | |
1092 | <name>Technorati</name> | |
1093 | <url>http://technorati.com/about/</url> | |
1094 | </spider> | |
1095 | <spider ident="Templeton"> | |
1096 | <name>Templeton</name> | |
1097 | </spider> | |
1098 | <spider ident="teoma"> | |
1099 | <name>Teoma/Ask Jeeves</name> | |
1100 | <url>http://sp.teoma.com/docs/teoma/about/</url> | |
1101 | </spider> | |
1102 | <spider ident="JubiiRobot"> | |
1103 | <name>The Jubii</name> | |
1104 | </spider> | |
1105 | <spider ident="NorthStar"> | |
1106 | <name>The NorthStar Robot</name> | |
1107 | </spider> | |
1108 | <spider ident="w3index"> | |
1109 | <name>The NWI Robot</name> | |
1110 | </spider> | |
1111 | <spider ident="Peregrinator-Mathematics"> | |
1112 | <name>The Peregrinator</name> | |
1113 | </spider> | |
1114 | <spider ident="thumbshots-de-Bot"> | |
1115 | <name>thumbshots-de-Bot</name> | |
1116 | </spider> | |
1117 | <spider ident="TITAN"> | |
1118 | <name>TITAN</name> | |
1119 | </spider> | |
1120 | <spider ident="TitIn"> | |
1121 | <name>TitIn</name> | |
1122 | </spider> | |
1123 | <spider ident="TLSpider"> | |
1124 | <name>TLSpider</name> | |
1125 | </spider> | |
1126 | <spider ident="TMCrawler"> | |
1127 | <name>TMCrawler</name> | |
1128 | </spider> | |
1129 | <spider ident="trendictionbot"> | |
1130 | <name>Trendiction-Bot</name> | |
1131 | <url>http://www.trendiction.com/bot</url> | |
1132 | </spider> | |
1133 | <spider ident="slysearch"> | |
1134 | <name>Turnitin.com</name> | |
1135 | <url>http://www.turnitin.com/static/products_services/search_engines.html</url> | |
1136 | </spider> | |
1137 | <spider ident="TurnitinBot/"> | |
1138 | <name>TurnitinBot</name> | |
1139 | </spider> | |
1140 | <spider ident="TurtleScanner"> | |
1141 | <name>Turtle</name> | |
1142 | <url>http://www.turtle.ru/</url> | |
1143 | </spider> | |
1144 | <spider ident="Twiceler"> | |
1145 | <name>Twiceler</name> | |
1146 | <url>http://www.cuill.com/twiceler/robot.html</url> | |
1147 | </spider> | |
1148 | <spider ident="UCSD-Crawler"> | |
1149 | <name>UCSD Crawl</name> | |
1150 | </spider> | |
1151 | <spider ident="UMBC-memeta-Bot"> | |
1152 | <name>UMBC</name> | |
1153 | </spider> | |
1154 | <spider ident="unisterbot"> | |
1155 | <name>Unister</name> | |
1156 | </spider> | |
1157 | <spider ident="Unpartisan"> | |
1158 | <name>Unpartisan</name> | |
1159 | <url>http://www.unpartisan.com</url> | |
1160 | </spider> | |
1161 | <spider ident="urlck"> | |
1162 | <name>URL Check</name> | |
1163 | </spider> | |
1164 | <spider ident="URL Spider Pro"> | |
1165 | <name>URL Spider Pro</name> | |
1166 | </spider> | |
1167 | <spider ident="Valkyrie"> | |
1168 | <name>Valkyrie</name> | |
1169 | </spider> | |
1170 | <spider ident="Verticrawl"> | |
1171 | <name>Verticrawl</name> | |
1172 | </spider> | |
1173 | <spider ident="Victoria"> | |
1174 | <name>Victoria</name> | |
1175 | </spider> | |
1176 | <spider ident="vision-search"> | |
1177 | <name>vision-search</name> | |
1178 | </spider> | |
1179 | <spider ident="VoilaBot"> | |
1180 | <name>VoilaBot</name> | |
1181 | <url>http://www.voila.com/</url> | |
1182 | </spider> | |
1183 | <spider ident="Voyager"> | |
1184 | <name>Voyager</name> | |
1185 | </spider> | |
1186 | <spider ident="VWbot_K"> | |
1187 | <name>VWbot</name> | |
1188 | </spider> | |
1189 | <spider ident="W3M2"> | |
1190 | <name>W3M2</name> | |
1191 | </spider> | |
1192 | <spider ident="w3mir"> | |
1193 | <name>w3mir</name> | |
1194 | </spider> | |
1195 | <spider ident="w@pSpider"> | |
1196 | <name>w@pSpider</name> | |
1197 | </spider> | |
1198 | <spider ident="appie"> | |
1199 | <name>Walhello appie</name> | |
1200 | <url>http://www.robotstxt.org/wc/active/html/appie.html</url> | |
1201 | </spider> | |
1202 | <spider ident="CrawlPaper"> | |
1203 | <name>WallPaper</name> | |
1204 | </spider> | |
1205 | <spider ident="root"> | |
1206 | <name>Web Core / Roots</name> | |
1207 | </spider> | |
1208 | <spider ident="WebMoose"> | |
1209 | <name>Web Moose</name> | |
1210 | </spider> | |
1211 | <spider ident="WebBandit"> | |
1212 | <name>WebBandit</name> | |
1213 | </spider> | |
1214 | <spider ident="WebCatcher"> | |
1215 | <name>WebCatcher</name> | |
1216 | </spider> | |
1217 | <spider ident="Webclipping"> | |
1218 | <name>Webclipping</name> | |
1219 | </spider> | |
1220 | <spider ident="WebCopy"> | |
1221 | <name>WebCopy</name> | |
1222 | </spider> | |
1223 | <spider ident="WebFetcher"> | |
1224 | <name>webfetcher</name> | |
1225 | </spider> | |
1226 | <spider ident="weblayers"> | |
1227 | <name>weblayers</name> | |
1228 | </spider> | |
1229 | <spider ident="WebLinker"> | |
1230 | <name>WebLinker</name> | |
1231 | </spider> | |
1232 | <spider ident="wlm"> | |
1233 | <name>Weblog Monitor</name> | |
1234 | </spider> | |
1235 | <spider ident="WebQuest"> | |
1236 | <name>WebQuest</name> | |
1237 | </spider> | |
1238 | <spider ident="WebReaper"> | |
1239 | <name>WebReaper</name> | |
1240 | </spider> | |
1241 | <spider ident="webs@recruit.co.jp"> | |
1242 | <name>webs</name> | |
1243 | </spider> | |
1244 | <spider ident="websearchbench"> | |
1245 | <name>WebSearchBench</name> | |
1246 | <url>http://websearchbench.cs.uni-dortmund.de/</url> | |
1247 | </spider> | |
1248 | <spider ident="WOLP"> | |
1249 | <name>WebStolperer</name> | |
1250 | </spider> | |
1251 | <spider ident="webvac"> | |
1252 | <name>WebVac</name> | |
1253 | </spider> | |
1254 | <spider ident="webwalk"> | |
1255 | <name>webwalk</name> | |
1256 | </spider> | |
1257 | <spider ident="WebWalker"> | |
1258 | <name>WebWalker</name> | |
1259 | </spider> | |
1260 | <spider ident="WebWatch"> | |
1261 | <name>WebWatch</name> | |
1262 | </spider> | |
1263 | <spider ident="whatUseek_winona"> | |
1264 | <name>whatUseek Winona</name> | |
1265 | </spider> | |
1266 | <spider ident="SurveyBot"> | |
1267 | <name>Whois Source</name> | |
1268 | <url>http://www.whois.sc/info/webmasters/surveybot.html</url> | |
1269 | </spider> | |
1270 | <spider ident="Hazel's Ferret Web hopper"> | |
1271 | <name>Wild Ferret Web Hopper</name> | |
1272 | </spider> | |
1273 | <spider ident="WinHTTP"> | |
1274 | <name>WinHTTP</name> | |
1275 | </spider> | |
1276 | <spider ident="wired-digital-newsbot"> | |
1277 | <name>Wired Digital</name> | |
1278 | </spider> | |
1279 | <spider ident="zyborg"> | |
1280 | <name>WiseNut</name> | |
1281 | </spider> | |
1282 | <spider ident="OmniExplorer_Bot"> | |
1283 | <name>WorldIndexer</name> | |
1284 | <url>http://www.omni-explorer.com</url> | |
1285 | </spider> | |
1286 | <spider ident="WWWC"> | |
1287 | <name>WWWC</name> | |
1288 | </spider> | |
1289 | <spider ident="WWWeasel Robot"> | |
1290 | <name>WWWeasel Robot</name> | |
1291 | </spider> | |
1292 | <spider ident="wwwster"> | |
1293 | <name>wwwster</name> | |
1294 | </spider> | |
1295 | <spider ident="WWWWanderer"> | |
1296 | <name>WWWWanderer</name> | |
1297 | </spider> | |
1298 | <spider ident="TECOMAC-Crawler"> | |
1299 | <name>X-Crawler</name> | |
1300 | </spider> | |
1301 | <spider ident="XGET"> | |
1302 | <name>XGET</name> | |
1303 | </spider> | |
1304 | <spider ident="cosmos"> | |
1305 | <name>XYLEME Robot</name> | |
1306 | </spider> | |
1307 | <spider ident="yacybot"> | |
1308 | <name>YaCy-Bot</name> | |
1309 | <url>http://yacy.net/yacy/bot.html</url> | |
1310 | </spider> | |
1311 | <spider ident="YahooYSMcm"> | |
1312 | <name>Yahoo Publisher Network</name> | |
1313 | <url>http://publisher.yahoo.com/</url> | |
1314 | </spider> | |
1315 | <spider ident="Yahoo-Blogs"> | |
1316 | <name>Yahoo-Blogs</name> | |
1317 | <url>http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html</url> | |
1318 | </spider> | |
1319 | <spider ident="Yahoo Pipes"> | |
1320 | <name>Yahoo Pipes</name> | |
1321 | </spider> | |
1322 | <spider ident="Yahoo! Slurp"> | |
1323 | <name>Yahoo! Slurp</name> | |
1324 | <url>http://help.yahoo.com/help/us/ysearch/slurp</url> | |
1325 | </spider> | |
1326 | <spider ident="Yahoo-VerticalCrawler"> | |
1327 | <name>Yahoo-VerticalCrawler</name> | |
1328 | </spider> | |
1329 | <spider ident="YahooFeedSeeker"> | |
1330 | <name>YahooFeedSeeker</name> | |
1331 | <url>http://my.yahoo.com/s/publishers.html</url> | |
1332 | </spider> | |
1333 | <spider ident="Yandex"> | |
1334 | <name>Yandex</name> | |
1335 | <url>http://www.yandex.ru/</url> | |
1336 | </spider> | |
1337 | <spider ident="zeus"> | |
1338 | <name>Zeus Internet Marketing</name> | |
1339 | <url>http://www.cyber-robotics.com/</url> | |
1340 | </spider> | |
1341 | <spider ident="http://www.zorkk.com"> | |
1342 | <name>Zork</name> | |
1343 | <url>http://www.zorkk.com</url> | |
1344 | </spider> | |
835ff3c7 | 1345 | </data> |