Subversion Repositories javautils

Rev

View as "text/xml" | Blame | Last modification | View Log | RSS feed

  1. <?xml version="1.0"?>
  2. <user-agents>
  3. <user-agent>
  4. <ID>id_a_f_3</ID>
  5. <String>!Susie (http://www.sync2it.com/susie)</String>
  6. <Description>Sync2It bookmark management &amp; clustering engine</Description>
  7. <Type>C R</Type>
  8. <Comment></Comment>
  9. <Link1>http://www.sync2it.com</Link1>
  10. <Link2></Link2>
  11. </user-agent>
  12. <user-agent>
  13. <ID>id_a_f_6</ID>
  14. <String>&lt;a href='http://www.unchaos.com/'> UnChaos &lt;/a> From Chaos To Order Hybrid Web Search Engine.(vadim_gonchar@unchaos.com)</String>
  15. <Description>UnCHAOS search robot</Description>
  16. <Type>R</Type>
  17. <Comment>Site is dead</Comment>
  18. <Link1>http://www.unchaos.com/</Link1>
  19. <Link2></Link2>
  20. </user-agent>
  21. <user-agent>
  22. <ID>id_a_f_7</ID>
  23. <String>&lt;a href='http://www.unchaos.com/'> UnChaos Bot Hybrid Web Search Engine. &lt;/a> (vadim_gonchar@unchaos.com)</String>
  24. <Description>UnCHAOS search robot</Description>
  25. <Type>R</Type>
  26. <Comment>Site is dead</Comment>
  27. <Link1>http://www.unchaos.com/</Link1>
  28. <Link2></Link2>
  29. </user-agent>
  30. <user-agent>
  31. <ID>id_a_f_8</ID>
  32. <String>&lt;b> UnChaosBot From Chaos To Order UnChaos Hybrid Web Search Engine at www.unchaos.com &lt;/b> (info@unchaos.com)</String>
  33. <Description>UnCHAOS search robot</Description>
  34. <Type>R</Type>
  35. <Comment>Site is dead</Comment>
  36. <Link1>http://www.unchaos.com/</Link1>
  37. <Link2></Link2>
  38. </user-agent>
  39. <user-agent>
  40. <ID>id_a_f_9</ID>
  41. <String>&lt;http://www.sygol.com/> http://www.sygol.com</String>
  42. <Description>Sygol Search (Italy) robot</Description>
  43. <Type>R</Type>
  44. <Comment>s.also SygolBot</Comment>
  45. <Link1>http://www.sygol.com/</Link1>
  46. <Link2></Link2>
  47. </user-agent>
  48. <user-agent>
  49. <ID>id_a_f_4</ID>
  50. <String>( Robots.txt Validator http://www.searchengineworld.com/cgi-bin/robotcheck.cgi )</String>
  51. <Description>SearchEngineWorld's robots.txt validator</Description>
  52. <Type>C</Type>
  53. <Comment>Services is no more available</Comment>
  54. <Link1>http://www.searchengineworld.com/cgi-bin/robotcheck.cgi</Link1>
  55. <Link2></Link2>
  56. </user-agent>
  57. <user-agent>
  58. <ID>id_a_f_171105_1</ID>
  59. <String>(DreamPassport/3.0; isao/MyDiGiRabi)</String>
  60. <Description>DreamCast DreamPassport browser</Description>
  61. <Type>B</Type>
  62. <Comment></Comment>
  63. <Link1>http://www.dricas.com/dp/</Link1>
  64. <Link2></Link2>
  65. </user-agent>
  66. <user-agent>
  67. <ID>id_a_f_290606_1</ID>
  68. <String>(Privoxy/1.0)</String>
  69. <Description>Privoxy web proxy</Description>
  70. <Type>P</Type>
  71. <Comment>s.also Privoxy/3.0 (Anonymous)</Comment>
  72. <Link1>http://www.privoxy.org/</Link1>
  73. <Link2></Link2>
  74. </user-agent>
  75. <user-agent>
  76. <ID>id_a_f_230507_1</ID>
  77. <String>*/Nutch-0.9-dev</String>
  78. <Description>Unknown Yahoo robot</Description>
  79. <Type>R</Type>
  80. <Comment>123.113.184.2xx</Comment>
  81. <Link1>http://www.yahoo.com</Link1>
  82. <Link2></Link2>
  83. </user-agent>
  84. <user-agent>
  85. <ID>id_a_f_5</ID>
  86. <String>+SitiDi.net/SitiDiBot/1.0 (+Have Good Day)</String>
  87. <Description>SitiDi.net search (Germany) robot</Description>
  88. <Type>R</Type>
  89. <Comment></Comment>
  90. <Link1>http://www.sitidi.net/</Link1>
  91. <Link2></Link2>
  92. </user-agent>
  93. <user-agent>
  94. <ID>id_a_f_1</ID>
  95. <String>-DIE-KRAEHE- META-SEARCH-ENGINE/1.1 http://www.die-kraehe.de</String>
  96. <Description>Die Kraehe Meta-Search-Engine (Germany) link checking</Description>
  97. <Type>R</Type>
  98. <Comment></Comment>
  99. <Link1>http://www.die-kraehe.de</Link1>
  100. <Link2></Link2>
  101. </user-agent>
  102. <user-agent>
  103. <ID>id_a_f_060206_1</ID>
  104. <String>123spider-Bot (Version: 1.02&#44; powered by www.123spider.de</String>
  105. <Description>123spider.de (Germany) web directory link checking</Description>
  106. <Type>C</Type>
  107. <Comment></Comment>
  108. <Link1>http://www.123spider.de/</Link1>
  109. <Link2></Link2>
  110. </user-agent>
  111. <user-agent>
  112. <ID>id_a_f_180806_1</ID>
  113. <String>192.comAgent</String>
  114. <Description>192.com - UK web directory</Description>
  115. <Type>R</Type>
  116. <Comment>217.160.75.2xx</Comment>
  117. <Link1>http://www.192.com/</Link1>
  118. <Link2></Link2>
  119. </user-agent>
  120. <user-agent>
  121. <ID>id_a_f_060606_1</ID>
  122. <String>1st ZipCommander (Net) - http://www.zipcommander.com/</String>
  123. <Description>1st ZipCommander Net - IE based browser</Description>
  124. <Type>B</Type>
  125. <Comment></Comment>
  126. <Link1>http://www.zipcommander.com/</Link1>
  127. <Link2></Link2>
  128. </user-agent>
  129. <user-agent>
  130. <ID>id_a_f_10</ID>
  131. <String>2Bone_LinkChecker/1.0 libwww-perl/5.64</String>
  132. <Description>2Bone online link checker</Description>
  133. <Type>C</Type>
  134. <Comment></Comment>
  135. <Link1>http://www.2bone.com/links/linkchecker.shtml</Link1>
  136. <Link2></Link2>
  137. </user-agent>
  138. <user-agent>
  139. <ID>id_a_f_11</ID>
  140. <String>4anything.com LinkChecker v2.0</String>
  141. <Description>4Anything robot</Description>
  142. <Type>R</Type>
  143. <Comment></Comment>
  144. <Link1>http://www.4anything.com</Link1>
  145. <Link2></Link2>
  146. </user-agent>
  147. <user-agent>
  148. <ID>id_a_f_110207_1</ID>
  149. <String>8484 Boston Project v 1.0</String>
  150. <Description>Unknown guestbook spamming or harvesting tool from diff. IPs</Description>
  151. <Type>S</Type>
  152. <Comment>s. various honey pot sites</Comment>
  153. <Link1>http://www.projecthoneypot.org/bsh_X19tb2RlPWdsb2JhbCZfX2J5PWMmY3RyeT11cyZ1YWc9ODQ4NCtCb3N0b24rUHJvamVjdCt2KzEuMA..</Link1>
  154. <Link2></Link2>
  155. </user-agent>
  156. <user-agent>
  157. <ID>id_a_f_2</ID>
  158. <String>:robot/1.0 (linux) ( admin e-mail: undefined http://www.neofonie.de/loesungen/search/robot.html )</String>
  159. <Description>neofonie search robot Germany</Description>
  160. <Type>R</Type>
  161. <Comment></Comment>
  162. <Link1>http://www.neofonie.de/loesungen/search/</Link1>
  163. <Link2></Link2>
  164. </user-agent>
  165. <user-agent>
  166. <ID>id_a_f_12</ID>
  167. <String>A-Online Search</String>
  168. <Description>A-Online.at robot - now Jet2Web Search</Description>
  169. <Type>R</Type>
  170. <Comment></Comment>
  171. <Link1>http://www.jet2web.net/portal</Link1>
  172. <Link2></Link2>
  173. </user-agent>
  174. <user-agent>
  175. <ID>id_a_f_090707_1</ID>
  176. <String>A1 Keyword Research/1.0.2 (+http://www.micro-sys.dk/products/keyword-research/) miggibot/2007.03.27</String>
  177. <Description>A1 Keyword Research - search engine and keyword optimization software</Description>
  178. <Type>C</Type>
  179. <Comment></Comment>
  180. <Link1>http://www.micro-sys.dk/products/keyword-research/</Link1>
  181. <Link2></Link2>
  182. </user-agent>
  183. <user-agent>
  184. <ID>id_a_f_100906_1</ID>
  185. <String>A1 Sitemap Generator/1.0 (+http://www.micro-sys.dk/products/sitemap-generator/) miggibot/2006.01.24</String>
  186. <Description>MiggiBot website crawler engine - A1 Sitemap Generator</Description>
  187. <Type>R</Type>
  188. <Comment></Comment>
  189. <Link1>http://www.micro-sys.dk/products/sitemap-generator/</Link1>
  190. <Link2>http://www.micro-sys.dk/developer/miggibot/</Link2>
  191. </user-agent>
  192. <user-agent>
  193. <ID>id_a_f_250408_2</ID>
  194. <String>aardvark-crawler</String>
  195. <Description>Aardvark web crawler for Sun's Blog recommendations</Description>
  196. <Type>R</Type>
  197. <Comment>192.9.71.7x</Comment>
  198. <Link1>http://blogs.sun.com/plamere/</Link1>
  199. <Link2></Link2>
  200. </user-agent>
  201. <user-agent>
  202. <ID>id_a_f_13</ID>
  203. <String>AbachoBOT</String>
  204. <Description>Abacho / Crawler.de robot</Description>
  205. <Type>R</Type>
  206. <Comment></Comment>
  207. <Link1>http://www.abacho.com</Link1>
  208. <Link2></Link2>
  209. </user-agent>
  210. <user-agent>
  211. <ID>id_a_f_14</ID>
  212. <String>AbachoBOT (Mozilla compatible)</String>
  213. <Description>Abacho / Crawler.de robot</Description>
  214. <Type>R</Type>
  215. <Comment></Comment>
  216. <Link1>http://www.abacho.com</Link1>
  217. <Link2></Link2>
  218. </user-agent>
  219. <user-agent>
  220. <ID>id_a_f_15</ID>
  221. <String>ABCdatos BotLink/5.xx.xxx#BBL</String>
  222. <Description>ABCdatos - Castilian program &amp; tutorial directory</Description>
  223. <Type>R</Type>
  224. <Comment></Comment>
  225. <Link1>http://www.abcdatos.com</Link1>
  226. <Link2></Link2>
  227. </user-agent>
  228. <user-agent>
  229. <ID>id_a_f_16</ID>
  230. <String>Aberja Checkomat</String>
  231. <Description>Aberja Hybridsuchmaschine (Germany) link checking</Description>
  232. <Type>R</Type>
  233. <Comment></Comment>
  234. <Link1>http://www.aberja.de</Link1>
  235. <Link2></Link2>
  236. </user-agent>
  237. <user-agent>
  238. <ID>id_a_f_17</ID>
  239. <String>abot/0.1 (abot; http://www.abot.com; abot@abot.com)</String>
  240. <Description>Nameprotect copyright search robot (24.177.134.x)</Description>
  241. <Type>R</Type>
  242. <Comment>s. also - np/0.1_(np;_http://www.nameprotect.com... - aipbot/1.0 (aipbot; http://www.aipbot.com...</Comment>
  243. <Link1>http://www.nameprotect.com/</Link1>
  244. <Link2></Link2>
  245. </user-agent>
  246. <user-agent>
  247. <ID>id_a_f_18</ID>
  248. <String>About/0.1libwww-perl/5.47</String>
  249. <Description>About robot</Description>
  250. <Type>R</Type>
  251. <Comment></Comment>
  252. <Link1>http://www.about.com</Link1>
  253. <Link2></Link2>
  254. </user-agent>
  255. <user-agent>
  256. <ID>id_a_f_051206_3</ID>
  257. <String>Accelatech RSSCrawler/0.4</String>
  258. <Description>Accela Technology RSS feed crawler</Description>
  259. <Type>R</Type>
  260. <Comment>125.100.242.2xx</Comment>
  261. <Link1>http://www.accelatech.com/</Link1>
  262. <Link2></Link2>
  263. </user-agent>
  264. <user-agent>
  265. <ID>id_a_f_19</ID>
  266. <String>accoona</String>
  267. <Description>Accoona Search robot</Description>
  268. <Type>R</Type>
  269. <Comment>65.17.255.xx</Comment>
  270. <Link1>http://www.accoona.com</Link1>
  271. <Link2></Link2>
  272. </user-agent>
  273. <user-agent>
  274. <ID>id_a_f_20</ID>
  275. <String>Accoona-AI-Agent/1.1.1 (crawler at accoona dot com)</String>
  276. <Description>Accoona Search robot</Description>
  277. <Type>R</Type>
  278. <Comment>65.17.255.xx</Comment>
  279. <Link1>http://www.accoona.com</Link1>
  280. <Link2></Link2>
  281. </user-agent>
  282. <user-agent>
  283. <ID>id_a_f_140906_3</ID>
  284. <String>Accoona-AI-Agent/1.1.2 (aicrawler at accoonabot dot com)</String>
  285. <Description>Accoona Search robot</Description>
  286. <Type>R</Type>
  287. <Comment>65.17.255.xx</Comment>
  288. <Link1>http://www.accoona.com</Link1>
  289. <Link2></Link2>
  290. </user-agent>
  291. <user-agent>
  292. <ID>id_a_f_21</ID>
  293. <String>Ace Explorer</String>
  294. <Description>Ace Explorer - IE based browser</Description>
  295. <Type>B</Type>
  296. <Comment></Comment>
  297. <Link1>http://www.aceexplorer.com</Link1>
  298. <Link2></Link2>
  299. </user-agent>
  300. <user-agent>
  301. <ID>id_a_f_280806_1</ID>
  302. <String>Ack (http://www.ackerm.com/)</String>
  303. <Description>Ackerm search robot</Description>
  304. <Type>R</Type>
  305. <Comment>64.74.153.xx</Comment>
  306. <Link1>http://www.ackerm.com/</Link1>
  307. <Link2></Link2>
  308. </user-agent>
  309. <user-agent>
  310. <ID>id_a_f_22</ID>
  311. <String>AcoiRobot</String>
  312. <Description>Acoi picture finder robot</Description>
  313. <Type>R</Type>
  314. <Comment></Comment>
  315. <Link1>http://monetdb.cwi.nl/acoi/projects.html</Link1>
  316. <Link2></Link2>
  317. </user-agent>
  318. <user-agent>
  319. <ID>id_a_f_23</ID>
  320. <String>Acoon Robot v1.50.001</String>
  321. <Description>Acoon.de search (Germany) robot</Description>
  322. <Type>R</Type>
  323. <Comment>80.237.153.10x</Comment>
  324. <Link1>http://www.acoon.de</Link1>
  325. <Link2></Link2>
  326. </user-agent>
  327. <user-agent>
  328. <ID>id_a_f_24</ID>
  329. <String>Acoon Robot v1.52 (http://www.acoon.de)</String>
  330. <Description>Acoon.de search (Germany) robot</Description>
  331. <Type>R</Type>
  332. <Comment>80.237.153.10x</Comment>
  333. <Link1>http://www.acoon.de</Link1>
  334. <Link2></Link2>
  335. </user-agent>
  336. <user-agent>
  337. <ID>id_a_f_100508_1</ID>
  338. <String>Acoon-Robot 4.0.x.[xx] (http://www.acoon.de)</String>
  339. <Description>Acoon.de search (Germany) robot</Description>
  340. <Type>R</Type>
  341. <Comment>80.237.209.xx</Comment>
  342. <Link1>http://www.acoon.de</Link1>
  343. <Link2></Link2>
  344. </user-agent>
  345. <user-agent>
  346. <ID>id_a_f_010108_1</ID>
  347. <String>Acoon-Robot v3.xx (http://www.acoon.de and http://www.acoon.com)</String>
  348. <Description>Acoon.de search (Germany) robot</Description>
  349. <Type>R</Type>
  350. <Comment>80.237.153.10x</Comment>
  351. <Link1>http://www.acoon.de</Link1>
  352. <Link2></Link2>
  353. </user-agent>
  354. <user-agent>
  355. <ID>id_a_f_110507_1</ID>
  356. <String>Acorn/Nutch-0.9 (Non-Profit Search Engine; acorn.isara.org; acorn at isara dot org)</String>
  357. <Description>Acorn Search Project</Description>
  358. <Type>R</Type>
  359. <Comment>124.157.145.1xx</Comment>
  360. <Link1>http://acorn.no-ip.org/</Link1>
  361. <Link2></Link2>
  362. </user-agent>
  363. <user-agent>
  364. <ID>id_a_f_25</ID>
  365. <String>ActiveBookmark 1.x</String>
  366. <Description>LibMaster.com Active Bookmark HTML page creator</Description>
  367. <Type>C B</Type>
  368. <Comment></Comment>
  369. <Link1>http://www.libmaster.com/software.php</Link1>
  370. <Link2></Link2>
  371. </user-agent>
  372. <user-agent>
  373. <ID>id_a_f_060806_2</ID>
  374. <String>Activeworlds</String>
  375. <Description>Activeworlds 3D homepage browser</Description>
  376. <Type>B</Type>
  377. <Comment></Comment>
  378. <Link1>http://www.activeworlds.com</Link1>
  379. <Link2></Link2>
  380. </user-agent>
  381. <user-agent>
  382. <ID>id_a_f_26</ID>
  383. <String>ActiveWorlds/3.xx (xxx)</String>
  384. <Description>Activeworlds 3D homepage browser</Description>
  385. <Type>B</Type>
  386. <Comment></Comment>
  387. <Link1>http://www.activeworlds.com</Link1>
  388. <Link2></Link2>
  389. </user-agent>
  390. <user-agent>
  391. <ID>id_a_f_27</ID>
  392. <String>Ad Muncher v4.xx.x</String>
  393. <Description>Ad Muncher - banner killer</Description>
  394. <Type>P</Type>
  395. <Comment></Comment>
  396. <Link1>http://www.admuncher.com/</Link1>
  397. <Link2></Link2>
  398. </user-agent>
  399. <user-agent>
  400. <ID>id_a_f_28</ID>
  401. <String>Ad Muncher v4x Build xxxxx</String>
  402. <Description>Ad Muncher - banner killer</Description>
  403. <Type>P</Type>
  404. <Comment></Comment>
  405. <Link1>http://www.admuncher.com/</Link1>
  406. <Link2></Link2>
  407. </user-agent>
  408. <user-agent>
  409. <ID>id_a_f_061006_1</ID>
  410. <String>Adaxas Spider (http://www.adaxas.net/)</String>
  411. <Description>website directory adaxas link checking</Description>
  412. <Type>C</Type>
  413. <Comment>85.10.199.xx</Comment>
  414. <Link1>http://www.adaxas.net/</Link1>
  415. <Link2></Link2>
  416. </user-agent>
  417. <user-agent>
  418. <ID>id_a_f_29</ID>
  419. <String>Advanced Browser (http://www.avantbrowser.com)</String>
  420. <Description>Avant Browser - IE based browser</Description>
  421. <Type>B</Type>
  422. <Comment></Comment>
  423. <Link1>http://www.avantbrowser.com</Link1>
  424. <Link2></Link2>
  425. </user-agent>
  426. <user-agent>
  427. <ID>id_a_f_30</ID>
  428. <String>AESOP_com_SpiderMan</String>
  429. <Description>Aesop robot</Description>
  430. <Type>R</Type>
  431. <Comment></Comment>
  432. <Link1>http://www.aesop.com</Link1>
  433. <Link2></Link2>
  434. </user-agent>
  435. <user-agent>
  436. <ID>id_a_f_31</ID>
  437. <String>agadine/1.x.x (+http://www.agada.de)</String>
  438. <Description>Agada search (Germany) robot</Description>
  439. <Type>R</Type>
  440. <Comment>s. also Mozilla/4.0 (agadine3.0)</Comment>
  441. <Link1>http://www.agada.de</Link1>
  442. <Link2></Link2>
  443. </user-agent>
  444. <user-agent>
  445. <ID>id_a_f_32</ID>
  446. <String>Agent-SharewarePlazaFileCheckBot/2.0+(+http://www.SharewarePlaza.com)</String>
  447. <Description>SharewarePlaza link checking</Description>
  448. <Type>R</Type>
  449. <Comment></Comment>
  450. <Link1>http://www.sharewareplaza.com</Link1>
  451. <Link2></Link2>
  452. </user-agent>
  453. <user-agent>
  454. <ID>id_a_f_33</ID>
  455. <String>AgentName/0.1 libwww-perl/5.48</String>
  456. <Description>Linkomatic submission verifier</Description>
  457. <Type>R</Type>
  458. <Comment></Comment>
  459. <Link1>http://www.linkomatic.com/</Link1>
  460. <Link2></Link2>
  461. </user-agent>
  462. <user-agent>
  463. <ID>id_a_f_34</ID>
  464. <String>AIBOT/2.1 By +(www.21seek.com A Real artificial intelligence search engine China)</String>
  465. <Description>21seek.com (China) robot (218.17.90.xxx)</Description>
  466. <Type>R</Type>
  467. <Comment></Comment>
  468. <Link1>http://www.21seek.com</Link1>
  469. <Link2></Link2>
  470. </user-agent>
  471. <user-agent>
  472. <ID>id_a_f_130807_1</ID>
  473. <String>AideRSS/1.0 (aiderss.com)</String>
  474. <Description>AideRss - Postrank RSS and Blog filtering</Description>
  475. <Type>C</Type>
  476. <Comment>72.44.35.2xx</Comment>
  477. <Link1>http://www.aiderss.com/</Link1>
  478. <Link2></Link2>
  479. </user-agent>
  480. <user-agent>
  481. <ID>id_a_f_35</ID>
  482. <String>aipbot/1.0 (aipbot; http://www.aipbot.com; aipbot@aipbot.com)</String>
  483. <Description>Nameprotect copyright search robot (24.177.134.x)</Description>
  484. <Type>R</Type>
  485. <Comment>s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com...</Comment>
  486. <Link1>http://www.nameprotect.com/</Link1>
  487. <Link2></Link2>
  488. </user-agent>
  489. <user-agent>
  490. <ID>id_a_f_36</ID>
  491. <String>aipbot/2-beta (aipbot dev; http://aipbot.com; aipbot@aipbot.com)</String>
  492. <Description>Nameprotect copyright search robot (24.177.134.x)</Description>
  493. <Type>R</Type>
  494. <Comment>s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com...</Comment>
  495. <Link1>http://www.nameprotect.com/</Link1>
  496. <Link2></Link2>
  497. </user-agent>
  498. <user-agent>
  499. <ID>id_a_f_291108_1</ID>
  500. <String>Akregator/1.2.9; librss/remnants</String>
  501. <Description>Akregator news feed reader for KDE</Description>
  502. <Type>B</Type>
  503. <Comment></Comment>
  504. <Link1>http://akregator.kde.org/</Link1>
  505. <Link2></Link2>
  506. </user-agent>
  507. <user-agent>
  508. <ID>id_a_f_37</ID>
  509. <String>Aladin/3.324</String>
  510. <Description>Aladin robot</Description>
  511. <Type>R</Type>
  512. <Comment></Comment>
  513. <Link1>http://www.aladin.de</Link1>
  514. <Link2></Link2>
  515. </user-agent>
  516. <user-agent>
  517. <ID>id_a_f_180408_1</ID>
  518. <String>Alcatel-BG3/1.0 UP.Browser/5.0.3.1.2</String>
  519. <Description>Phone.com UP.Browser for mobiles on Alcatel cellphone</Description>
  520. <Type>B</Type>
  521. <Comment></Comment>
  522. <Link1>http://www.openwave.com</Link1>
  523. <Link2></Link2>
  524. </user-agent>
  525. <user-agent>
  526. <ID>id_a_f_38</ID>
  527. <String>Aleksika Spider/1.0 (+http://www.aleksika.com/)</String>
  528. <Description>Aleksika Danmark - Search engine optimization spider</Description>
  529. <Type>R</Type>
  530. <Comment></Comment>
  531. <Link1>http://www.aleksika.com</Link1>
  532. <Link2></Link2>
  533. </user-agent>
  534. <user-agent>
  535. <ID>id_a_f_291108_2</ID>
  536. <String>AlertInfo 2.0 (Powered by Newsbrain)</String>
  537. <Description>Alertinfo - French version of Feedreader 3.xx </Description>
  538. <Type>B</Type>
  539. <Comment></Comment>
  540. <Link1>http://www.feedreader.com/</Link1>
  541. <Link2>http://www.geste.fr/alertinfo/home.html</Link2>
  542. </user-agent>
  543. <user-agent>
  544. <ID>id_a_f_39</ID>
  545. <String>AlkalineBOT/1.3</String>
  546. <Description>Vestris robot</Description>
  547. <Type>R</Type>
  548. <Comment></Comment>
  549. <Link1>http://alkaline.vestris.com/</Link1>
  550. <Link2></Link2>
  551. </user-agent>
  552. <user-agent>
  553. <ID>id_a_f_40</ID>
  554. <String>AlkalineBOT/1.4 (1.4.0326.0 RTM)</String>
  555. <Description>Vestris robot</Description>
  556. <Type>R</Type>
  557. <Comment></Comment>
  558. <Link1>http://alkaline.vestris.com/</Link1>
  559. <Link2></Link2>
  560. </user-agent>
  561. <user-agent>
  562. <ID>id_a_f_41</ID>
  563. <String>Allesklar/0.1 libwww-perl/5.46</String>
  564. <Description>Allesklar.de robot</Description>
  565. <Type>R</Type>
  566. <Comment></Comment>
  567. <Link1>http://www.allesklar.de</Link1>
  568. <Link2></Link2>
  569. </user-agent>
  570. <user-agent>
  571. <ID>id_a_f_42</ID>
  572. <String>Alligator 1.31 (www.nearsoftware.com)</String>
  573. <Description>Alligator download manager</Description>
  574. <Type>D</Type>
  575. <Comment></Comment>
  576. <Link1>http://www.nearsoftware.com</Link1>
  577. <Link2></Link2>
  578. </user-agent>
  579. <user-agent>
  580. <ID>id_a_f_011108_1</ID>
  581. <String>Allrati/1.1 (+)</String>
  582. <Description>Unknown robot from Allrati.com</Description>
  583. <Type>R</Type>
  584. <Comment>67.205.96.xxx/67.205.104.xx</Comment>
  585. <Link1>http://www.allrati.com/</Link1>
  586. <Link2></Link2>
  587. </user-agent>
  588. <user-agent>
  589. <ID>id_a_f_43</ID>
  590. <String>AltaVista Intranet V2.0 AVS EVAL search@freeit.com</String>
  591. <Description>Altavista robot</Description>
  592. <Type>R</Type>
  593. <Comment></Comment>
  594. <Link1>http://www.altavista.com</Link1>
  595. <Link2></Link2>
  596. </user-agent>
  597. <user-agent>
  598. <ID>id_a_f_44</ID>
  599. <String>AltaVista Intranet V2.0 Compaq Altavista Eval sveand@altavista.net</String>
  600. <Description>Altavista robot</Description>
  601. <Type>R</Type>
  602. <Comment></Comment>
  603. <Link1>http://www.altavista.com</Link1>
  604. <Link2></Link2>
  605. </user-agent>
  606. <user-agent>
  607. <ID>id_a_f_45</ID>
  608. <String>AltaVista Intranet V2.0 evreka.com crawler@evreka.com</String>
  609. <Description>Altavista robot</Description>
  610. <Type>R</Type>
  611. <Comment></Comment>
  612. <Link1>http://www.altavista.com</Link1>
  613. <Link2></Link2>
  614. </user-agent>
  615. <user-agent>
  616. <ID>id_a_f_46</ID>
  617. <String>AltaVista V2.0B crawler@evreka.com</String>
  618. <Description>Altavista robot</Description>
  619. <Type>R</Type>
  620. <Comment></Comment>
  621. <Link1>http://www.altavista.com</Link1>
  622. <Link2></Link2>
  623. </user-agent>
  624. <user-agent>
  625. <ID>id_a_f_280209_1</ID>
  626. <String>amaya/x.xx libwww/x.x.x</String>
  627. <Description>Amaya - W3C's Editor/Browser</Description>
  628. <Type>B</Type>
  629. <Comment></Comment>
  630. <Link1>http://www.w3.org/Amaya/</Link1>
  631. <Link2></Link2>
  632. </user-agent>
  633. <user-agent>
  634. <ID>id_a_f_47</ID>
  635. <String>AmfibiBOT</String>
  636. <Description>Amfibi Search robot</Description>
  637. <Type>R</Type>
  638. <Comment>64.111.217.9x</Comment>
  639. <Link1>http://www.amfibi.com/</Link1>
  640. <Link2></Link2>
  641. </user-agent>
  642. <user-agent>
  643. <ID>id_a_f_48</ID>
  644. <String>Amfibibot/0.06 (Amfibi Web Search; http://www.amfibi.com; agent@amfibi.com)</String>
  645. <Description>Amfibi Search robot</Description>
  646. <Type>R</Type>
  647. <Comment>64.111.217.9x</Comment>
  648. <Link1>http://www.amfibi.com/</Link1>
  649. <Link2></Link2>
  650. </user-agent>
  651. <user-agent>
  652. <ID>id_a_f_141105_2</ID>
  653. <String>Amfibibot/0.07 (Amfibi Robot; http://www.amfibi.com; agent@amfibi.com)</String>
  654. <Description>Amfibi Search robot</Description>
  655. <Type>R</Type>
  656. <Comment>64.111.217.9x</Comment>
  657. <Link1>http://www.amfibi.com/</Link1>
  658. <Link2></Link2>
  659. </user-agent>
  660. <user-agent>
  661. <ID>id_a_f_49</ID>
  662. <String>amibot</String>
  663. <Description>amibot - Amidalla search engine robot (62.241.33.xx)</Description>
  664. <Type>R</Type>
  665. <Comment>s. also libwww-perl/5.65</Comment>
  666. <Link1>http://www.amidalla.com/</Link1>
  667. <Link2></Link2>
  668. </user-agent>
  669. <user-agent>
  670. <ID>id_a_f_50</ID>
  671. <String>Amiga-AWeb/3.4.167SE</String>
  672. <Description>AWeb Amiga browser</Description>
  673. <Type>B</Type>
  674. <Comment></Comment>
  675. <Link1>http://www.amitrix.com/aweb.html</Link1>
  676. <Link2></Link2>
  677. </user-agent>
  678. <user-agent>
  679. <ID>id_a_f_51</ID>
  680. <String>AmigaVoyager/3.4.4 (MorphOS/PPC native)</String>
  681. <Description>Voyager - Amiga browser</Description>
  682. <Type>B</Type>
  683. <Comment></Comment>
  684. <Link1>http://www.vapor.com/voyager/</Link1>
  685. <Link2></Link2>
  686. </user-agent>
  687. <user-agent>
  688. <ID>id_a_f_091205_1</ID>
  689. <String>AmiTCP Miami (AmigaOS 2.04)</String>
  690. <Description>Amiga Miami TCP Stack</Description>
  691. <Type></Type>
  692. <Comment></Comment>
  693. <Link1>http://home.ptd.net/~strdustr/amirc/Netware.html</Link1>
  694. <Link2></Link2>
  695. </user-agent>
  696. <user-agent>
  697. <ID>id_a_f_210608_1</ID>
  698. <String>Amoi 8512/R21.0 NF-Browser/3.3</String>
  699. <Description>NF embedded browser on Amois Skypephone</Description>
  700. <Type>B</Type>
  701. <Comment></Comment>
  702. <Link1>http://3skypephone.com/</Link1>
  703. <Link2></Link2>
  704. </user-agent>
  705. <user-agent>
  706. <ID>id_a_f_190206_3</ID>
  707. <String>amzn_assoc</String>
  708. <Description>Amazon.com robot for checking their affiliate sites</Description>
  709. <Type>C</Type>
  710. <Comment>s. also aranhabot</Comment>
  711. <Link1></Link1>
  712. <Link2></Link2>
  713. </user-agent>
  714. <user-agent>
  715. <ID>id_a_f_52</ID>
  716. <String>AnnoMille spider 0.1 alpha - http://www.annomille.it</String>
  717. <Description>Annomille Italian historical oriented robot</Description>
  718. <Type>R</Type>
  719. <Comment></Comment>
  720. <Link1>http://www.annomille.it</Link1>
  721. <Link2></Link2>
  722. </user-agent>
  723. <user-agent>
  724. <ID>id_a_f_53</ID>
  725. <String>annotate_google; http://ponderer.org/download/annotate_google.user.js</String>
  726. <Description>annotate Google - Firefox extension for annotating Google search results</Description>
  727. <Type>B</Type>
  728. <Comment></Comment>
  729. <Link1>http://ponderer.org/annotate_google</Link1>
  730. <Link2></Link2>
  731. </user-agent>
  732. <user-agent>
  733. <ID>id_a_f_54</ID>
  734. <String>Anonymized by ProxyOS: http://www.megaproxy.com</String>
  735. <Description>Megaproxy user</Description>
  736. <Type>P</Type>
  737. <Comment></Comment>
  738. <Link1>http://www.megaproxy.com</Link1>
  739. <Link2></Link2>
  740. </user-agent>
  741. <user-agent>
  742. <ID>id_a_f_55</ID>
  743. <String>Anonymizer/1.1</String>
  744. <Description>faked user agent</Description>
  745. <Type></Type>
  746. <Comment></Comment>
  747. <Link1></Link1>
  748. <Link2></Link2>
  749. </user-agent>
  750. <user-agent>
  751. <ID>id_a_f_56</ID>
  752. <String>AnswerBus (http://www.answerbus.com/)</String>
  753. <Description>AnswerBus natural language search using COLLATE technology</Description>
  754. <Type>R</Type>
  755. <Comment></Comment>
  756. <Link1>http://www.answerbus.com</Link1>
  757. <Link2>http://collate.dfki.de/kurzdarstellung.html</Link2>
  758. </user-agent>
  759. <user-agent>
  760. <ID>id_a_f_57</ID>
  761. <String>AnswerChase PROve x.0</String>
  762. <Description>AnswerChase search tool</Description>
  763. <Type></Type>
  764. <Comment></Comment>
  765. <Link1>http://www.answerchase.com</Link1>
  766. <Link2></Link2>
  767. </user-agent>
  768. <user-agent>
  769. <ID>id_a_f_58</ID>
  770. <String>AnswerChase x.0</String>
  771. <Description>AnswerChase search tool</Description>
  772. <Type></Type>
  773. <Comment></Comment>
  774. <Link1>http://www.answerchase.com</Link1>
  775. <Link2></Link2>
  776. </user-agent>
  777. <user-agent>
  778. <ID>id_a_f_59</ID>
  779. <String>ANTFresco/x.xx</String>
  780. <Description>ANT Fresco Browser</Description>
  781. <Type>B</Type>
  782. <Comment>s. also Mozilla/x.xx (compatible; ANTFresco....)</Comment>
  783. <Link1>http://www.antlimited.com/products/fresco.htm</Link1>
  784. <Link2></Link2>
  785. </user-agent>
  786. <user-agent>
  787. <ID>id_a_f_60</ID>
  788. <String>antibot-V1.1.5/i586-linux-2.2</String>
  789. <Description>Antibot (discontinued) robot</Description>
  790. <Type>R</Type>
  791. <Comment></Comment>
  792. <Link1>http://www.antidot.net</Link1>
  793. <Link2></Link2>
  794. </user-agent>
  795. <user-agent>
  796. <ID>id_a_f_61</ID>
  797. <String>AnzwersCrawl/2.0 (anzwerscrawl@anzwers.com.au;Engine)</String>
  798. <Description>Anzwers (Yahoo) Australia robot</Description>
  799. <Type>R</Type>
  800. <Comment></Comment>
  801. <Link1>http://au.anzwers.yahoo.com/</Link1>
  802. <Link2></Link2>
  803. </user-agent>
  804. <user-agent>
  805. <ID>id_a_f_030206_1</ID>
  806. <String>Apexoo Spider 1.x</String>
  807. <Description>Apexoo Search spider</Description>
  808. <Type>R</Type>
  809. <Comment>216.240.143.xx</Comment>
  810. <Link1>http://www.apexoo.com/</Link1>
  811. <Link2></Link2>
  812. </user-agent>
  813. <user-agent>
  814. <ID>id_a_f_62</ID>
  815. <String>Aplix HTTP/1.0.1</String>
  816. <Description>JavaOS app. for SEGA Saturn Internet and Sanyo Internet-TV</Description>
  817. <Type>B</Type>
  818. <Comment></Comment>
  819. <Link1></Link1>
  820. <Link2></Link2>
  821. </user-agent>
  822. <user-agent>
  823. <ID>id_a_f_63</ID>
  824. <String>Aplix_SANYO_browser/1.x (Japanese)</String>
  825. <Description>JavaOS app. for Sanyo Internet-TV</Description>
  826. <Type>B</Type>
  827. <Comment></Comment>
  828. <Link1></Link1>
  829. <Link2></Link2>
  830. </user-agent>
  831. <user-agent>
  832. <ID>id_a_f_64</ID>
  833. <String>Aplix_SEGASATURN_browser/1.x (Japanese)</String>
  834. <Description>JavaOS app. for SEGA Saturn Internet</Description>
  835. <Type>B</Type>
  836. <Comment></Comment>
  837. <Link1></Link1>
  838. <Link2></Link2>
  839. </user-agent>
  840. <user-agent>
  841. <ID>id_a_f_65</ID>
  842. <String>Aport</String>
  843. <Description>Aport robot</Description>
  844. <Type>R</Type>
  845. <Comment></Comment>
  846. <Link1>http://www.aport.ru</Link1>
  847. <Link2></Link2>
  848. </user-agent>
  849. <user-agent>
  850. <ID>id_a_f_66</ID>
  851. <String>appie 1.1 (www.walhello.com)</String>
  852. <Description>Walhello Internet Search robot</Description>
  853. <Type>R</Type>
  854. <Comment></Comment>
  855. <Link1>http://www.walhello.com</Link1>
  856. <Link2></Link2>
  857. </user-agent>
  858. <user-agent>
  859. <ID>id_a_f_140608_1</ID>
  860. <String>Apple iPhone v1.1.4 CoreMedia v1.0.0.4A102</String>
  861. <Description>CoreMedia player on Apple iPhone</Description>
  862. <Type>B</Type>
  863. <Comment></Comment>
  864. <Link1>http://www.apple.com/iphone/</Link1>
  865. <Link2></Link2>
  866. </user-agent>
  867. <user-agent>
  868. <ID>id_a_f_070209_1</ID>
  869. <String>Apple-PubSub/65.1.1</String>
  870. <Description>PubSub - Mac OS X utility for managing RSS/Atom subscriptions via the PubSub framework</Description>
  871. <Type>B</Type>
  872. <Comment></Comment>
  873. <Link1>http://developer.apple.com/documentation/Darwin/Reference/ManPages/man1/pubsub.1.html</Link1>
  874. <Link2></Link2>
  875. </user-agent>
  876. <user-agent>
  877. <ID>id_a_f_120707_1</ID>
  878. <String>ArabyBot (compatible; Mozilla/5.0; GoogleBot; FAST Crawler 6.4; http://www.araby.com;)</String>
  879. <Description>Araby search - Arabia</Description>
  880. <Type>R</Type>
  881. <Comment>209.85.31.2xx</Comment>
  882. <Link1>http://www.araby.com/</Link1>
  883. <Link2></Link2>
  884. </user-agent>
  885. <user-agent>
  886. <ID>id_a_f_260608_1</ID>
  887. <String>ArachBot</String>
  888. <Description>Covac Arachnid Web Crawler</Description>
  889. <Type>R</Type>
  890. <Comment>s.also Covac TexAs Arachbot</Comment>
  891. <Link1>http://www.covac-software.com/</Link1>
  892. <Link2></Link2>
  893. </user-agent>
  894. <user-agent>
  895. <ID>id_a_f_67</ID>
  896. <String>Arachnoidea (arachnoidea@euroseek.com)</String>
  897. <Description>Euroseek spider</Description>
  898. <Type>R</Type>
  899. <Comment></Comment>
  900. <Link1>http://www.euroseek.com</Link1>
  901. <Link2></Link2>
  902. </user-agent>
  903. <user-agent>
  904. <ID>id_a_f_190206_2</ID>
  905. <String>aranhabot</String>
  906. <Description>Amazon.com robot for checking their affiliate sites</Description>
  907. <Type>C</Type>
  908. <Comment>s. also amzn_assoc</Comment>
  909. <Link1></Link1>
  910. <Link2></Link2>
  911. </user-agent>
  912. <user-agent>
  913. <ID>id_a_f_68</ID>
  914. <String>ArchitextSpider</String>
  915. <Description>Excite spider</Description>
  916. <Type>R</Type>
  917. <Comment></Comment>
  918. <Link1>http://www.excite.com</Link1>
  919. <Link2></Link2>
  920. </user-agent>
  921. <user-agent>
  922. <ID>id_a_f_69</ID>
  923. <String>archive.org_bot</String>
  924. <Description>Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx)</Description>
  925. <Type>R</Type>
  926. <Comment>s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/...</Comment>
  927. <Link1>http://www.archive.org/</Link1>
  928. <Link2></Link2>
  929. </user-agent>
  930. <user-agent>
  931. <ID>id_a_f_70</ID>
  932. <String>Argus/1.1 (Nutch; http://www.simpy.com/bot.html; feedback at simpy dot com)</String>
  933. <Description>Simpy Bookmarklet crawler (69.55.233.xx)</Description>
  934. <Type>C</Type>
  935. <Comment>s. also Simpy</Comment>
  936. <Link1>http://www.simpy.com/</Link1>
  937. <Link2></Link2>
  938. </user-agent>
  939. <user-agent>
  940. <ID>id_a_f_031205_1</ID>
  941. <String>Arikus_Spider</String>
  942. <Description>Arikus inContext search engine software</Description>
  943. <Type>R</Type>
  944. <Comment></Comment>
  945. <Link1>http://www.arikus.com/inContext-enterprise.html</Link1>
  946. <Link2></Link2>
  947. </user-agent>
  948. <user-agent>
  949. <ID>id_a_f_210208_1</ID>
  950. <String>Arquivo-web-crawler  (compatible; heritrix/1.12.1 +http://arquivo-web.fccn.pt)</String>
  951. <Description>Tomba project: the Portuguese web archive</Description>
  952. <Type>R</Type>
  953. <Comment>193.136.192.xx</Comment>
  954. <Link1>http://arquivo-web.fccn.pt/</Link1>
  955. <Link2>http://arquivo-web.fccn.pt/crawler?set_language=en</Link2>
  956. </user-agent>
  957. <user-agent>
  958. <ID>id_a_f_251007_1</ID>
  959. <String>ASAHA Search Engine Turkey V.001 (http://www.asaha.com/)</String>
  960. <Description>Asaha search robot (Turkey)</Description>
  961. <Type>R</Type>
  962. <Comment>62.68.194.2xx</Comment>
  963. <Link1>http://www.asaha.com/</Link1>
  964. <Link2></Link2>
  965. </user-agent>
  966. <user-agent>
  967. <ID>id_a_f_71</ID>
  968. <String>Asahina-Antenna/1.x</String>
  969. <Description>ASAHINA Antenna information detecting agent</Description>
  970. <Type>R</Type>
  971. <Comment></Comment>
  972. <Link1>http://masshy.fastwave.gr.jp/hina/release/</Link1>
  973. <Link2></Link2>
  974. </user-agent>
  975. <user-agent>
  976. <ID>id_a_f_72</ID>
  977. <String>Asahina-Antenna/1.x (libhina.pl/x.x ; libtime.pl/x.x)</String>
  978. <Description>ASAHINA Antenna information detecting agent</Description>
  979. <Type>R</Type>
  980. <Comment></Comment>
  981. <Link1>http://masshy.fastwave.gr.jp/hina/release/</Link1>
  982. <Link2></Link2>
  983. </user-agent>
  984. <user-agent>
  985. <ID>id_a_f_73</ID>
  986. <String>ask.24x.info</String>
  987. <Description>Ask 24x Info robot</Description>
  988. <Type>R</Type>
  989. <Comment></Comment>
  990. <Link1>http://ask.24x.info/</Link1>
  991. <Link2></Link2>
  992. </user-agent>
  993. <user-agent>
  994. <ID>id_a_f_74</ID>
  995. <String>AskAboutOil/0.06-rcp (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@askaboutoil.com)</String>
  996. <Description>Ask About Oil - Petroleum related search (24.227.212.xxx) using Nutch</Description>
  997. <Type>R</Type>
  998. <Comment></Comment>
  999. <Link1>http://askaboutoil.com/search.jsp</Link1>
  1000. <Link2>http://www.nutch.org</Link2>
  1001. </user-agent>
  1002. <user-agent>
  1003. <ID>id_a_f_120806_1</ID>
  1004. <String>asked/Nutch-0.8 (web crawler; http://asked.jp; epicurus at gmail dot com)</String>
  1005. <Description>askEd! / Inferret search (Japan) robot using Nutch</Description>
  1006. <Type>R</Type>
  1007. <Comment>131.112.125.1xx</Comment>
  1008. <Link1>http://asked.jp/</Link1>
  1009. <Link2></Link2>
  1010. </user-agent>
  1011. <user-agent>
  1012. <ID>id_a_f_75</ID>
  1013. <String>ASPSeek/1.2.5</String>
  1014. <Description>ASPSeek search engine software -Yahoo-Inc. / Telecom Canada robot </Description>
  1015. <Type>R</Type>
  1016. <Comment></Comment>
  1017. <Link1>http://www.aspseek.org</Link1>
  1018. <Link2></Link2>
  1019. </user-agent>
  1020. <user-agent>
  1021. <ID>id_a_f_76</ID>
  1022. <String>ASPseek/1.2.9d</String>
  1023. <Description>Swsoft.net robot using Aspseek</Description>
  1024. <Type>R</Type>
  1025. <Comment></Comment>
  1026. <Link1>http://www.aspseek.com</Link1>
  1027. <Link2></Link2>
  1028. </user-agent>
  1029. <user-agent>
  1030. <ID>id_a_f_77</ID>
  1031. <String>ASPSeek/1.2.x</String>
  1032. <Description>ASPSeek search engine software</Description>
  1033. <Type>R</Type>
  1034. <Comment></Comment>
  1035. <Link1>http://www.aspseek.org</Link1>
  1036. <Link2></Link2>
  1037. </user-agent>
  1038. <user-agent>
  1039. <ID>id_a_f_78</ID>
  1040. <String>ASPSeek/1.2.xa</String>
  1041. <Description>ASPSeek search engine software</Description>
  1042. <Type>R</Type>
  1043. <Comment></Comment>
  1044. <Link1>http://www.aspseek.org</Link1>
  1045. <Link2></Link2>
  1046. </user-agent>
  1047. <user-agent>
  1048. <ID>id_a_f_79</ID>
  1049. <String>ASPseek/1.2.xx</String>
  1050. <Description>ASPSeek search engine software</Description>
  1051. <Type>R</Type>
  1052. <Comment></Comment>
  1053. <Link1>http://www.aspseek.org</Link1>
  1054. <Link2></Link2>
  1055. </user-agent>
  1056. <user-agent>
  1057. <ID>id_a_f_80</ID>
  1058. <String>ASPSeek/1.2.xxpre</String>
  1059. <Description>ASPSeek search engine software</Description>
  1060. <Type>R</Type>
  1061. <Comment></Comment>
  1062. <Link1>http://www.aspseek.org</Link1>
  1063. <Link2></Link2>
  1064. </user-agent>
  1065. <user-agent>
  1066. <ID>id_a_f_81</ID>
  1067. <String>ASSORT/0.10</String>
  1068. <Description>Associative Sort robot</Description>
  1069. <Type>R</Type>
  1070. <Comment>site is down</Comment>
  1071. <Link1>http://pcmath126.unice.fr/assort-robot.html</Link1>
  1072. <Link2></Link2>
  1073. </user-agent>
  1074. <user-agent>
  1075. <ID>id_a_f_82</ID>
  1076. <String>asterias/2.0</String>
  1077. <Description>Singingfish media spider (64.12.186.2xx) via AOL search</Description>
  1078. <Type>R</Type>
  1079. <Comment>s. also Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler ...</Comment>
  1080. <Link1>http://search.singingfish.com/sfw/home.jsp</Link1>
  1081. <Link2></Link2>
  1082. </user-agent>
  1083. <user-agent>
  1084. <ID>id_a_f_83</ID>
  1085. <String>AtlocalBot/1.1 +(http://www.atlocal.com/local-web-site-owner.html)</String>
  1086. <Description>Atlocal local business search robot</Description>
  1087. <Type>R</Type>
  1088. <Comment></Comment>
  1089. <Link1>http://www.atlocal.com/</Link1>
  1090. <Link2></Link2>
  1091. </user-agent>
  1092. <user-agent>
  1093. <ID>id_a_f_041207_2</ID>
  1094. <String>Atomic_Email_Hunter/4.0</String>
  1095. <Description>Atomic Email Hunter email extracing and harvesting</Description>
  1096. <Type>S</Type>
  1097. <Comment></Comment>
  1098. <Link1></Link1>
  1099. <Link2></Link2>
  1100. </user-agent>
  1101. <user-agent>
  1102. <ID>id_a_f_84</ID>
  1103. <String>Atomz/1.0</String>
  1104. <Description>Atomz robot</Description>
  1105. <Type>R</Type>
  1106. <Comment></Comment>
  1107. <Link1>http://www.atomz.com</Link1>
  1108. <Link2></Link2>
  1109. </user-agent>
  1110. <user-agent>
  1111. <ID>id_a_f_85</ID>
  1112. <String>atSpider/1.0</String>
  1113. <Description>atSpider (ceased) email harvester / spambot</Description>
  1114. <Type>S</Type>
  1115. <Comment></Comment>
  1116. <Link1></Link1>
  1117. <Link2></Link2>
  1118. </user-agent>
  1119. <user-agent>
  1120. <ID>id_a_f_060707_1</ID>
  1121. <String>Attentio/Nutch-0.9-dev (Attentio's beta blog crawler; www.attentio.com; info@attentio.com)</String>
  1122. <Description>Attentio social media monitoring and analysing </Description>
  1123. <Type>R</Type>
  1124. <Comment>85.88.35.xx</Comment>
  1125. <Link1>http://www.attentio.com/</Link1>
  1126. <Link2></Link2>
  1127. </user-agent>
  1128. <user-agent>
  1129. <ID>id_a_f_231105_2</ID>
  1130. <String>AU-MIC/2.0 MMP/2.0</String>
  1131. <Description>Samsung SPH-A660 phone with Sprint software</Description>
  1132. <Type>B</Type>
  1133. <Comment></Comment>
  1134. <Link1>http://www1.sprintpcs.com/explore/showcase/Showcase.jsp?scTopic=pcsVision</Link1>
  1135. <Link2></Link2>
  1136. </user-agent>
  1137. <user-agent>
  1138. <ID>id_a_f_240208_1</ID>
  1139. <String>AUDIOVOX-SMT5600</String>
  1140. <Description>Audiovox SMT5600 (AT&#38;T) Smartphone mobile phone browser</Description>
  1141. <Type>B</Type>
  1142. <Comment></Comment>
  1143. <Link1>http://www.audiovox.com/</Link1>
  1144. <Link2>http://www.audiovox.com/manuals/owners/SMT%205600%20QSG%209-7%20FINAL.pdf</Link2>
  1145. </user-agent>
  1146. <user-agent>
  1147. <ID>id_a_f_86</ID>
  1148. <String>augurfind</String>
  1149. <Description>Augurnet Swiss (was www.augurnet.ch) search robot</Description>
  1150. <Type>R</Type>
  1151. <Comment></Comment>
  1152. <Link1></Link1>
  1153. <Link2></Link2>
  1154. </user-agent>
  1155. <user-agent>
  1156. <ID>id_a_f_87</ID>
  1157. <String>augurnfind V-1.x</String>
  1158. <Description>Augurnet Swiss (was www.augurnet.ch) search robot</Description>
  1159. <Type>R</Type>
  1160. <Comment></Comment>
  1161. <Link1></Link1>
  1162. <Link2></Link2>
  1163. </user-agent>
  1164. <user-agent>
  1165. <ID>id_a_f_88</ID>
  1166. <String>autoemailspider</String>
  1167. <Description>Auto Email Pro Email harvester</Description>
  1168. <Type>S</Type>
  1169. <Comment>was http://autoemailspider.com - site is dead</Comment>
  1170. <Link1></Link1>
  1171. <Link2></Link2>
  1172. </user-agent>
  1173. <user-agent>
  1174. <ID>id_a_f_89</ID>
  1175. <String>autohttp</String>
  1176. <Description>Linkscan tool from Elsop</Description>
  1177. <Type>C</Type>
  1178. <Comment>s. Linkscan/x ?</Comment>
  1179. <Link1>http://www.elsop.com/linkscan/</Link1>
  1180. <Link2></Link2>
  1181. </user-agent>
  1182. <user-agent>
  1183. <ID>id_a_f_050208_1</ID>
  1184. <String>autowebdir 1.1 (www.autowebdir.com)</String>
  1185. <Description>Autowebdir - The Automatically Generated Web Directory</Description>
  1186. <Type>R</Type>
  1187. <Comment>84.104.43.x</Comment>
  1188. <Link1>http://www.autowebdir.com/</Link1>
  1189. <Link2></Link2>
  1190. </user-agent>
  1191. <user-agent>
  1192. <ID>id_a_f_90</ID>
  1193. <String>AV Fetch 1.0</String>
  1194. <Description>Altavista robot ??</Description>
  1195. <Type>R</Type>
  1196. <Comment></Comment>
  1197. <Link1>http://www.altavista.com/</Link1>
  1198. <Link2></Link2>
  1199. </user-agent>
  1200. <user-agent>
  1201. <ID>id_a_f_91</ID>
  1202. <String>Avant Browser (http://www.avantbrowser.com)</String>
  1203. <Description>Avant Browser - IE based browser</Description>
  1204. <Type>B</Type>
  1205. <Comment></Comment>
  1206. <Link1>http://www.avantbrowser.com</Link1>
  1207. <Link2></Link2>
  1208. </user-agent>
  1209. <user-agent>
  1210. <ID>id_a_f_92</ID>
  1211. <String>AVSearch-1.0(peter.turney@nrc.ca)</String>
  1212. <Description>National Research Council Canada robot</Description>
  1213. <Type>R</Type>
  1214. <Comment></Comment>
  1215. <Link1>http://www.nrc-cnrc.gc.ca/main_e.html</Link1>
  1216. <Link2></Link2>
  1217. </user-agent>
  1218. <user-agent>
  1219. <ID>id_a_f_93</ID>
  1220. <String>AVSearch-2.0-fusionIdx-14-CompetitorWebSites</String>
  1221. <Description>Unknown robot from 205.203.108.xx (telerate.com)</Description>
  1222. <Type></Type>
  1223. <Comment></Comment>
  1224. <Link1></Link1>
  1225. <Link2></Link2>
  1226. </user-agent>
  1227. <user-agent>
  1228. <ID>id_a_f_94</ID>
  1229. <String>AVSearch-3.0(AltaVista/AVC)</String>
  1230. <Description>Altavista robot</Description>
  1231. <Type>R</Type>
  1232. <Comment></Comment>
  1233. <Link1>http://www.altavista.com/</Link1>
  1234. <Link2></Link2>
  1235. </user-agent>
  1236. <user-agent>
  1237. <ID>id_a_f_95</ID>
  1238. <String>AWeb</String>
  1239. <Description>AWeb Amiga browser</Description>
  1240. <Type>B</Type>
  1241. <Comment></Comment>
  1242. <Link1>http://aweb.sunsite.dk/</Link1>
  1243. <Link2></Link2>
  1244. </user-agent>
  1245. <user-agent>
  1246. <ID>id_a_f_96</ID>
  1247. <String>axadine/ (Axadine Crawler; http://www.axada.de/; )</String>
  1248. <Description>Axada search Germany robot</Description>
  1249. <Type>R</Type>
  1250. <Comment></Comment>
  1251. <Link1>http://www.axada.de</Link1>
  1252. <Link2></Link2>
  1253. </user-agent>
  1254. <user-agent>
  1255. <ID>id_a_f_97</ID>
  1256. <String>AxmoRobot - Crawling your site for better indexing on www.axmo.com search engine.</String>
  1257. <Description>Axmo search robot</Description>
  1258. <Type>R</Type>
  1259. <Comment></Comment>
  1260. <Link1>http://www.axmo.com</Link1>
  1261. <Link2></Link2>
  1262. </user-agent>
  1263. <user-agent>
  1264. <ID>id_a_f_250306_1</ID>
  1265. <String>Azureus 2.x.x.x</String>
  1266. <Description>Azureus Java BitTorrent Client</Description>
  1267. <Type>D</Type>
  1268. <Comment></Comment>
  1269. <Link1>http://azureus.sourceforge.net/</Link1>
  1270. <Link2></Link2>
  1271. </user-agent>
  1272. <user-agent>
  1273. <ID>id_a_f_131208_1</ID>
  1274. <String>BabalooSpider/1.3 (BabalooSpider; http://www.babaloo.si; spider@babaloo.si)</String>
  1275. <Description>Babaloo search robot (Slovenia)</Description>
  1276. <Type>R</Type>
  1277. <Comment>84.255.237.2xx</Comment>
  1278. <Link1>http://www.babaloo.si/</Link1>
  1279. <Link2></Link2>
  1280. </user-agent>
  1281. <user-agent>
  1282. <ID>id_a_f_98</ID>
  1283. <String>BaboomBot/1.x.x (+http://www.baboom.us)</String>
  1284. <Description>BaBoom Web Portal (ODP) robot (66.98.254.xx)</Description>
  1285. <Type>R</Type>
  1286. <Comment></Comment>
  1287. <Link1>http://www.baboom.us</Link1>
  1288. <Link2></Link2>
  1289. </user-agent>
  1290. <user-agent>
  1291. <ID>id_a_f_050406_1</ID>
  1292. <String>BackStreet Browser 3.x</String>
  1293. <Description>BackStreet Browser - Offline browser / website downloader</Description>
  1294. <Type>D</Type>
  1295. <Comment></Comment>
  1296. <Link1>http://www.spadixbd.com/backstreet/</Link1>
  1297. <Link2></Link2>
  1298. </user-agent>
  1299. <user-agent>
  1300. <ID>id_a_f_140508_1</ID>
  1301. <String>BaiduImagespider+(+http://www.baidu.jp/search/s308.html)</String>
  1302. <Description>Baidu search (Japan) image crawler</Description>
  1303. <Type>R</Type>
  1304. <Comment>119.63.193.94.[x]xx</Comment>
  1305. <Link1>http://www.baidu.jp/</Link1>
  1306. <Link2></Link2>
  1307. </user-agent>
  1308. <user-agent>
  1309. <ID>id_a_f_99</ID>
  1310. <String>BaiDuSpider</String>
  1311. <Description>Baidu spidering engine - used by diff. IPs</Description>
  1312. <Type>R</Type>
  1313. <Comment></Comment>
  1314. <Link1>http://www.baidu.com</Link1>
  1315. <Link2></Link2>
  1316. </user-agent>
  1317. <user-agent>
  1318. <ID>id_a_f_080608_1</ID>
  1319. <String>Baiduspider+(+http://help.baidu.jp/system/05.html)</String>
  1320. <Description>Baidu spidering engine - used by diff. IPs</Description>
  1321. <Type>R</Type>
  1322. <Comment></Comment>
  1323. <Link1>http://www.baidu.com</Link1>
  1324. <Link2></Link2>
  1325. </user-agent>
  1326. <user-agent>
  1327. <ID>id_a_f_100</ID>
  1328. <String>Baiduspider+(+http://www.baidu.com/search/spider.htm)</String>
  1329. <Description>Baidu spidering engine - used by diff. IPs</Description>
  1330. <Type>R</Type>
  1331. <Comment></Comment>
  1332. <Link1>http://www.baidu.com</Link1>
  1333. <Link2></Link2>
  1334. </user-agent>
  1335. <user-agent>
  1336. <ID>id_a_f_080407_1</ID>
  1337. <String>Baiduspider+(+http://www.baidu.com/search/spider_jp.html)</String>
  1338. <Description>Baidu search (Japan) crawler</Description>
  1339. <Type>R</Type>
  1340. <Comment>119.63.193.[x]xx</Comment>
  1341. <Link1>http://www.baidu.jp</Link1>
  1342. <Link2></Link2>
  1343. </user-agent>
  1344. <user-agent>
  1345. <ID>id_a_f_031107_1</ID>
  1346. <String>Balihoo/Nutch-1.0-dev (Crawler for Balihoo.com search engine - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com)</String>
  1347. <Description>Balihoo - Vertical search engine crawler (beta)</Description>
  1348. <Type>R</Type>
  1349. <Comment></Comment>
  1350. <Link1>http://www.balihoo.com/</Link1>
  1351. <Link2>http://www.balihoo.com/pdfs/BalihooFactSheet.pdf</Link2>
  1352. </user-agent>
  1353. <user-agent>
  1354. <ID>id_a_f_101</ID>
  1355. <String>BanBots/1.2 (spider@banbots.com)</String>
  1356. <Description>Project BanBots Perl script robot</Description>
  1357. <Type>C</Type>
  1358. <Comment>s. also Mozilla/5.0 (compatible; BanBots/2.0b..</Comment>
  1359. <Link1>http://www.banbots.com/</Link1>
  1360. <Link2></Link2>
  1361. </user-agent>
  1362. <user-agent>
  1363. <ID>id_a_f_140506_3</ID>
  1364. <String>Barca/2.0.xxxx</String>
  1365. <Description>Barca Pro email &amp; PIM software</Description>
  1366. <Type>B</Type>
  1367. <Comment></Comment>
  1368. <Link1>http://www.pocosystems.com/home/index.php?option=com_content&amp;task=view&amp;id=105&amp;Itemid=54</Link1>
  1369. <Link2></Link2>
  1370. </user-agent>
  1371. <user-agent>
  1372. <ID>id_a_f_120206_2</ID>
  1373. <String>BarcaPro/1.4.xxxx</String>
  1374. <Description>Barca Pro email &amp; PIM software</Description>
  1375. <Type>B</Type>
  1376. <Comment></Comment>
  1377. <Link1>http://www.pocosystems.com/home/index.php?option=com_content&amp;task=view&amp;id=105&amp;Itemid=54</Link1>
  1378. <Link2></Link2>
  1379. </user-agent>
  1380. <user-agent>
  1381. <ID>id_a_f_102</ID>
  1382. <String>BarraHomeCrawler (albertof@barrahome.org)</String>
  1383. <Description>Barrahome crawler</Description>
  1384. <Type>R</Type>
  1385. <Comment>64.246.56.xx</Comment>
  1386. <Link1>http://www.barrahome.org</Link1>
  1387. <Link2></Link2>
  1388. </user-agent>
  1389. <user-agent>
  1390. <ID>id_a_f_011006_1</ID>
  1391. <String>bCentral Billing Post-Process</String>
  1392. <Description>Unknown user agent from Microsoft</Description>
  1393. <Type></Type>
  1394. <Comment>204.71.191.1xx</Comment>
  1395. <Link1></Link1>
  1396. <Link2></Link2>
  1397. </user-agent>
  1398. <user-agent>
  1399. <ID>id_a_f_103</ID>
  1400. <String>bdcindexer_2.6.2 (research@bdc)</String>
  1401. <Description>Business.com robot</Description>
  1402. <Type>R</Type>
  1403. <Comment>208.144.233.xxx</Comment>
  1404. <Link1>http://www.business.com</Link1>
  1405. <Link2></Link2>
  1406. </user-agent>
  1407. <user-agent>
  1408. <ID>id_a_f_104</ID>
  1409. <String>BDFetch</String>
  1410. <Description>Brandimensions Brand Protection robot</Description>
  1411. <Type>R</Type>
  1412. <Comment></Comment>
  1413. <Link1>http://www.brandimensions.com/</Link1>
  1414. <Link2></Link2>
  1415. </user-agent>
  1416. <user-agent>
  1417. <ID>id_a_f_105</ID>
  1418. <String>BDNcentral Crawler v2.3 [en] (http://www.bdncentral.com/robot.html) (X11; I; Linux 2.0.44 i686)</String>
  1419. <Description>Bdncentral Sitesearch robot</Description>
  1420. <Type>R</Type>
  1421. <Comment></Comment>
  1422. <Link1>http://www.bdncentral.com</Link1>
  1423. <Link2></Link2>
  1424. </user-agent>
  1425. <user-agent>
  1426. <ID>id_a_f_111205_3</ID>
  1427. <String>BeamMachine/0.5 (dead link remover of www.beammachine.net)</String>
  1428. <Description>beammachine web directory (Germany) link checking</Description>
  1429. <Type>R C</Type>
  1430. <Comment></Comment>
  1431. <Link1>http://www.beammachine.net/de/</Link1>
  1432. <Link2></Link2>
  1433. </user-agent>
  1434. <user-agent>
  1435. <ID>id_a_f_106</ID>
  1436. <String>beautybot/1.0 (+http://www.uchoose.de/crawler/beautybot/)</String>
  1437. <Description>Beauty robot for Cosmoty - German beauty and wellness search</Description>
  1438. <Type>R</Type>
  1439. <Comment></Comment>
  1440. <Link1>http://www.cosmoty.de</Link1>
  1441. <Link2>http://www.uchoose.de/Projekte/Lifestyle/beauty/</Link2>
  1442. </user-agent>
  1443. <user-agent>
  1444. <ID>id_a_f_230406_1</ID>
  1445. <String>BebopBot/2.5.1 ( crawler http://www.apassion4jazz.net/bebopbot.html )</String>
  1446. <Description>A Passion for Jazz music related search robot</Description>
  1447. <Type>R</Type>
  1448. <Comment>68.6.204.2xx</Comment>
  1449. <Link1>http://www.apassion4jazz.net/</Link1>
  1450. <Link2></Link2>
  1451. </user-agent>
  1452. <user-agent>
  1453. <ID>id_a_f_107</ID>
  1454. <String>BeebwareDirectory/v0.01</String>
  1455. <Description>LinkcheckerBeepware (site is down) web directory link checking</Description>
  1456. <Type>C</Type>
  1457. <Comment></Comment>
  1458. <Link1>http://directory.beebware.co.uk</Link1>
  1459. <Link2></Link2>
  1460. </user-agent>
  1461. <user-agent>
  1462. <ID>id_a_f_108</ID>
  1463. <String>Big Brother (http://pauillac.inria.fr/~fpottier/)</String>
  1464. <Description>Big Brother link checking tool</Description>
  1465. <Type>C</Type>
  1466. <Comment></Comment>
  1467. <Link1>http://pauillac.inria.fr</Link1>
  1468. <Link2></Link2>
  1469. </user-agent>
  1470. <user-agent>
  1471. <ID>id_a_f_130606_1</ID>
  1472. <String>Big Fish v1.0</String>
  1473. <Description>GoonGee.com link popularity checking</Description>
  1474. <Type>C</Type>
  1475. <Comment>216.89.111.x</Comment>
  1476. <Link1>http://www.goongee.com/big-fish/</Link1>
  1477. <Link2></Link2>
  1478. </user-agent>
  1479. <user-agent>
  1480. <ID>id_a_f_109</ID>
  1481. <String>BigBrother/1.6e</String>
  1482. <Description>BB4 network monitoring</Description>
  1483. <Type>C</Type>
  1484. <Comment></Comment>
  1485. <Link1>http://www.bb4.com</Link1>
  1486. <Link2></Link2>
  1487. </user-agent>
  1488. <user-agent>
  1489. <ID>id_a_f_110</ID>
  1490. <String>BigCliqueBOT/1.03-dev (bigclicbot; http://www.bigclique.com; bot@bigclique.com)</String>
  1491. <Description>BigClique Search robot</Description>
  1492. <Type>R</Type>
  1493. <Comment></Comment>
  1494. <Link1>http://www.bigclique.com</Link1>
  1495. <Link2></Link2>
  1496. </user-agent>
  1497. <user-agent>
  1498. <ID>id_a_f_080206_4</ID>
  1499. <String>BIGLOTRON (Beta 2;GNU/Linux)</String>
  1500. <Description>Biglotron search (France) robot</Description>
  1501. <Type>R</Type>
  1502. <Comment></Comment>
  1503. <Link1>http://www.biglotron.com/</Link1>
  1504. <Link2></Link2>
  1505. </user-agent>
  1506. <user-agent>
  1507. <ID>id_a_f_171106_2</ID>
  1508. <String>Bigsearch.ca/Nutch-x.x-dev (Bigsearch.ca Internet Spider; http://www.bigsearch.ca/; info@enhancededge.com)</String>
  1509. <Description>Bigsearch.ca search robot</Description>
  1510. <Type>R</Type>
  1511. <Comment>72.0.207.1xx</Comment>
  1512. <Link1>http://www.bigsearch.ca/</Link1>
  1513. <Link2></Link2>
  1514. </user-agent>
  1515. <user-agent>
  1516. <ID>id_a_f_111</ID>
  1517. <String>Bilbo/2.3b-UNIX</String>
  1518. <Description>Bilbo - web frontend for the Nessus Security Scanner</Description>
  1519. <Type>C</Type>
  1520. <Comment></Comment>
  1521. <Link1>http://home.broadpark.no/%7Etnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html</Link1>
  1522. <Link2></Link2>
  1523. </user-agent>
  1524. <user-agent>
  1525. <ID>id_a_f_170806_1</ID>
  1526. <String>BilgiBetaBot/0.8-dev (bilgi.com (Beta) ; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)</String>
  1527. <Description>Bilgi.com (Beta) search robot - Turkey</Description>
  1528. <Type>R</Type>
  1529. <Comment>212.156.230.2xx</Comment>
  1530. <Link1>http://www.bilgi.com/</Link1>
  1531. <Link2></Link2>
  1532. </user-agent>
  1533. <user-agent>
  1534. <ID>id_a_f_080607_1</ID>
  1535. <String>BilgiBot/1.0(beta) (http://www.bilgi.com/; bilgi at bilgi dot com)</String>
  1536. <Description>Bilgi.com (Beta) search robot - Turkey</Description>
  1537. <Type>R</Type>
  1538. <Comment>212.156.230.2xx</Comment>
  1539. <Link1>http://www.bilgi.com/</Link1>
  1540. <Link2></Link2>
  1541. </user-agent>
  1542. <user-agent>
  1543. <ID>id_a_f_112</ID>
  1544. <String>billbot wjj@cs.cmu.edu</String>
  1545. <Description>Carnegie Mellon School robot/link checking ?</Description>
  1546. <Type>C</Type>
  1547. <Comment></Comment>
  1548. <Link1>http://www.cs.cmu.edu</Link1>
  1549. <Link2></Link2>
  1550. </user-agent>
  1551. <user-agent>
  1552. <ID>id_a_f_050206_3</ID>
  1553. <String>Bitacle bot/1.1</String>
  1554. <Description>Bitacle Blog Search Archive robot</Description>
  1555. <Type>R</Type>
  1556. <Comment></Comment>
  1557. <Link1>http://bitacle.org/</Link1>
  1558. <Link2></Link2>
  1559. </user-agent>
  1560. <user-agent>
  1561. <ID>id_a_f_050206_2</ID>
  1562. <String>Bitacle Robot (V:1.0;) (http://www.bitacle.com)</String>
  1563. <Description>Bitacle Blog Search Archive robot</Description>
  1564. <Type>R</Type>
  1565. <Comment></Comment>
  1566. <Link1>http://bitacle.org/</Link1>
  1567. <Link2></Link2>
  1568. </user-agent>
  1569. <user-agent>
  1570. <ID>id_a_f_113</ID>
  1571. <String>Biyubi/x.x (Sistema Fenix; G11; Familia Toledo; es-mx)</String>
  1572. <Description>Biyubi Navigator - Mexican browser for Fenix OS</Description>
  1573. <Type>B</Type>
  1574. <Comment></Comment>
  1575. <Link1>http://www.biyubi.com</Link1>
  1576. <Link2></Link2>
  1577. </user-agent>
  1578. <user-agent>
  1579. <ID>id_a_f_114</ID>
  1580. <String>BlackBerry7520/4.0.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/5.0.3.3 UP.Link/5.1.2.12 (Google WAP Proxy/1.0)</String>
  1581. <Description>Blackberry Wireless Internet browser via Google WAP Proxy</Description>
  1582. <Type>B P</Type>
  1583. <Comment></Comment>
  1584. <Link1>http://www.blackberry.com/products/service/web.shtml</Link1>
  1585. <Link2>http://www.openwave.com</Link2>
  1586. </user-agent>
  1587. <user-agent>
  1588. <ID>id_a_f_115</ID>
  1589. <String>BlackWidow</String>
  1590. <Description>FS Consulting (was www.fsconsult.net) Black Widow web crawler</Description>
  1591. <Type>R</Type>
  1592. <Comment></Comment>
  1593. <Link1></Link1>
  1594. <Link2></Link2>
  1595. </user-agent>
  1596. <user-agent>
  1597. <ID>id_a_f_010306_1</ID>
  1598. <String>BlackWidow</String>
  1599. <Description>BlackWidow web site scanner / downloading tool</Description>
  1600. <Type>D</Type>
  1601. <Comment></Comment>
  1602. <Link1>http://www.softbytelabs.com/BlackWidow</Link1>
  1603. <Link2></Link2>
  1604. </user-agent>
  1605. <user-agent>
  1606. <ID>id_a_f_116</ID>
  1607. <String>Blaiz-Bee/1.0 (+http://www.blaiz.net)</String>
  1608. <Description>Blaiz Enterprises RawGrunt search</Description>
  1609. <Type>R</Type>
  1610. <Comment>203.87.123.1xx</Comment>
  1611. <Link1>http://www.rawgrunt.com/</Link1>
  1612. <Link2>http://www.blaiz.net</Link2>
  1613. </user-agent>
  1614. <user-agent>
  1615. <ID>id_a_f_160307_1</ID>
  1616. <String>Blaiz-Bee/2.00.8222 (BE Internet Search Engine http://www.rawgrunt.com)</String>
  1617. <Description>Blaiz Enterprises RawGrunt search</Description>
  1618. <Type>R</Type>
  1619. <Comment>203.87.123.1xx</Comment>
  1620. <Link1>http://www.rawgrunt.com/</Link1>
  1621. <Link2>http://www.blaiz.net</Link2>
  1622. </user-agent>
  1623. <user-agent>
  1624. <ID>id_a_f_240706_1</ID>
  1625. <String>Blaiz-Bee/2.00.xxxx (+http://www.blaiz.net)</String>
  1626. <Description>Blaiz Enterprises RawGrunt search</Description>
  1627. <Type>R</Type>
  1628. <Comment>203.87.123.1xx</Comment>
  1629. <Link1>http://www.rawgrunt.com/</Link1>
  1630. <Link2>http://www.blaiz.net</Link2>
  1631. </user-agent>
  1632. <user-agent>
  1633. <ID>id_a_f_117</ID>
  1634. <String>BlitzBOT@tricus.net</String>
  1635. <Description>Blitzsuche Germany robot</Description>
  1636. <Type>R</Type>
  1637. <Comment></Comment>
  1638. <Link1>http://blitzsuche.rp-online.de/</Link1>
  1639. <Link2></Link2>
  1640. </user-agent>
  1641. <user-agent>
  1642. <ID>id_a_f_118</ID>
  1643. <String>BlitzBOT@tricus.net (Mozilla compatible)</String>
  1644. <Description>Blitzsuche Germany robot</Description>
  1645. <Type>R</Type>
  1646. <Comment></Comment>
  1647. <Link1>http://blitzsuche.rp-online.de/</Link1>
  1648. <Link2></Link2>
  1649. </user-agent>
  1650. <user-agent>
  1651. <ID>id_a_f_090307_1</ID>
  1652. <String>BlockNote.Net</String>
  1653. <Description>BlockNote web page editor</Description>
  1654. <Type>B</Type>
  1655. <Comment></Comment>
  1656. <Link1>http://blocknote.net/</Link1>
  1657. <Link2></Link2>
  1658. </user-agent>
  1659. <user-agent>
  1660. <ID>id_a_f_119</ID>
  1661. <String>BlogBot/1.x</String>
  1662. <Description>blogdex robot from MIT.edu</Description>
  1663. <Type>R</Type>
  1664. <Comment></Comment>
  1665. <Link1>http://blogdex.media.mit.edu/</Link1>
  1666. <Link2></Link2>
  1667. </user-agent>
  1668. <user-agent>
  1669. <ID>id_a_f_071206_1</ID>
  1670. <String>BlogBridge 2.13 (http://www.blogbridge.com/)</String>
  1671. <Description>BlogBridge RSS reader</Description>
  1672. <Type>B</Type>
  1673. <Comment></Comment>
  1674. <Link1>http://www.blogbridge.com/</Link1>
  1675. <Link2></Link2>
  1676. </user-agent>
  1677. <user-agent>
  1678. <ID>id_a_f_120</ID>
  1679. <String>Bloglines Title Fetch/1.0 (http://www.bloglines.com)</String>
  1680. <Description>Bloglines article search</Description>
  1681. <Type>R</Type>
  1682. <Comment>65.214.44.xx</Comment>
  1683. <Link1>http://www.bloglines.com</Link1>
  1684. <Link2></Link2>
  1685. </user-agent>
  1686. <user-agent>
  1687. <ID>id_a_f_250907_1</ID>
  1688. <String>Bloglines-Images/0.1 (http://www.bloglines.com)</String>
  1689. <Description>Bloglines graphics crawler</Description>
  1690. <Type>R</Type>
  1691. <Comment>65.214.44.xx</Comment>
  1692. <Link1>http://www.bloglines.com</Link1>
  1693. <Link2></Link2>
  1694. </user-agent>
  1695. <user-agent>
  1696. <ID>id_a_f_011108_2</ID>
  1697. <String>Bloglines/3.1 (http://www.bloglines.com)</String>
  1698. <Description>Bloglines news crawler</Description>
  1699. <Type>R</Type>
  1700. <Comment>65.214.44.xx</Comment>
  1701. <Link1>http://www.bloglines.com</Link1>
  1702. <Link2></Link2>
  1703. </user-agent>
  1704. <user-agent>
  1705. <ID>id_a_f_071206_2</ID>
  1706. <String>BlogMap (http://www.feedmap.net)</String>
  1707. <Description>FeedMap / BlogMap geo coding service</Description>
  1708. <Type>C</Type>
  1709. <Comment></Comment>
  1710. <Link1>http://www.feedmap.net/BlogMap/</Link1>
  1711. <Link2></Link2>
  1712. </user-agent>
  1713. <user-agent>
  1714. <ID>id_a_f_121</ID>
  1715. <String>Blogpulse (info@blogpulse.com)</String>
  1716. <Description>Intelliseek's BlogPulse blog search</Description>
  1717. <Type>R</Type>
  1718. <Comment>64.158.138.xx</Comment>
  1719. <Link1>http://www.blogpulse.com</Link1>
  1720. <Link2></Link2>
  1721. </user-agent>
  1722. <user-agent>
  1723. <ID>id_a_f_050208_2</ID>
  1724. <String>BlogPulseLive (support@blogpulse.com)</String>
  1725. <Description>Intelliseek's BlogPulse blog search</Description>
  1726. <Type>R</Type>
  1727. <Comment>64.158.138.xx</Comment>
  1728. <Link1>http://www.blogpulse.com</Link1>
  1729. <Link2></Link2>
  1730. </user-agent>
  1731. <user-agent>
  1732. <ID>id_a_f_161206_2</ID>
  1733. <String>BlogSearch/1.x +http://www.icerocket.com/</String>
  1734. <Description>IceRocket Web search robot</Description>
  1735. <Type>R</Type>
  1736. <Comment>s. also BlogzIce ...</Comment>
  1737. <Link1>http://www.icerocket.com</Link1>
  1738. <Link2></Link2>
  1739. </user-agent>
  1740. <user-agent>
  1741. <ID>id_a_f_020707_1</ID>
  1742. <String>blogsearchbot-pumpkin-3</String>
  1743. <Description>Art of Computing blog search project</Description>
  1744. <Type>R</Type>
  1745. <Comment>88.198.44.2xx</Comment>
  1746. <Link1>http://artofcomputing.net/blog/?p=4</Link1>
  1747. <Link2></Link2>
  1748. </user-agent>
  1749. <user-agent>
  1750. <ID>id_a_f_241205_1</ID>
  1751. <String>BlogsNowBot&#44; V 2.01 (+http://www.blogsnow.com/)</String>
  1752. <Description>BlogsNow realtime link tracker robot</Description>
  1753. <Type>R</Type>
  1754. <Comment></Comment>
  1755. <Link1>http://www.blogsnow.com/</Link1>
  1756. <Link2></Link2>
  1757. </user-agent>
  1758. <user-agent>
  1759. <ID>id_a_f_261107_1</ID>
  1760. <String>BlogVibeBot-v1.1 (spider@blogvibe.nl)</String>
  1761. <Description>BlogVipe news and Blog crawler (Netherlands)</Description>
  1762. <Type>R</Type>
  1763. <Comment>212.61.21.xx</Comment>
  1764. <Link1>http://www.blogvibe.nl</Link1>
  1765. <Link2></Link2>
  1766. </user-agent>
  1767. <user-agent>
  1768. <ID>id_a_f_122</ID>
  1769. <String>blogWatcher_Spider/0.1 (http://www.lr.pi.titech.ac.jp/blogWatcher/)</String>
  1770. <Description>blogWatcher robot from Okumura Group Tokyo (131.112.182.xxx)</Description>
  1771. <Type>R</Type>
  1772. <Comment></Comment>
  1773. <Link1>http://www.lr.pi.titech.ac.jp</Link1>
  1774. <Link2></Link2>
  1775. </user-agent>
  1776. <user-agent>
  1777. <ID>id_a_f_123</ID>
  1778. <String>BlogzIce/1.0 (+http://icerocket.com; rhodes@icerocket.com)</String>
  1779. <Description>IceRocket Web search robot</Description>
  1780. <Type>R</Type>
  1781. <Comment>s. also BlogSearch ...</Comment>
  1782. <Link1>http://www.icerocket.com</Link1>
  1783. <Link2></Link2>
  1784. </user-agent>
  1785. <user-agent>
  1786. <ID>id_a_f_124</ID>
  1787. <String>BlogzIce/1.0 +http://www.icerocket.com/</String>
  1788. <Description>IceRocket Web search robot</Description>
  1789. <Type>R</Type>
  1790. <Comment>s. also BlogSearch ...</Comment>
  1791. <Link1>http://www.icerocket.com</Link1>
  1792. <Link2></Link2>
  1793. </user-agent>
  1794. <user-agent>
  1795. <ID>id_a_f_310108_1</ID>
  1796. <String>BloobyBot</String>
  1797. <Description>Blooby search (beta) robot</Description>
  1798. <Type>R</Type>
  1799. <Comment>206.166.206.18x</Comment>
  1800. <Link1>http://www.blooby.com/</Link1>
  1801. <Link2></Link2>
  1802. </user-agent>
  1803. <user-agent>
  1804. <ID>id_a_f_270507_1</ID>
  1805. <String>Bloodhound/Nutch-0.9 (Testing Crawler for Research - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com)</String>
  1806. <Description>Balihoo - Search Engine for Advertising Media</Description>
  1807. <Type>R</Type>
  1808. <Comment>204.228.230.xx</Comment>
  1809. <Link1>http://balihoo.com/</Link1>
  1810. <Link2></Link2>
  1811. </user-agent>
  1812. <user-agent>
  1813. <ID>id_a_f_125</ID>
  1814. <String>bluefish 0.6 HTML editor</String>
  1815. <Description>Bluefish HTML-editor for Linux</Description>
  1816. <Type>B</Type>
  1817. <Comment></Comment>
  1818. <Link1>http://bluefish.openoffice.nl/</Link1>
  1819. <Link2></Link2>
  1820. </user-agent>
  1821. <user-agent>
  1822. <ID>id_a_f_126</ID>
  1823. <String>BMCLIENT</String>
  1824. <Description>Part of ButtMan remote access tool</Description>
  1825. <Type></Type>
  1826. <Comment>seems to be a Trojan - see link</Comment>
  1827. <Link1>http://www.glocksoft.com/trojan_list/ButtMan.htm</Link1>
  1828. <Link2></Link2>
  1829. </user-agent>
  1830. <user-agent>
  1831. <ID>id_a_f_120506_1</ID>
  1832. <String>BMLAUNCHER</String>
  1833. <Description>Bookmark Express bookmark manager</Description>
  1834. <Type>C</Type>
  1835. <Comment>Website is dead - was:</Comment>
  1836. <Link1>http://www.bookmarkexpress.com/</Link1>
  1837. <Link2></Link2>
  1838. </user-agent>
  1839. <user-agent>
  1840. <ID>id_a_f_127</ID>
  1841. <String>Bobby/4.0.x RPT-HTTPClient/0.3-3E</String>
  1842. <Description>Bobby web accessibility desktop testing tool</Description>
  1843. <Type>C</Type>
  1844. <Comment></Comment>
  1845. <Link1>http://bobby.watchfire.com/bobby/html/en/index.jsp</Link1>
  1846. <Link2></Link2>
  1847. </user-agent>
  1848. <user-agent>
  1849. <ID>id_a_f_128</ID>
  1850. <String>boitho.com-dc/0.xx (http://www.boitho.com/dcbot.html)</String>
  1851. <Description>Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx</Description>
  1852. <Type>R</Type>
  1853. <Comment></Comment>
  1854. <Link1>http://www.boitho.com</Link1>
  1855. <Link2></Link2>
  1856. </user-agent>
  1857. <user-agent>
  1858. <ID>id_a_f_129</ID>
  1859. <String>boitho.com-robot/1.x</String>
  1860. <Description>Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx</Description>
  1861. <Type>R</Type>
  1862. <Comment></Comment>
  1863. <Link1>http://www.boitho.com</Link1>
  1864. <Link2></Link2>
  1865. </user-agent>
  1866. <user-agent>
  1867. <ID>id_a_f_130</ID>
  1868. <String>boitho.com-robot/1.x (http://www.boitho.com/bot.html)</String>
  1869. <Description>Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx</Description>
  1870. <Type>R</Type>
  1871. <Comment></Comment>
  1872. <Link1>http://www.boitho.com</Link1>
  1873. <Link2></Link2>
  1874. </user-agent>
  1875. <user-agent>
  1876. <ID>id_a_f_060806_1</ID>
  1877. <String>Bookdog/x.x</String>
  1878. <Description>Bookdog - Mac bookmark manager</Description>
  1879. <Type>C</Type>
  1880. <Comment></Comment>
  1881. <Link1>http://www.sheepsystems.com/bookdog/</Link1>
  1882. <Link2></Link2>
  1883. </user-agent>
  1884. <user-agent>
  1885. <ID>id_a_f_131</ID>
  1886. <String>Bookmark Buddy bookmark checker (http://www.bookmarkbuddy.net/)</String>
  1887. <Description>Bookmark Buddy - favorite bookmark manager </Description>
  1888. <Type>C</Type>
  1889. <Comment></Comment>
  1890. <Link1>http://www.bookmarkbuddy.net</Link1>
  1891. <Link2></Link2>
  1892. </user-agent>
  1893. <user-agent>
  1894. <ID>id_a_f_132</ID>
  1895. <String>Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/]</String>
  1896. <Description>Favourites managing program</Description>
  1897. <Type>C</Type>
  1898. <Comment></Comment>
  1899. <Link1>http://www.bookmark.ne.jp</Link1>
  1900. <Link2></Link2>
  1901. </user-agent>
  1902. <user-agent>
  1903. <ID>id_a_f_230807_1</ID>
  1904. <String>Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/] (Version 2.0beta)</String>
  1905. <Description>Favourites managing program</Description>
  1906. <Type>C</Type>
  1907. <Comment></Comment>
  1908. <Link1>http://www.bookmark.ne.jp</Link1>
  1909. <Link2></Link2>
  1910. </user-agent>
  1911. <user-agent>
  1912. <ID>id_a_f_300408_1</ID>
  1913. <String>BookmarkBase(2/;http://bookmarkbase.com)</String>
  1914. <Description>Bookmark Base bookmark manager</Description>
  1915. <Type>C</Type>
  1916. <Comment></Comment>
  1917. <Link1>http://www.bookmarkbase.com/</Link1>
  1918. <Link2></Link2>
  1919. </user-agent>
  1920. <user-agent>
  1921. <ID>id_a_f_133</ID>
  1922. <String>Bot mailto:craftbot@yahoo.com</String>
  1923. <Description>cybercity.fr user robot / faked user agent ?</Description>
  1924. <Type></Type>
  1925. <Comment></Comment>
  1926. <Link1></Link1>
  1927. <Link2></Link2>
  1928. </user-agent>
  1929. <user-agent>
  1930. <ID>id_a_f_160308_1</ID>
  1931. <String>BPImageWalker/2.0 (www.bdbrandprotect.com)</String>
  1932. <Description>BD-Brandprotect copyright infringement crawler</Description>
  1933. <Type>R</Type>
  1934. <Comment>72.14.164.1xx</Comment>
  1935. <Link1>http://www.bdbrandprotect.com/</Link1>
  1936. <Link2>http://www.bdbrandprotect.com/solutions_5.html</Link2>
  1937. </user-agent>
  1938. <user-agent>
  1939. <ID>id_a_f_134</ID>
  1940. <String>BravoBrian bstop.bravobrian.it</String>
  1941. <Description>BravoBrian bSTOP parental control</Description>
  1942. <Type>P R</Type>
  1943. <Comment> s. also BStop</Comment>
  1944. <Link1>http://bstop.bravobrian.it/</Link1>
  1945. <Link2></Link2>
  1946. </user-agent>
  1947. <user-agent>
  1948. <ID>id_a_f_135</ID>
  1949. <String>BravoBrian SpiderEngine MarcoPolo</String>
  1950. <Description>Robot for BravoBrian bSTOP</Description>
  1951. <Type>R</Type>
  1952. <Comment> s. also BStop</Comment>
  1953. <Link1>http://bstop.bravobrian.it/</Link1>
  1954. <Link2></Link2>
  1955. </user-agent>
  1956. <user-agent>
  1957. <ID>id_a_f_220508_1</ID>
  1958. <String>BrightCrawler (http://www.brightcloud.com/brightcrawler.asp)</String>
  1959. <Description>BrightCloud web filtering for classifying websites</Description>
  1960. <Type>P R</Type>
  1961. <Comment></Comment>
  1962. <Link1>http://www.brightcloud.com/brightcrawler.asp</Link1>
  1963. <Link2></Link2>
  1964. </user-agent>
  1965. <user-agent>
  1966. <ID>id_a_f_136</ID>
  1967. <String>BruinBot (+http://webarchive.cs.ucla.edu/bruinbot.html) </String>
  1968. <Description>Webarchive Project Bruinbot crawler</Description>
  1969. <Type>R</Type>
  1970. <Comment></Comment>
  1971. <Link1>http://webarchive.cs.ucla.edu</Link1>
  1972. <Link2></Link2>
  1973. </user-agent>
  1974. <user-agent>
  1975. <ID>id_a_f_137</ID>
  1976. <String>BSDSeek/1.0</String>
  1977. <Description>Inktomi (Hotbot-Lycos NBCi) robot</Description>
  1978. <Type>R</Type>
  1979. <Comment></Comment>
  1980. <Link1>http://www.inktomi.com/</Link1>
  1981. <Link2></Link2>
  1982. </user-agent>
  1983. <user-agent>
  1984. <ID>id_a_f_138</ID>
  1985. <String>BStop.BravoBrian.it Agent Detector</String>
  1986. <Description>BravoBrian bSTOP parental control</Description>
  1987. <Type>P R</Type>
  1988. <Comment>s. also BravoBrian ..</Comment>
  1989. <Link1>http://bstop.bravobrian.it/</Link1>
  1990. <Link2></Link2>
  1991. </user-agent>
  1992. <user-agent>
  1993. <ID>id_a_f_139</ID>
  1994. <String>BTbot/0.x (+http://www.btbot.com/btbot.html)</String>
  1995. <Description>BitTorrent Search Engine btbot robot</Description>
  1996. <Type>R</Type>
  1997. <Comment></Comment>
  1998. <Link1>http://www.btbot.com</Link1>
  1999. <Link2></Link2>
  2000. </user-agent>
  2001. <user-agent>
  2002. <ID>id_a_f_300408_2</ID>
  2003. <String>BTWebClient/180B(9704)</String>
  2004. <Description>&#181;Torrent BitTorrent Client</Description>
  2005. <Type>D</Type>
  2006. <Comment></Comment>
  2007. <Link1>http://www.utorrent.com/</Link1>
  2008. <Link2></Link2>
  2009. </user-agent>
  2010. <user-agent>
  2011. <ID>id_a_f_080407_2</ID>
  2012. <String>BuildCMS crawler (http://www.buildcms.com/crawler)</String>
  2013. <Description>BuildCMS crawler - market monitoring project of BuildCMS</Description>
  2014. <Type>R</Type>
  2015. <Comment>194.24.253.xx</Comment>
  2016. <Link1>http://www.buildcms.com/index.php</Link1>
  2017. <Link2>http://www.buildcms.com/about_us/crawler</Link2>
  2018. </user-agent>
  2019. <user-agent>
  2020. <ID>id_a_f_051206_4</ID>
  2021. <String>Bulkfeeds/r1752 (http://bulkfeeds.net/)</String>
  2022. <Description>Bulkfeeds: RSS directory link checking</Description>
  2023. <Type>C</Type>
  2024. <Comment>202.181.96.2xx</Comment>
  2025. <Link1>http://bulkfeeds.net/</Link1>
  2026. <Link2></Link2>
  2027. </user-agent>
  2028. <user-agent>
  2029. <ID>id_a_f_140</ID>
  2030. <String>BullsEye</String>
  2031. <Description>BullsEye/Intelliseek robot</Description>
  2032. <Type>R</Type>
  2033. <Comment></Comment>
  2034. <Link1>http://www.intelliseek.com/be/bullseye.htm</Link1>
  2035. <Link2></Link2>
  2036. </user-agent>
  2037. <user-agent>
  2038. <ID>id_a_f_141</ID>
  2039. <String>bumblebee@relevare.com</String>
  2040. <Description>Relevare Portal software robot</Description>
  2041. <Type>R</Type>
  2042. <Comment></Comment>
  2043. <Link1>http://www.relevare.com</Link1>
  2044. <Link2></Link2>
  2045. </user-agent>
  2046. <user-agent>
  2047. <ID>id_a_f_142</ID>
  2048. <String>BunnySlippers</String>
  2049. <Description>Microsoft server information robot (see link)</Description>
  2050. <Type>C</Type>
  2051. <Comment></Comment>
  2052. <Link1>http://www.webmasterworld.com/forum11/841.htm</Link1>
  2053. <Link2></Link2>
  2054. </user-agent>
  2055. <user-agent>
  2056. <ID>id_a_f_070606_1</ID>
  2057. <String>BurstFindCrawler/1.1 (crawler.burstfind.com; http://crawler.burstfind.com; crawler@burstfind.com)</String>
  2058. <Description>BurstFind search crawler (64.34.172.xx)</Description>
  2059. <Type>R</Type>
  2060. <Comment></Comment>
  2061. <Link1>http://www.burstfind.com/</Link1>
  2062. <Link2></Link2>
  2063. </user-agent>
  2064. <user-agent>
  2065. <ID>id_a_f_143</ID>
  2066. <String>Buscaplus Robi/1.0 (http://www.buscaplus.com/robi/)</String>
  2067. <Description>Buscaplus (Spain) robot</Description>
  2068. <Type>R</Type>
  2069. <Comment></Comment>
  2070. <Link1>http://www.buscaplus.com</Link1>
  2071. <Link2></Link2>
  2072. </user-agent>
  2073. <user-agent>
  2074. <ID>id_a_f_050807_2</ID>
  2075. <String>BW-C-2.0</String>
  2076. <Description>Logitech Desktop Managers (LDM) Backweb (BW) update check</Description>
  2077. <Type>D</Type>
  2078. <Comment></Comment>
  2079. <Link1>http://www.logitech.com/index.cfm/494/3041&amp;cl=de&#44;de</Link1>
  2080. <Link2></Link2>
  2081. </user-agent>
  2082. <user-agent>
  2083. <ID>id_a_f_140508_2</ID>
  2084. <String>bwh3_user_agent</String>
  2085. <Description>Basic Web Hacking 3 fake user-agent from Hellbound Hackers challenges</Description>
  2086. <Type>S</Type>
  2087. <Comment></Comment>
  2088. <Link1>http://www.hellboundhackers.org/forum/_basic_web_hacking_3-7-6960_0.html</Link1>
  2089. <Link2>http://vuau.wordpress.com/2008/03/12/hbh-basic-web-3-switch-user-agent/</Link2>
  2090. </user-agent>
  2091. <user-agent>
  2092. <ID>id_a_f_140508_3</ID>
  2093. <String>Cabot/Nutch-0.9 (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com)</String>
  2094. <Description>Amfibi Search robot</Description>
  2095. <Type>R</Type>
  2096. <Comment>64.111.217.9x</Comment>
  2097. <Link1>http://www.amfibi.com/</Link1>
  2098. <Link2></Link2>
  2099. </user-agent>
  2100. <user-agent>
  2101. <ID>id_a_f_280508_1</ID>
  2102. <String>Cabot/Nutch-1.0-dev (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com)</String>
  2103. <Description>Amfibi Search robot</Description>
  2104. <Type>R</Type>
  2105. <Comment>64.111.217.9x</Comment>
  2106. <Link1>http://www.amfibi.com/</Link1>
  2107. <Link2></Link2>
  2108. </user-agent>
  2109. <user-agent>
  2110. <ID>id_a_f_140506_4</ID>
  2111. <String>CamelHttpStream/1.0</String>
  2112. <Description>Evolution integrated mail solution Camel TCP stream class</Description>
  2113. <Type></Type>
  2114. <Comment></Comment>
  2115. <Link1>http://www.gnome.org/projects/evolution/</Link1>
  2116. <Link2>http://go-evolution.org/Camel.Stream</Link2>
  2117. </user-agent>
  2118. <user-agent>
  2119. <ID>id_a_f_144</ID>
  2120. <String>Cancer Information and Support International;</String>
  2121. <Description>Some user agent</Description>
  2122. <Type></Type>
  2123. <Comment></Comment>
  2124. <Link1></Link1>
  2125. <Link2></Link2>
  2126. </user-agent>
  2127. <user-agent>
  2128. <ID>id_a_f_110206_1</ID>
  2129. <String>carleson/1.0</String>
  2130. <Description>Cosmix project crawler (204.14.48.x / 38.113.234.xxx)</Description>
  2131. <Type>R</Type>
  2132. <Comment>s. also - voyager/1.x - cfetch/1.</Comment>
  2133. <Link1>http://www.cosmixcorp.com/</Link1>
  2134. <Link2></Link2>
  2135. </user-agent>
  2136. <user-agent>
  2137. <ID>id_a_f_145</ID>
  2138. <String>Carnegie_Mellon_University_Research_WebBOT-->PLEASE READ-->http://www.andrew.cmu.edu/~brgordon/webbot/index.html http://www.andrew.cmu.edu/~brgordon/webbot/index.html</String>
  2139. <Description>Carnegie Mellon University WebBOT</Description>
  2140. <Type>R</Type>
  2141. <Comment></Comment>
  2142. <Link1>http://www.andrew.cmu.edu</Link1>
  2143. <Link2></Link2>
  2144. </user-agent>
  2145. <user-agent>
  2146. <ID>id_a_f_146</ID>
  2147. <String>Carnegie_Mellon_University_WebCrawler http://www.andrew.cmu.edu/~brgordon/webbot/index.html</String>
  2148. <Description>Carnegie Mellon University WebBOT</Description>
  2149. <Type>R</Type>
  2150. <Comment></Comment>
  2151. <Link1>http://www.andrew.cmu.edu</Link1>
  2152. <Link2></Link2>
  2153. </user-agent>
  2154. <user-agent>
  2155. <ID>id_a_f_170206_1</ID>
  2156. <String>Catall Spider</String>
  2157. <Description>Catall.de search &amp; web directory (Germany)</Description>
  2158. <Type>R</Type>
  2159. <Comment></Comment>
  2160. <Link1>http://www.catall.de/</Link1>
  2161. <Link2></Link2>
  2162. </user-agent>
  2163. <user-agent>
  2164. <ID>id_a_f_130807_3</ID>
  2165. <String>CazoodleBot/CazoodleBot-0.1 (CazoodleBot Crawler; http://www.cazoodle.com/cazoodlebot; cazoodlebot@cazoodle.com)</String>
  2166. <Description>UIUCs Cazoodle search based on MetaQuerier</Description>
  2167. <Type>R</Type>
  2168. <Comment>72.36.94.1xx</Comment>
  2169. <Link1>http://www.cazoodle.com/</Link1>
  2170. <Link2>http://metaquerier.cs.uiuc.edu/</Link2>
  2171. </user-agent>
  2172. <user-agent>
  2173. <ID>id_a_f_290308_1</ID>
  2174. <String>CCBot/1.0 (+http://www.commoncrawl.org/bot.html)</String>
  2175. <Description>CommonCrawl Foundation search crawler</Description>
  2176. <Type>R</Type>
  2177. <Comment>38.103.63.1[6-8]</Comment>
  2178. <Link1>http://www.commoncrawl.org/faq.htm</Link1>
  2179. <Link2></Link2>
  2180. </user-agent>
  2181. <user-agent>
  2182. <ID>id_a_f_147</ID>
  2183. <String>ccubee/x.x</String>
  2184. <Description>Empyreum Ccubee (Czech) search engine solution</Description>
  2185. <Type>R</Type>
  2186. <Comment></Comment>
  2187. <Link1>http://empyreum.com/technologies/ccubee</Link1>
  2188. <Link2></Link2>
  2189. </user-agent>
  2190. <user-agent>
  2191. <ID>id_a_f_010108_2</ID>
  2192. <String>CDR/1.7.1 Simulator/0.7(+http://timewe.net) Profile/MIDP-1.0 Configuration/CLDC-1.0</String>
  2193. <Description>Timewe mobile browser (WAP) simulator (Japan)</Description>
  2194. <Type>B</Type>
  2195. <Comment>61.142.xx.x[xx]</Comment>
  2196. <Link1>http://timewe.net/</Link1>
  2197. <Link2></Link2>
  2198. </user-agent>
  2199. <user-agent>
  2200. <ID>id_a_f_291105_6</ID>
  2201. <String>CE-Preload</String>
  2202. <Description>Cisco Content Engine</Description>
  2203. <Type>P</Type>
  2204. <Comment></Comment>
  2205. <Link1>http://www.cisco.com/en/US/products/hw/contnetw/index.html</Link1>
  2206. <Link2></Link2>
  2207. </user-agent>
  2208. <user-agent>
  2209. <ID>id_a_f_100408_4</ID>
  2210. <String>CentiverseBot</String>
  2211. <Description>Nordic semantic search engine</Description>
  2212. <Type>C</Type>
  2213. <Comment>87.72.214.9x</Comment>
  2214. <Link1>http://www.centiverse-project.net/post/Educating-the-bots.aspx</Link1>
  2215. <Link2></Link2>
  2216. </user-agent>
  2217. <user-agent>
  2218. <ID>id_a_f_180408_2</ID>
  2219. <String>CentiverseBot - investigator</String>
  2220. <Description>Nordic semantic search engine</Description>
  2221. <Type>C</Type>
  2222. <Comment>87.72.214.9x</Comment>
  2223. <Link1>http://www.centiverse-project.net/post/Educating-the-bots.aspx</Link1>
  2224. <Link2></Link2>
  2225. </user-agent>
  2226. <user-agent>
  2227. <ID>id_a_f_180408_3</ID>
  2228. <String>CentiverseBot/3.0 (http://www.centiverse-project.net)</String>
  2229. <Description>Nordic semantic search engine</Description>
  2230. <Type>C</Type>
  2231. <Comment>87.72.214.9x</Comment>
  2232. <Link1>http://www.centiverse-project.net/post/Educating-the-bots.aspx</Link1>
  2233. <Link2></Link2>
  2234. </user-agent>
  2235. <user-agent>
  2236. <ID>id_a_f_148</ID>
  2237. <String>Ceramic Tile Installation Guide (http://www.floorstransformed.com)</String>
  2238. <Description>Floortransformed.com robot (link ckecking ??)</Description>
  2239. <Type>R</Type>
  2240. <Comment></Comment>
  2241. <Link1>http://www.floorstransformed.com</Link1>
  2242. <Link2></Link2>
  2243. </user-agent>
  2244. <user-agent>
  2245. <ID>id_a_f_131208_2</ID>
  2246. <String>CERN-LineMode/2.15</String>
  2247. <Description>CERN Line Mode Browser</Description>
  2248. <Type>B</Type>
  2249. <Comment></Comment>
  2250. <Link1>http://www.w3.org/LineMode/</Link1>
  2251. <Link2></Link2>
  2252. </user-agent>
  2253. <user-agent>
  2254. <ID>id_a_f_149</ID>
  2255. <String>cfetch/1.0</String>
  2256. <Description>Cosmix project crawler (204.14.48.x / 38.113.234.xxx)</Description>
  2257. <Type>R</Type>
  2258. <Comment>s. also - voyager/1.x - carleson/1.x</Comment>
  2259. <Link1>http://www.cosmixcorp.com</Link1>
  2260. <Link2></Link2>
  2261. </user-agent>
  2262. <user-agent>
  2263. <ID>id_a_f_150</ID>
  2264. <String>CFNetwork/x.x</String>
  2265. <Description>MaxOS X CoreFoundation CFNetwork API</Description>
  2266. <Type></Type>
  2267. <Comment></Comment>
  2268. <Link1>http://www.cocoadev.com/index.pl?CFNetwork</Link1>
  2269. <Link2></Link2>
  2270. </user-agent>
  2271. <user-agent>
  2272. <ID>id_a_f_151</ID>
  2273. <String>cg-eye interactive</String>
  2274. <Description>cg-eye CGI checker</Description>
  2275. <Type>C</Type>
  2276. <Comment></Comment>
  2277. <Link1>http://www.htmlhelp.com</Link1>
  2278. <Link2></Link2>
  2279. </user-agent>
  2280. <user-agent>
  2281. <ID>id_a_f_152</ID>
  2282. <String>Charon/1.x (Amiga)</String>
  2283. <Description>Charon Amiga download manager</Description>
  2284. <Type>D</Type>
  2285. <Comment></Comment>
  2286. <Link1>http://tesla.rcub.bg.ac.yu/%7Eantony/Charon/</Link1>
  2287. <Link2></Link2>
  2288. </user-agent>
  2289. <user-agent>
  2290. <ID>id_a_f_131208_3</ID>
  2291. <String>Chat Catcher/1.0</String>
  2292. <Description>Chat Catcher blog monitoring robot</Description>
  2293. <Type>C</Type>
  2294. <Comment>69.80.208.2xx</Comment>
  2295. <Link1>http://chatcatcher.com/cc/</Link1>
  2296. <Link2></Link2>
  2297. </user-agent>
  2298. <user-agent>
  2299. <ID>id_a_f_153</ID>
  2300. <String>Checkbot/1.xx LWP/5.xx</String>
  2301. <Description>Checkbot link validation</Description>
  2302. <Type>C</Type>
  2303. <Comment></Comment>
  2304. <Link1>http://degraaff.org/checkbot/</Link1>
  2305. <Link2></Link2>
  2306. </user-agent>
  2307. <user-agent>
  2308. <ID>id_a_f_154</ID>
  2309. <String>CheckLinks/1.x.x</String>
  2310. <Description>Checklinks - Perl link checker</Description>
  2311. <Type>C</Type>
  2312. <Comment></Comment>
  2313. <Link1>http://www.jmarshall.com</Link1>
  2314. <Link2></Link2>
  2315. </user-agent>
  2316. <user-agent>
  2317. <ID>id_a_f_155</ID>
  2318. <String>CheckUrl</String>
  2319. <Description>NTL user agent</Description>
  2320. <Type></Type>
  2321. <Comment></Comment>
  2322. <Link1>http://www.ntl.com</Link1>
  2323. <Link2></Link2>
  2324. </user-agent>
  2325. <user-agent>
  2326. <ID>id_a_f_156</ID>
  2327. <String>CheckWeb</String>
  2328. <Description>CheckWeb link validation</Description>
  2329. <Type>C</Type>
  2330. <Comment></Comment>
  2331. <Link1>http://p.duby.free.fr/chkweb.htm</Link1>
  2332. <Link2></Link2>
  2333. </user-agent>
  2334. <user-agent>
  2335. <ID>id_a_f_030206_2</ID>
  2336. <String>Chilkat/1.0.0 (+http://www.chilkatsoft.com/ChilkatHttpUA.asp)</String>
  2337. <Description>Chilkat HTTP component user-agent</Description>
  2338. <Type></Type>
  2339. <Comment></Comment>
  2340. <Link1>http://www.chilkatsoft.com/HttpDotNet.asp</Link1>
  2341. <Link2></Link2>
  2342. </user-agent>
  2343. <user-agent>
  2344. <ID>id_a_f_230506_1</ID>
  2345. <String>China Local Browse 2.6</String>
  2346. <Description>Unknown spam bot from telekom.com.my (218.111.83.xxx)</Description>
  2347. <Type>S</Type>
  2348. <Comment>see link:</Comment>
  2349. <Link1>http://linuxreviews.org/webdesign/602_Apache_Webalizer/</Link1>
  2350. <Link2></Link2>
  2351. </user-agent>
  2352. <user-agent>
  2353. <ID>id_a_f_170408_2</ID>
  2354. <String>Chitika ContentHit 1.0</String>
  2355. <Description>Chitika Inc. Blog advertising</Description>
  2356. <Type>C</Type>
  2357. <Comment>67.15.219.[x]x</Comment>
  2358. <Link1>http://chitika.com/</Link1>
  2359. <Link2></Link2>
  2360. </user-agent>
  2361. <user-agent>
  2362. <ID>id_a_f_157</ID>
  2363. <String>ChristCRAWLER 2.0</String>
  2364. <Description>Christcentral.com Christcrawler (was www.christcrawler.com)</Description>
  2365. <Type>R</Type>
  2366. <Comment>- s. also Mozilla/4.0 (compatible; ChristCrawler..)</Comment>
  2367. <Link1></Link1>
  2368. <Link2></Link2>
  2369. </user-agent>
  2370. <user-agent>
  2371. <ID>id_a_f_010607_2</ID>
  2372. <String>CHttpClient by Open Text Corporation</String>
  2373. <Description>CHttpClient - C++ class using WinInet</Description>
  2374. <Type></Type>
  2375. <Comment></Comment>
  2376. <Link1>http://www.codeproject.com/library/lyoulhttpclient.asp</Link1>
  2377. <Link2></Link2>
  2378. </user-agent>
  2379. <user-agent>
  2380. <ID>id_a_f_158</ID>
  2381. <String>CipinetBot (http://www.cipinet.com/bot.html)</String>
  2382. <Description>CipinetBot -Cipinet Search Engine Web Crawler</Description>
  2383. <Type>R</Type>
  2384. <Comment></Comment>
  2385. <Link1>http://www.cipinet.com</Link1>
  2386. <Link2></Link2>
  2387. </user-agent>
  2388. <user-agent>
  2389. <ID>id_a_f_130108_1</ID>
  2390. <String>Cityreview Robot (+http://www.cityreview.org/crawler/)</String>
  2391. <Description>Cityreview regional search (Germany) link checking</Description>
  2392. <Type>C</Type>
  2393. <Comment>88.198.212.5x</Comment>
  2394. <Link1>http://www.cityreview.de/</Link1>
  2395. <Link2>http://www.cityreview.org/crawler/</Link2>
  2396. </user-agent>
  2397. <user-agent>
  2398. <ID>id_a_f_159</ID>
  2399. <String>CJ Spider/</String>
  2400. <Description>Commision Junction link checking spider</Description>
  2401. <Type>C</Type>
  2402. <Comment></Comment>
  2403. <Link1>http://www.cj.com/</Link1>
  2404. <Link2></Link2>
  2405. </user-agent>
  2406. <user-agent>
  2407. <ID>id_a_f_050606_1</ID>
  2408. <String>CJB.NET Proxy</String>
  2409. <Description>CJB Net anonymous socks proxy service (216.194.70.x)</Description>
  2410. <Type>P</Type>
  2411. <Comment></Comment>
  2412. <Link1>http://proxy.cjb.net/</Link1>
  2413. <Link2></Link2>
  2414. </user-agent>
  2415. <user-agent>
  2416. <ID>id_a_f_160</ID>
  2417. <String>ClariaBot/1.0</String>
  2418. <Description>Claria (ex Gator) SearchScout robot (64.152.73.xx)</Description>
  2419. <Type>R</Type>
  2420. <Comment>s. also Diamond</Comment>
  2421. <Link1>http://www.searchscout.com</Link1>
  2422. <Link2></Link2>
  2423. </user-agent>
  2424. <user-agent>
  2425. <ID>id_a_f_161</ID>
  2426. <String>Claymont.com</String>
  2427. <Description>Claymont Search robot</Description>
  2428. <Type>R</Type>
  2429. <Comment></Comment>
  2430. <Link1>http://www.claymont.com</Link1>
  2431. <Link2></Link2>
  2432. </user-agent>
  2433. <user-agent>
  2434. <ID>id_a_f_100307_1</ID>
  2435. <String>CloakDetect/0.9 (+http://fulltext.seznam.cz/)</String>
  2436. <Description>Seznam Search (Czech Republic) robot</Description>
  2437. <Type>R</Type>
  2438. <Comment>212.80.76.xx</Comment>
  2439. <Link1>http://www.seznam.cz/</Link1>
  2440. <Link2></Link2>
  2441. </user-agent>
  2442. <user-agent>
  2443. <ID>id_a_f_162</ID>
  2444. <String>Clushbot/2.x (+http://www.clush.com/bot.html)</String>
  2445. <Description>Clush clustered search robot</Description>
  2446. <Type>R</Type>
  2447. <Comment></Comment>
  2448. <Link1>http://www.clush.com</Link1>
  2449. <Link2></Link2>
  2450. </user-agent>
  2451. <user-agent>
  2452. <ID>id_a_f_163</ID>
  2453. <String>Clushbot/3.x-BinaryFury (+http://www.clush.com/bot.html)</String>
  2454. <Description>Clush clustered search robot</Description>
  2455. <Type>R</Type>
  2456. <Comment></Comment>
  2457. <Link1>http://www.clush.com</Link1>
  2458. <Link2></Link2>
  2459. </user-agent>
  2460. <user-agent>
  2461. <ID>id_a_f_164</ID>
  2462. <String>Clushbot/3.xx-Ajax (+http://www.clush.com/bot.html)</String>
  2463. <Description>Clush clustered search robot</Description>
  2464. <Type>R</Type>
  2465. <Comment></Comment>
  2466. <Link1>http://www.clush.com</Link1>
  2467. <Link2></Link2>
  2468. </user-agent>
  2469. <user-agent>
  2470. <ID>id_a_f_165</ID>
  2471. <String>Clushbot/3.xx-Hector (+http://www.clush.com/bot.html)</String>
  2472. <Description>Clush clustered search robot</Description>
  2473. <Type>R</Type>
  2474. <Comment></Comment>
  2475. <Link1>http://www.clush.com</Link1>
  2476. <Link2></Link2>
  2477. </user-agent>
  2478. <user-agent>
  2479. <ID>id_a_f_166</ID>
  2480. <String>Clushbot/3.xx-Peleus (+http://www.clush.com/bot.html)</String>
  2481. <Description>Clush clustered search robot</Description>
  2482. <Type>R</Type>
  2483. <Comment></Comment>
  2484. <Link1>http://www.clush.com</Link1>
  2485. <Link2></Link2>
  2486. </user-agent>
  2487. <user-agent>
  2488. <ID>id_a_f_070506_1</ID>
  2489. <String>COAST WebMaster Pro/4.x.x.xx (Windows NT)</String>
  2490. <Description>COAST Webmaster - Web management and maintenance software</Description>
  2491. <Type>C</Type>
  2492. <Comment></Comment>
  2493. <Link1>http://www.extablish.com/cwm.htm</Link1>
  2494. <Link2></Link2>
  2495. </user-agent>
  2496. <user-agent>
  2497. <ID>id_a_f_150306_1</ID>
  2498. <String>CoBITSProbe</String>
  2499. <Description>Proposed Content-Based Image Tracking System (CoBITS) P2P crawler</Description>
  2500. <Type>R C</Type>
  2501. <Comment></Comment>
  2502. <Link1>http://www.iis.sinica.edu.tw/~hungchi/CBIT/</Link1>
  2503. <Link2></Link2>
  2504. </user-agent>
  2505. <user-agent>
  2506. <ID>id_a_f_167</ID>
  2507. <String>Cocoal.icio.us/1.0 (v36) (Mac OS X; http://www.scifihifi.com/cocoalicious)</String>
  2508. <Description>Cocoa del.icio.us (social bookmarks manager) client for Mac OS X</Description>
  2509. <Type>C</Type>
  2510. <Comment></Comment>
  2511. <Link1>http://www.scifihifi.com</Link1>
  2512. <Link2></Link2>
  2513. </user-agent>
  2514. <user-agent>
  2515. <ID>id_a_f_070209_2</ID>
  2516. <String>Cogentbot/1.X (+http://www.cogentsoftwaresolutions.com/bot.html)</String>
  2517. <Description>Cogent Search Bot from Cogent Software Solutions for unknown purposes</Description>
  2518. <Type>R</Type>
  2519. <Comment>72.81.252.9x</Comment>
  2520. <Link1>http://www.cogentsoftwaresolutions.com/bot.html</Link1>
  2521. <Link2></Link2>
  2522. </user-agent>
  2523. <user-agent>
  2524. <ID>id_a_f_168</ID>
  2525. <String>ColdFusion</String>
  2526. <Description>Cold Fusion server used by various IPs i.e.: - NetWORLD web catalogue link checking</Description>
  2527. <Type>P C</Type>
  2528. <Comment></Comment>
  2529. <Link1>http://www.networld.com</Link1>
  2530. <Link2>http://www.macromedia.com/software/coldfusion/</Link2>
  2531. </user-agent>
  2532. <user-agent>
  2533. <ID>id_a_f_169</ID>
  2534. <String>ColdFusion (BookmarkTracker.com)</String>
  2535. <Description>Cold Fusion server used by Bookmark Tracker - online favourites managment</Description>
  2536. <Type>C</Type>
  2537. <Comment></Comment>
  2538. <Link1>http://www.bookmarktracker.com</Link1>
  2539. <Link2>http://www.macromedia.com/software/coldfusion/</Link2>
  2540. </user-agent>
  2541. <user-agent>
  2542. <ID>id_a_f_170</ID>
  2543. <String>collage.cgi/1.xx</String>
  2544. <Description>WebCollage Syndicator graphics crawler/collector</Description>
  2545. <Type>R D</Type>
  2546. <Comment></Comment>
  2547. <Link1>http://www.webcollage.com</Link1>
  2548. <Link2></Link2>
  2549. </user-agent>
  2550. <user-agent>
  2551. <ID>id_a_f_171</ID>
  2552. <String>combine/0.0</String>
  2553. <Description>Combine harvesting &amp; indexing robot</Description>
  2554. <Type>R</Type>
  2555. <Comment>130.235.4.xx</Comment>
  2556. <Link1>http://combine.it.lth.se/</Link1>
  2557. <Link2></Link2>
  2558. </user-agent>
  2559. <user-agent>
  2560. <ID>id_a_f_080406_1</ID>
  2561. <String>Combine/2.0 http://combine.it.lth.se/</String>
  2562. <Description>Combine harvesting &amp; indexing robot</Description>
  2563. <Type>R</Type>
  2564. <Comment>130.235.4.xx</Comment>
  2565. <Link1>http://combine.it.lth.se/</Link1>
  2566. <Link2></Link2>
  2567. </user-agent>
  2568. <user-agent>
  2569. <ID>id_a_f_160807_1</ID>
  2570. <String>Combine/3 http://combine.it.lth.se/</String>
  2571. <Description>Combine harvesting &amp; indexing robot</Description>
  2572. <Type>R</Type>
  2573. <Comment>130.235.4.xx</Comment>
  2574. <Link1>http://combine.it.lth.se/</Link1>
  2575. <Link2></Link2>
  2576. </user-agent>
  2577. <user-agent>
  2578. <ID>id_a_f_172</ID>
  2579. <String>Combine/x.0</String>
  2580. <Description>Combine harvesting &amp; indexing robot</Description>
  2581. <Type>R</Type>
  2582. <Comment>130.235.4.xx</Comment>
  2583. <Link1>http://combine.it.lth.se/</Link1>
  2584. <Link2></Link2>
  2585. </user-agent>
  2586. <user-agent>
  2587. <ID>id_a_f_280606_3</ID>
  2588. <String>cometrics-bot&#44; http://www.cometrics.de</String>
  2589. <Description>cometrics Web Content Mining solution - Germany</Description>
  2590. <Type>R</Type>
  2591. <Comment></Comment>
  2592. <Link1>http://www.cometrics.de/</Link1>
  2593. <Link2></Link2>
  2594. </user-agent>
  2595. <user-agent>
  2596. <ID>id_a_f_173</ID>
  2597. <String>Commerce Browser Center</String>
  2598. <Description>Wildsoft Germany (closed) Internet client system user-agent (was www.oskarweb.de)</Description>
  2599. <Type>B</Type>
  2600. <Comment></Comment>
  2601. <Link1></Link1>
  2602. <Link2></Link2>
  2603. </user-agent>
  2604. <user-agent>
  2605. <ID>id_a_f_240107_1</ID>
  2606. <String>complex_network_group/Nutch-0.9-dev (discovering the structure of the world-wide-web; http://cantor.ee.ucla.edu/~networks/crawl; nimakhaj@gmail.com)</String>
  2607. <Description>UCLA Complex Networks Groups Complex Network Analysis</Description>
  2608. <Type>C</Type>
  2609. <Comment>216.182.233.1xx</Comment>
  2610. <Link1>http://cantor.ee.ucla.edu/~networks/</Link1>
  2611. <Link2></Link2>
  2612. </user-agent>
  2613. <user-agent>
  2614. <ID>id_a_f_174</ID>
  2615. <String>Computer_and_Automation_Research_Institute_Crawler crawler@ilab.sztaki.hu</String>
  2616. <Description>Hungarian Academy of Sciences data mining search</Description>
  2617. <Type>R</Type>
  2618. <Comment></Comment>
  2619. <Link1>http://www.ilab.sztaki.hu/websearch/</Link1>
  2620. <Link2></Link2>
  2621. </user-agent>
  2622. <user-agent>
  2623. <ID>id_a_f_010406_2</ID>
  2624. <String>Comrite/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)</String>
  2625. <Description>ComRite Chinese Search Engine for Oversea Web Sites (69.248.26.xx)</Description>
  2626. <Type>R</Type>
  2627. <Comment>powered by Nutch</Comment>
  2628. <Link1>http://www.comrite.com/</Link1>
  2629. <Link2>http://meidong.comrite.com/</Link2>
  2630. </user-agent>
  2631. <user-agent>
  2632. <ID>id_a_f_175</ID>
  2633. <String>Contact</String>
  2634. <Description>unknown</Description>
  2635. <Type></Type>
  2636. <Comment></Comment>
  2637. <Link1></Link1>
  2638. <Link2></Link2>
  2639. </user-agent>
  2640. <user-agent>
  2641. <ID>id_a_f_200307_1</ID>
  2642. <String>ContactBot/0.2</String>
  2643. <Description>Probably E-Mail harvesting robot - same as LMQueueBot</Description>
  2644. <Type>S</Type>
  2645. <Comment>64.124.152.xx</Comment>
  2646. <Link1></Link1>
  2647. <Link2></Link2>
  2648. </user-agent>
  2649. <user-agent>
  2650. <ID>id_a_f_291105_7</ID>
  2651. <String>ContentSmartz</String>
  2652. <Description>ContentSmartz e-mail harvesting tools</Description>
  2653. <Type>S</Type>
  2654. <Comment></Comment>
  2655. <Link1></Link1>
  2656. <Link2></Link2>
  2657. </user-agent>
  2658. <user-agent>
  2659. <ID>id_a_f_176</ID>
  2660. <String>contype</String>
  2661. <Description>Internet Explorer versions 4.x and 5 plugin content</Description>
  2662. <Type>B</Type>
  2663. <Comment>NOT Contype mime type managment Perl script</Comment>
  2664. <Link1>http://support.microsoft.com/default.aspx?scid=kb;en-us;293792</Link1>
  2665. <Link2></Link2>
  2666. </user-agent>
  2667. <user-agent>
  2668. <ID>id_a_f_177</ID>
  2669. <String>Convera Internet Spider V6.x</String>
  2670. <Description>Converas RetrievalWare Internet Spider (63.241.61.x)</Description>
  2671. <Type>R</Type>
  2672. <Comment> s. also - infoConveraCrawler... - CrawlConvera ...</Comment>
  2673. <Link1>http://www.convera.com</Link1>
  2674. <Link2></Link2>
  2675. </user-agent>
  2676. <user-agent>
  2677. <ID>id_a_f_178</ID>
  2678. <String>ConveraCrawler/0.2</String>
  2679. <Description>Converas RetrievalWare Internet Spider (63.241.61.x)</Description>
  2680. <Type>R</Type>
  2681. <Comment> s. also - infoConveraCrawler... - CrawlConvera ...</Comment>
  2682. <Link1>http://www.convera.com</Link1>
  2683. <Link2></Link2>
  2684. </user-agent>
  2685. <user-agent>
  2686. <ID>id_a_f_051205_1</ID>
  2687. <String>ConveraCrawler/0.9d (+http://www.authoritativeweb.com/crawl)</String>
  2688. <Description>Converas RetrievalWare Internet Spider (63.241.61.x)</Description>
  2689. <Type>R</Type>
  2690. <Comment> s. also - infoConveraCrawler... - CrawlConvera ...</Comment>
  2691. <Link1>http://www.convera.com/</Link1>
  2692. <Link2></Link2>
  2693. </user-agent>
  2694. <user-agent>
  2695. <ID>id_a_f_179</ID>
  2696. <String>ConveraMultiMediaCrawler/0.1 (+http://www.authoritativeweb.com/crawl)</String>
  2697. <Description>Converas RetrievalWare Internet Spider (63.241.61.x)</Description>
  2698. <Type>R</Type>
  2699. <Comment> s. also - infoConveraCrawler... - CrawlConvera ...</Comment>
  2700. <Link1>http://www.convera.com</Link1>
  2701. <Link2></Link2>
  2702. </user-agent>
  2703. <user-agent>
  2704. <ID>id_a_f_180</ID>
  2705. <String>CoolBot</String>
  2706. <Description>Suchmaschine21 (Germany) robot</Description>
  2707. <Type>R</Type>
  2708. <Comment></Comment>
  2709. <Link1>http://www.suchmaschine21.de/</Link1>
  2710. <Link2></Link2>
  2711. </user-agent>
  2712. <user-agent>
  2713. <ID>id_a_f_030110_2</ID>
  2714. <String>Cooliris/1.5 CFNetwork/459 Darwin/10.0.0d3</String>
  2715. <Description>Cooliris photo and video browser</Description>
  2716. <Type>B</Type>
  2717. <Comment></Comment>
  2718. <Link1>http://www.cooliris.com/</Link1>
  2719. <Link2></Link2>
  2720. </user-agent>
  2721. <user-agent>
  2722. <ID>id_a_f_040406_1</ID>
  2723. <String>CoralWebPrx/0.1.1x (See http://coralcdn.org/)</String>
  2724. <Description>Coral Content Distribution Network</Description>
  2725. <Type>P C</Type>
  2726. <Comment></Comment>
  2727. <Link1>http://coralcdn.org/</Link1>
  2728. <Link2></Link2>
  2729. </user-agent>
  2730. <user-agent>
  2731. <ID>id_a_f_181</ID>
  2732. <String>cosmos/0.8_(robot@xyleme.com)</String>
  2733. <Description>Xyleme SA France robot</Description>
  2734. <Type>R</Type>
  2735. <Comment></Comment>
  2736. <Link1>http://www.xyleme.com/en/index.jsp</Link1>
  2737. <Link2></Link2>
  2738. </user-agent>
  2739. <user-agent>
  2740. <ID>id_a_f_182</ID>
  2741. <String>cosmos/0.9_(robot@xyleme.com)</String>
  2742. <Description>Xyleme SA France robot</Description>
  2743. <Type>R</Type>
  2744. <Comment></Comment>
  2745. <Link1>http://www.xyleme.com/en/index.jsp</Link1>
  2746. <Link2></Link2>
  2747. </user-agent>
  2748. <user-agent>
  2749. <ID>id_a_f_040607_1</ID>
  2750. <String>CoteoNutchCrawler/Nutch-0.9 (info [at] coteo [dot] com)</String>
  2751. <Description>Coteo.com - local French directory link checking</Description>
  2752. <Type>C</Type>
  2753. <Comment></Comment>
  2754. <Link1>http://www.coteo.com/</Link1>
  2755. <Link2></Link2>
  2756. </user-agent>
  2757. <user-agent>
  2758. <ID>id_a_f_030206_3</ID>
  2759. <String>CougarSearch/0.x (+http://www.cougarsearch.com/faq.shtml)</String>
  2760. <Description>Cougarsearch.com robot</Description>
  2761. <Type>R</Type>
  2762. <Comment></Comment>
  2763. <Link1>http://www.cougarsearch.com/</Link1>
  2764. <Link2></Link2>
  2765. </user-agent>
  2766. <user-agent>
  2767. <ID>id_a_f_280408_2</ID>
  2768. <String>Covac TexAs Arachbot</String>
  2769. <Description>Covac Arachnid Web Crawler</Description>
  2770. <Type>R</Type>
  2771. <Comment>s.also ArachBot</Comment>
  2772. <Link1>http://www.covac-software.com/</Link1>
  2773. <Link2></Link2>
  2774. </user-agent>
  2775. <user-agent>
  2776. <ID>id_a_f_211208_1</ID>
  2777. <String>CoverScout%203/3.0.1 CFNetwork/339.5 Darwin/9.5.0 (i386) (iMac5&#44;1)</String>
  2778. <Description>CoverScout for iTunes - CD cover search tool</Description>
  2779. <Type>B</Type>
  2780. <Comment></Comment>
  2781. <Link1>http://www.equinux.com/de/products/coverscout/index.html</Link1>
  2782. <Link2></Link2>
  2783. </user-agent>
  2784. <user-agent>
  2785. <ID>id_a_f_183</ID>
  2786. <String>Cowbot-0.1 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)</String>
  2787. <Description>Naver Japan / Korea robot</Description>
  2788. <Type>R</Type>
  2789. <Comment> s. also Python-urllib/1.15 -  nabot -  NaverBot &amp; dloader</Comment>
  2790. <Link1>http://www.naver.co.jp</Link1>
  2791. <Link2></Link2>
  2792. </user-agent>
  2793. <user-agent>
  2794. <ID>id_a_f_184</ID>
  2795. <String>Cowbot-0.1.x (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)</String>
  2796. <Description>Naver Japan / Korea robot</Description>
  2797. <Type>R</Type>
  2798. <Comment> s. also Python-urllib/1.15 -  nabot -  NaverBot &amp; dloader</Comment>
  2799. <Link1>http://www.naver.co.jp</Link1>
  2800. <Link2></Link2>
  2801. </user-agent>
  2802. <user-agent>
  2803. <ID>id_a_f_185</ID>
  2804. <String>CrawlConvera0.1 (CrawlConvera@yahoo.com)</String>
  2805. <Description>Converas RetrievalWare Internet Spider</Description>
  2806. <Type>R</Type>
  2807. <Comment>s. also - Convera Internet Spider .. - infoConveraCrawler...</Comment>
  2808. <Link1>http://www.convera.com</Link1>
  2809. <Link2></Link2>
  2810. </user-agent>
  2811. <user-agent>
  2812. <ID>id_a_f_186</ID>
  2813. <String>Crawler</String>
  2814. <Description>unknown robot via Level3.net</Description>
  2815. <Type></Type>
  2816. <Comment></Comment>
  2817. <Link1></Link1>
  2818. <Link2></Link2>
  2819. </user-agent>
  2820. <user-agent>
  2821. <ID>id_a_f_187</ID>
  2822. <String>Crawler (cometsearch@cometsystems.com)</String>
  2823. <Description>Cometsystems Comet Search robot via Findwhat (now Miva)</Description>
  2824. <Type>R</Type>
  2825. <Comment></Comment>
  2826. <Link1>http://www.cometsystems.com</Link1>
  2827. <Link2>http://www.miva.com/</Link2>
  2828. </user-agent>
  2829. <user-agent>
  2830. <ID>id_a_f_188</ID>
  2831. <String>Crawler admin@crawler.de</String>
  2832. <Description>Crawler.de / Abacho robot</Description>
  2833. <Type>R</Type>
  2834. <Comment></Comment>
  2835. <Link1>http://www.crawler.de</Link1>
  2836. <Link2>http://www.abacho.de/</Link2>
  2837. </user-agent>
  2838. <user-agent>
  2839. <ID>id_a_f_189</ID>
  2840. <String>Crawler V 0.2.x admin@crawler.de</String>
  2841. <Description>Crawler.de / Abacho robot</Description>
  2842. <Type>R</Type>
  2843. <Comment></Comment>
  2844. <Link1>http://www.crawler.de</Link1>
  2845. <Link2>http://www.abacho.de/</Link2>
  2846. </user-agent>
  2847. <user-agent>
  2848. <ID>id_a_f_190</ID>
  2849. <String>crawler@alexa.com</String>
  2850. <Description>Alexa crawler</Description>
  2851. <Type>R</Type>
  2852. <Comment></Comment>
  2853. <Link1>http://www.alexa.com</Link1>
  2854. <Link2></Link2>
  2855. </user-agent>
  2856. <user-agent>
  2857. <ID>id_a_f_191</ID>
  2858. <String>CrawlerBoy Pinpoint.com</String>
  2859. <Description>Pinpoint WAP search robot</Description>
  2860. <Type>R</Type>
  2861. <Comment></Comment>
  2862. <Link1>http://www.pinpoint.com</Link1>
  2863. <Link2></Link2>
  2864. </user-agent>
  2865. <user-agent>
  2866. <ID>id_a_f_130506_1</ID>
  2867. <String>Crawllybot/0.1 (Crawllybot; +http://www.crawlly.com; crawler@crawlly.com)</String>
  2868. <Description>Crawlly Beta search - Germany (72.232.194.2xx)</Description>
  2869. <Type>R</Type>
  2870. <Comment>powered by Nutch</Comment>
  2871. <Link1>http://www.crawlly.com/</Link1>
  2872. <Link2></Link2>
  2873. </user-agent>
  2874. <user-agent>
  2875. <ID>id_a_f_192</ID>
  2876. <String>CreativeCommons/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net)</String>
  2877. <Description>Creatice Commons using Nutch open source robot</Description>
  2878. <Type>R</Type>
  2879. <Comment></Comment>
  2880. <Link1>http://www.nutch.org</Link1>
  2881. <Link2></Link2>
  2882. </user-agent>
  2883. <user-agent>
  2884. <ID>id_a_f_030110_3</ID>
  2885. <String>Cricket-A100/1.0 UP.Browser/6.3.0.7 (GUI) MMP/2.0</String>
  2886. <Description>Cricket A100 cell phone browser</Description>
  2887. <Type>B</Type>
  2888. <Comment></Comment>
  2889. <Link1>http://www.mycricket.com/cell-phones/details/Cricket-A100</Link1>
  2890. <Link2></Link2>
  2891. </user-agent>
  2892. <user-agent>
  2893. <ID>id_a_f_193</ID>
  2894. <String>CrocCrawler vx.3 [en] (http://www.croccrawler.com) (X11; I; Linux 2.0.44 i686)</String>
  2895. <Description>Croccrawler robot</Description>
  2896. <Type>R</Type>
  2897. <Comment></Comment>
  2898. <Link1>http://www.croccrawler.com</Link1>
  2899. <Link2></Link2>
  2900. </user-agent>
  2901. <user-agent>
  2902. <ID>id_a_f_090306_2</ID>
  2903. <String>csci_b659/0.13</String>
  2904. <Description>Web mining project from CSCI 659 (computer science course) at Indiana Univerity</Description>
  2905. <Type>R</Type>
  2906. <Comment></Comment>
  2907. <Link1>http://informatics.indiana.edu/fil/Class/b659/</Link1>
  2908. <Link2></Link2>
  2909. </user-agent>
  2910. <user-agent>
  2911. <ID>id_a_f_180906_1</ID>
  2912. <String>CSE HTML Validator Professional (http://www.htmlvalidator.com/)</String>
  2913. <Description>CSE HTML Validator for Windows</Description>
  2914. <Type>C</Type>
  2915. <Comment></Comment>
  2916. <Link1>http://www.htmlvalidator.com/</Link1>
  2917. <Link2></Link2>
  2918. </user-agent>
  2919. <user-agent>
  2920. <ID>id_a_f_194</ID>
  2921. <String>Cuam Ver0.050bx</String>
  2922. <Description>Cuam - IE based browser</Description>
  2923. <Type>B</Type>
  2924. <Comment>site is dead</Comment>
  2925. <Link1>http://cuam.virtualave.net</Link1>
  2926. <Link2></Link2>
  2927. </user-agent>
  2928. <user-agent>
  2929. <ID>id_a_f_195</ID>
  2930. <String>Cuasarbot/0.9b http://www.cuasar.com/spider_beta/ </String>
  2931. <Description>Cuasar (Spain) music / ringtone search spider</Description>
  2932. <Type>R</Type>
  2933. <Comment></Comment>
  2934. <Link1>http://www.cuasar.com</Link1>
  2935. <Link2></Link2>
  2936. </user-agent>
  2937. <user-agent>
  2938. <ID>id_a_f_196</ID>
  2939. <String>curl/7.10.x (i386-redhat-linux-gnu) libcurl/7.10.x OpenSSL/0.9.7a ipv6 zlib/1.1.4</String>
  2940. <Description>Curl file transferring tool</Description>
  2941. <Type>D</Type>
  2942. <Comment></Comment>
  2943. <Link1>http://curl.haxx.se/</Link1>
  2944. <Link2></Link2>
  2945. </user-agent>
  2946. <user-agent>
  2947. <ID>id_a_f_197</ID>
  2948. <String>curl/7.7.x (i386--freebsd4.3) libcurl 7.7.x (SSL 0.9.6) (ipv6 enabled)</String>
  2949. <Description>Curl file transferring tool</Description>
  2950. <Type>D</Type>
  2951. <Comment></Comment>
  2952. <Link1>http://curl.haxx.se/</Link1>
  2953. <Link2></Link2>
  2954. </user-agent>
  2955. <user-agent>
  2956. <ID>id_a_f_198</ID>
  2957. <String>curl/7.8 (i686-pc-linux-gnu) libcurl 7.8 (OpenSSL 0.9.6)</String>
  2958. <Description>Curl file transferring tool</Description>
  2959. <Type>D</Type>
  2960. <Comment></Comment>
  2961. <Link1>http://curl.haxx.se/</Link1>
  2962. <Link2></Link2>
  2963. </user-agent>
  2964. <user-agent>
  2965. <ID>id_a_f_199</ID>
  2966. <String>curl/7.9.x (win32) libcurl 7.9.x</String>
  2967. <Description>Curl file transferring tool</Description>
  2968. <Type>D</Type>
  2969. <Comment></Comment>
  2970. <Link1>http://curl.haxx.se/</Link1>
  2971. <Link2></Link2>
  2972. </user-agent>
  2973. <user-agent>
  2974. <ID>id_a_f_200</ID>
  2975. <String>CurryGuide SiteScan 1.1</String>
  2976. <Description>CurryGuide UK link check robot</Description>
  2977. <Type>R</Type>
  2978. <Comment></Comment>
  2979. <Link1>http://uk.curryguide.com/</Link1>
  2980. <Link2></Link2>
  2981. </user-agent>
  2982. <user-agent>
  2983. <ID>id_a_f_201</ID>
  2984. <String>Custo x.x (www.netwu.com)</String>
  2985. <Description>Custo web site spidering tool (link checking)</Description>
  2986. <Type>C</Type>
  2987. <Comment>s. also - - Mozilla/5.0 (compatible; Custo 3...</Comment>
  2988. <Link1>http://www.netwu.com</Link1>
  2989. <Link2></Link2>
  2990. </user-agent>
  2991. <user-agent>
  2992. <ID>id_a_f_202</ID>
  2993. <String>Custom Spider www.bisnisseek.com /1.0</String>
  2994. <Description>Bisnisseek (was www.bisnisseek.com) robot</Description>
  2995. <Type>R</Type>
  2996. <Comment></Comment>
  2997. <Link1></Link1>
  2998. <Link2></Link2>
  2999. </user-agent>
  3000. <user-agent>
  3001. <ID>id_a_f_203</ID>
  3002. <String>Cyberdog/2.0 (Macintosh; 68k)</String>
  3003. <Description>Cyberdog Mac Browser (was www.cyberdog.org)</Description>
  3004. <Type>B</Type>
  3005. <Comment></Comment>
  3006. <Link1></Link1>
  3007. <Link2></Link2>
  3008. </user-agent>
  3009. <user-agent>
  3010. <ID>id_a_f_260608_2</ID>
  3011. <String>CyberPatrol SiteCat Webbot (http://www.cyberpatrol.com/cyberpatrolcrawler.asp)</String>
  3012. <Description>CyberPatrol LLC robot for web filtering software</Description>
  3013. <Type>R</Type>
  3014. <Comment>38.103.17.16x</Comment>
  3015. <Link1>http://www.cyberpatrol.com/cyberpatrolcrawler.asp</Link1>
  3016. <Link2></Link2>
  3017. </user-agent>
  3018. <user-agent>
  3019. <ID>id_a_f_204</ID>
  3020. <String>CyberSpyder Link Test/2.1.12 (admin@mspennyworth.com)</String>
  3021. <Description>CyberSpyder Link Test software</Description>
  3022. <Type>C</Type>
  3023. <Comment></Comment>
  3024. <Link1>http://www.cyberspyder.com/cslnkts1.html</Link1>
  3025. <Link2></Link2>
  3026. </user-agent>
  3027. <user-agent>
  3028. <ID>id_a_f_205</ID>
  3029. <String>CydralSpider/1.x (Cydral Web Image Search; http://www.cydral.com)</String>
  3030. <Description>Cydral image &amp; site search spider</Description>
  3031. <Type>R</Type>
  3032. <Comment></Comment>
  3033. <Link1>http://www.cydral.com</Link1>
  3034. <Link2></Link2>
  3035. </user-agent>
  3036. <user-agent>
  3037. <ID>id_a_f_060508_1</ID>
  3038. <String>CydralSpider/3.0 (Cydral Image Search; http://www.cydral.com)</String>
  3039. <Description>Cydral image &amp; site search spider</Description>
  3040. <Type>R</Type>
  3041. <Comment></Comment>
  3042. <Link1>http://www.cydral.com</Link1>
  3043. <Link2></Link2>
  3044. </user-agent>
  3045. <user-agent>
  3046. <ID>id_a_f_206</ID>
  3047. <String>DA 3.5 (www.lidan.com)</String>
  3048. <Description>Downloadaccelerator download manager</Description>
  3049. <Type>D</Type>
  3050. <Comment></Comment>
  3051. <Link1>http://www.downloadaccelerator.com</Link1>
  3052. <Link2></Link2>
  3053. </user-agent>
  3054. <user-agent>
  3055. <ID>id_a_f_207</ID>
  3056. <String>DA 4.0</String>
  3057. <Description>Downloadaccelerator download manager</Description>
  3058. <Type>D</Type>
  3059. <Comment></Comment>
  3060. <Link1>http://www.downloadaccelerator.com</Link1>
  3061. <Link2></Link2>
  3062. </user-agent>
  3063. <user-agent>
  3064. <ID>id_a_f_208</ID>
  3065. <String>DA 4.0 (www.downloadaccelerator.com)</String>
  3066. <Description>Downloadaccelerator download manager</Description>
  3067. <Type>D</Type>
  3068. <Comment></Comment>
  3069. <Link1>http://www.downloadaccelerator.com</Link1>
  3070. <Link2></Link2>
  3071. </user-agent>
  3072. <user-agent>
  3073. <ID>id_a_f_209</ID>
  3074. <String>DA 5.0</String>
  3075. <Description>Downloadaccelerator download manager</Description>
  3076. <Type>D</Type>
  3077. <Comment></Comment>
  3078. <Link1>http://www.downloadaccelerator.com</Link1>
  3079. <Link2></Link2>
  3080. </user-agent>
  3081. <user-agent>
  3082. <ID>id_a_f_210</ID>
  3083. <String>DA 7.0</String>
  3084. <Description>Downloadaccelerator download manager</Description>
  3085. <Type>D</Type>
  3086. <Comment></Comment>
  3087. <Link1>http://www.downloadaccelerator.com</Link1>
  3088. <Link2></Link2>
  3089. </user-agent>
  3090. <user-agent>
  3091. <ID>id_a_f_070209_3</ID>
  3092. <String>DAP x.x</String>
  3093. <Description>Download Accelerator Plus download manager</Description>
  3094. <Type>D</Type>
  3095. <Comment></Comment>
  3096. <Link1>http://www.speedbit.com/</Link1>
  3097. <Link2></Link2>
  3098. </user-agent>
  3099. <user-agent>
  3100. <ID>id_a_f_211</ID>
  3101. <String>Dart Communications PowerTCP</String>
  3102. <Description>PowerTCP ActiveX control tool</Description>
  3103. <Type></Type>
  3104. <Comment></Comment>
  3105. <Link1>http://www.dart.com</Link1>
  3106. <Link2></Link2>
  3107. </user-agent>
  3108. <user-agent>
  3109. <ID>id_a_f_212</ID>
  3110. <String>DataCha0s/2.0</String>
  3111. <Description>Unknown bot from Kornet Korea (218.149.129.xxx) scans for Perl Awstats</Description>
  3112. <Type>S</Type>
  3113. <Comment></Comment>
  3114. <Link1></Link1>
  3115. <Link2></Link2>
  3116. </user-agent>
  3117. <user-agent>
  3118. <ID>id_a_f_101106_1</ID>
  3119. <String>DataCha0s/2.0</String>
  3120. <Description>Unknown UA looking for Awstats Perl components</Description>
  3121. <Type>S</Type>
  3122. <Comment>from various IPs</Comment>
  3123. <Link1></Link1>
  3124. <Link2></Link2>
  3125. </user-agent>
  3126. <user-agent>
  3127. <ID>id_a_f_213</ID>
  3128. <String>DataFountains/DMOZ Downloader</String>
  3129. <Description>INFOMINE/iVia Scholary Internet Resource Collections robot</Description>
  3130. <Type>R</Type>
  3131. <Comment>138.23.85.xx</Comment>
  3132. <Link1>http://infomine.ucr.edu/</Link1>
  3133. <Link2>http://ivia.ucr.edu/useragents.shtml</Link2>
  3134. </user-agent>
  3135. <user-agent>
  3136. <ID>id_a_f_040307_1</ID>
  3137. <String>DataFountains/Dmoz Downloader (http://ivia.ucr.edu/useragents.shtml)</String>
  3138. <Description>INFOMINE/iVia Scholary Internet Resource Collections robot</Description>
  3139. <Type>R</Type>
  3140. <Comment>138.23.85.xx</Comment>
  3141. <Link1>http://infomine.ucr.edu/</Link1>
  3142. <Link2>http://ivia.ucr.edu/useragents.shtml</Link2>
  3143. </user-agent>
  3144. <user-agent>
  3145. <ID>id_a_f_110307_1</ID>
  3146. <String>DataFountains/DMOZ Feature Vector Corpus Creator (http://ivia.ucr.edu/useragents.shtml)</String>
  3147. <Description>INFOMINE/iVia Scholary Internet Resource Collections robot</Description>
  3148. <Type>R</Type>
  3149. <Comment>138.23.85.xx</Comment>
  3150. <Link1>http://infomine.ucr.edu/</Link1>
  3151. <Link2>http://ivia.ucr.edu/useragents.shtml</Link2>
  3152. </user-agent>
  3153. <user-agent>
  3154. <ID>id_a_f_050907_1</ID>
  3155. <String>DataparkSearch/4.47 (+http://dataparksearch.org/bot)</String>
  3156. <Description>DataparkSearch open source search engine</Description>
  3157. <Type>R</Type>
  3158. <Comment></Comment>
  3159. <Link1>http://www.dataparksearch.org</Link1>
  3160. <Link2></Link2>
  3161. </user-agent>
  3162. <user-agent>
  3163. <ID>id_a_f_214</ID>
  3164. <String>DataparkSearch/4.xx (http://www.dataparksearch.org/)</String>
  3165. <Description>DataparkSearch open source search engine</Description>
  3166. <Type>R</Type>
  3167. <Comment></Comment>
  3168. <Link1>http://www.dataparksearch.org</Link1>
  3169. <Link2></Link2>
  3170. </user-agent>
  3171. <user-agent>
  3172. <ID>id_a_f_080206_1</ID>
  3173. <String>DataSpear/1.0 (Spider; http://www.dataspear.com/spider.html; spider@dataspear.com)</String>
  3174. <Description>DataSpear Directory robot (24.109.29.xx)</Description>
  3175. <Type>R</Type>
  3176. <Comment></Comment>
  3177. <Link1>http://www.dataspear.com/</Link1>
  3178. <Link2></Link2>
  3179. </user-agent>
  3180. <user-agent>
  3181. <ID>id_a_f_215</ID>
  3182. <String>DataSpearSpiderBot/0.2 (DataSpear Spider Bot; http://dssb.dataspear.com/bot.html; dssb@dataspear.com)</String>
  3183. <Description>DataSpear Directory robot (24.109.29.xx)</Description>
  3184. <Type>R</Type>
  3185. <Comment></Comment>
  3186. <Link1>http://www.dataspear.com/</Link1>
  3187. <Link2></Link2>
  3188. </user-agent>
  3189. <user-agent>
  3190. <ID>id_a_f_161105_1</ID>
  3191. <String>DatenBot( http://www.sicher-durchs-netz.de/bot.html)</String>
  3192. <Description>Sicher-durchs-Netz German security related search (62.75.220.xxx)</Description>
  3193. <Type>R</Type>
  3194. <Comment></Comment>
  3195. <Link1>http://www.sicher-durchs-netz.de/suche</Link1>
  3196. <Link2></Link2>
  3197. </user-agent>
  3198. <user-agent>
  3199. <ID>id_a_f_216</ID>
  3200. <String>DaviesBot/1.7 (www.wholeweb.net)</String>
  3201. <Description>Wholeweb robot</Description>
  3202. <Type>R</Type>
  3203. <Comment>site is closed</Comment>
  3204. <Link1>http://www.wholeweb.net</Link1>
  3205. <Link2></Link2>
  3206. </user-agent>
  3207. <user-agent>
  3208. <ID>id_a_f_217</ID>
  3209. <String>daypopbot/0.x</String>
  3210. <Description>Daypop blog - weblog - online mag search spider</Description>
  3211. <Type>R</Type>
  3212. <Comment></Comment>
  3213. <Link1>http://www.daypop.com/info/about.htm</Link1>
  3214. <Link2></Link2>
  3215. </user-agent>
  3216. <user-agent>
  3217. <ID>id_a_f_218</ID>
  3218. <String>dbDig(http://www.prairielandconsulting.com)</String>
  3219. <Description>dbDig search engine</Description>
  3220. <Type>R</Type>
  3221. <Comment></Comment>
  3222. <Link1>http://www.prairielandconsulting.com</Link1>
  3223. <Link2></Link2>
  3224. </user-agent>
  3225. <user-agent>
  3226. <ID>id_a_f_219</ID>
  3227. <String>DBrowse 1.4b</String>
  3228. <Description>Some site scanning tool via diff. IPs i.e.: - wanweb.net (208.6.163.xxx) - cox.net (68.4.xxx.xxx)</Description>
  3229. <Type>S</Type>
  3230. <Comment>UA sometimes - DSurf15a 01 - DBrowse 1.4d</Comment>
  3231. <Link1></Link1>
  3232. <Link2></Link2>
  3233. </user-agent>
  3234. <user-agent>
  3235. <ID>id_a_f_220</ID>
  3236. <String>DBrowse 1.4d</String>
  3237. <Description>Some site scanning tool via diff. IPs i.e.: - pacbell.net (67.112.xxx.xxx)</Description>
  3238. <Type>S</Type>
  3239. <Comment>see also DSurf15a 01 - DBrowse 1.4b</Comment>
  3240. <Link1></Link1>
  3241. <Link2></Link2>
  3242. </user-agent>
  3243. <user-agent>
  3244. <ID>id_a_f_221</ID>
  3245. <String>DC-Sakura/x.xx</String>
  3246. <Description>DC-Sakura download manager</Description>
  3247. <Type>D</Type>
  3248. <Comment></Comment>
  3249. <Link1>http://www.dc-sakura.com/</Link1>
  3250. <Link2></Link2>
  3251. </user-agent>
  3252. <user-agent>
  3253. <ID>id_a_f_222</ID>
  3254. <String>dCSbot/1.1</String>
  3255. <Description>unknown divine/Openmarket.com robot</Description>
  3256. <Type>R</Type>
  3257. <Comment></Comment>
  3258. <Link1>http://www.openmarket.com/</Link1>
  3259. <Link2></Link2>
  3260. </user-agent>
  3261. <user-agent>
  3262. <ID>id_a_f_223</ID>
  3263. <String>DDD</String>
  3264. <Description>some (website) downloading tool</Description>
  3265. <Type>D</Type>
  3266. <Comment></Comment>
  3267. <Link1></Link1>
  3268. <Link2></Link2>
  3269. </user-agent>
  3270. <user-agent>
  3271. <ID>id_a_f_224</ID>
  3272. <String>dds explorer v1.0 beta</String>
  3273. <Description>Unknown user agent</Description>
  3274. <Type></Type>
  3275. <Comment></Comment>
  3276. <Link1></Link1>
  3277. <Link2></Link2>
  3278. </user-agent>
  3279. <user-agent>
  3280. <ID>id_a_f_225</ID>
  3281. <String>de.searchengine.comBot 1.2 (http://de.searchengine.com/spider)</String>
  3282. <Description>Searchengine.com (Germany) submission checking / robot (84.73.57.xx)</Description>
  3283. <Type>R</Type>
  3284. <Comment></Comment>
  3285. <Link1>http://de.searchengine.com</Link1>
  3286. <Link2></Link2>
  3287. </user-agent>
  3288. <user-agent>
  3289. <ID>id_a_f_226</ID>
  3290. <String>DeadLinkCheck/0.4.0 libwww-perl/5.xx</String>
  3291. <Description>DLC Perl HTTP link checking</Description>
  3292. <Type>C</Type>
  3293. <Comment></Comment>
  3294. <Link1>http://dlc.sourceforge.net/</Link1>
  3295. <Link2></Link2>
  3296. </user-agent>
  3297. <user-agent>
  3298. <ID>id_a_f_111206_3</ID>
  3299. <String>Deep Link Calculator v1.0</String>
  3300. <Description>Sootle Web Directory deep link checker</Description>
  3301. <Type>C</Type>
  3302. <Comment>216.89.111.x</Comment>
  3303. <Link1>http://directory.sootle.com/deep-links/</Link1>
  3304. <Link2></Link2>
  3305. </user-agent>
  3306. <user-agent>
  3307. <ID>id_a_f_227</ID>
  3308. <String>deepak-USC/ISI</String>
  3309. <Description>deepak-USC/ISI robot from USC/Information Science Institute</Description>
  3310. <Type>R</Type>
  3311. <Comment></Comment>
  3312. <Link1>http://www.isi.edu/%7Eravichan/deepak-usc-isi.html</Link1>
  3313. <Link2>http://www.isi.edu/</Link2>
  3314. </user-agent>
  3315. <user-agent>
  3316. <ID>id_a_f_228</ID>
  3317. <String>DeepIndex</String>
  3318. <Description>Deepindex robot</Description>
  3319. <Type>R</Type>
  3320. <Comment></Comment>
  3321. <Link1>http://www.deepindex.net/utilisateurs.php?referral=deepindex</Link1>
  3322. <Link2></Link2>
  3323. </user-agent>
  3324. <user-agent>
  3325. <ID>id_a_f_229</ID>
  3326. <String>DeepIndex ( http://www.zetbot.com )</String>
  3327. <Description>Zetbot search Belgium (213.41.128.xx) using Deepindex robot</Description>
  3328. <Type>R</Type>
  3329. <Comment></Comment>
  3330. <Link1>http://www.zetbot.com/</Link1>
  3331. <Link2>http://www.deepindex.net/utilisateurs.php?referral=deepindex</Link2>
  3332. </user-agent>
  3333. <user-agent>
  3334. <ID>id_a_f_230</ID>
  3335. <String>DeepIndex (www.en.deepindex.com)</String>
  3336. <Description>Deepindex robot</Description>
  3337. <Type>R</Type>
  3338. <Comment></Comment>
  3339. <Link1>http://www.deepindex.net/utilisateurs.php?referral=deepindex</Link1>
  3340. <Link2></Link2>
  3341. </user-agent>
  3342. <user-agent>
  3343. <ID>id_a_f_231</ID>
  3344. <String>DeepIndexer.ca</String>
  3345. <Description>Deepindex robot (via Paragon.net Canada)</Description>
  3346. <Type>R</Type>
  3347. <Comment></Comment>
  3348. <Link1>http://www.deepindex.net/utilisateurs.php?referral=deepindex</Link1>
  3349. <Link2></Link2>
  3350. </user-agent>
  3351. <user-agent>
  3352. <ID>id_a_f_011006_2</ID>
  3353. <String>del.icio.us-thumbnails/1.0 Mozilla/5.0 (compatible; Konqueror/3.4; FreeBSD) KHTML/3.4.2 (like Gecko)</String>
  3354. <Description>del.icio.us picture robot for thumbnail preview via Yahoo</Description>
  3355. <Type>D</Type>
  3356. <Comment>66.94.237.1xx</Comment>
  3357. <Link1>http://del.icio.us/</Link1>
  3358. <Link2></Link2>
  3359. </user-agent>
  3360. <user-agent>
  3361. <ID>id_a_f_250106_1</ID>
  3362. <String>DeleGate/9.0.5-fix1</String>
  3363. <Description>DeleGate application level gateway / proxy server</Description>
  3364. <Type>P</Type>
  3365. <Comment></Comment>
  3366. <Link1>http://www.delegate.org/delegate/</Link1>
  3367. <Link2></Link2>
  3368. </user-agent>
  3369. <user-agent>
  3370. <ID>id_a_f_232</ID>
  3371. <String>Demo Bot DOT 16b</String>
  3372. <Description>Some site scanning tool from 217.34.59.xxx (btopenworld.com)</Description>
  3373. <Type>S</Type>
  3374. <Comment></Comment>
  3375. <Link1></Link1>
  3376. <Link2></Link2>
  3377. </user-agent>
  3378. <user-agent>
  3379. <ID>id_a_f_233</ID>
  3380. <String>Demo Bot Z 16b</String>
  3381. <Description>Some site scanning tool from 68.154.96.xx (bellsouth.net)</Description>
  3382. <Type>S</Type>
  3383. <Comment>appears also as - MFC Foundation Class Library - Full Web Bot 0516B</Comment>
  3384. <Link1></Link1>
  3385. <Link2></Link2>
  3386. </user-agent>
  3387. <user-agent>
  3388. <ID>id_a_f_234</ID>
  3389. <String>Denmex websearch (http://search.denmex.com)</String>
  3390. <Description>Denmex Websearch robot/link checking</Description>
  3391. <Type>R</Type>
  3392. <Comment></Comment>
  3393. <Link1>http://search.denmex.com</Link1>
  3394. <Link2></Link2>
  3395. </user-agent>
  3396. <user-agent>
  3397. <ID>id_a_f_235</ID>
  3398. <String>Der gro&#223;e BilderSauger 2.00u</String>
  3399. <Description>DataBecker Bilder Sauger (discontinued) web graphics downloader</Description>
  3400. <Type>D</Type>
  3401. <Comment></Comment>
  3402. <Link1>http://www.databecker.de</Link1>
  3403. <Link2></Link2>
  3404. </user-agent>
  3405. <user-agent>
  3406. <ID>id_a_f_230206_1</ID>
  3407. <String>dev-spider2.searchpsider.com/1.3b</String>
  3408. <Description>Searchspider.com robot (72.245.225.xxx)</Description>
  3409. <Type>R</Type>
  3410. <Comment></Comment>
  3411. <Link1>http://www.searchspider.com/</Link1>
  3412. <Link2></Link2>
  3413. </user-agent>
  3414. <user-agent>
  3415. <ID>id_a_f_236</ID>
  3416. <String>DevComponents.com HtmlDocument Object</String>
  3417. <Description>DevComponents HTMLDocument Class Library for Visual Studio.net</Description>
  3418. <Type></Type>
  3419. <Comment></Comment>
  3420. <Link1>http://www.devcomponents.com</Link1>
  3421. <Link2></Link2>
  3422. </user-agent>
  3423. <user-agent>
  3424. <ID>id_a_f_237</ID>
  3425. <String>DiaGem/1.1 (http://www.skyrocket.gr.jp/diagem.html)</String>
  3426. <Description>DiaGem Japan web crawler</Description>
  3427. <Type>R</Type>
  3428. <Comment>(site is offline)</Comment>
  3429. <Link1>http://www.skyrocket.gr.jp</Link1>
  3430. <Link2></Link2>
  3431. </user-agent>
  3432. <user-agent>
  3433. <ID>id_a_f_238</ID>
  3434. <String>Diamond/x.0</String>
  3435. <Description>Claria (ex Gator) SearchScout robot (64.152.73.xx)</Description>
  3436. <Type>R</Type>
  3437. <Comment>s. also Claria</Comment>
  3438. <Link1>http://www.searchscout.com</Link1>
  3439. <Link2></Link2>
  3440. </user-agent>
  3441. <user-agent>
  3442. <ID>id_a_f_239</ID>
  3443. <String>DiamondBot</String>
  3444. <Description>Claria (ex Gator) SearchScout robot (64.152.73.xx)</Description>
  3445. <Type>R</Type>
  3446. <Comment>s. also Claria</Comment>
  3447. <Link1>http://www.searchscout.com</Link1>
  3448. <Link2></Link2>
  3449. </user-agent>
  3450. <user-agent>
  3451. <ID>id_a_f_240</ID>
  3452. <String>Digger/1.0 JDK/1.3.0rc3</String>
  3453. <Description>Diggit! robot</Description>
  3454. <Type>R</Type>
  3455. <Comment></Comment>
  3456. <Link1>http://www.diggit.com</Link1>
  3457. <Link2></Link2>
  3458. </user-agent>
  3459. <user-agent>
  3460. <ID>id_a_f_241</ID>
  3461. <String>DigOut4U</String>
  3462. <Description>OpenPortal4U robot</Description>
  3463. <Type>R</Type>
  3464. <Comment></Comment>
  3465. <Link1>http://www.arisem.com</Link1>
  3466. <Link2></Link2>
  3467. </user-agent>
  3468. <user-agent>
  3469. <ID>id_a_f_242</ID>
  3470. <String>DIIbot/1.2</String>
  3471. <Description>Findsame.com (site is offline) / Digital-Integrity robot</Description>
  3472. <Type>R</Type>
  3473. <Comment></Comment>
  3474. <Link1>http://www.digital-integrity.com/</Link1>
  3475. <Link2></Link2>
  3476. </user-agent>
  3477. <user-agent>
  3478. <ID>id_a_f_100206_1</ID>
  3479. <String>Dillo/0.8.5-i18n-misc</String>
  3480. <Description>Dillo Web Browser</Description>
  3481. <Type>B</Type>
  3482. <Comment></Comment>
  3483. <Link1>http://www.dillo.org/</Link1>
  3484. <Link2></Link2>
  3485. </user-agent>
  3486. <user-agent>
  3487. <ID>id_a_f_243</ID>
  3488. <String>Dillo/0.x.x</String>
  3489. <Description>Dillo Web Browser</Description>
  3490. <Type>B</Type>
  3491. <Comment></Comment>
  3492. <Link1>http://www.dillo.org/</Link1>
  3493. <Link2></Link2>
  3494. </user-agent>
  3495. <user-agent>
  3496. <ID>id_a_f_100109_1</ID>
  3497. <String>disastrous/1.0.5 (running with Python 2.5.1; http://www.bortzmeyer.org/disastrous.html; archangel77@del.icio.us)</String>
  3498. <Description>disastrous - a del.icio.us link checker based on Python</Description>
  3499. <Type>C</Type>
  3500. <Comment></Comment>
  3501. <Link1>http://www.bortzmeyer.org/disastrous.html</Link1>
  3502. <Link2></Link2>
  3503. </user-agent>
  3504. <user-agent>
  3505. <ID>id_a_f_140306_1</ID>
  3506. <String>DISCo Pump x.x</String>
  3507. <Description>DISCo Pump offline browser / website ripper</Description>
  3508. <Type>D</Type>
  3509. <Comment>No active homepage</Comment>
  3510. <Link1>http://www.arssoft.com/</Link1>
  3511. <Link2>http://www.filetransit.com/view.php?id=3870</Link2>
  3512. </user-agent>
  3513. <user-agent>
  3514. <ID>id_a_f_300907_1</ID>
  3515. <String>disco/Nutch-0.9 (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com)</String>
  3516. <Description>Unkown robot from Discovery Engine Corp.</Description>
  3517. <Type>R</Type>
  3518. <Comment>208.96.54.xx</Comment>
  3519. <Link1>http://www.discoveryengine.com/</Link1>
  3520. <Link2></Link2>
  3521. </user-agent>
  3522. <user-agent>
  3523. <ID>id_a_f_300907_2</ID>
  3524. <String>disco/Nutch-1.0-dev (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com)</String>
  3525. <Description>Unkown robot from Discovery Engine Corp.</Description>
  3526. <Type>R</Type>
  3527. <Comment>208.96.54.xx</Comment>
  3528. <Link1>http://www.discoveryengine.com/</Link1>
  3529. <Link2></Link2>
  3530. </user-agent>
  3531. <user-agent>
  3532. <ID>id_a_f_244</ID>
  3533. <String>DittoSpyder</String>
  3534. <Description>Ditto picture search robot</Description>
  3535. <Type>R</Type>
  3536. <Comment></Comment>
  3537. <Link1>http://www.ditto.com</Link1>
  3538. <Link2></Link2>
  3539. </user-agent>
  3540. <user-agent>
  3541. <ID>id_a_f_245</ID>
  3542. <String>dlman</String>
  3543. <Description>some download agent</Description>
  3544. <Type>D</Type>
  3545. <Comment>Wildsoft Surfer</Comment>
  3546. <Link1></Link1>
  3547. <Link2></Link2>
  3548. </user-agent>
  3549. <user-agent>
  3550. <ID>id_a_f_246</ID>
  3551. <String>dloader(NaverRobot)/1.0</String>
  3552. <Description>Naver Japan / Korea robot</Description>
  3553. <Type>R</Type>
  3554. <Comment>s. also Python-urllib/1.15 - nabot - NaverBot &amp; Cowbot</Comment>
  3555. <Link1>http://www.naver.co.jp</Link1>
  3556. <Link2></Link2>
  3557. </user-agent>
  3558. <user-agent>
  3559. <ID>id_a_f_100408_1</ID>
  3560. <String>DNSRight.com WebBot Link Ckeck Tool. Report abuse to: dnsr@dnsright.com</String>
  3561. <Description>DNS Right - Online DNS tools</Description>
  3562. <Type>C</Type>
  3563. <Comment>203.161.71.17x</Comment>
  3564. <Link1>http://www.dnsright.com/</Link1>
  3565. <Link2></Link2>
  3566. </user-agent>
  3567. <user-agent>
  3568. <ID>id_a_f_247</ID>
  3569. <String>DoCoMo/1.0/Nxxxi/c10</String>
  3570. <Description>NTT DoCoMo (Japan) robot</Description>
  3571. <Type>R</Type>
  3572. <Comment></Comment>
  3573. <Link1>http://www.nttdocomo.co.jp/</Link1>
  3574. <Link2></Link2>
  3575. </user-agent>
  3576. <user-agent>
  3577. <ID>id_a_f_248</ID>
  3578. <String>DoCoMo/1.0/Nxxxi/c10/TB</String>
  3579. <Description>NTT DoCoMo (Japan) robot</Description>
  3580. <Type>R</Type>
  3581. <Comment></Comment>
  3582. <Link1>http://www.nttdocomo.co.jp/</Link1>
  3583. <Link2></Link2>
  3584. </user-agent>
  3585. <user-agent>
  3586. <ID>id_a_f_249</ID>
  3587. <String>DoCoMo/1.0/P502i/c10 (Google CHTML Proxy/1.0)</String>
  3588. <Description>Google (216.239.39.x) proxy server</Description>
  3589. <Type>P</Type>
  3590. <Comment></Comment>
  3591. <Link1></Link1>
  3592. <Link2></Link2>
  3593. </user-agent>
  3594. <user-agent>
  3595. <ID>id_a_f_250</ID>
  3596. <String>DoCoMo/2.0 P900iV(c100;TB;W24H11) </String>
  3597. <Description>NTT DoCoMo (Japan) robot</Description>
  3598. <Type>R</Type>
  3599. <Comment></Comment>
  3600. <Link1>http://www.nttdocomo.co.jp/</Link1>
  3601. <Link2></Link2>
  3602. </user-agent>
  3603. <user-agent>
  3604. <ID>id_a_f_141205_1</ID>
  3605. <String>DoCoMo/2.0 SH901iS(c100;TB;W24H12)&#44;gzip(gfe) (via translate.google.com)</String>
  3606. <Description>NTT DoCoMo (Japan) proxy server (210.136.161.1xx)</Description>
  3607. <Type>P</Type>
  3608. <Comment></Comment>
  3609. <Link1>http://www.nttdocomo.co.jp/</Link1>
  3610. <Link2></Link2>
  3611. </user-agent>
  3612. <user-agent>
  3613. <ID>id_a_f_081207_1</ID>
  3614. <String>DoCoMo/2.0 SH902i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html)</String>
  3615. <Description>Yahoo Search Japan robot (203.216.197.xxx)</Description>
  3616. <Type>R</Type>
  3617. <Comment>s. also Y!J-SRD/1.0</Comment>
  3618. <Link1>http://www.yahoo.co.jp/</Link1>
  3619. <Link2></Link2>
  3620. </user-agent>
  3621. <user-agent>
  3622. <ID>id_a_f_271006_3</ID>
  3623. <String>DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html)</String>
  3624. <Description>Yahoo Search Japan robot (203.216.197.xxx)</Description>
  3625. <Type>R</Type>
  3626. <Comment>s. also Y!J-SRD/1.0</Comment>
  3627. <Link1>http://www.yahoo.co.jp/</Link1>
  3628. <Link2></Link2>
  3629. </user-agent>
  3630. <user-agent>
  3631. <ID>id_a_f_251</ID>
  3632. <String>DocZilla/1.0 (Windows; U; WinNT4.0; en-US; rv:1.0.0) Gecko/20020804</String>
  3633. <Description>DocZilla - Mozilla-based SGML/XML/HTML- browser</Description>
  3634. <Type>B</Type>
  3635. <Comment></Comment>
  3636. <Link1>http://www.doczilla.com</Link1>
  3637. <Link2></Link2>
  3638. </user-agent>
  3639. <user-agent>
  3640. <ID>id_a_f_210607_1</ID>
  3641. <String>dodgebot/experimental</String>
  3642. <Description>unknown robot from AGMLAB Information Technologies (Information retrieval system ?)</Description>
  3643. <Type>R</Type>
  3644. <Comment>212.174.130.1xx</Comment>
  3645. <Link1>http://www.agmlab.com/agmlab_eng.html</Link1>
  3646. <Link2></Link2>
  3647. </user-agent>
  3648. <user-agent>
  3649. <ID>id_a_f_180606_1</ID>
  3650. <String>DonutP; Windows98SE</String>
  3651. <Description>Donut P - Japanese IE based browser</Description>
  3652. <Type>B</Type>
  3653. <Comment></Comment>
  3654. <Link1>http://donutp.com/</Link1>
  3655. <Link2></Link2>
  3656. </user-agent>
  3657. <user-agent>
  3658. <ID>id_a_f_250907_2</ID>
  3659. <String>Doubanbot/1.0 (bot@douban.com http://www.douban.com)</String>
  3660. <Description>Unknown robot from douban search (China) - maybe image crawling</Description>
  3661. <Type></Type>
  3662. <Comment>59.151.41.xx</Comment>
  3663. <Link1>http://www.douban.com/</Link1>
  3664. <Link2></Link2>
  3665. </user-agent>
  3666. <user-agent>
  3667. <ID>id_a_f_252</ID>
  3668. <String>Download Demon/3.x.x.x</String>
  3669. <Description>Download Demon/Netzip download manager</Description>
  3670. <Type>D</Type>
  3671. <Comment></Comment>
  3672. <Link1>http://www.netzip.com</Link1>
  3673. <Link2></Link2>
  3674. </user-agent>
  3675. <user-agent>
  3676. <ID>id_a_f_191105_4</ID>
  3677. <String>Download Druid 2.x</String>
  3678. <Description>Download Druid IE plugin download manager</Description>
  3679. <Type>D</Type>
  3680. <Comment></Comment>
  3681. <Link1>http://www.xemico.com/druid/index.html</Link1>
  3682. <Link2></Link2>
  3683. </user-agent>
  3684. <user-agent>
  3685. <ID>id_a_f_253</ID>
  3686. <String>Download Express 1.0</String>
  3687. <Description>Download Express download manager</Description>
  3688. <Type>D</Type>
  3689. <Comment></Comment>
  3690. <Link1>http://www.metaproducts.com</Link1>
  3691. <Link2></Link2>
  3692. </user-agent>
  3693. <user-agent>
  3694. <ID>id_a_f_254</ID>
  3695. <String>Download Master</String>
  3696. <Description>Download Master download manager</Description>
  3697. <Type>D</Type>
  3698. <Comment></Comment>
  3699. <Link1>http://www.westbyte.com/dm/index.phtml</Link1>
  3700. <Link2></Link2>
  3701. </user-agent>
  3702. <user-agent>
  3703. <ID>id_a_f_191105_5</ID>
  3704. <String>Download Ninja 3.0</String>
  3705. <Description>Download Ninja download manager (Japan)</Description>
  3706. <Type>D</Type>
  3707. <Comment></Comment>
  3708. <Link1>http://www.h-fd.org/mkro/mt/archives/2002/09/download_ninja_1.html</Link1>
  3709. <Link2></Link2>
  3710. </user-agent>
  3711. <user-agent>
  3712. <ID>id_a_f_255</ID>
  3713. <String>Download Wonder</String>
  3714. <Description>Download Wonder download manager</Description>
  3715. <Type>D</Type>
  3716. <Comment></Comment>
  3717. <Link1>http://www.forty.com</Link1>
  3718. <Link2></Link2>
  3719. </user-agent>
  3720. <user-agent>
  3721. <ID>id_a_f_256</ID>
  3722. <String>Download-Tipp Linkcheck (http://download-tipp.de/)</String>
  3723. <Description>Download-Tipp Germany link checking</Description>
  3724. <Type>R</Type>
  3725. <Comment></Comment>
  3726. <Link1>http://download-tipp.de/</Link1>
  3727. <Link2></Link2>
  3728. </user-agent>
  3729. <user-agent>
  3730. <ID>id_a_f_257</ID>
  3731. <String>Download.exe(1.1) (+http://www.sql-und-xml.de/freeware-tools/)</String>
  3732. <Description>download.exe .NET based downloading tool</Description>
  3733. <Type>D</Type>
  3734. <Comment></Comment>
  3735. <Link1>http://www.sql-und-xml.de/freeware-tools/</Link1>
  3736. <Link2></Link2>
  3737. </user-agent>
  3738. <user-agent>
  3739. <ID>id_a_f_300907_3</ID>
  3740. <String>DownloadDirect.1.0</String>
  3741. <Description>Download Direct download manager</Description>
  3742. <Type>D</Type>
  3743. <Comment></Comment>
  3744. <Link1>http://senbit.com/</Link1>
  3745. <Link2></Link2>
  3746. </user-agent>
  3747. <user-agent>
  3748. <ID>id_a_f_258</ID>
  3749. <String>Dr.Web (R) online scanner: http://online.drweb.com/</String>
  3750. <Description>Dr.WEB online virus scanner</Description>
  3751. <Type></Type>
  3752. <Comment></Comment>
  3753. <Link1>http://online.drweb.com</Link1>
  3754. <Link2></Link2>
  3755. </user-agent>
  3756. <user-agent>
  3757. <ID>id_a_f_259</ID>
  3758. <String>Dragonfly File Reader</String>
  3759. <Description>Dragonfly CMS - Open Source content management system</Description>
  3760. <Type>B</Type>
  3761. <Comment></Comment>
  3762. <Link1>http://www.cpgnuke.com</Link1>
  3763. <Link2></Link2>
  3764. </user-agent>
  3765. <user-agent>
  3766. <ID>id_a_f_260</ID>
  3767. <String>Drecombot/1.0 (http://career.drecom.jp/bot.html)</String>
  3768. <Description>Drecom Japan (210.233.67.xxx) - Blog search ??</Description>
  3769. <Type>R</Type>
  3770. <Comment></Comment>
  3771. <Link1>http://www.drecom.co.jp</Link1>
  3772. <Link2></Link2>
  3773. </user-agent>
  3774. <user-agent>
  3775. <ID>id_a_f_3090906_1</ID>
  3776. <String>Drupal (+http://drupal.org/)</String>
  3777. <Description>Drupal - open source content management platform</Description>
  3778. <Type>C</Type>
  3779. <Comment></Comment>
  3780. <Link1>http://drupal.org/</Link1>
  3781. <Link2></Link2>
  3782. </user-agent>
  3783. <user-agent>
  3784. <ID>id_a_f_261</ID>
  3785. <String>DSurf15a 01</String>
  3786. <Description>Some site scanning tool via diff. IPs i.e.: - cox.net (68.5.xxx.xxx) - pacbell.net (64.16x.xxx.xxx)</Description>
  3787. <Type>S</Type>
  3788. <Comment>DBrowse 1.4d</Comment>
  3789. <Link1></Link1>
  3790. <Link2></Link2>
  3791. </user-agent>
  3792. <user-agent>
  3793. <ID>id_a_f_262</ID>
  3794. <String>DSurf15a 71</String>
  3795. <Description>Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx)</Description>
  3796. <Type>S</Type>
  3797. <Comment>TRPMFHXE</Comment>
  3798. <Link1></Link1>
  3799. <Link2></Link2>
  3800. </user-agent>
  3801. <user-agent>
  3802. <ID>id_a_f_263</ID>
  3803. <String>DSurf15a 81</String>
  3804. <Description>Some site scanning tool via diff. IPs i.e.: - verizon.net (4.47.xxx.xxx)</Description>
  3805. <Type>S</Type>
  3806. <Comment>WFRIKXVNFL</Comment>
  3807. <Link1></Link1>
  3808. <Link2></Link2>
  3809. </user-agent>
  3810. <user-agent>
  3811. <ID>id_a_f_264</ID>
  3812. <String>DSurf15a VA</String>
  3813. <Description>Some site scanning tool via diff. IPs i.e.: - eastlink.ca (24.222.xxx.xxx) - cogeco.net (216.221.8x.xxx)</Description>
  3814. <Type>S</Type>
  3815. <Comment></Comment>
  3816. <Link1></Link1>
  3817. <Link2></Link2>
  3818. </user-agent>
  3819. <user-agent>
  3820. <ID>id_a_f_020506_2</ID>
  3821. <String>DTAAgent</String>
  3822. <Description>DTAAgent Java object for data collecting</Description>
  3823. <Type>R D</Type>
  3824. <Comment></Comment>
  3825. <Link1>http://www.ibr.cs.tu-bs.de/courses/ss00/sep-vs/gruppe1/jdoc/DTA/agent/DTAAgent.html</Link1>
  3826. <Link2></Link2>
  3827. </user-agent>
  3828. <user-agent>
  3829. <ID>id_a_f_265</ID>
  3830. <String>dtSearchSpider</String>
  3831. <Description>dt Search Spider software</Description>
  3832. <Type>R</Type>
  3833. <Comment></Comment>
  3834. <Link1>http://www.dtsearch.com/spider.html</Link1>
  3835. <Link2></Link2>
  3836. </user-agent>
  3837. <user-agent>
  3838. <ID>id_a_f_266</ID>
  3839. <String>Dual Proxy</String>
  3840. <Description>Fourelle Venturi proxy server</Description>
  3841. <Type>P</Type>
  3842. <Comment></Comment>
  3843. <Link1>http://www.fourelle.com/news/articles/148457.htm</Link1>
  3844. <Link2></Link2>
  3845. </user-agent>
  3846. <user-agent>
  3847. <ID>id_a_f_290308_2</ID>
  3848. <String>DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)</String>
  3849. <Description>Duck Duck Go search crawler</Description>
  3850. <Type>R</Type>
  3851. <Comment>72.94.249.34</Comment>
  3852. <Link1>http://duckduckgo.com/</Link1>
  3853. <Link2>http://duckduckgo.com/duckduckbot.html</Link2>
  3854. </user-agent>
  3855. <user-agent>
  3856. <ID>id_a_f_267</ID>
  3857. <String>Dumbot(version 0.1 beta - dumbfind.com)</String>
  3858. <Description>DumbFind.com robot</Description>
  3859. <Type>R</Type>
  3860. <Comment></Comment>
  3861. <Link1>http://www.dumbfind.com</Link1>
  3862. <Link2></Link2>
  3863. </user-agent>
  3864. <user-agent>
  3865. <ID>id_a_f_268</ID>
  3866. <String>Dumbot(version 0.1 beta - http://www.dumbfind.com/dumbot.html)</String>
  3867. <Description>DumbFind.com robot</Description>
  3868. <Type>R</Type>
  3869. <Comment></Comment>
  3870. <Link1>http://www.dumbfind.com</Link1>
  3871. <Link2></Link2>
  3872. </user-agent>
  3873. <user-agent>
  3874. <ID>id_a_f_269</ID>
  3875. <String>Dumbot(version 0.1 beta)</String>
  3876. <Description>DumbFind.com robot</Description>
  3877. <Type>R</Type>
  3878. <Comment></Comment>
  3879. <Link1>http://www.dumbfind.com</Link1>
  3880. <Link2></Link2>
  3881. </user-agent>
  3882. <user-agent>
  3883. <ID>id_a_f_270</ID>
  3884. <String>e-sense 1.0 ea(www.vigiltech.com/esensedisclaim.html)</String>
  3885. <Description>Vigiltech e-Sense user research robot (website is offline)</Description>
  3886. <Type>R</Type>
  3887. <Comment></Comment>
  3888. <Link1></Link1>
  3889. <Link2></Link2>
  3890. </user-agent>
  3891. <user-agent>
  3892. <ID>id_a_f_271</ID>
  3893. <String>e-SocietyRobot(http://www.yama.info.waseda.ac.jp/~yamana/es/)</String>
  3894. <Description>e-Society Project (Japan) crawler (133.9.238.xx)</Description>
  3895. <Type>R</Type>
  3896. <Comment></Comment>
  3897. <Link1>http://www.yama.info.waseda.ac.jp</Link1>
  3898. <Link2></Link2>
  3899. </user-agent>
  3900. <user-agent>
  3901. <ID>id_a_f_280108_1</ID>
  3902. <String>eApolloBot/2.0 (compatible; heritrix/2.0.0-SNAPSHOT-20071024.170148 +http://www.eapollo-opto.com)</String>
  3903. <Description>Global Opto's eApollo Flash based search engine - Taiwan</Description>
  3904. <Type>R</Type>
  3905. <Comment></Comment>
  3906. <Link1>http://www.eapollo.com/eaSE.jsp?language=eng</Link1>
  3907. <Link2>http://www.global-opto.com/</Link2>
  3908. </user-agent>
  3909. <user-agent>
  3910. <ID>id_a_f_272</ID>
  3911. <String>EARTHCOM.info/1.x [www.earthcom.info]</String>
  3912. <Description>Earthcom (Czech Republic) search robot (194.108.39.xx)</Description>
  3913. <Type>R</Type>
  3914. <Comment>s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ...</Comment>
  3915. <Link1>http://www.earthcom.info</Link1>
  3916. <Link2></Link2>
  3917. </user-agent>
  3918. <user-agent>
  3919. <ID>id_a_f_273</ID>
  3920. <String>EARTHCOM.info/1.xbeta [www.earthcom.info]</String>
  3921. <Description>Earthcom (Czech Republic) search robot (194.108.39.xx)</Description>
  3922. <Type>R</Type>
  3923. <Comment>s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ...</Comment>
  3924. <Link1>http://www.earthcom.info</Link1>
  3925. <Link2></Link2>
  3926. </user-agent>
  3927. <user-agent>
  3928. <ID>id_a_f_274</ID>
  3929. <String>EasyDL/3.xx</String>
  3930. <Description>Keywen Encyclopedia Bot</Description>
  3931. <Type>R</Type>
  3932. <Comment></Comment>
  3933. <Link1>http://keywen.com/Encyclopedia/Bot/</Link1>
  3934. <Link2></Link2>
  3935. </user-agent>
  3936. <user-agent>
  3937. <ID>id_a_f_275</ID>
  3938. <String>EasyDL/3.xx http://keywen.com/Encyclopedia/Bot</String>
  3939. <Description>Keywen Encyclopedia Bot</Description>
  3940. <Type>R</Type>
  3941. <Comment></Comment>
  3942. <Link1>http://keywen.com/Encyclopedia/Bot/</Link1>
  3943. <Link2></Link2>
  3944. </user-agent>
  3945. <user-agent>
  3946. <ID>id_a_f_276</ID>
  3947. <String>EBrowse 1.4b</String>
  3948. <Description>Some site scanning tool via diff. IPs i.e.: - swbell.net (65.66.xxx.xxx)</Description>
  3949. <Type>S</Type>
  3950. <Comment></Comment>
  3951. <Link1></Link1>
  3952. <Link2></Link2>
  3953. </user-agent>
  3954. <user-agent>
  3955. <ID>id_a_f_277</ID>
  3956. <String>eCatch/3.0</String>
  3957. <Description>eCatch (now Wysigot) offline browser</Description>
  3958. <Type>B D</Type>
  3959. <Comment></Comment>
  3960. <Link1>http://www.ecatch.com</Link1>
  3961. <Link2></Link2>
  3962. </user-agent>
  3963. <user-agent>
  3964. <ID>id_a_f_278</ID>
  3965. <String>EchO!/2.0</String>
  3966. <Description>Echo.fr robot</Description>
  3967. <Type>R</Type>
  3968. <Comment></Comment>
  3969. <Link1>http://echo.fr/</Link1>
  3970. <Link2></Link2>
  3971. </user-agent>
  3972. <user-agent>
  3973. <ID>id_a_f_279</ID>
  3974. <String>Educate Search VxB</String>
  3975. <Description>Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx)</Description>
  3976. <Type>S</Type>
  3977. <Comment>s. also DSurf - 66.118.1xx.xxx (sagonet.com) - see also Full Web Bot - Industry Program 1.0.5</Comment>
  3978. <Link1></Link1>
  3979. <Link2></Link2>
  3980. </user-agent>
  3981. <user-agent>
  3982. <ID>id_a_f_280</ID>
  3983. <String>egothor/3.0a (+http://www.xdefine.org/robot.html)</String>
  3984. <Description>Xdefine text search engine robot - based on Egothor open source crawler</Description>
  3985. <Type>R</Type>
  3986. <Comment></Comment>
  3987. <Link1>http://www.xdefine.com/</Link1>
  3988. <Link2>http://www.egothor.org/</Link2>
  3989. </user-agent>
  3990. <user-agent>
  3991. <ID>id_a_f_281</ID>
  3992. <String>EgotoBot/4.8 (+http://www.egoto.com/about.htm)</String>
  3993. <Description>Egoto Search robot</Description>
  3994. <Type>R</Type>
  3995. <Comment></Comment>
  3996. <Link1>http://www.egoto.com</Link1>
  3997. <Link2></Link2>
  3998. </user-agent>
  3999. <user-agent>
  4000. <ID>id_a_f_211105_1</ID>
  4001. <String>ejupiter.com</String>
  4002. <Description>eJupiter searcg robot (206.191.49.xx)</Description>
  4003. <Type>R</Type>
  4004. <Comment></Comment>
  4005. <Link1>http://search.ejupiter.com/</Link1>
  4006. <Link2></Link2>
  4007. </user-agent>
  4008. <user-agent>
  4009. <ID>id_a_f_282</ID>
  4010. <String>EldoS TimelyWeb/3.x</String>
  4011. <Description>TimelyWeb web page monitoring tool</Description>
  4012. <Type>C</Type>
  4013. <Comment>s. also TimelyWeb/...</Comment>
  4014. <Link1>http://www.eldos.org/timelyweb/timelyweb.html</Link1>
  4015. <Link2></Link2>
  4016. </user-agent>
  4017. <user-agent>
  4018. <ID>id_a_f_283</ID>
  4019. <String>elfbot/1.0 (+http://www.uchoose.de/crawler/elfbot/)</String>
  4020. <Description>Elftales crawler for uChoose theme based search (Germany)</Description>
  4021. <Type>R</Type>
  4022. <Comment></Comment>
  4023. <Link1>http://www.uchoose.de</Link1>
  4024. <Link2></Link2>
  4025. </user-agent>
  4026. <user-agent>
  4027. <ID>id_a_f_300707_1</ID>
  4028. <String>ELI/20070402:2.0 (DAUM RSS Robot&#44; Daum Communications Corp.; +http://ws.daum.net/aboutkr.html)</String>
  4029. <Description>DAUMOA - RSS search robot of Daum</Description>
  4030. <Type>R</Type>
  4031. <Comment>211.115.109.1xx</Comment>
  4032. <Link1>http://ws.daum.net/abouten.html</Link1>
  4033. <Link2></Link2>
  4034. </user-agent>
  4035. <user-agent>
  4036. <ID>id_a_f_284</ID>
  4037. <String>ELinks (0.x.x; Linux 2.4.20 i586; 132x60)</String>
  4038. <Description>ELinks text mode browser</Description>
  4039. <Type>B</Type>
  4040. <Comment></Comment>
  4041. <Link1>http://elinks.or.cz/</Link1>
  4042. <Link2></Link2>
  4043. </user-agent>
  4044. <user-agent>
  4045. <ID>id_a_f_285</ID>
  4046. <String>ELinks/0.x.x (textmode; NetBSD 1.6.2 sparc; 132x43)</String>
  4047. <Description>ELinks text mode browser</Description>
  4048. <Type>B</Type>
  4049. <Comment></Comment>
  4050. <Link1>http://elinks.or.cz/</Link1>
  4051. <Link2></Link2>
  4052. </user-agent>
  4053. <user-agent>
  4054. <ID>id_a_f_286</ID>
  4055. <String>EmailSiphon</String>
  4056. <Description>Sonic E-mail collector</Description>
  4057. <Type>S</Type>
  4058. <Comment></Comment>
  4059. <Link1>http://www.americaint.com/superstore/elist.html</Link1>
  4060. <Link2></Link2>
  4061. </user-agent>
  4062. <user-agent>
  4063. <ID>id_a_f_220508_2</ID>
  4064. <String>EmailSpider</String>
  4065. <Description>EmailSpider E-mail harvesting  software</Description>
  4066. <Type>S</Type>
  4067. <Comment></Comment>
  4068. <Link1>http://www.emailspider.net/index.php?kat=11</Link1>
  4069. <Link2></Link2>
  4070. </user-agent>
  4071. <user-agent>
  4072. <ID>id_a_f_287</ID>
  4073. <String>EmailWolf 1.00</String>
  4074. <Description>Trellian EMailWolf E-mail collector</Description>
  4075. <Type>S</Type>
  4076. <Comment></Comment>
  4077. <Link1>http://www.trellian.com</Link1>
  4078. <Link2></Link2>
  4079. </user-agent>
  4080. <user-agent>
  4081. <ID>id_a_f_288</ID>
  4082. <String>EmeraldShield.com WebBot</String>
  4083. <Description>EmeraldShield spam and web filtration services</Description>
  4084. <Type>P R</Type>
  4085. <Comment></Comment>
  4086. <Link1>http://www.emeraldshield.com</Link1>
  4087. <Link2></Link2>
  4088. </user-agent>
  4089. <user-agent>
  4090. <ID>id_a_f_289</ID>
  4091. <String>EmeraldShield.com WebBot (http://www.emeraldshield.com/webbot.aspx)</String>
  4092. <Description>EmeraldShield spam and web filtration services</Description>
  4093. <Type>P R</Type>
  4094. <Comment></Comment>
  4095. <Link1>http://www.emeraldshield.com</Link1>
  4096. <Link2></Link2>
  4097. </user-agent>
  4098. <user-agent>
  4099. <ID>id_a_f_070606_2</ID>
  4100. <String>EMPAS_ROBOT</String>
  4101. <Description>Empas search Korea robot (220.95.22x.xxx)</Description>
  4102. <Type>R</Type>
  4103. <Comment></Comment>
  4104. <Link1>http://www.empas.com/</Link1>
  4105. <Link2></Link2>
  4106. </user-agent>
  4107. <user-agent>
  4108. <ID>id_a_f_280208_1</ID>
  4109. <String>EnaBot/1.x (http://www.enaball.com/crawler.html)</String>
  4110. <Description>Enabot - Enaball semantic search project crawler</Description>
  4111. <Type>R</Type>
  4112. <Comment></Comment>
  4113. <Link1>http://www.enaball.com/crawler.html</Link1>
  4114. <Link2></Link2>
  4115. </user-agent>
  4116. <user-agent>
  4117. <ID>id_a_f_110506_4</ID>
  4118. <String>endo/1.0 (Mac OS X; ppc i386; http://kula.jp/endo)</String>
  4119. <Description>endo - Mac news site and blog aggregator</Description>
  4120. <Type>B</Type>
  4121. <Comment></Comment>
  4122. <Link1>http://kula.jp/software/endo/</Link1>
  4123. <Link2></Link2>
  4124. </user-agent>
  4125. <user-agent>
  4126. <ID>id_a_f_290</ID>
  4127. <String>Enfish Tracker</String>
  4128. <Description>Enfish Personal search tool</Description>
  4129. <Type>R</Type>
  4130. <Comment></Comment>
  4131. <Link1>http://www.enfish.com</Link1>
  4132. <Link2></Link2>
  4133. </user-agent>
  4134. <user-agent>
  4135. <ID>id_a_f_291</ID>
  4136. <String>Enterprise_Search/1.0</String>
  4137. <Description>Enterprise Search engine software (64.202.165.xxx)</Description>
  4138. <Type>R</Type>
  4139. <Comment> s. also - ES.NET_Crawler - InnerpriseBot</Comment>
  4140. <Link1>http://www.innerprise.net</Link1>
  4141. <Link2></Link2>
  4142. </user-agent>
  4143. <user-agent>
  4144. <ID>id_a_f_292</ID>
  4145. <String>Enterprise_Search/1.0.xxx</String>
  4146. <Description>Enterprise Search engine software (64.202.165.xxx)</Description>
  4147. <Type>R</Type>
  4148. <Comment> s. also - ES.NET_Crawler - InnerpriseBot</Comment>
  4149. <Link1>http://www.innerprise.net</Link1>
  4150. <Link2></Link2>
  4151. </user-agent>
  4152. <user-agent>
  4153. <ID>id_a_f_293</ID>
  4154. <String>Enterprise_Search/1.00.xxx;MSSQL (http://www.innerprise.net/es-spider.asp)</String>
  4155. <Description>Enterprise Search engine software (64.202.165.xxx)</Description>
  4156. <Type>R</Type>
  4157. <Comment> s. also - ES.NET_Crawler - InnerpriseBot</Comment>
  4158. <Link1>http://www.innerprise.net</Link1>
  4159. <Link2></Link2>
  4160. </user-agent>
  4161. <user-agent>
  4162. <ID>id_a_f_230706_1</ID>
  4163. <String>envolk/1.7 (+http://www.envolk.com/envolkspiderinfo.php)</String>
  4164. <Description>Envolk Web Search robot</Description>
  4165. <Type>R</Type>
  4166. <Comment>70.169.191.x</Comment>
  4167. <Link1>http://www.envolk.com/</Link1>
  4168. <Link2></Link2>
  4169. </user-agent>
  4170. <user-agent>
  4171. <ID>id_a_f_294</ID>
  4172. <String>envolk[ITS]spider/1.6(+http://www.envolk.com/envolkspider.html)</String>
  4173. <Description>Envolk Web Search robot</Description>
  4174. <Type>R</Type>
  4175. <Comment>70.169.191.x</Comment>
  4176. <Link1>http://www.envolk.com/</Link1>
  4177. <Link2></Link2>
  4178. </user-agent>
  4179. <user-agent>
  4180. <ID>id_a_f_295</ID>
  4181. <String>EroCrawler</String>
  4182. <Description>EroCrawler adult search robot</Description>
  4183. <Type>R</Type>
  4184. <Comment></Comment>
  4185. <Link1>http://www.erocrawler.com</Link1>
  4186. <Link2></Link2>
  4187. </user-agent>
  4188. <user-agent>
  4189. <ID>id_a_f_296</ID>
  4190. <String>ES.NET_Crawler/2.0 (http://search.innerprise.net/)</String>
  4191. <Description>Enterprise Search engine software (64.202.165.xxx)</Description>
  4192. <Type>R</Type>
  4193. <Comment>s. also - Enterprise_Search - InnerpriseBot</Comment>
  4194. <Link1>http://search.innerprise.net</Link1>
  4195. <Link2></Link2>
  4196. </user-agent>
  4197. <user-agent>
  4198. <ID>id_a_f_297</ID>
  4199. <String>eseek-larbin_2.6.2 (crawler@exactseek.com)</String>
  4200. <Description>ExactSEEK (Jayde Online) robot</Description>
  4201. <Type>R</Type>
  4202. <Comment>see also ExactSeek Crawler / eseek-larbin / exactseek.com</Comment>
  4203. <Link1>http://www.exactseek.com</Link1>
  4204. <Link2></Link2>
  4205. </user-agent>
  4206. <user-agent>
  4207. <ID>id_a_f_298</ID>
  4208. <String>ESISmartSpider</String>
  4209. <Description>ESI Smart-Spider toolkit</Description>
  4210. <Type>R</Type>
  4211. <Comment></Comment>
  4212. <Link1>http://www.smart-spider.com/</Link1>
  4213. <Link2></Link2>
  4214. </user-agent>
  4215. <user-agent>
  4216. <ID>id_a_f_299</ID>
  4217. <String>eStyleSearch 4 (compatible; MSIE 6.0; Windows NT 5.0)</String>
  4218. <Description>e-Style ISP search (Russia) robot (217.174.103.xxx)</Description>
  4219. <Type>R</Type>
  4220. <Comment></Comment>
  4221. <Link1>http://www.e-styleisp.ru/</Link1>
  4222. <Link2></Link2>
  4223. </user-agent>
  4224. <user-agent>
  4225. <ID>id_a_f_300</ID>
  4226. <String>ESurf15a 15</String>
  4227. <Description>Some site scanning tool via diff. IPs</Description>
  4228. <Type>S</Type>
  4229. <Comment>s. also DSurf - PBrowse ...</Comment>
  4230. <Link1></Link1>
  4231. <Link2></Link2>
  4232. </user-agent>
  4233. <user-agent>
  4234. <ID>id_a_f_301</ID>
  4235. <String>EuripBot/0.x (+http://www.eurip.com) GetFile</String>
  4236. <Description>Eurip.com - European Internet Portal robot</Description>
  4237. <Type>R</Type>
  4238. <Comment></Comment>
  4239. <Link1>http://www.eurip.com</Link1>
  4240. <Link2></Link2>
  4241. </user-agent>
  4242. <user-agent>
  4243. <ID>id_a_f_302</ID>
  4244. <String>EuripBot/0.x (+http://www.eurip.com) GetRobots</String>
  4245. <Description>Eurip.com - European Internet Portal robot</Description>
  4246. <Type>R</Type>
  4247. <Comment></Comment>
  4248. <Link1>http://www.eurip.com</Link1>
  4249. <Link2></Link2>
  4250. </user-agent>
  4251. <user-agent>
  4252. <ID>id_a_f_303</ID>
  4253. <String>EuripBot/0.x (+http://www.eurip.com) PreCheck</String>
  4254. <Description>Eurip.com - European Internet Portal robot</Description>
  4255. <Type>R</Type>
  4256. <Comment></Comment>
  4257. <Link1>http://www.eurip.com</Link1>
  4258. <Link2></Link2>
  4259. </user-agent>
  4260. <user-agent>
  4261. <ID>id_a_f_220508_3</ID>
  4262. <String>Eurobot/1.0 (http://www.ayell.eu)</String>
  4263. <Description>Ayell Euronet business directory robot</Description>
  4264. <Type>R</Type>
  4265. <Comment></Comment>
  4266. <Link1>http://www.ayell.eu/</Link1>
  4267. <Link2></Link2>
  4268. </user-agent>
  4269. <user-agent>
  4270. <ID>id_a_f_030206_4</ID>
  4271. <String>EvaalSE - bot@evaal.com</String>
  4272. <Description>Evaal Search Engine robot</Description>
  4273. <Type>R</Type>
  4274. <Comment>based on Nutch</Comment>
  4275. <Link1>http://www.evaal.com/</Link1>
  4276. <Link2>http://search.evaal.com/en/about.html</Link2>
  4277. </user-agent>
  4278. <user-agent>
  4279. <ID>id_a_f_304</ID>
  4280. <String>eventax/1.3 (eventax; http://www.eventax.de/; info@eventax.de)</String>
  4281. <Description>Eventax event search (Germany)</Description>
  4282. <Type>R</Type>
  4283. <Comment></Comment>
  4284. <Link1>http://www.eventax.de</Link1>
  4285. <Link2></Link2>
  4286. </user-agent>
  4287. <user-agent>
  4288. <ID>id_a_f_291205_1</ID>
  4289. <String>Everest-Vulcan Inc./0.1 (R&amp;D project; host=e-1-24; http://everest.vulcan.com/crawlerhelp)</String>
  4290. <Description>Vulcan Inc. Everest crawler (in development)</Description>
  4291. <Type>R</Type>
  4292. <Comment></Comment>
  4293. <Link1>http://www.vulcan.com/</Link1>
  4294. <Link2></Link2>
  4295. </user-agent>
  4296. <user-agent>
  4297. <ID>id_a_f_305</ID>
  4298. <String>Everest-Vulcan Inc./0.1 (R&amp;D project; http://everest.vulcan.com/crawlerhelp)</String>
  4299. <Description>Vulcan Inc. Everest crawler (in development)</Description>
  4300. <Type>R</Type>
  4301. <Comment></Comment>
  4302. <Link1>http://www.vulcan.com/</Link1>
  4303. <Link2></Link2>
  4304. </user-agent>
  4305. <user-agent>
  4306. <ID>id_a_f_050406_2</ID>
  4307. <String>Exabot-Images/1.0</String>
  4308. <Description>Exalead Websearch image crawler (193.47.80.xx)</Description>
  4309. <Type>R</Type>
  4310. <Comment>Exabot-Images only requests robots.txt - image crawling under UA NG/4.0.1229</Comment>
  4311. <Link1>http://www.exalead.com/search</Link1>
  4312. <Link2></Link2>
  4313. </user-agent>
  4314. <user-agent>
  4315. <ID>id_a_f_211206_1</ID>
  4316. <String>Exabot-Test/1.0</String>
  4317. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  4318. <Type>R</Type>
  4319. <Comment>s. Harvest-NG/1.0.2 and Exalead NG...</Comment>
  4320. <Link1>http://www.exabot.com/</Link1>
  4321. <Link2></Link2>
  4322. </user-agent>
  4323. <user-agent>
  4324. <ID>id_a_f_190106_1</ID>
  4325. <String>Exabot/2.0</String>
  4326. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  4327. <Type>R</Type>
  4328. <Comment>s. Harvest-NG/1.0.2 and Exalead NG...</Comment>
  4329. <Link1>http://www.exabot.com/</Link1>
  4330. <Link2></Link2>
  4331. </user-agent>
  4332. <user-agent>
  4333. <ID>id_a_f_211206_2</ID>
  4334. <String>Exabot/3.0</String>
  4335. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  4336. <Type>R</Type>
  4337. <Comment>s. Harvest-NG/1.0.2 and Exalead NG...</Comment>
  4338. <Link1>http://www.exabot.com/</Link1>
  4339. <Link2></Link2>
  4340. </user-agent>
  4341. <user-agent>
  4342. <ID>id_a_f_306</ID>
  4343. <String>ExactSearch</String>
  4344. <Description>eXact Search Bar for IE</Description>
  4345. <Type>B</Type>
  4346. <Comment></Comment>
  4347. <Link1>http://www.exactsearchbar.com/exact04</Link1>
  4348. <Link2></Link2>
  4349. </user-agent>
  4350. <user-agent>
  4351. <ID>id_a_f_307</ID>
  4352. <String>ExactSeek Crawler/0.1</String>
  4353. <Description>ExactSEEK (Jayde Online) robot</Description>
  4354. <Type>R</Type>
  4355. <Comment>see also eseek-larbin / exactseek.com</Comment>
  4356. <Link1>http://www.exactseek.com</Link1>
  4357. <Link2></Link2>
  4358. </user-agent>
  4359. <user-agent>
  4360. <ID>id_a_f_308</ID>
  4361. <String>exactseek-crawler-2.63 (crawler@exactseek.com)</String>
  4362. <Description>ExactSEEK (Jayde Online) robot</Description>
  4363. <Type>R</Type>
  4364. <Comment>see also eseek-larbin / exactseek.com</Comment>
  4365. <Link1>http://www.exactseek.com</Link1>
  4366. <Link2></Link2>
  4367. </user-agent>
  4368. <user-agent>
  4369. <ID>id_a_f_309</ID>
  4370. <String>exactseek-pagereaper-2.63 (crawler@exactseek.com)</String>
  4371. <Description>ExactSEEK (Jayde Online) robot</Description>
  4372. <Type>R</Type>
  4373. <Comment>see also eseek-larbin / exactseek.com</Comment>
  4374. <Link1>http://www.exactseek.com</Link1>
  4375. <Link2></Link2>
  4376. </user-agent>
  4377. <user-agent>
  4378. <ID>id_a_f_050606_2</ID>
  4379. <String>exactseek.com</String>
  4380. <Description>ExactSEEK (Jayde Online) robot (69.9.181.1xx)</Description>
  4381. <Type>R</Type>
  4382. <Comment>see also eseek-larbin</Comment>
  4383. <Link1>http://www.exactseek.com</Link1>
  4384. <Link2></Link2>
  4385. </user-agent>
  4386. <user-agent>
  4387. <ID>id_a_f_310</ID>
  4388. <String>Exalead NG/MimeLive Client (convert/http/0.120)</String>
  4389. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  4390. <Type>R</Type>
  4391. <Comment>s. Harvest-NG/1.0.2 and NG/1.0</Comment>
  4392. <Link1>http://www.exabot.com</Link1>
  4393. <Link2></Link2>
  4394. </user-agent>
  4395. <user-agent>
  4396. <ID>id_a_f_311</ID>
  4397. <String>Excalibur Internet Spider V6.5.4</String>
  4398. <Description>Excalibur (now Convera) spider software</Description>
  4399. <Type>R</Type>
  4400. <Comment></Comment>
  4401. <Link1>http://www.excalib.com</Link1>
  4402. <Link2></Link2>
  4403. </user-agent>
  4404. <user-agent>
  4405. <ID>id_a_f_191206_1</ID>
  4406. <String>Execrawl/1.0 (Execrawl; http://www.execrawl.com/; bot@execrawl.com)</String>
  4407. <Description>Execrawl software search using nutch</Description>
  4408. <Type>R</Type>
  4409. <Comment>72.36.179.1xx</Comment>
  4410. <Link1>http://www.execrawl.com/</Link1>
  4411. <Link2></Link2>
  4412. </user-agent>
  4413. <user-agent>
  4414. <ID>id_a_f_060608_1</ID>
  4415. <String>exooba crawler/exooba crawler (crawler for exooba.com; http://www.exooba.com/; info at exooba dot com)</String>
  4416. <Description>exooba crawler for exooba search pre-alpha development</Description>
  4417. <Type>R</Type>
  4418. <Comment>216.195.184.xx</Comment>
  4419. <Link1>http://www.exooba.com/</Link1>
  4420. <Link2></Link2>
  4421. </user-agent>
  4422. <user-agent>
  4423. <ID>id_a_f_060608_2</ID>
  4424. <String>exooba/exooba crawler (exooba; exooba)</String>
  4425. <Description>exooba crawler for exooba search pre-alpha development</Description>
  4426. <Type>R</Type>
  4427. <Comment>216.195.184.xx</Comment>
  4428. <Link1>http://www.exooba.com/</Link1>
  4429. <Link2></Link2>
  4430. </user-agent>
  4431. <user-agent>
  4432. <ID>id_a_f_312</ID>
  4433. <String>ExperimentalHenrytheMiragoRobot</String>
  4434. <Description>Mirago UK Robot</Description>
  4435. <Type>R</Type>
  4436. <Comment></Comment>
  4437. <Link1>http://www.mirago.co.uk</Link1>
  4438. <Link2></Link2>
  4439. </user-agent>
  4440. <user-agent>
  4441. <ID>id_a_f_313</ID>
  4442. <String>Expired Domain Sleuth</String>
  4443. <Description>Expired Domain Sleuth domain name tool</Description>
  4444. <Type>R C</Type>
  4445. <Comment></Comment>
  4446. <Link1>http://expireddomainsleuth.com/</Link1>
  4447. <Link2></Link2>
  4448. </user-agent>
  4449. <user-agent>
  4450. <ID>id_a_f_314</ID>
  4451. <String>Express WebPictures (www.express-soft.com)</String>
  4452. <Description>Express Web Pictures image browser</Description>
  4453. <Type>B D</Type>
  4454. <Comment></Comment>
  4455. <Link1>http://www.express-soft.com/</Link1>
  4456. <Link2></Link2>
  4457. </user-agent>
  4458. <user-agent>
  4459. <ID>id_a_f_315</ID>
  4460. <String>ExtractorPro</String>
  4461. <Description>Extractor Pro e-mail collector</Description>
  4462. <Type>S</Type>
  4463. <Comment></Comment>
  4464. <Link1>http://www.extractorpro.com</Link1>
  4465. <Link2></Link2>
  4466. </user-agent>
  4467. <user-agent>
  4468. <ID>id_a_f_170106_1</ID>
  4469. <String>Extreme Picture Finder</String>
  4470. <Description>Exisoftware image grabber and downloading tool</Description>
  4471. <Type>D</Type>
  4472. <Comment></Comment>
  4473. <Link1>http://www.exisoftware.com/picture_finder/</Link1>
  4474. <Link2></Link2>
  4475. </user-agent>
  4476. <user-agent>
  4477. <ID>id_a_f_316</ID>
  4478. <String>EyeCatcher (Download-tipp.de)/1.0</String>
  4479. <Description>Download-Tipp Germany robot</Description>
  4480. <Type>R</Type>
  4481. <Comment></Comment>
  4482. <Link1>http://download-tipp.de</Link1>
  4483. <Link2></Link2>
  4484. </user-agent>
  4485. <user-agent>
  4486. <ID>id_a_f_091006_1</ID>
  4487. <String>Factbot 1.09 (see http://www.factbites.com/webmasters.php)</String>
  4488. <Description>Factbites search robot</Description>
  4489. <Type>R</Type>
  4490. <Comment>70.86.159.1xx</Comment>
  4491. <Link1>http://www.factbites.com/</Link1>
  4492. <Link2></Link2>
  4493. </user-agent>
  4494. <user-agent>
  4495. <ID>id_a_f_220906_1</ID>
  4496. <String>factbot : http://www.factbites.com/robots</String>
  4497. <Description>Factbites search robot</Description>
  4498. <Type>R</Type>
  4499. <Comment>70.86.159.1xx</Comment>
  4500. <Link1>http://www.factbites.com/</Link1>
  4501. <Link2></Link2>
  4502. </user-agent>
  4503. <user-agent>
  4504. <ID>id_a_f_221006_1</ID>
  4505. <String>FaEdit/2.0.x</String>
  4506. <Description>FaEdit Professional - Japanese bookmark manager</Description>
  4507. <Type>C</Type>
  4508. <Comment></Comment>
  4509. <Link1>https://sw.vector.co.jp/swreg/step1.reserve?srno=SR040433&amp;site=y</Link1>
  4510. <Link2></Link2>
  4511. </user-agent>
  4512. <user-agent>
  4513. <ID>id_a_f_317</ID>
  4514. <String>FairAd Client</String>
  4515. <Description>FairAd user</Description>
  4516. <Type>P</Type>
  4517. <Comment></Comment>
  4518. <Link1>http://www.fairad.de</Link1>
  4519. <Link2></Link2>
  4520. </user-agent>
  4521. <user-agent>
  4522. <ID>id_a_f_051206_1</ID>
  4523. <String>FANGCrawl/0.01</String>
  4524. <Description>Safe-t.net web filtering service</Description>
  4525. <Type>P</Type>
  4526. <Comment>63.167.160.1xx</Comment>
  4527. <Link1>http://www.safe-t.net/</Link1>
  4528. <Link2></Link2>
  4529. </user-agent>
  4530. <user-agent>
  4531. <ID>id_a_f_210206_1</ID>
  4532. <String>FARK.com link verifier</String>
  4533. <Description>Drew Curtis' FARK.com link checking</Description>
  4534. <Type>C</Type>
  4535. <Comment></Comment>
  4536. <Link1>http://www.fark.com/</Link1>
  4537. <Link2></Link2>
  4538. </user-agent>
  4539. <user-agent>
  4540. <ID>id_a_f_318</ID>
  4541. <String>Fast Crawler Gold Edition</String>
  4542. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4543. <Type>R</Type>
  4544. <Comment></Comment>
  4545. <Link1>http://www.alltheweb.com</Link1>
  4546. <Link2></Link2>
  4547. </user-agent>
  4548. <user-agent>
  4549. <ID>id_a_f_319</ID>
  4550. <String>FAST Enterprise Crawler 6 (Experimental)</String>
  4551. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4552. <Type>R</Type>
  4553. <Comment></Comment>
  4554. <Link1>http://www.alltheweb.com</Link1>
  4555. <Link2></Link2>
  4556. </user-agent>
  4557. <user-agent>
  4558. <ID>id_a_f_040206_1</ID>
  4559. <String>FAST Enterprise Crawler 6 / Scirus scirus-crawler@fast.no; http://www.scirus.com/srsapp/contactus/</String>
  4560. <Description>Fast Enterprise Crawler (66.151.181.xx) for Scirus scienctific information search</Description>
  4561. <Type>R</Type>
  4562. <Comment></Comment>
  4563. <Link1>http://www.scirus.com/srsapp/</Link1>
  4564. <Link2>http://www.alltheweb.com</Link2>
  4565. </user-agent>
  4566. <user-agent>
  4567. <ID>id_a_f_320</ID>
  4568. <String>FAST Enterprise Crawler 6 used by Cobra Development (admin@fastsearch.com)</String>
  4569. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4570. <Type>R</Type>
  4571. <Comment></Comment>
  4572. <Link1>http://www.alltheweb.com</Link1>
  4573. <Link2></Link2>
  4574. </user-agent>
  4575. <user-agent>
  4576. <ID>id_a_f_070507_1</ID>
  4577. <String>FAST Enterprise Crawler 6 used by Comperio AS (sts@comperio.no)</String>
  4578. <Description>Comperio Web Miner based on Fast ESP</Description>
  4579. <Type>R</Type>
  4580. <Comment></Comment>
  4581. <Link1>http://www.comperio.no/index.php?option=com_content&amp;task=blogcategory&amp;id=7&amp;Itemid=27</Link1>
  4582. <Link2></Link2>
  4583. </user-agent>
  4584. <user-agent>
  4585. <ID>id_a_f_321</ID>
  4586. <String>FAST Enterprise Crawler 6 used by FAST (FAST)</String>
  4587. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4588. <Type>R</Type>
  4589. <Comment></Comment>
  4590. <Link1>http://www.alltheweb.com</Link1>
  4591. <Link2></Link2>
  4592. </user-agent>
  4593. <user-agent>
  4594. <ID>id_a_f_161106_1</ID>
  4595. <String>FAST Enterprise Crawler 6 used by Pages Jaunes (pvincent@pagesjaunes.fr)</String>
  4596. <Description>Pages Jaunes business search (France) robot using Fast Enterprise Crawler</Description>
  4597. <Type>R</Type>
  4598. <Comment>193.252.242.xx</Comment>
  4599. <Link1>http://www.pagesjaunes.fr/</Link1>
  4600. <Link2></Link2>
  4601. </user-agent>
  4602. <user-agent>
  4603. <ID>id_a_f_322</ID>
  4604. <String>FAST Enterprise Crawler 6 used by Sensis.com.au Web Crawler (search_comments\at\sensis\dot\com\dot\au)</String>
  4605. <Description>Fast/Alltheweb crawler for Sensis.com.au Australian search (66.151.181.xx)</Description>
  4606. <Type>R</Type>
  4607. <Comment></Comment>
  4608. <Link1>http://www.sensis.com.au/</Link1>
  4609. <Link2>http://www.alltheweb.com</Link2>
  4610. </user-agent>
  4611. <user-agent>
  4612. <ID>id_a_f_251007_2</ID>
  4613. <String>FAST Enterprise Crawler 6 used by Singapore Press Holdings (crawler@sphsearch.sg)</String>
  4614. <Description>SPH Search - Singapore related search using Fast crawler</Description>
  4615. <Type>R</Type>
  4616. <Comment>202.176.220.xx</Comment>
  4617. <Link1>http://www.sphsearch.sg/</Link1>
  4618. <Link2></Link2>
  4619. </user-agent>
  4620. <user-agent>
  4621. <ID>id_a_f_280606_2</ID>
  4622. <String>FAST Enterprise Crawler 6 used by WWU (wardi@uni-muenster.de)</String>
  4623. <Description>FAST Enterprise Crawler  used by WWU (University of Muenster - Germany)</Description>
  4624. <Type>C</Type>
  4625. <Comment>128.176.188.2xx</Comment>
  4626. <Link1>http://www.uni-muenster.de/en/index.html</Link1>
  4627. <Link2>http://www.alltheweb.com</Link2>
  4628. </user-agent>
  4629. <user-agent>
  4630. <ID>id_a_f_323</ID>
  4631. <String>FAST Enterprise Crawler/6 (www.fastsearch.com)</String>
  4632. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4633. <Type>R</Type>
  4634. <Comment></Comment>
  4635. <Link1>http://www.alltheweb.com</Link1>
  4636. <Link2></Link2>
  4637. </user-agent>
  4638. <user-agent>
  4639. <ID>id_a_f_324</ID>
  4640. <String>FAST Enterprise Crawler/6.4 (helpdesk at fast.no)</String>
  4641. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4642. <Type>R</Type>
  4643. <Comment></Comment>
  4644. <Link1>http://www.alltheweb.com</Link1>
  4645. <Link2></Link2>
  4646. </user-agent>
  4647. <user-agent>
  4648. <ID>id_a_f_325</ID>
  4649. <String>FAST FirstPage retriever (compatible; MSIE 5.5; Mozilla/4.0)</String>
  4650. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4651. <Type>R</Type>
  4652. <Comment></Comment>
  4653. <Link1>http://www.alltheweb.com</Link1>
  4654. <Link2></Link2>
  4655. </user-agent>
  4656. <user-agent>
  4657. <ID>id_a_f_326</ID>
  4658. <String>FAST MetaWeb Crawler (helpdesk at fastsearch dot com)</String>
  4659. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4660. <Type>R</Type>
  4661. <Comment></Comment>
  4662. <Link1>http://www.alltheweb.com</Link1>
  4663. <Link2></Link2>
  4664. </user-agent>
  4665. <user-agent>
  4666. <ID>id_a_f_327</ID>
  4667. <String>Fast PartnerSite Crawler</String>
  4668. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4669. <Type>R</Type>
  4670. <Comment></Comment>
  4671. <Link1>http://www.alltheweb.com</Link1>
  4672. <Link2></Link2>
  4673. </user-agent>
  4674. <user-agent>
  4675. <ID>id_a_f_328</ID>
  4676. <String>FAST-WebCrawler/2.2.10 (Multimedia Search) (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)</String>
  4677. <Description>Fast/Alltheweb multimedia crawler</Description>
  4678. <Type>R</Type>
  4679. <Comment>see also Yahoo-MMCrawler/3.x</Comment>
  4680. <Link1>http://www.alltheweb.com</Link1>
  4681. <Link2></Link2>
  4682. </user-agent>
  4683. <user-agent>
  4684. <ID>id_a_f_329</ID>
  4685. <String>FAST-WebCrawler/2.2.6 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)</String>
  4686. <Description>Fast/Alltheweb crawler</Description>
  4687. <Type>R</Type>
  4688. <Comment></Comment>
  4689. <Link1>http://www.alltheweb.com</Link1>
  4690. <Link2></Link2>
  4691. </user-agent>
  4692. <user-agent>
  4693. <ID>id_a_f_330</ID>
  4694. <String>FAST-WebCrawler/2.2.7 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no</String>
  4695. <Description>Fast/Alltheweb crawler</Description>
  4696. <Type>R</Type>
  4697. <Comment></Comment>
  4698. <Link1>http://www.alltheweb.com</Link1>
  4699. <Link2></Link2>
  4700. </user-agent>
  4701. <user-agent>
  4702. <ID>id_a_f_331</ID>
  4703. <String>FAST-WebCrawler/2.2.8 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no</String>
  4704. <Description>Fast/Alltheweb crawler</Description>
  4705. <Type>R</Type>
  4706. <Comment></Comment>
  4707. <Link1>http://www.alltheweb.com</Link1>
  4708. <Link2></Link2>
  4709. </user-agent>
  4710. <user-agent>
  4711. <ID>id_a_f_332</ID>
  4712. <String>FAST-WebCrawler/3.2 test</String>
  4713. <Description>Fast/Alltheweb crawler</Description>
  4714. <Type>R</Type>
  4715. <Comment></Comment>
  4716. <Link1>http://www.alltheweb.com</Link1>
  4717. <Link2></Link2>
  4718. </user-agent>
  4719. <user-agent>
  4720. <ID>id_a_f_333</ID>
  4721. <String>FAST-WebCrawler/3.3 (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)</String>
  4722. <Description>Fast/Alltheweb crawler</Description>
  4723. <Type>R</Type>
  4724. <Comment></Comment>
  4725. <Link1>http://www.alltheweb.com</Link1>
  4726. <Link2></Link2>
  4727. </user-agent>
  4728. <user-agent>
  4729. <ID>id_a_f_334</ID>
  4730. <String>FAST-WebCrawler/3.4/Nirvana (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)</String>
  4731. <Description>Fast/Alltheweb crawler</Description>
  4732. <Type>R</Type>
  4733. <Comment></Comment>
  4734. <Link1>http://www.alltheweb.com</Link1>
  4735. <Link2></Link2>
  4736. </user-agent>
  4737. <user-agent>
  4738. <ID>id_a_f_335</ID>
  4739. <String>FAST-WebCrawler/3.4/PartnerSite (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)</String>
  4740. <Description>Fast/Alltheweb crawler</Description>
  4741. <Type>R</Type>
  4742. <Comment></Comment>
  4743. <Link1>http://www.alltheweb.com</Link1>
  4744. <Link2></Link2>
  4745. </user-agent>
  4746. <user-agent>
  4747. <ID>id_a_f_336</ID>
  4748. <String>FAST-WebCrawler/3.5 (atw-crawler at fast dot no; http://fast.no/support.php?c=faqs/crawler)</String>
  4749. <Description>Fast/Alltheweb crawler</Description>
  4750. <Type>R</Type>
  4751. <Comment></Comment>
  4752. <Link1>http://www.alltheweb.com</Link1>
  4753. <Link2></Link2>
  4754. </user-agent>
  4755. <user-agent>
  4756. <ID>id_a_f_337</ID>
  4757. <String>FAST-WebCrawler/3.6 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)</String>
  4758. <Description>Fast/Alltheweb crawler</Description>
  4759. <Type>R</Type>
  4760. <Comment></Comment>
  4761. <Link1>http://www.alltheweb.com</Link1>
  4762. <Link2></Link2>
  4763. </user-agent>
  4764. <user-agent>
  4765. <ID>id_a_f_338</ID>
  4766. <String>FAST-WebCrawler/3.6/FirstPage (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)</String>
  4767. <Description>Fast/Alltheweb crawler</Description>
  4768. <Type>R</Type>
  4769. <Comment></Comment>
  4770. <Link1>http://www.alltheweb.com</Link1>
  4771. <Link2></Link2>
  4772. </user-agent>
  4773. <user-agent>
  4774. <ID>id_a_f_339</ID>
  4775. <String>FAST-WebCrawler/3.7 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)</String>
  4776. <Description>Fast/Alltheweb crawler</Description>
  4777. <Type>R</Type>
  4778. <Comment></Comment>
  4779. <Link1>http://www.alltheweb.com</Link1>
  4780. <Link2></Link2>
  4781. </user-agent>
  4782. <user-agent>
  4783. <ID>id_a_f_340</ID>
  4784. <String>FAST-WebCrawler/3.7/FirstPage (atw-crawler at fast dot no;http://fast.no/support/crawler.asp)</String>
  4785. <Description>Fast/Alltheweb crawler</Description>
  4786. <Type>R</Type>
  4787. <Comment></Comment>
  4788. <Link1>http://www.alltheweb.com</Link1>
  4789. <Link2></Link2>
  4790. </user-agent>
  4791. <user-agent>
  4792. <ID>id_a_f_341</ID>
  4793. <String>FAST-WebCrawler/3.8 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)</String>
  4794. <Description>Fast/Alltheweb crawler</Description>
  4795. <Type>R</Type>
  4796. <Comment></Comment>
  4797. <Link1>http://www.alltheweb.com</Link1>
  4798. <Link2></Link2>
  4799. </user-agent>
  4800. <user-agent>
  4801. <ID>id_a_f_342</ID>
  4802. <String>FAST-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)</String>
  4803. <Description>Fast/Alltheweb crawler</Description>
  4804. <Type>R</Type>
  4805. <Comment></Comment>
  4806. <Link1>http://www.alltheweb.com</Link1>
  4807. <Link2></Link2>
  4808. </user-agent>
  4809. <user-agent>
  4810. <ID>id_a_f_343</ID>
  4811. <String>FAST-WebCrawler/3.x Multimedia</String>
  4812. <Description>Fast/Alltheweb multimedia crawler</Description>
  4813. <Type>R</Type>
  4814. <Comment>see also Yahoo-MMCrawler/3.x</Comment>
  4815. <Link1>http://www.alltheweb.com</Link1>
  4816. <Link2></Link2>
  4817. </user-agent>
  4818. <user-agent>
  4819. <ID>id_a_f_344</ID>
  4820. <String>FAST-WebCrawler/3.x Multimedia (mm dash crawler at fast dot no)</String>
  4821. <Description>Fast/Alltheweb multimedia crawler</Description>
  4822. <Type>R</Type>
  4823. <Comment>see also Yahoo-MMCrawler/3.x</Comment>
  4824. <Link1>http://www.alltheweb.com</Link1>
  4825. <Link2></Link2>
  4826. </user-agent>
  4827. <user-agent>
  4828. <ID>id_a_f_121205_2</ID>
  4829. <String>fastbot crawler beta 2.0 (+http://www.fastbot.de)</String>
  4830. <Description>Fastbot search Germany crawler (80.252.104.1xx)</Description>
  4831. <Type>R</Type>
  4832. <Comment></Comment>
  4833. <Link1>http://www.fastbot.de/</Link1>
  4834. <Link2></Link2>
  4835. </user-agent>
  4836. <user-agent>
  4837. <ID>id_a_f_345</ID>
  4838. <String>FastBug http://www.ay-up.com</String>
  4839. <Description>Ay-Up geo sync search robot</Description>
  4840. <Type>R</Type>
  4841. <Comment></Comment>
  4842. <Link1>http://www.ay-up.com</Link1>
  4843. <Link2></Link2>
  4844. </user-agent>
  4845. <user-agent>
  4846. <ID>id_a_f_346</ID>
  4847. <String>FastCrawler 3.0.1 (crawler@1klik.dk)</String>
  4848. <Description>Fast/Alltheweb crawler (66.151.181.xx)</Description>
  4849. <Type>R</Type>
  4850. <Comment></Comment>
  4851. <Link1>http://www.alltheweb.com</Link1>
  4852. <Link2></Link2>
  4853. </user-agent>
  4854. <user-agent>
  4855. <ID>id_a_f_347</ID>
  4856. <String>FastSearch Web Crawler for Verizon SuperPages (kevin.watters@fastsearch.com)</String>
  4857. <Description>Fast/Alltheweb crawler used by SuperPages.com</Description>
  4858. <Type>R</Type>
  4859. <Comment></Comment>
  4860. <Link1>http://www.superpages.com</Link1>
  4861. <Link2>http://www.alltheweb.com</Link2>
  4862. </user-agent>
  4863. <user-agent>
  4864. <ID>id_a_f_170408_3</ID>
  4865. <String>Favcollector/2.0 (info@favcollector.com http://www.favcollector.com/)</String>
  4866. <Description>Favcollector Favicon collecting robot</Description>
  4867. <Type>R</Type>
  4868. <Comment>66.207.217.13x</Comment>
  4869. <Link1>http://www.favcollector.com/</Link1>
  4870. <Link2></Link2>
  4871. </user-agent>
  4872. <user-agent>
  4873. <ID>id_a_f_161006_1</ID>
  4874. <String>FavIconizer</String>
  4875. <Description>FavIconizer - IE favorites icons refreshing tool</Description>
  4876. <Type>D</Type>
  4877. <Comment></Comment>
  4878. <Link1>http://www.codeproject.com/tools/faviconizer.asp</Link1>
  4879. <Link2></Link2>
  4880. </user-agent>
  4881. <user-agent>
  4882. <ID>id_a_f_151206_1</ID>
  4883. <String>favo.eu crawler/0.6 (http://www.favo.eu)</String>
  4884. <Description>favo.eu (Germany) search robot</Description>
  4885. <Type>R</Type>
  4886. <Comment>84.19.186.1xx</Comment>
  4887. <Link1>http://www.favo.eu/</Link1>
  4888. <Link2></Link2>
  4889. </user-agent>
  4890. <user-agent>
  4891. <ID>id_a_f_348</ID>
  4892. <String>FavOrg</String>
  4893. <Description>ZD's FavOrg favourites managing program</Description>
  4894. <Type>C</Type>
  4895. <Comment></Comment>
  4896. <Link1>http://www.pcmag.com/article2/0&#44;4149&#44;108438&#44;00.asp</Link1>
  4897. <Link2></Link2>
  4898. </user-agent>
  4899. <user-agent>
  4900. <ID>id_a_f_260108_1</ID>
  4901. <String>Favorites Checking (http://campulka.net)</String>
  4902. <Description>Campulka.net Favorites checking tool</Description>
  4903. <Type>C</Type>
  4904. <Comment></Comment>
  4905. <Link1>http://campulka.net/?dir=Utility</Link1>
  4906. <Link2></Link2>
  4907. </user-agent>
  4908. <user-agent>
  4909. <ID>id_a_f_349</ID>
  4910. <String>Favorites Sweeper v.2.03</String>
  4911. <Description>Favorites Sweeper bookmark checker</Description>
  4912. <Type>C</Type>
  4913. <Comment></Comment>
  4914. <Link1>http://www.manitoolssoftware.cjb.net</Link1>
  4915. <Link2></Link2>
  4916. </user-agent>
  4917. <user-agent>
  4918. <ID>id_a_f_350</ID>
  4919. <String>Faxobot/1.0</String>
  4920. <Description>FaXo Search robot (69.152.89.xx)</Description>
  4921. <Type>R</Type>
  4922. <Comment></Comment>
  4923. <Link1>http://www.faxo.com</Link1>
  4924. <Link2></Link2>
  4925. </user-agent>
  4926. <user-agent>
  4927. <ID>id_a_f_351</ID>
  4928. <String>FDM 1.x</String>
  4929. <Description>Free Download Manager (FDM) download accelerator </Description>
  4930. <Type>D</Type>
  4931. <Comment></Comment>
  4932. <Link1>http://www.freedownloadmanager.org</Link1>
  4933. <Link2></Link2>
  4934. </user-agent>
  4935. <user-agent>
  4936. <ID>id_a_f_180207_1</ID>
  4937. <String>FDM 2.x</String>
  4938. <Description>Free Download Manager (FDM) download accelerator </Description>
  4939. <Type>D</Type>
  4940. <Comment></Comment>
  4941. <Link1>http://www.freedownloadmanager.org</Link1>
  4942. <Link2></Link2>
  4943. </user-agent>
  4944. <user-agent>
  4945. <ID>id_a_f_352</ID>
  4946. <String>Feed Seeker Bot (RSS Feed Seeker http://www.MyNewFavoriteThing.com/fsb.php)</String>
  4947. <Description>RSS Feed Seeker bot (68.225.95.2xx)</Description>
  4948. <Type>R</Type>
  4949. <Comment></Comment>
  4950. <Link1>http://www.MyNewFavoriteThing.com</Link1>
  4951. <Link2></Link2>
  4952. </user-agent>
  4953. <user-agent>
  4954. <ID>id_a_f_241206_1</ID>
  4955. <String>Feed24.com</String>
  4956. <Description>Feed24 news feed and blog search</Description>
  4957. <Type>R</Type>
  4958. <Comment>194.105.139.2xx</Comment>
  4959. <Link1>http://www.feed24.com/</Link1>
  4960. <Link2></Link2>
  4961. </user-agent>
  4962. <user-agent>
  4963. <ID>id_a_f_050306_1</ID>
  4964. <String>Feed::Find/0.0x</String>
  4965. <Description>Feed::Find - Syndication feed (RSS/Atom) auto-discovery</Description>
  4966. <Type>D</Type>
  4967. <Comment></Comment>
  4968. <Link1>http://search.cpan.org/~btrott/Feed-Find-0.06/lib/Feed/Find.pm</Link1>
  4969. <Link2></Link2>
  4970. </user-agent>
  4971. <user-agent>
  4972. <ID>id_a_f_250707_1</ID>
  4973. <String>Feedable/0.1 (compatible; MSIE 6.0; Windows NT 5.1)</String>
  4974. <Description>Feedable beta web based RSS service</Description>
  4975. <Type>B</Type>
  4976. <Comment>64.27.19.25x</Comment>
  4977. <Link1>http://reader.feedable.com/</Link1>
  4978. <Link2></Link2>
  4979. </user-agent>
  4980. <user-agent>
  4981. <ID>id_a_f_230406_2</ID>
  4982. <String>FeedChecker/0.01</String>
  4983. <Description>Unknown robot from the University of Tokyo (157.82.157.xx)</Description>
  4984. <Type>R</Type>
  4985. <Comment>reads robots.txt</Comment>
  4986. <Link1>http://www.u-tokyo.ac.jp/index_e.html</Link1>
  4987. <Link2></Link2>
  4988. </user-agent>
  4989. <user-agent>
  4990. <ID>id_a_f_140608_2</ID>
  4991. <String>FeedDemon/2.7 (http://www.newsgator.com/; Microsoft Windows XP)</String>
  4992. <Description>FeedDemon RSS reader</Description>
  4993. <Type>B</Type>
  4994. <Comment></Comment>
  4995. <Link1>http://www.newsgator.com/individuals/feeddemon/</Link1>
  4996. <Link2></Link2>
  4997. </user-agent>
  4998. <user-agent>
  4999. <ID>id_a_f_160308_2</ID>
  5000. <String>Feedfetcher-Google-iGoogleGadgets; (+http://www.google.com/feedfetcher.html)</String>
  5001. <Description>Google news feed feetcher for iGoogle gadgets</Description>
  5002. <Type>C</Type>
  5003. <Comment>72.14.[1-2]xx.[X]xx</Comment>
  5004. <Link1>http://www.google.com/feedfetcher.html</Link1>
  5005. <Link2></Link2>
  5006. </user-agent>
  5007. <user-agent>
  5008. <ID>id_a_f_010906_1</ID>
  5009. <String>Feedfetcher-Google; (+http://www.google.com/feedfetcher.html)</String>
  5010. <Description>Google Feedfetcher - RSS and Atom feed crawler</Description>
  5011. <Type>R</Type>
  5012. <Comment>72.14.199.x[xx]</Comment>
  5013. <Link1>http://www.google.com/feedfetcher.html</Link1>
  5014. <Link2></Link2>
  5015. </user-agent>
  5016. <user-agent>
  5017. <ID>id_a_f_010307_1</ID>
  5018. <String>FeedForAll rss2html.php v2</String>
  5019. <Description>FeedForAll RSS feed robot</Description>
  5020. <Type>C</Type>
  5021. <Comment>216.92.192.1xx</Comment>
  5022. <Link1>http://www.feedforall.com/</Link1>
  5023. <Link2></Link2>
  5024. </user-agent>
  5025. <user-agent>
  5026. <ID>id_a_f_010308_1</ID>
  5027. <String>FeedHub FeedDiscovery/1.0 (http://www.feedhub.com)</String>
  5028. <Description>FeedHub news feed personalization engine powered by mSpoke</Description>
  5029. <Type>R</Type>
  5030. <Comment>216.134.194.xx</Comment>
  5031. <Link1>http://www.feedhub.com/</Link1>
  5032. <Link2>http://www.mspoke.com/</Link2>
  5033. </user-agent>
  5034. <user-agent>
  5035. <ID>id_a_f_060608_3</ID>
  5036. <String>FeedHub MetaDataFetcher/1.0 (http://www.feedhub.com)</String>
  5037. <Description>FeedHub news feed personalization engine powered by mSpoke</Description>
  5038. <Type>R</Type>
  5039. <Comment>216.134.194.xx</Comment>
  5040. <Link1>http://www.feedhub.com/</Link1>
  5041. <Link2>http://www.mspoke.com/</Link2>
  5042. </user-agent>
  5043. <user-agent>
  5044. <ID>id_a_f_260608_3</ID>
  5045. <String>Feedjit Favicon Crawler 1.0</String>
  5046. <Description>Feedjit news feed service favicon crawler</Description>
  5047. <Type>R</Type>
  5048. <Comment>69.46.36.x</Comment>
  5049. <Link1>http://feedjit.com/</Link1>
  5050. <Link2></Link2>
  5051. </user-agent>
  5052. <user-agent>
  5053. <ID>id_a_f_150108_1</ID>
  5054. <String>Feedreader 3.xx (Powered by Newsbrain)</String>
  5055. <Description>Newsbrain Feedreader3</Description>
  5056. <Type>B</Type>
  5057. <Comment></Comment>
  5058. <Link1>http://www.feedreader.com/</Link1>
  5059. <Link2></Link2>
  5060. </user-agent>
  5061. <user-agent>
  5062. <ID>id_a_f_281106_3</ID>
  5063. <String>Feedshow/x.0 (http://www.feedshow.com; 1 subscriber)</String>
  5064. <Description>FeedShow online RSS feed reader</Description>
  5065. <Type>B</Type>
  5066. <Comment></Comment>
  5067. <Link1>http://www.feedshow.com/</Link1>
  5068. <Link2></Link2>
  5069. </user-agent>
  5070. <user-agent>
  5071. <ID>id_a_f_051206_2</ID>
  5072. <String>FeedshowOnline (http://www.feedshow.com)</String>
  5073. <Description>FeedShow online RSS feed reader</Description>
  5074. <Type>B</Type>
  5075. <Comment></Comment>
  5076. <Link1>http://www.feedshow.com/</Link1>
  5077. <Link2></Link2>
  5078. </user-agent>
  5079. <user-agent>
  5080. <ID>id_a_f_021206_1</ID>
  5081. <String>Feedster Crawler/3.0; Feedster&#44; Inc.</String>
  5082. <Description>Feedster RSS feed search</Description>
  5083. <Type>R</Type>
  5084. <Comment>64.95.116.x[x]</Comment>
  5085. <Link1>http://www.feedster.com/</Link1>
  5086. <Link2></Link2>
  5087. </user-agent>
  5088. <user-agent>
  5089. <ID>id_a_f_040207_1</ID>
  5090. <String>FeedZcollector v1.x (Platinum) http://www.feeds4all.com/feedzcollector</String>
  5091. <Description>FeedZcollector - Feed (RSS&#44; ATOM and RDF) capturing software</Description>
  5092. <Type>B</Type>
  5093. <Comment></Comment>
  5094. <Link1>http://www.feeds4all.com/feedzcollector/</Link1>
  5095. <Link2></Link2>
  5096. </user-agent>
  5097. <user-agent>
  5098. <ID>id_a_f_353</ID>
  5099. <String>Felix - Mixcat Crawler (+http://mixcat.com)</String>
  5100. <Description>MixCat robot</Description>
  5101. <Type>R</Type>
  5102. <Comment>s. also Morris</Comment>
  5103. <Link1>http://mixcat.com</Link1>
  5104. <Link2></Link2>
  5105. </user-agent>
  5106. <user-agent>
  5107. <ID>id_a_f_354</ID>
  5108. <String>fetch libfetch/2.0</String>
  5109. <Description>FreeBSD download tool</Description>
  5110. <Type>D</Type>
  5111. <Comment></Comment>
  5112. <Link1></Link1>
  5113. <Link2></Link2>
  5114. </user-agent>
  5115. <user-agent>
  5116. <ID>id_a_f_355</ID>
  5117. <String>FFC Trap Door Spider</String>
  5118. <Description>Frequent Finders spider via Sitefusion.com</Description>
  5119. <Type>R</Type>
  5120. <Comment></Comment>
  5121. <Link1>http://www.frequentfinders.com</Link1>
  5122. <Link2></Link2>
  5123. </user-agent>
  5124. <user-agent>
  5125. <ID>id_a_f_356</ID>
  5126. <String>Filangy/0.01-beta (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com)</String>
  5127. <Description>Filangy search and bookmark service</Description>
  5128. <Type>R C</Type>
  5129. <Comment></Comment>
  5130. <Link1>http://www.filangy.com</Link1>
  5131. <Link2></Link2>
  5132. </user-agent>
  5133. <user-agent>
  5134. <ID>id_a_f_357</ID>
  5135. <String>Filangy/1.0x (Filangy; http://www.filangy.com/filangyinfo.jsp?inc=robots.jsp; filangy-agent@filangy.com)</String>
  5136. <Description>Filangy search and bookmark service</Description>
  5137. <Type>R C</Type>
  5138. <Comment></Comment>
  5139. <Link1>http://www.filangy.com</Link1>
  5140. <Link2></Link2>
  5141. </user-agent>
  5142. <user-agent>
  5143. <ID>id_a_f_358</ID>
  5144. <String>Filangy/1.0x (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com)</String>
  5145. <Description>Filangy search and bookmark service</Description>
  5146. <Type>R C</Type>
  5147. <Comment></Comment>
  5148. <Link1>http://www.filangy.com</Link1>
  5149. <Link2></Link2>
  5150. </user-agent>
  5151. <user-agent>
  5152. <ID>id_a_f_359</ID>
  5153. <String>fileboost.net/1.0 (+http://www.fileboost.net)</String>
  5154. <Description>File Boost Network link checking</Description>
  5155. <Type>R C</Type>
  5156. <Comment></Comment>
  5157. <Link1>http://www.fileboost.net</Link1>
  5158. <Link2></Link2>
  5159. </user-agent>
  5160. <user-agent>
  5161. <ID>id_a_f_360</ID>
  5162. <String>FileHound x.x</String>
  5163. <Description>FileHound download manager</Description>
  5164. <Type>D</Type>
  5165. <Comment></Comment>
  5166. <Link1>http://www.allabout.com</Link1>
  5167. <Link2></Link2>
  5168. </user-agent>
  5169. <user-agent>
  5170. <ID>id_a_f_180208_1</ID>
  5171. <String>Filtrbox/1.0</String>
  5172. <Description>filtrbox media content (news) monitoring</Description>
  5173. <Type>R</Type>
  5174. <Comment>72.47.203.8x</Comment>
  5175. <Link1>http://www.filtrbox.com/</Link1>
  5176. <Link2></Link2>
  5177. </user-agent>
  5178. <user-agent>
  5179. <ID>id_a_f_361</ID>
  5180. <String>FindAnISP.com_ISP_Finder_v99a</String>
  5181. <Description>Find An ISP robot</Description>
  5182. <Type>R C</Type>
  5183. <Comment>site is down</Comment>
  5184. <Link1>http://www.findanisp.com/</Link1>
  5185. <Link2></Link2>
  5186. </user-agent>
  5187. <user-agent>
  5188. <ID>id_a_f_141205_2</ID>
  5189. <String>Findexa Crawler (http://www.findexa.no/gulesider/article26548.ece)</String>
  5190. <Description>Yelo.no business search (Norway) via Findexa</Description>
  5191. <Type>R</Type>
  5192. <Comment></Comment>
  5193. <Link1>http://www.findexa.no/english/article27709.ece</Link1>
  5194. <Link2></Link2>
  5195. </user-agent>
  5196. <user-agent>
  5197. <ID>id_a_f_362</ID>
  5198. <String>findlinks/x.xxx (+http://wortschatz.uni-leipzig.de/findlinks/) </String>
  5199. <Description>NextLinks - German vocabulary and hyperlink search</Description>
  5200. <Type>R</Type>
  5201. <Comment></Comment>
  5202. <Link1>http://wortschatz.uni-leipzig.de/nextlinks/findlinks.html</Link1>
  5203. <Link2></Link2>
  5204. </user-agent>
  5205. <user-agent>
  5206. <ID>id_a_f_363</ID>
  5207. <String>FineBot</String>
  5208. <Description>Finesearch robot</Description>
  5209. <Type>R</Type>
  5210. <Comment></Comment>
  5211. <Link1>http://www.finesearch.com</Link1>
  5212. <Link2></Link2>
  5213. </user-agent>
  5214. <user-agent>
  5215. <ID>id_a_f_080306_1</ID>
  5216. <String>Finjan-prefetch</String>
  5217. <Description>Finjan Vital Security Web Appliance security solution</Description>
  5218. <Type>P</Type>
  5219. <Comment></Comment>
  5220. <Link1>http://www.finjan.com/</Link1>
  5221. <Link2></Link2>
  5222. </user-agent>
  5223. <user-agent>
  5224. <ID>id_a_f_364</ID>
  5225. <String>Firefly/1.0</String>
  5226. <Description>Fireball.de robot</Description>
  5227. <Type>R</Type>
  5228. <Comment></Comment>
  5229. <Link1>http://www.fireball.de</Link1>
  5230. <Link2></Link2>
  5231. </user-agent>
  5232. <user-agent>
  5233. <ID>id_a_f_365</ID>
  5234. <String>Firefly/1.0 (compatible; Mozilla 4.0; MSIE 5.5)</String>
  5235. <Description>Fireball.de robot</Description>
  5236. <Type>R</Type>
  5237. <Comment></Comment>
  5238. <Link1>http://www.fireball.de</Link1>
  5239. <Link2></Link2>
  5240. </user-agent>
  5241. <user-agent>
  5242. <ID>id_a_f_210906_1</ID>
  5243. <String>Firefox (kastaneta03@hotmail.com)</String>
  5244. <Description>Unknown robot from Czech Technical University Prague (147.32.141.xx)</Description>
  5245. <Type>R</Type>
  5246. <Comment>reads robots.txt</Comment>
  5247. <Link1>http://www.cvut.cz/</Link1>
  5248. <Link2></Link2>
  5249. </user-agent>
  5250. <user-agent>
  5251. <ID>id_a_f_190306_2</ID>
  5252. <String>Firefox_1.0.6 (kasparek@naparek.cz)</String>
  5253. <Description>Unknown robot from Czech Technical University Prague (147.32.141.xx)</Description>
  5254. <Type>R</Type>
  5255. <Comment>reads robots.txt</Comment>
  5256. <Link1>http://www.cvut.cz/</Link1>
  5257. <Link2></Link2>
  5258. </user-agent>
  5259. <user-agent>
  5260. <ID>id_a_f_366</ID>
  5261. <String>FirstGov.gov Search - POC:firstgov.webmasters@gsa.gov</String>
  5262. <Description>AT&amp;T/Fast Search robot for FirstGov (U.S.Government) portal</Description>
  5263. <Type>R</Type>
  5264. <Comment></Comment>
  5265. <Link1>http://www.firstgov.gov</Link1>
  5266. <Link2></Link2>
  5267. </user-agent>
  5268. <user-agent>
  5269. <ID>id_a_f_367</ID>
  5270. <String>firstsbot</String>
  5271. <Description>Firstsfind Germany robot / link checking</Description>
  5272. <Type>R</Type>
  5273. <Comment></Comment>
  5274. <Link1>http://www.firstsfind.de</Link1>
  5275. <Link2></Link2>
  5276. </user-agent>
  5277. <user-agent>
  5278. <ID>id_a_f_020906_1</ID>
  5279. <String>Flapbot/0.7.2 (Flaptor Crawler; http://www.flaptor.com; crawler at flaptor period com)</String>
  5280. <Description>Flaptor information retrieval solutions robot</Description>
  5281. <Type>R</Type>
  5282. <Comment></Comment>
  5283. <Link1>http://www.flaptor.com/index.htm</Link1>
  5284. <Link2></Link2>
  5285. </user-agent>
  5286. <user-agent>
  5287. <ID>id_a_f_368</ID>
  5288. <String>FlashGet</String>
  5289. <Description>JetCar/FlashGet download manager</Description>
  5290. <Type>D</Type>
  5291. <Comment></Comment>
  5292. <Link1>http://www.amazesoft.com</Link1>
  5293. <Link2></Link2>
  5294. </user-agent>
  5295. <user-agent>
  5296. <ID>id_a_f_161205_1</ID>
  5297. <String>FLATARTS_FAVICO</String>
  5298. <Description>FlatArts Favorites Icon Tool</Description>
  5299. <Type>C D</Type>
  5300. <Comment></Comment>
  5301. <Link1>http://flatarts.jp/contents/software/information.php?name=rico</Link1>
  5302. <Link2></Link2>
  5303. </user-agent>
  5304. <user-agent>
  5305. <ID>id_a_f_100308_1</ID>
  5306. <String>Flexum spider</String>
  5307. <Description>Flexum.ru search service</Description>
  5308. <Type>R</Type>
  5309. <Comment>81.176.76.93</Comment>
  5310. <Link1>http://www.flexum.ru/</Link1>
  5311. <Link2></Link2>
  5312. </user-agent>
  5313. <user-agent>
  5314. <ID>id_a_f_280508_2</ID>
  5315. <String>Flexum/2.0</String>
  5316. <Description>Flexum.ru search service</Description>
  5317. <Type>R</Type>
  5318. <Comment>81.176.76.93</Comment>
  5319. <Link1>http://www.flexum.ru/</Link1>
  5320. <Link2></Link2>
  5321. </user-agent>
  5322. <user-agent>
  5323. <ID>id_a_f_369</ID>
  5324. <String>FlickBot 2.0 RPT-HTTPClient/0.3-3</String>
  5325. <Description>DivX.com Movie Find robot</Description>
  5326. <Type>R</Type>
  5327. <Comment></Comment>
  5328. <Link1>http://www.divx.com</Link1>
  5329. <Link2></Link2>
  5330. </user-agent>
  5331. <user-agent>
  5332. <ID>id_a_f_370</ID>
  5333. <String>flunky</String>
  5334. <Description>Metacarta / Cogent robot</Description>
  5335. <Type>R</Type>
  5336. <Comment></Comment>
  5337. <Link1>http://www.metacarta.com</Link1>
  5338. <Link2></Link2>
  5339. </user-agent>
  5340. <user-agent>
  5341. <ID>id_a_f_371</ID>
  5342. <String>fly/6.01 libwww/4.0D</String>
  5343. <Description>unknown</Description>
  5344. <Type></Type>
  5345. <Comment></Comment>
  5346. <Link1></Link1>
  5347. <Link2></Link2>
  5348. </user-agent>
  5349. <user-agent>
  5350. <ID>id_a_f_110107_1</ID>
  5351. <String>flyindex.net 1.0/http://www.flyindex.net</String>
  5352. <Description>FLY Index Metasearch link checking</Description>
  5353. <Type>C</Type>
  5354. <Comment>62.141.52.2xx</Comment>
  5355. <Link1>http://www.flyindex.net/</Link1>
  5356. <Link2></Link2>
  5357. </user-agent>
  5358. <user-agent>
  5359. <ID>id_a_f_021108_1</ID>
  5360. <String>FnooleBot/2.5.2 (+http://www.fnoole.com/addurl.html)</String>
  5361. <Description>Fnoole news crawler</Description>
  5362. <Type>R</Type>
  5363. <Comment>209.205.65.9x</Comment>
  5364. <Link1>http://www.fnoole.com/</Link1>
  5365. <Link2></Link2>
  5366. </user-agent>
  5367. <user-agent>
  5368. <ID>id_a_f_372</ID>
  5369. <String>FocusedSampler/1.0</String>
  5370. <Description>IBM's Almaden Research robot</Description>
  5371. <Type>R</Type>
  5372. <Comment> s. also: - - WFARC</Comment>
  5373. <Link1>http://www.almaden.ibm.com</Link1>
  5374. <Link2></Link2>
  5375. </user-agent>
  5376. <user-agent>
  5377. <ID>id_a_f_080108_1</ID>
  5378. <String>Folkd.com Spider/0.1 beta 1 (www.folkd.com)</String>
  5379. <Description>folkd.com social search robot</Description>
  5380. <Type>R</Type>
  5381. <Comment>212.227.95.3x</Comment>
  5382. <Link1>http://www.folkd.com/</Link1>
  5383. <Link2></Link2>
  5384. </user-agent>
  5385. <user-agent>
  5386. <ID>id_a_f_070209_4</ID>
  5387. <String>FollowSite Bot ( http://www.followsite.com/bot.html )</String>
  5388. <Description>FollowSite robot - website monitoring</Description>
  5389. <Type>C</Type>
  5390. <Comment>77.232.77.13x</Comment>
  5391. <Link1>http://www.followsite.com/bot.html</Link1>
  5392. <Link2></Link2>
  5393. </user-agent>
  5394. <user-agent>
  5395. <ID>id_a_f_140209_1</ID>
  5396. <String>FollowSite.com ( http://www.followsite.com/b.html )</String>
  5397. <Description>FollowSite robot - website monitoring</Description>
  5398. <Type>C</Type>
  5399. <Comment>77.232.77.13x</Comment>
  5400. <Link1>http://www.followsite.com/bot.html</Link1>
  5401. <Link2></Link2>
  5402. </user-agent>
  5403. <user-agent>
  5404. <ID>id_a_f_141105_1</ID>
  5405. <String>Fooky.com/ScorpionBot/ScoutOut; http://www.fooky.com/scorpionbots</String>
  5406. <Description>Fooky search Scorpionbots robot (65.12.170.xxx)</Description>
  5407. <Type>R</Type>
  5408. <Comment></Comment>
  5409. <Link1>http://www.fooky.com/</Link1>
  5410. <Link2></Link2>
  5411. </user-agent>
  5412. <user-agent>
  5413. <ID>id_a_f_373</ID>
  5414. <String>Francis/1.0 (francis@neomo.de http://www.neomo.de/)</String>
  5415. <Description>Neomo Search (Germany) robot (85.10.197.1xx)</Description>
  5416. <Type>R</Type>
  5417. <Comment></Comment>
  5418. <Link1>http://www.neomo.de</Link1>
  5419. <Link2></Link2>
  5420. </user-agent>
  5421. <user-agent>
  5422. <ID>id_a_f_374</ID>
  5423. <String>Franklin Locator 1.8</String>
  5424. <Description>Some spam bot</Description>
  5425. <Type>S</Type>
  5426. <Comment></Comment>
  5427. <Link1></Link1>
  5428. <Link2></Link2>
  5429. </user-agent>
  5430. <user-agent>
  5431. <ID>id_a_f_110506_1</ID>
  5432. <String>free-downloads.net download-link validator /0.1</String>
  5433. <Description>Free Downloads shareware directory link checking</Description>
  5434. <Type>C</Type>
  5435. <Comment></Comment>
  5436. <Link1>http://www.free-downloads.net/</Link1>
  5437. <Link2></Link2>
  5438. </user-agent>
  5439. <user-agent>
  5440. <ID>id_a_f_375</ID>
  5441. <String>FreeFind.com-SiteSearchEngine/1.0 (http://freefind.com; spiderinfo@freefind.com)</String>
  5442. <Description>FreeFind.com robot</Description>
  5443. <Type>R</Type>
  5444. <Comment></Comment>
  5445. <Link1>http://freefind.com</Link1>
  5446. <Link2></Link2>
  5447. </user-agent>
  5448. <user-agent>
  5449. <ID>id_a_f_221008_2</ID>
  5450. <String>Frelicbot/1.0 +http://www.frelic.com/</String>
  5451. <Description>Frelics backlink checking bot (beta)</Description>
  5452. <Type>C</Type>
  5453. <Comment></Comment>
  5454. <Link1>http://www.frelic.com/</Link1>
  5455. <Link2></Link2>
  5456. </user-agent>
  5457. <user-agent>
  5458. <ID>id_a_f_376</ID>
  5459. <String>FreshDownload/x.xx</String>
  5460. <Description>Fresh Download download manager</Description>
  5461. <Type>D</Type>
  5462. <Comment></Comment>
  5463. <Link1>http://www.freshdevices.com</Link1>
  5464. <Link2></Link2>
  5465. </user-agent>
  5466. <user-agent>
  5467. <ID>id_a_f_230306_2</ID>
  5468. <String>FreshNotes crawler&lt; report problems to crawler-at-freshnotes-dot-com</String>
  5469. <Description>FreshNotes - music related artist search (72.3.225.xx)</Description>
  5470. <Type>R</Type>
  5471. <Comment></Comment>
  5472. <Link1>http://freshnotes.com/fn/</Link1>
  5473. <Link2></Link2>
  5474. </user-agent>
  5475. <user-agent>
  5476. <ID>id_a_f_377</ID>
  5477. <String>FSurf15a 01</String>
  5478. <Description>Some site scanning tool via diff. IPs</Description>
  5479. <Type>S</Type>
  5480. <Comment>s. also DSurf -  PBrowse ...</Comment>
  5481. <Link1></Link1>
  5482. <Link2></Link2>
  5483. </user-agent>
  5484. <user-agent>
  5485. <ID>id_a_f_070209_5</ID>
  5486. <String>FTB-Bot http://www.findthebest.co.uk/</String>
  5487. <Description>Find the Best search robot</Description>
  5488. <Type>R</Type>
  5489. <Comment>83.105.71.16x</Comment>
  5490. <Link1>http://www.findthebest.co.uk/</Link1>
  5491. <Link2></Link2>
  5492. </user-agent>
  5493. <user-agent>
  5494. <ID>id_a_f_378</ID>
  5495. <String>Full Web Bot 0416B</String>
  5496. <Description>Some site scanning tool from diff. IPs i.e.: - 66.28.240.xx (cogentco.com) - 68.5.174.xx (cox.net)</Description>
  5497. <Type>S</Type>
  5498. <Comment></Comment>
  5499. <Link1></Link1>
  5500. <Link2></Link2>
  5501. </user-agent>
  5502. <user-agent>
  5503. <ID>id_a_f_379</ID>
  5504. <String>Full Web Bot 0516B</String>
  5505. <Description>Some site scanning tool i.e. from - 68.154.96.xx (bellsouth.net)</Description>
  5506. <Type>S</Type>
  5507. <Comment>appears also as MFC Foundation Class Library &amp; Demo Bot Z 16b - 66.118.1xx.xxx (sagonet.com) - s. also Educate Search VxB - Industry Program 1.0.5</Comment>
  5508. <Link1></Link1>
  5509. <Link2></Link2>
  5510. </user-agent>
  5511. <user-agent>
  5512. <ID>id_a_f_380</ID>
  5513. <String>Full Web Bot 2816B</String>
  5514. <Description>Some site scanning tool from 66.255.6.xxx (uslec.com)</Description>
  5515. <Type>S</Type>
  5516. <Comment></Comment>
  5517. <Link1></Link1>
  5518. <Link2></Link2>
  5519. </user-agent>
  5520. <user-agent>
  5521. <ID>id_a_f_190807_1</ID>
  5522. <String>FuseBulb.Com</String>
  5523. <Description>FuseBulb search</Description>
  5524. <Type>R</Type>
  5525. <Comment>208.109.126.1xx</Comment>
  5526. <Link1>http://www.fusebulb.com/</Link1>
  5527. <Link2></Link2>
  5528. </user-agent>
  5529. <user-agent>
  5530. <ID>id_a_f_381</ID>
  5531. <String>FyberSpider (+http://www.fybersearch.com/fyberspider.php)</String>
  5532. <Description>FyberSearch FyberSpider robot</Description>
  5533. <Type>R</Type>
  5534. <Comment></Comment>
  5535. <Link1>http://www.fybersearch.com</Link1>
  5536. <Link2></Link2>
  5537. </user-agent>
  5538. <user-agent>
  5539. <ID>id_g_m_382</ID>
  5540. <String>Gagglebot</String>
  5541. <Description>Some user from bbnplanet.net (4.63.218.2xx) using an Innerprise robot tool</Description>
  5542. <Type>R C ?</Type>
  5543. <Comment></Comment>
  5544. <Link1>http://www.innerprise.net</Link1>
  5545. <Link2></Link2>
  5546. </user-agent>
  5547. <user-agent>
  5548. <ID>id_g_m_383</ID>
  5549. <String>GAIS Robot/1.0B2</String>
  5550. <Description>Seed Search robot</Description>
  5551. <Type>R</Type>
  5552. <Comment></Comment>
  5553. <Link1>http://www.seed.net.tw</Link1>
  5554. <Link2></Link2>
  5555. </user-agent>
  5556. <user-agent>
  5557. <ID>id_g_m_384</ID>
  5558. <String>Gaisbot/3.0 (indexer@gais.cs.ccu.edu.tw; http://gais.cs.ccu.edu.tw/robot.php)</String>
  5559. <Description>Gaislab Taiwan robot</Description>
  5560. <Type>R</Type>
  5561. <Comment>140.123.100.x</Comment>
  5562. <Link1>http://gais.cs.ccu.edu.tw</Link1>
  5563. <Link2></Link2>
  5564. </user-agent>
  5565. <user-agent>
  5566. <ID>id_g_m_160706_1</ID>
  5567. <String>Gaisbot/3.0+(robot06@gais.cs.ccu.edu.tw;+http://gais.cs.ccu.edu.tw/robot.php)</String>
  5568. <Description>Gaislab Taiwan robot</Description>
  5569. <Type>R</Type>
  5570. <Comment>140.123.100.x</Comment>
  5571. <Link1>http://gais.cs.ccu.edu.tw</Link1>
  5572. <Link2></Link2>
  5573. </user-agent>
  5574. <user-agent>
  5575. <ID>id_g_m_385</ID>
  5576. <String>GalaxyBot/1.0 (http://www.galaxy.com/galaxybot.html)</String>
  5577. <Description>Galaxy robot (63.121.41.xxx)</Description>
  5578. <Type>R</Type>
  5579. <Comment> s. also Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com....)</Comment>
  5580. <Link1>http://www.galaxy.com</Link1>
  5581. <Link2></Link2>
  5582. </user-agent>
  5583. <user-agent>
  5584. <ID>id_g_m_130407_2</ID>
  5585. <String>Gallent Search Spider v1.4 Robot 2 (http://robot.GallentSearch.com)</String>
  5586. <Description>Gallent Search directory (UK)</Description>
  5587. <Type>R</Type>
  5588. <Comment>88.208.223.xx</Comment>
  5589. <Link1>http://www.gallent.co.uk/</Link1>
  5590. <Link2>http://robot.gallentsearch.com/</Link2>
  5591. </user-agent>
  5592. <user-agent>
  5593. <ID>id_g_m_010107_1</ID>
  5594. <String>gamekitbot/1.0 (+http://www.uchoose.de/crawler/gamekitbot/)</String>
  5595. <Description>Gamekit game search engine - Germany</Description>
  5596. <Type>R</Type>
  5597. <Comment>80.65.45.xx</Comment>
  5598. <Link1>http://www.gamekit.de/</Link1>
  5599. <Link2></Link2>
  5600. </user-agent>
  5601. <user-agent>
  5602. <ID>id_g_m_386</ID>
  5603. <String>Gamespy_Arcade</String>
  5604. <Description>GameSpyHTTP/1.0</Description>
  5605. <Type>D</Type>
  5606. <Comment>GameSpy Arcade download manager (FilePlanet)</Comment>
  5607. <Link1>http://www.gamespyarcade.com/features/</Link1>
  5608. <Link2></Link2>
  5609. </user-agent>
  5610. <user-agent>
  5611. <ID>id_g_m_387</ID>
  5612. <String>GammaSpider/1.0</String>
  5613. <Description>GammaWare GammaSpider</Description>
  5614. <Type>R</Type>
  5615. <Comment></Comment>
  5616. <Link1>http://www.gammasite.com</Link1>
  5617. <Link2></Link2>
  5618. </user-agent>
  5619. <user-agent>
  5620. <ID>id_g_m_388</ID>
  5621. <String>gazz/x.x (gazz@nttrd.com)</String>
  5622. <Description>nttrd.com / Infobee.ne.jp robot</Description>
  5623. <Type>R</Type>
  5624. <Comment></Comment>
  5625. <Link1></Link1>
  5626. <Link2></Link2>
  5627. </user-agent>
  5628. <user-agent>
  5629. <ID>id_g_m_389</ID>
  5630. <String>geckobot</String>
  5631. <Description>Geckobot user robot</Description>
  5632. <Type></Type>
  5633. <Comment>no active website</Comment>
  5634. <Link1>http://www.geckobot.com/</Link1>
  5635. <Link2></Link2>
  5636. </user-agent>
  5637. <user-agent>
  5638. <ID>id_g_m_280406_1</ID>
  5639. <String>Generic Mobile Phone (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)</String>
  5640. <Description>Google Mobile Search crawler</Description>
  5641. <Type>R P</Type>
  5642. <Comment>66.249.72.1xx</Comment>
  5643. <Link1>http://www.google.com/mobile/formats.html</Link1>
  5644. <Link2></Link2>
  5645. </user-agent>
  5646. <user-agent>
  5647. <ID>id_g_m_390</ID>
  5648. <String>generic_crawler/01.0217/</String>
  5649. <Description>Unknown robot from Carnegie Mellon University (128.2.211.xxx)</Description>
  5650. <Type>R</Type>
  5651. <Comment></Comment>
  5652. <Link1>http://www.cmu.edu</Link1>
  5653. <Link2></Link2>
  5654. </user-agent>
  5655. <user-agent>
  5656. <ID>id_g_m_100109_2</ID>
  5657. <String>GenesisBrowser (HTTP 1.1; 0.9; XP SP2; .NET CLR 2.0.50727)</String>
  5658. <Description>Lunascape Genesis browser</Description>
  5659. <Type>B</Type>
  5660. <Comment></Comment>
  5661. <Link1>http://www.lunascape.tv/</Link1>
  5662. <Link2></Link2>
  5663. </user-agent>
  5664. <user-agent>
  5665. <ID>id_g_m_231205_1</ID>
  5666. <String>genieBot (http://64.5.245.11/faq/faq.html)</String>
  5667. <Description>GenieKnows.com search</Description>
  5668. <Type>R</Type>
  5669. <Comment> s. also: - larbin_2.6.3 (wgao@genieknows.com)</Comment>
  5670. <Link1>http://www.genieknows.com/</Link1>
  5671. <Link2></Link2>
  5672. </user-agent>
  5673. <user-agent>
  5674. <ID>id_g_m_391</ID>
  5675. <String>geniebot wgao@genieknows.com</String>
  5676. <Description>GenieKnows.com search</Description>
  5677. <Type>R</Type>
  5678. <Comment> s. also: - larbin_2.6.3 (wgao@genieknows.com)</Comment>
  5679. <Link1>http://www.genieknows.com/</Link1>
  5680. <Link2></Link2>
  5681. </user-agent>
  5682. <user-agent>
  5683. <ID>id_g_m_050606_3</ID>
  5684. <String>GeoBot/1.0</String>
  5685. <Description>Unknown robot from wavepath.com (65.254.33.1xx)</Description>
  5686. <Type></Type>
  5687. <Comment>no active website</Comment>
  5688. <Link1></Link1>
  5689. <Link2></Link2>
  5690. </user-agent>
  5691. <user-agent>
  5692. <ID>id_g_m_392</ID>
  5693. <String>GeonaBot 1.x; http://www.geona.com/</String>
  5694. <Description>Geona Search robot / link checking</Description>
  5695. <Type>R</Type>
  5696. <Comment></Comment>
  5697. <Link1>http://www.geona.com</Link1>
  5698. <Link2></Link2>
  5699. </user-agent>
  5700. <user-agent>
  5701. <ID>id_g_m_160206_3</ID>
  5702. <String>geourl/2.0b2</String>
  5703. <Description>GeoURL ICBM Address Server - a location-to-URL reverse directory</Description>
  5704. <Type>C</Type>
  5705. <Comment></Comment>
  5706. <Link1>http://geourl.org/</Link1>
  5707. <Link2></Link2>
  5708. </user-agent>
  5709. <user-agent>
  5710. <ID>id_g_m_160206_2</ID>
  5711. <String>GeoURLBot 1.0 (http://geourl.org)</String>
  5712. <Description>GeoURL ICBM Address Server - a location-to-URL reverse directory</Description>
  5713. <Type>C</Type>
  5714. <Comment></Comment>
  5715. <Link1>http://geourl.org/</Link1>
  5716. <Link2></Link2>
  5717. </user-agent>
  5718. <user-agent>
  5719. <ID>id_g_m_393</ID>
  5720. <String>GetBot</String>
  5721. <Description>Getbot web downloading tool / site grabber</Description>
  5722. <Type>D</Type>
  5723. <Comment></Comment>
  5724. <Link1>http://www.getbot.com</Link1>
  5725. <Link2></Link2>
  5726. </user-agent>
  5727. <user-agent>
  5728. <ID>id_g_m_394</ID>
  5729. <String>GetRight/3.x.x</String>
  5730. <Description>GetRight download manager</Description>
  5731. <Type>D</Type>
  5732. <Comment></Comment>
  5733. <Link1>http://www.getright.com</Link1>
  5734. <Link2></Link2>
  5735. </user-agent>
  5736. <user-agent>
  5737. <ID>id_g_m_395</ID>
  5738. <String>GetRight/4.5xx</String>
  5739. <Description>GetRight download manager</Description>
  5740. <Type>D</Type>
  5741. <Comment></Comment>
  5742. <Link1>http://www.getright.com</Link1>
  5743. <Link2></Link2>
  5744. </user-agent>
  5745. <user-agent>
  5746. <ID>id_g_m_396</ID>
  5747. <String>GetRight/4.x</String>
  5748. <Description>GetRight download manager</Description>
  5749. <Type>D</Type>
  5750. <Comment></Comment>
  5751. <Link1>http://www.getright.com</Link1>
  5752. <Link2></Link2>
  5753. </user-agent>
  5754. <user-agent>
  5755. <ID>id_g_m_397</ID>
  5756. <String>GetRight/4.x[a-e]</String>
  5757. <Description>GetRight download manager</Description>
  5758. <Type>D</Type>
  5759. <Comment></Comment>
  5760. <Link1>http://www.getright.com</Link1>
  5761. <Link2></Link2>
  5762. </user-agent>
  5763. <user-agent>
  5764. <ID>id_g_m_260807_1</ID>
  5765. <String>GetRight/6.1 (Pro)</String>
  5766. <Description>GetRight download manager</Description>
  5767. <Type>D</Type>
  5768. <Comment></Comment>
  5769. <Link1>http://www.getright.com</Link1>
  5770. <Link2></Link2>
  5771. </user-agent>
  5772. <user-agent>
  5773. <ID>id_g_m_398</ID>
  5774. <String>GetRightPro/6.0beta2</String>
  5775. <Description>GetRight download manager</Description>
  5776. <Type>D</Type>
  5777. <Comment></Comment>
  5778. <Link1>http://www.getright.com</Link1>
  5779. <Link2></Link2>
  5780. </user-agent>
  5781. <user-agent>
  5782. <ID>id_g_m_170706_3</ID>
  5783. <String>GetWeb/0.1 libwww-perl/5.16</String>
  5784. <Description>GetWeb - web page to email service</Description>
  5785. <Type>D</Type>
  5786. <Comment>216.204.133.xxx</Comment>
  5787. <Link1>http://www.healthnet.org/getweb.php</Link1>
  5788. <Link2></Link2>
  5789. </user-agent>
  5790. <user-agent>
  5791. <ID>id_g_m_399</ID>
  5792. <String>GhostRouteHunter/20021130 (https://www.sixxs.net/tools/grh/; info@sixxs.net)</String>
  5793. <Description>Sixxs Ghost Route Hunter</Description>
  5794. <Type>C</Type>
  5795. <Comment></Comment>
  5796. <Link1>http://www.sixxs.net/tools/grh/</Link1>
  5797. <Link2></Link2>
  5798. </user-agent>
  5799. <user-agent>
  5800. <ID>id_g_m_400</ID>
  5801. <String>gigabaz/3.1x (baz@gigabaz.com; http://gigabaz.com/gigabaz/)</String>
  5802. <Description>GigaBaz Brainbot (Germany) robot</Description>
  5803. <Type>R</Type>
  5804. <Comment> s. also - MicroBaz</Comment>
  5805. <Link1>http://gigabaz.com</Link1>
  5806. <Link2></Link2>
  5807. </user-agent>
  5808. <user-agent>
  5809. <ID>id_g_m_401</ID>
  5810. <String>Gigabot/2.0 (gigablast.com)</String>
  5811. <Description>Gigablast robot (64.62.168.xx)</Description>
  5812. <Type>R</Type>
  5813. <Comment></Comment>
  5814. <Link1>http://www.gigablast.com</Link1>
  5815. <Link2></Link2>
  5816. </user-agent>
  5817. <user-agent>
  5818. <ID>id_g_m_140106_1</ID>
  5819. <String>Gigabot/2.0/gigablast.com/spider.html</String>
  5820. <Description>Gigablast robot</Description>
  5821. <Type>R</Type>
  5822. <Comment>comes from 64.62.168.xx AND 66.154.102.xx</Comment>
  5823. <Link1>http://www.gigablast.com</Link1>
  5824. <Link2></Link2>
  5825. </user-agent>
  5826. <user-agent>
  5827. <ID>id_g_m_170506_1</ID>
  5828. <String>Gigabot/2.0; http://www.gigablast.com/spider.html</String>
  5829. <Description>Gigablast robot</Description>
  5830. <Type>R</Type>
  5831. <Comment>comes from 64.62.168.xx AND 66.154.102.xx</Comment>
  5832. <Link1>http://www.gigablast.com</Link1>
  5833. <Link2></Link2>
  5834. </user-agent>
  5835. <user-agent>
  5836. <ID>id_g_m_190507_1</ID>
  5837. <String>Gigabot/2.0att</String>
  5838. <Description>Gigablast robot</Description>
  5839. <Type>R</Type>
  5840. <Comment>66.231.188.1xx</Comment>
  5841. <Link1>http://www.gigablast.com</Link1>
  5842. <Link2></Link2>
  5843. </user-agent>
  5844. <user-agent>
  5845. <ID>id_g_m_230508_1</ID>
  5846. <String>Gigabot/3.0 (http://www.gigablast.com/spider.html)</String>
  5847. <Description>Gigablast robot</Description>
  5848. <Type>R</Type>
  5849. <Comment>66.231.18x.[x]xx</Comment>
  5850. <Link1>http://www.gigablast.com</Link1>
  5851. <Link2></Link2>
  5852. </user-agent>
  5853. <user-agent>
  5854. <ID>id_g_m_402</ID>
  5855. <String>Gigabot/x.0</String>
  5856. <Description>Gigablast robot (64.62.168.xx)</Description>
  5857. <Type>R</Type>
  5858. <Comment></Comment>
  5859. <Link1>http://www.gigablast.com</Link1>
  5860. <Link2></Link2>
  5861. </user-agent>
  5862. <user-agent>
  5863. <ID>id_g_m_403</ID>
  5864. <String>GigabotSiteSearch/2.0 (sitesearch.gigablast.com)</String>
  5865. <Description>Gigablast robot (64.62.168.xx)</Description>
  5866. <Type>R</Type>
  5867. <Comment></Comment>
  5868. <Link1>http://www.gigablast.com</Link1>
  5869. <Link2></Link2>
  5870. </user-agent>
  5871. <user-agent>
  5872. <ID>id_g_m_404</ID>
  5873. <String>GNODSPIDER (www.gnod.net)</String>
  5874. <Description>www.gnod.net spider</Description>
  5875. <Type>R</Type>
  5876. <Comment></Comment>
  5877. <Link1>http://www.gnod.net</Link1>
  5878. <Link2></Link2>
  5879. </user-agent>
  5880. <user-agent>
  5881. <ID>id_g_m_406</ID>
  5882. <String>Go!Zilla 3.x (www.gozilla.com)</String>
  5883. <Description>Go!Zilla download manager</Description>
  5884. <Type>D</Type>
  5885. <Comment></Comment>
  5886. <Link1>http://www.gozilla.com</Link1>
  5887. <Link2></Link2>
  5888. </user-agent>
  5889. <user-agent>
  5890. <ID>id_g_m_407</ID>
  5891. <String>Go!Zilla/4.x.x.xx</String>
  5892. <Description>Go!Zilla download manager</Description>
  5893. <Type>D</Type>
  5894. <Comment></Comment>
  5895. <Link1>http://www.gozilla.com</Link1>
  5896. <Link2></Link2>
  5897. </user-agent>
  5898. <user-agent>
  5899. <ID>id_g_m_405</ID>
  5900. <String>Go-Ahead-Got-It/1.1</String>
  5901. <Description>GotIt web accelerator (discontinued)</Description>
  5902. <Type>P D</Type>
  5903. <Comment></Comment>
  5904. <Link1></Link1>
  5905. <Link2></Link2>
  5906. </user-agent>
  5907. <user-agent>
  5908. <ID>id_g_m_408</ID>
  5909. <String>Goblin/0.9 (http://www.goguides.org/)</String>
  5910. <Description>GoGuides.Org (195.226.137.xx) robot</Description>
  5911. <Type>R</Type>
  5912. <Comment></Comment>
  5913. <Link1>http://www.goguides.org/goblin-info.html</Link1>
  5914. <Link2></Link2>
  5915. </user-agent>
  5916. <user-agent>
  5917. <ID>id_g_m_409</ID>
  5918. <String>Goblin/0.9.x (http://www.goguides.org/goblin-info.html)</String>
  5919. <Description>GoGuides.Org (195.226.137.xx) robot</Description>
  5920. <Type>R</Type>
  5921. <Comment></Comment>
  5922. <Link1>http://www.goguides.org/goblin-info.html</Link1>
  5923. <Link2></Link2>
  5924. </user-agent>
  5925. <user-agent>
  5926. <ID>id_g_m_410</ID>
  5927. <String>GoForIt.com</String>
  5928. <Description>GoForIt Search robot</Description>
  5929. <Type>R</Type>
  5930. <Comment>208.109.236.xx</Comment>
  5931. <Link1>http://www.goforit.com</Link1>
  5932. <Link2></Link2>
  5933. </user-agent>
  5934. <user-agent>
  5935. <ID>id_g_m_411</ID>
  5936. <String>GOFORITBOT ( http://www.goforit.com/about/ )</String>
  5937. <Description>GoForIt Search robot</Description>
  5938. <Type>R</Type>
  5939. <Comment>208.109.236.xx</Comment>
  5940. <Link1>http://www.goforit.com</Link1>
  5941. <Link2></Link2>
  5942. </user-agent>
  5943. <user-agent>
  5944. <ID>id_g_m_020306_1</ID>
  5945. <String>GoGuides.Org Link Check</String>
  5946. <Description>GoGuides.org directory &amp; search link checking</Description>
  5947. <Type>C</Type>
  5948. <Comment></Comment>
  5949. <Link1>http://www.goguides.org/</Link1>
  5950. <Link2></Link2>
  5951. </user-agent>
  5952. <user-agent>
  5953. <ID>id_g_m_230207_2</ID>
  5954. <String>GoldenFeed Spider 1.0 (http://www.goldenfeed.com)</String>
  5955. <Description>GoldenFeed.com - RSS search engine</Description>
  5956. <Type>C</Type>
  5957. <Comment>74.52.41.1xx</Comment>
  5958. <Link1>http://www.goldenfeed.com/</Link1>
  5959. <Link2></Link2>
  5960. </user-agent>
  5961. <user-agent>
  5962. <ID>id_g_m_412</ID>
  5963. <String>Goldfire Server</String>
  5964. <Description>Invention Machines Goldfire Server</Description>
  5965. <Type>P</Type>
  5966. <Comment></Comment>
  5967. <Link1>http://www.invention-machine.com/custsupport/GFR_install.cfm</Link1>
  5968. <Link2></Link2>
  5969. </user-agent>
  5970. <user-agent>
  5971. <ID>id_g_m_041006_1</ID>
  5972. <String>gonzo1[P] +http://www.suchen.de/popups/faq.jsp</String>
  5973. <Description>suchen.de German local search robot</Description>
  5974. <Type>R</Type>
  5975. <Comment>212.34.185.xx</Comment>
  5976. <Link1>http://www.suchen.de/</Link1>
  5977. <Link2></Link2>
  5978. </user-agent>
  5979. <user-agent>
  5980. <ID>id_g_m_130108_2</ID>
  5981. <String>gonzo2[P] +http://www.suchen.de/faq.html</String>
  5982. <Description>suchen.de German local search robot</Description>
  5983. <Type>R</Type>
  5984. <Comment>212.34.185.xx</Comment>
  5985. <Link1>http://www.suchen.de/</Link1>
  5986. <Link2></Link2>
  5987. </user-agent>
  5988. <user-agent>
  5989. <ID>id_g_m_413</ID>
  5990. <String>Goofer/0.2</String>
  5991. <Description>Some private robot (Wanadoo.fr client)</Description>
  5992. <Type>R</Type>
  5993. <Comment></Comment>
  5994. <Link1></Link1>
  5995. <Link2></Link2>
  5996. </user-agent>
  5997. <user-agent>
  5998. <ID>id_g_m_300606_1</ID>
  5999. <String>Google Talk</String>
  6000. <Description>Google instant messenger</Description>
  6001. <Type>B</Type>
  6002. <Comment></Comment>
  6003. <Link1>http://www.google.com/talk/</Link1>
  6004. <Link2></Link2>
  6005. </user-agent>
  6006. <user-agent>
  6007. <ID>id_g_m_414</ID>
  6008. <String>googlebot (larbin2.6.0@unspecified.mail)</String>
  6009. <Description>Packard Bell Net user robot (*not* Google)</Description>
  6010. <Type></Type>
  6011. <Comment></Comment>
  6012. <Link1></Link1>
  6013. <Link2></Link2>
  6014. </user-agent>
  6015. <user-agent>
  6016. <ID>id_g_m_050106_1</ID>
  6017. <String>Googlebot-Image/1.0</String>
  6018. <Description>Google image crawler (66.249.72.xxx)</Description>
  6019. <Type>R</Type>
  6020. <Comment></Comment>
  6021. <Link1>http://www.google.com</Link1>
  6022. <Link2></Link2>
  6023. </user-agent>
  6024. <user-agent>
  6025. <ID>id_g_m_415</ID>
  6026. <String>Googlebot-Image/1.0 ( http://www.googlebot.com/bot.html)</String>
  6027. <Description>Google image crawler (66.249.72.xxx)</Description>
  6028. <Type>R</Type>
  6029. <Comment></Comment>
  6030. <Link1>http://www.google.com</Link1>
  6031. <Link2></Link2>
  6032. </user-agent>
  6033. <user-agent>
  6034. <ID>id_g_m_416</ID>
  6035. <String>Googlebot/2.1 ( http://www.google.com/bot.html)</String>
  6036. <Description>Google robot 66.249.64.XXX</Description>
  6037. <Type>R</Type>
  6038. <Comment> s. also: - Mozilla/4.0 (MobilePhone SCP ... - Mozilla/5.0 (compatible; Googlebot/2.1...</Comment>
  6039. <Link1>http://www.google.com</Link1>
  6040. <Link2></Link2>
  6041. </user-agent>
  6042. <user-agent>
  6043. <ID>id_g_m_417</ID>
  6044. <String>Googlebot/2.1 ( http://www.googlebot.com/bot.html)</String>
  6045. <Description>Google robot 66.249.64.XXX</Description>
  6046. <Type>R</Type>
  6047. <Comment></Comment>
  6048. <Link1>http://www.google.com</Link1>
  6049. <Link2></Link2>
  6050. </user-agent>
  6051. <user-agent>
  6052. <ID>id_g_m_418</ID>
  6053. <String>Googlebot/Test ( http://www.googlebot.com/bot.html)</String>
  6054. <Description>Google robot 66.249.64.XXX</Description>
  6055. <Type>R</Type>
  6056. <Comment></Comment>
  6057. <Link1>http://www.google.com</Link1>
  6058. <Link2></Link2>
  6059. </user-agent>
  6060. <user-agent>
  6061. <ID>id_g_m_280209_2</ID>
  6062. <String>Gordon's Spider/Nutch-0.9 (http://www.sharethis.com; gordon@sharethis.com)</String>
  6063. <Description>ShareThis social networking service via Amazon Web Services</Description>
  6064. <Type>C</Type>
  6065. <Comment>174.129.242.x</Comment>
  6066. <Link1>http://sharethis.com/</Link1>
  6067. <Link2>http://www.amazonaws.com/</Link2>
  6068. </user-agent>
  6069. <user-agent>
  6070. <ID>id_g_m_419</ID>
  6071. <String>GrapeFX/0.3 libwww/5.4.0</String>
  6072. <Description>Grapeshot web search system API</Description>
  6073. <Type>R</Type>
  6074. <Comment></Comment>
  6075. <Link1>http://www.grapeshot.co.uk/html/Index.html</Link1>
  6076. <Link2></Link2>
  6077. </user-agent>
  6078. <user-agent>
  6079. <ID>id_g_m_300907_4</ID>
  6080. <String>great-plains-web-spider/flatlandbot (Flatland Industries Web Spider; http://www.flatlandindustries.com/flatlandbot.php; jason@flatlandindustries.com)</String>
  6081. <Description>Flatland Industries vertical search solution</Description>
  6082. <Type>R</Type>
  6083. <Comment>74.62.161.xx</Comment>
  6084. <Link1>http://www.flatlandindustries.com/</Link1>
  6085. <Link2>http://www.flatlandindustries.com/flatlandbot.php</Link2>
  6086. </user-agent>
  6087. <user-agent>
  6088. <ID>id_g_m_250707_2</ID>
  6089. <String>GreatNews/1.0</String>
  6090. <Description>GreatNews 1.0 Beta RSS reader</Description>
  6091. <Type>B</Type>
  6092. <Comment></Comment>
  6093. <Link1>http://www.curiostudio.com/</Link1>
  6094. <Link2></Link2>
  6095. </user-agent>
  6096. <user-agent>
  6097. <ID>id_g_m_170207_2</ID>
  6098. <String>GreenBrowser</String>
  6099. <Description>GreenBrowser - IE based browser (China)</Description>
  6100. <Type>B</Type>
  6101. <Comment></Comment>
  6102. <Link1>http://www.morequick.com/indexen.htm</Link1>
  6103. <Link2></Link2>
  6104. </user-agent>
  6105. <user-agent>
  6106. <ID>id_g_m_100307_2</ID>
  6107. <String>gridwell (http://search.gridwell.com)</String>
  6108. <Description>search gridwell favicon display</Description>
  6109. <Type>D</Type>
  6110. <Comment>212.227.127.xx</Comment>
  6111. <Link1>http://search.gridwell.com/</Link1>
  6112. <Link2></Link2>
  6113. </user-agent>
  6114. <user-agent>
  6115. <ID>id_g_m_420</ID>
  6116. <String>GrigorBot 0.8 (http://www.grigor.biz/bot.html)</String>
  6117. <Description>Grigor Search bot</Description>
  6118. <Type>R</Type>
  6119. <Comment></Comment>
  6120. <Link1>http://www.grigor.biz</Link1>
  6121. <Link2></Link2>
  6122. </user-agent>
  6123. <user-agent>
  6124. <ID>id_g_m_161206_1</ID>
  6125. <String>Gromit/1.0</String>
  6126. <Description>Australasian Legal Information Institute (AustLII) robot</Description>
  6127. <Type>R</Type>
  6128. <Comment></Comment>
  6129. <Link1>http://www.austlii.edu.au/</Link1>
  6130. <Link2>http://www2.austlii.edu.au/~dan/gromit/</Link2>
  6131. </user-agent>
  6132. <user-agent>
  6133. <ID>id_g_m_421</ID>
  6134. <String>grub crawler(http://www.grub.org)</String>
  6135. <Description>Grub open source crawler</Description>
  6136. <Type>R</Type>
  6137. <Comment></Comment>
  6138. <Link1>http://www.grub.org</Link1>
  6139. <Link2></Link2>
  6140. </user-agent>
  6141. <user-agent>
  6142. <ID>id_g_m_422</ID>
  6143. <String>grub-client</String>
  6144. <Description>Grub open source crawler</Description>
  6145. <Type>R</Type>
  6146. <Comment></Comment>
  6147. <Link1>http://www.grub.org</Link1>
  6148. <Link2></Link2>
  6149. </user-agent>
  6150. <user-agent>
  6151. <ID>id_g_m_423</ID>
  6152. <String>gsa-crawler (Enterprise; GID-01422; jplastiras@google.com)</String>
  6153. <Description>Google Search Appliance robot (216.239.xx.xx)</Description>
  6154. <Type>R</Type>
  6155. <Comment></Comment>
  6156. <Link1>http://www.google.com/enterprise/gsa/</Link1>
  6157. <Link2></Link2>
  6158. </user-agent>
  6159. <user-agent>
  6160. <ID>id_g_m_424</ID>
  6161. <String>gsa-crawler (Enterprise; GID-01742;gsatesting@rediffmail.com)</String>
  6162. <Description>Google Search Appliance robot (216.239.xx.xx)</Description>
  6163. <Type>R</Type>
  6164. <Comment></Comment>
  6165. <Link1>http://www.google.com/enterprise/gsa/</Link1>
  6166. <Link2></Link2>
  6167. </user-agent>
  6168. <user-agent>
  6169. <ID>id_g_m_060506_1</ID>
  6170. <String>gsa-crawler (Enterprise; GIX-02057; dm@enhesa.com)</String>
  6171. <Description>Google Enterprise Search Appliance used by Enhesa (212.35.100.1xx)</Description>
  6172. <Type>R</Type>
  6173. <Comment></Comment>
  6174. <Link1>http://www.enhesa.com/enhesa/en/default.asp</Link1>
  6175. <Link2>http://www.google.com/enterprise/gsa/</Link2>
  6176. </user-agent>
  6177. <user-agent>
  6178. <ID>id_g_m_311205_1</ID>
  6179. <String>gsa-crawler (Enterprise; GIX-03519; cknuetter@stubhub.com)</String>
  6180. <Description>Google Enterprise Search Appliance used by IBM (129.41.20.1xx)</Description>
  6181. <Type>R</Type>
  6182. <Comment></Comment>
  6183. <Link1>http://www.google.com/enterprise/gsa/</Link1>
  6184. <Link2></Link2>
  6185. </user-agent>
  6186. <user-agent>
  6187. <ID>id_g_m_425</ID>
  6188. <String>gsa-crawler (Enterprise; GIX-0xxxx; enterprise-training@google.com)</String>
  6189. <Description>Google Search Appliance robot (216.239.xx.xx)</Description>
  6190. <Type>R</Type>
  6191. <Comment></Comment>
  6192. <Link1>http://www.google.com/enterprise/gsa/</Link1>
  6193. <Link2></Link2>
  6194. </user-agent>
  6195. <user-agent>
  6196. <ID>id_g_m_081006_1</ID>
  6197. <String>GSiteCrawler/v1.xx rev. xxx (http://gsitecrawler.com/)</String>
  6198. <Description>GSiteCrawler - Google sitemap generator for Windows</Description>
  6199. <Type>C</Type>
  6200. <Comment></Comment>
  6201. <Link1>http://gsitecrawler.com/</Link1>
  6202. <Link2></Link2>
  6203. </user-agent>
  6204. <user-agent>
  6205. <ID>id_g_m_260207_1</ID>
  6206. <String>Guestbook Auto Submitter</String>
  6207. <Description>Guestbook spamming tool</Description>
  6208. <Type>S</Type>
  6209. <Comment></Comment>
  6210. <Link1></Link1>
  6211. <Link2></Link2>
  6212. </user-agent>
  6213. <user-agent>
  6214. <ID>id_g_m_426</ID>
  6215. <String>Gulliver/1.3</String>
  6216. <Description>Northernlight robot</Description>
  6217. <Type>R</Type>
  6218. <Comment></Comment>
  6219. <Link1>http://www.northernlight.com</Link1>
  6220. <Link2></Link2>
  6221. </user-agent>
  6222. <user-agent>
  6223. <ID>id_g_m_427</ID>
  6224. <String>Gulper Web Bot 0.2.4 (www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot)</String>
  6225. <Description>Yuntis Collaborative Web Resource Categorization and Ranking Project robot</Description>
  6226. <Type>R</Type>
  6227. <Comment></Comment>
  6228. <Link1>http://www.ecsl.cs.sunysb.edu/yuntis/</Link1>
  6229. <Link2></Link2>
  6230. </user-agent>
  6231. <user-agent>
  6232. <ID>id_g_m_140907_1</ID>
  6233. <String>Gungho/0.08004 (http://code.google.com/p/gungho-crawler/wiki/Index)</String>
  6234. <Description>Gungho - Extensible web crawler written in Perl by Google Code</Description>
  6235. <Type>R</Type>
  6236. <Comment></Comment>
  6237. <Link1>http://code.google.com/p/gungho-crawler/wiki/Index</Link1>
  6238. <Link2></Link2>
  6239. </user-agent>
  6240. <user-agent>
  6241. <ID>id_g_m_211106_1</ID>
  6242. <String>GurujiBot/1.0 (+http://www.guruji.com/WebmasterFAQ.html)</String>
  6243. <Description>guruji : the Indian search engine robot</Description>
  6244. <Type>R</Type>
  6245. <Comment>209.128.80.1xx / 72.20.109.xx</Comment>
  6246. <Link1>http://www.guruji.com/</Link1>
  6247. <Link2></Link2>
  6248. </user-agent>
  6249. <user-agent>
  6250. <ID>id_g_m_100508_2</ID>
  6251. <String>GurujiImageBot/1.0 (+http://www.guruji.com/en/WebmasterFAQ.html)</String>
  6252. <Description>guruji : the Indian search engine picture crawler</Description>
  6253. <Type>R</Type>
  6254. <Comment>72.20.109.xx</Comment>
  6255. <Link1>http://www.guruji.com/</Link1>
  6256. <Link2></Link2>
  6257. </user-agent>
  6258. <user-agent>
  6259. <ID>id_g_m_291108_3</ID>
  6260. <String>Haier-T10C/1.0 iPanel/2.0 WAP2.0 (compatible; UP.Browser/6.2.2.4; UPG1; UP/4.0; Embedded)</String>
  6261. <Description>Openwave Mobile Browser on Haier T10C mobile</Description>
  6262. <Type>B</Type>
  6263. <Comment></Comment>
  6264. <Link1>http://www.openwave.com</Link1>
  6265. <Link2></Link2>
  6266. </user-agent>
  6267. <user-agent>
  6268. <ID>id_g_m_171105_5</ID>
  6269. <String>HappyFunBot/1.1</String>
  6270. <Description>Happy Fun Search robot</Description>
  6271. <Type>R</Type>
  6272. <Comment></Comment>
  6273. <Link1>http://www.happyfunsearch.com/bot.html</Link1>
  6274. <Link2></Link2>
  6275. </user-agent>
  6276. <user-agent>
  6277. <ID>id_g_m_428</ID>
  6278. <String>Harvest-NG/1.0.2</String>
  6279. <Description>Harvest-NG web crawler used by search.yahoo.com</Description>
  6280. <Type>R</Type>
  6281. <Comment>see also Exalead NG and NG/1.0</Comment>
  6282. <Link1>http://search.yahoo.com</Link1>
  6283. <Link2></Link2>
  6284. </user-agent>
  6285. <user-agent>
  6286. <ID>id_g_m_429</ID>
  6287. <String>Haste/0.12 (HOME: http://haste.kytoon.com/)</String>
  6288. <Description>Haste - web mapping and monitoring system</Description>
  6289. <Type>R C</Type>
  6290. <Comment>site is closed</Comment>
  6291. <Link1>http://haste.kytoon.com</Link1>
  6292. <Link2></Link2>
  6293. </user-agent>
  6294. <user-agent>
  6295. <ID>id_g_m_430</ID>
  6296. <String>Hatena Antenna/0.4 (http://a.hatena.ne.jp/help#robot)</String>
  6297. <Description>Hatena::Antenna Japan robot</Description>
  6298. <Type>R</Type>
  6299. <Comment>221.186.146.xx</Comment>
  6300. <Link1>http://a.hatena.ne.jp</Link1>
  6301. <Link2></Link2>
  6302. </user-agent>
  6303. <user-agent>
  6304. <ID>id_g_m_110606_2</ID>
  6305. <String>Hatena Mobile Gateway/1.0</String>
  6306. <Description>Hatena Japan proxy for handheld/mobile clients</Description>
  6307. <Type>P</Type>
  6308. <Comment>221.186.146.xx</Comment>
  6309. <Link1>http://www.hatena.ne.jp/</Link1>
  6310. <Link2></Link2>
  6311. </user-agent>
  6312. <user-agent>
  6313. <ID>id_g_m_431</ID>
  6314. <String>Hatena Pagetitle Agent/1.0</String>
  6315. <Description>Hatena Japan robot</Description>
  6316. <Type>R</Type>
  6317. <Comment>221.186.146.xx</Comment>
  6318. <Link1>http://www.hatena.ne.jp</Link1>
  6319. <Link2></Link2>
  6320. </user-agent>
  6321. <user-agent>
  6322. <ID>id_g_m_240207_1</ID>
  6323. <String>Hatena RSS/0.3 (http://r.hatena.ne.jp)</String>
  6324. <Description>Hatena Japan RSS feed robot</Description>
  6325. <Type>R</Type>
  6326. <Comment>221.186.146.xx</Comment>
  6327. <Link1>http://www.hatena.ne.jp</Link1>
  6328. <Link2></Link2>
  6329. </user-agent>
  6330. <user-agent>
  6331. <ID>id_g_m_110606_1</ID>
  6332. <String>HatenaScreenshot/1.0 (checker)</String>
  6333. <Description>Hatena::Diary (Japan) web page screenshot robot</Description>
  6334. <Type>R D</Type>
  6335. <Comment>221.186.146.xx</Comment>
  6336. <Link1>http://www.hatena.ne.jp/</Link1>
  6337. <Link2></Link2>
  6338. </user-agent>
  6339. <user-agent>
  6340. <ID>id_g_m_120108_1</ID>
  6341. <String>hbtronix.spider.2 -- http://hbtronix.de/spider.php</String>
  6342. <Description>hbtronix.spider - Domain name spider (Germany)</Description>
  6343. <Type>R</Type>
  6344. <Comment>89.110.157.*</Comment>
  6345. <Link1>http://hbtronix.de/spider.php</Link1>
  6346. <Link2></Link2>
  6347. </user-agent>
  6348. <user-agent>
  6349. <ID>id_g_m_432</ID>
  6350. <String>HeinrichderMiragoRobot</String>
  6351. <Description>Mirago Germany robot</Description>
  6352. <Type>R</Type>
  6353. <Comment></Comment>
  6354. <Link1>http://www.mirago.de/</Link1>
  6355. <Link2></Link2>
  6356. </user-agent>
  6357. <user-agent>
  6358. <ID>id_g_m_433</ID>
  6359. <String>HeinrichderMiragoRobot (http://www.miragorobot.com/scripts/deinfo.asp)</String>
  6360. <Description>Mirago Germany robot</Description>
  6361. <Type>R</Type>
  6362. <Comment></Comment>
  6363. <Link1>http://www.mirago.de/</Link1>
  6364. <Link2></Link2>
  6365. </user-agent>
  6366. <user-agent>
  6367. <ID>id_g_m_434</ID>
  6368. <String>Helix/1.x ( http://www.sitesearch.ca/helix/)</String>
  6369. <Description>Helix - The SiteSearch (Canada) web crawler</Description>
  6370. <Type>R</Type>
  6371. <Comment></Comment>
  6372. <Link1>http://www.sitesearch.ca</Link1>
  6373. <Link2></Link2>
  6374. </user-agent>
  6375. <user-agent>
  6376. <ID>id_g_m_080206_3</ID>
  6377. <String>HenriLeRobotMirago (http://www.miragorobot.com/scripts/frinfo.asp)</String>
  6378. <Description>Mirago France robot</Description>
  6379. <Type>R</Type>
  6380. <Comment></Comment>
  6381. <Link1>http://www.mirago.fr/</Link1>
  6382. <Link2></Link2>
  6383. </user-agent>
  6384. <user-agent>
  6385. <ID>id_g_m_435</ID>
  6386. <String>HenrytheMiragoRobot</String>
  6387. <Description>Mirago search (UK) robot</Description>
  6388. <Type>R</Type>
  6389. <Comment>217.154.245.2xx</Comment>
  6390. <Link1>http://www.mirago.co.uk</Link1>
  6391. <Link2></Link2>
  6392. </user-agent>
  6393. <user-agent>
  6394. <ID>id_g_m_060806_3</ID>
  6395. <String>HenryTheMiragoRobot (http://www.miragorobot.com/scripts/mrinfo.asp)</String>
  6396. <Description>Mirago search (UK) robot</Description>
  6397. <Type>R</Type>
  6398. <Comment>217.154.245.2xx</Comment>
  6399. <Link1>http://www.mirago.co.uk</Link1>
  6400. <Link2></Link2>
  6401. </user-agent>
  6402. <user-agent>
  6403. <ID>id_g_m_436</ID>
  6404. <String>hgrepurl/1.0</String>
  6405. <Description>O'Reilly's Perl LWP example client program from Web Client Programming with Perl</Description>
  6406. <Type></Type>
  6407. <Comment></Comment>
  6408. <Link1></Link1>
  6409. <Link2></Link2>
  6410. </user-agent>
  6411. <user-agent>
  6412. <ID>id_g_m_437</ID>
  6413. <String>Hi! I'm CsCrawler my homepage: http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html RPT-HTTPClient/0.3-3</String>
  6414. <Description>University of Kassel Germany CsCrawler using the HTTPClient library</Description>
  6415. <Type>R</Type>
  6416. <Comment></Comment>
  6417. <Link1>http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html</Link1>
  6418. <Link2>http://www.innovation.ch/java/HTTPClient/</Link2>
  6419. </user-agent>
  6420. <user-agent>
  6421. <ID>id_g_m_438</ID>
  6422. <String>HiDownload</String>
  6423. <Description>HiDownload download manager</Description>
  6424. <Type>D</Type>
  6425. <Comment></Comment>
  6426. <Link1>http://www.streamingstar.com/hidownload.htm</Link1>
  6427. <Link2></Link2>
  6428. </user-agent>
  6429. <user-agent>
  6430. <ID>id_g_m_439</ID>
  6431. <String>Hippias/0.9 Beta</String>
  6432. <Description>Hippias robot</Description>
  6433. <Type>R</Type>
  6434. <Comment>site is offline</Comment>
  6435. <Link1>http://hippias.evansville.edu</Link1>
  6436. <Link2></Link2>
  6437. </user-agent>
  6438. <user-agent>
  6439. <ID>id_g_m_440</ID>
  6440. <String>HitList</String>
  6441. <Description>Pilot Hitlist web analytics solution</Description>
  6442. <Type>R</Type>
  6443. <Comment></Comment>
  6444. <Link1>http://www.pilotsoftware.com/products_solutions/hitlist.html</Link1>
  6445. <Link2></Link2>
  6446. </user-agent>
  6447. <user-agent>
  6448. <ID>id_g_m_441</ID>
  6449. <String>Hitwise Spider v1.0 http://www.hitwise.com</String>
  6450. <Description>Hitwise spider</Description>
  6451. <Type>R</Type>
  6452. <Comment></Comment>
  6453. <Link1>http://www.hitwise.com</Link1>
  6454. <Link2></Link2>
  6455. </user-agent>
  6456. <user-agent>
  6457. <ID>id_g_m_442</ID>
  6458. <String>HLoader</String>
  6459. <Description>diff. IPs / unknown services</Description>
  6460. <Type></Type>
  6461. <Comment> i.e.: - 204.95.207.xxx user agent ? - 66.27.113.xx link checking ?</Comment>
  6462. <Link1></Link1>
  6463. <Link2></Link2>
  6464. </user-agent>
  6465. <user-agent>
  6466. <ID>id_g_m_040907_1</ID>
  6467. <String>holmes/3.11 (http://morfeo.centrum.cz/bot)</String>
  6468. <Description>Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx</Description>
  6469. <Type>R</Type>
  6470. <Comment></Comment>
  6471. <Link1>http://morfeo.centrum.cz/</Link1>
  6472. <Link2></Link2>
  6473. </user-agent>
  6474. <user-agent>
  6475. <ID>id_g_m_220906_2</ID>
  6476. <String>holmes/3.9 (onet.pl)</String>
  6477. <Description>Onet.pl (Poland) search robot</Description>
  6478. <Type>R</Type>
  6479. <Comment>213.180.137.xx</Comment>
  6480. <Link1>http://szukaj.onet.pl/</Link1>
  6481. <Link2></Link2>
  6482. </user-agent>
  6483. <user-agent>
  6484. <ID>id_g_m_181006_1</ID>
  6485. <String>holmes/3.xx (OnetSzukaj/5.0; +http://szukaj.onet.pl)</String>
  6486. <Description>Onet.pl (Poland) search robot</Description>
  6487. <Type>R</Type>
  6488. <Comment>213.180.137.xx</Comment>
  6489. <Link1>http://szukaj.onet.pl/</Link1>
  6490. <Link2></Link2>
  6491. </user-agent>
  6492. <user-agent>
  6493. <ID>id_g_m_443</ID>
  6494. <String>holmes/x.x</String>
  6495. <Description>Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx</Description>
  6496. <Type>R</Type>
  6497. <Comment></Comment>
  6498. <Link1>http://morfeo.centrum.cz/</Link1>
  6499. <Link2></Link2>
  6500. </user-agent>
  6501. <user-agent>
  6502. <ID>id_g_m_021108_2</ID>
  6503. <String>HolmesBot (http://holmes.ge)</String>
  6504. <Description>Holes search robot (Georgia)</Description>
  6505. <Type>R</Type>
  6506. <Comment>77.92.229.3x</Comment>
  6507. <Link1>http://holmes.ge/</Link1>
  6508. <Link2></Link2>
  6509. </user-agent>
  6510. <user-agent>
  6511. <ID>id_g_m_444</ID>
  6512. <String>HomePageSearch(hpsearch.uni-trier.de)</String>
  6513. <Description>HomePageSearch robot</Description>
  6514. <Type>R</Type>
  6515. <Comment></Comment>
  6516. <Link1>http://hpsearch.uni-trier.de/</Link1>
  6517. <Link2></Link2>
  6518. </user-agent>
  6519. <user-agent>
  6520. <ID>id_g_m_445</ID>
  6521. <String>Homerbot: www.homerweb.com</String>
  6522. <Description>Homerweb search robot</Description>
  6523. <Type>R</Type>
  6524. <Comment></Comment>
  6525. <Link1>http://www.homerweb.com</Link1>
  6526. <Link2></Link2>
  6527. </user-agent>
  6528. <user-agent>
  6529. <ID>id_g_m_220606_1</ID>
  6530. <String>Honda-Search/0.7.2 (Nutch; http://lucene.apache.org/nutch/bot.html; search@honda-search.com)</String>
  6531. <Description>Honda-Search.com - Honda cars related search robot</Description>
  6532. <Type>R</Type>
  6533. <Comment>69.16.227.1xx</Comment>
  6534. <Link1>http://www.honda-search.com/</Link1>
  6535. <Link2></Link2>
  6536. </user-agent>
  6537. <user-agent>
  6538. <ID>id_g_m_090206_1</ID>
  6539. <String>HooWWWer/2.1.3 (debugging run) (+http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-info&lt;at>hiit.fi)</String>
  6540. <Description>HooWWer - Next Generation Information Retrieval robot </Description>
  6541. <Type>R</Type>
  6542. <Comment></Comment>
  6543. <Link1>http://cosco.hiit.fi</Link1>
  6544. <Link2></Link2>
  6545. </user-agent>
  6546. <user-agent>
  6547. <ID>id_g_m_446</ID>
  6548. <String>HooWWWer/2.1.x ( http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-info&lt;at>hiit.fi)</String>
  6549. <Description>HooWWer - Next Generation Information Retrieval robot (128.214.112.xx)</Description>
  6550. <Type>R</Type>
  6551. <Comment></Comment>
  6552. <Link1>http://cosco.hiit.fi/</Link1>
  6553. <Link2></Link2>
  6554. </user-agent>
  6555. <user-agent>
  6556. <ID>id_g_m_447</ID>
  6557. <String>HotJava/1.0.1/JRE1.1.x</String>
  6558. <Description>HotJava browser plus HTML Component 1.1.x</Description>
  6559. <Type>B</Type>
  6560. <Comment></Comment>
  6561. <Link1></Link1>
  6562. <Link2></Link2>
  6563. </user-agent>
  6564. <user-agent>
  6565. <ID>id_g_m_448</ID>
  6566. <String>Hotzonu/x.0</String>
  6567. <Description>Hotzuno - Japanese BBS reader client</Description>
  6568. <Type>B</Type>
  6569. <Comment></Comment>
  6570. <Link1>http://hotzonu.hp.infoseek.co.jp/</Link1>
  6571. <Link2></Link2>
  6572. </user-agent>
  6573. <user-agent>
  6574. <ID>id_g_m_040507_1</ID>
  6575. <String>HPL/Nutch-0.9 -</String>
  6576. <Description>Unknown robot from HP Labs</Description>
  6577. <Type>R</Type>
  6578. <Comment>15.203.249.12x</Comment>
  6579. <Link1>http://hpl.hp.com/</Link1>
  6580. <Link2></Link2>
  6581. </user-agent>
  6582. <user-agent>
  6583. <ID>id_g_m_449</ID>
  6584. <String>htdig/3.1.6 (http://computerorgs.com)</String>
  6585. <Description>COMPUTERorgs.com robot (205.134.190.xxx) using htdig</Description>
  6586. <Type>R</Type>
  6587. <Comment></Comment>
  6588. <Link1>http://www.computerorgs.com/</Link1>
  6589. <Link2>http://www.htdig.org</Link2>
  6590. </user-agent>
  6591. <user-agent>
  6592. <ID>id_g_m_210106_1</ID>
  6593. <String>htdig/3.1.6 (unconfigured@htdig.searchengine.maintainer)</String>
  6594. <Description>htdig used by the Academie de Toulouse</Description>
  6595. <Type>R</Type>
  6596. <Comment>reads robots.txt</Comment>
  6597. <Link1>http://www.ac-toulouse.fr/html/_.php</Link1>
  6598. <Link2>http://www.htdig.org</Link2>
  6599. </user-agent>
  6600. <user-agent>
  6601. <ID>id_g_m_450</ID>
  6602. <String>htdig/3.1.x (root@localhost)</String>
  6603. <Description>htdig search tool</Description>
  6604. <Type>R</Type>
  6605. <Comment></Comment>
  6606. <Link1>http://www.htdig.org</Link1>
  6607. <Link2></Link2>
  6608. </user-agent>
  6609. <user-agent>
  6610. <ID>id_g_m_451</ID>
  6611. <String>Html Link Validator (www.lithopssoft.com)</String>
  6612. <Description>Lithops Software link validation tool</Description>
  6613. <Type>C</Type>
  6614. <Comment></Comment>
  6615. <Link1>http://www.lithopssoft.com</Link1>
  6616. <Link2></Link2>
  6617. </user-agent>
  6618. <user-agent>
  6619. <ID>id_g_m_110506_3</ID>
  6620. <String>HTML2JPG Blackbox&#44; http://www.html2jpg.com</String>
  6621. <Description>HTML2JPG webpage to image converter</Description>
  6622. <Type>D</Type>
  6623. <Comment></Comment>
  6624. <Link1>http://www.html2jpg.com</Link1>
  6625. <Link2></Link2>
  6626. </user-agent>
  6627. <user-agent>
  6628. <ID>id_g_m_452</ID>
  6629. <String>HTML2JPG Enterprise</String>
  6630. <Description>HTML2JPG webpage to image converter</Description>
  6631. <Type>D</Type>
  6632. <Comment></Comment>
  6633. <Link1>http://www.html2jpg.com</Link1>
  6634. <Link2></Link2>
  6635. </user-agent>
  6636. <user-agent>
  6637. <ID>id_g_m_101205_1</ID>
  6638. <String>HTMLParser/1.x</String>
  6639. <Description>HTML Parser Java library to parse HTML</Description>
  6640. <Type>D</Type>
  6641. <Comment></Comment>
  6642. <Link1>http://sourceforge.net/projects/htmlparser</Link1>
  6643. <Link2></Link2>
  6644. </user-agent>
  6645. <user-agent>
  6646. <ID>id_g_m_071006_1</ID>
  6647. <String>HTTP Retriever</String>
  6648. <Description>PHP HTTP client to access Web servers</Description>
  6649. <Type>D</Type>
  6650. <Comment></Comment>
  6651. <Link1>http://code.blitzaffe.com/pages/home/</Link1>
  6652. <Link2></Link2>
  6653. </user-agent>
  6654. <user-agent>
  6655. <ID>id_g_m_240306_1</ID>
  6656. <String>http://Anonymouse.org/ (Unix)</String>
  6657. <Description>Anonymous web proxy service</Description>
  6658. <Type>P</Type>
  6659. <Comment></Comment>
  6660. <Link1>http://anonymouse.org/</Link1>
  6661. <Link2></Link2>
  6662. </user-agent>
  6663. <user-agent>
  6664. <ID>id_g_m_453</ID>
  6665. <String>http://Ask.24x.Info/ (http://narres.it/)</String>
  6666. <Description>Ask 24x Info (Germany) DMOZ related robot</Description>
  6667. <Type>R</Type>
  6668. <Comment></Comment>
  6669. <Link1>http://narres.it</Link1>
  6670. <Link2></Link2>
  6671. </user-agent>
  6672. <user-agent>
  6673. <ID>id_g_m_070209_6</ID>
  6674. <String>http://hilfe.acont.de/bot.html ACONTBOT</String>
  6675. <Description>ACONTBOT - Acont search Germany robot</Description>
  6676. <Type>R</Type>
  6677. <Comment>82.149.246.2x</Comment>
  6678. <Link1>http://acont.de/</Link1>
  6679. <Link2>http://hilfe.acont.de/bot.htm</Link2>
  6680. </user-agent>
  6681. <user-agent>
  6682. <ID>id_g_m_230408_1</ID>
  6683. <String>http://OzySoftware.com/Index.html</String>
  6684. <Description>OzySoftware.com software directory link checking</Description>
  6685. <Type>C</Type>
  6686. <Comment>202.173.141.x</Comment>
  6687. <Link1>http://ozysoftware.com/index.html</Link1>
  6688. <Link2></Link2>
  6689. </user-agent>
  6690. <user-agent>
  6691. <ID>id_g_m_454</ID>
  6692. <String>http://www.almaden.ibm.com/cs/crawler</String>
  6693. <Description>IBM's Almaden Research robot</Description>
  6694. <Type>R</Type>
  6695. <Comment> s. also: - FocusedSampler - WFARC</Comment>
  6696. <Link1>http://www.almaden.ibm.com</Link1>
  6697. <Link2></Link2>
  6698. </user-agent>
  6699. <user-agent>
  6700. <ID>id_g_m_455</ID>
  6701. <String>http://www.almaden.ibm.com/cs/crawler [rc1.wf.ibm.com]</String>
  6702. <Description>IBM's Almaden Research robot</Description>
  6703. <Type>R</Type>
  6704. <Comment></Comment>
  6705. <Link1>http://www.almaden.ibm.com</Link1>
  6706. <Link2></Link2>
  6707. </user-agent>
  6708. <user-agent>
  6709. <ID>id_g_m_456</ID>
  6710. <String>http://www.almaden.ibm.com/cs/crawler [wf216]</String>
  6711. <Description>IBM's Almaden Research robot</Description>
  6712. <Type>R</Type>
  6713. <Comment></Comment>
  6714. <Link1>http://www.almaden.ibm.com</Link1>
  6715. <Link2></Link2>
  6716. </user-agent>
  6717. <user-agent>
  6718. <ID>id_g_m_271105_4</ID>
  6719. <String>http://www.istarthere.com_spider@istarthere.com</String>
  6720. <Description>Istarthere.com search robot</Description>
  6721. <Type>R</Type>
  6722. <Comment></Comment>
  6723. <Link1>http://www.istarthere.com/</Link1>
  6724. <Link2></Link2>
  6725. </user-agent>
  6726. <user-agent>
  6727. <ID>id_g_m_070106_1</ID>
  6728. <String>http://www.monogol.de</String>
  6729. <Description>Monogol - German open source search engine project (195.226.167.1xx)</Description>
  6730. <Type>R</Type>
  6731. <Comment></Comment>
  6732. <Link1>http://www.monogol.de/</Link1>
  6733. <Link2></Link2>
  6734. </user-agent>
  6735. <user-agent>
  6736. <ID>id_g_m_060806_4</ID>
  6737. <String>http://www.trendtech.dk/spider.asp)</String>
  6738. <Description>TrendTech Search Engine (Denmark) robot</Description>
  6739. <Type>R</Type>
  6740. <Comment>87.104.18.xx</Comment>
  6741. <Link1>http://www.trendtech.dk/</Link1>
  6742. <Link2></Link2>
  6743. </user-agent>
  6744. <user-agent>
  6745. <ID>id_g_m_290106_1</ID>
  6746. <String>HTTP::Lite/2.x.x</String>
  6747. <Description>HTTP::Lite - Standalone Perl module for retreiving HTTP documents</Description>
  6748. <Type>D</Type>
  6749. <Comment></Comment>
  6750. <Link1>http://www.toybox.ca/http-lite/</Link1>
  6751. <Link2></Link2>
  6752. </user-agent>
  6753. <user-agent>
  6754. <ID>id_g_m_050108_1</ID>
  6755. <String>HTTPEyes</String>
  6756. <Description>HTTPEyes - Web proxy cache</Description>
  6757. <Type>P</Type>
  6758. <Comment></Comment>
  6759. <Link1>http://bachue.com/httpeyes/</Link1>
  6760. <Link2></Link2>
  6761. </user-agent>
  6762. <user-agent>
  6763. <ID>id_g_m_457</ID>
  6764. <String>HTTPResume v. 1.x</String>
  6765. <Description>HTTPResume Amiga download manager</Description>
  6766. <Type>D</Type>
  6767. <Comment></Comment>
  6768. <Link1>http://tesla.rcub.bg.ac.yu/%7Eantony/HTTPResume/</Link1>
  6769. <Link2></Link2>
  6770. </user-agent>
  6771. <user-agent>
  6772. <ID>id_g_m_031107_2</ID>
  6773. <String>httpunit/1.5</String>
  6774. <Description>HttpUnit - Java test code for emulating browser behaviour</Description>
  6775. <Type>B</Type>
  6776. <Comment></Comment>
  6777. <Link1>http://httpunit.sourceforge.net/</Link1>
  6778. <Link2></Link2>
  6779. </user-agent>
  6780. <user-agent>
  6781. <ID>id_g_m_090306_1</ID>
  6782. <String>httpunit/1.x</String>
  6783. <Description>HttpUnit - Java browser behavior simulation tool</Description>
  6784. <Type>B</Type>
  6785. <Comment></Comment>
  6786. <Link1>http://httpunit.sourceforge.net/</Link1>
  6787. <Link2></Link2>
  6788. </user-agent>
  6789. <user-agent>
  6790. <ID>id_g_m_010807_1</ID>
  6791. <String>Hybrid/1.2 [en] (OS Independent)</String>
  6792. <Description>Hybrid Share mono C#/Gtk# application for file sharing</Description>
  6793. <Type></Type>
  6794. <Comment></Comment>
  6795. <Link1>http://hybrid-share.sourceforge.net/index.php</Link1>
  6796. <Link2></Link2>
  6797. </user-agent>
  6798. <user-agent>
  6799. <ID>id_g_m_300507_1</ID>
  6800. <String>HyperEstraier/1.x.xx</String>
  6801. <Description>Hyper Estraier full-text search system</Description>
  6802. <Type>D</Type>
  6803. <Comment></Comment>
  6804. <Link1>http://hyperestraier.sourceforge.net/</Link1>
  6805. <Link2></Link2>
  6806. </user-agent>
  6807. <user-agent>
  6808. <ID>id_g_m_170906_1</ID>
  6809. <String>i1searchbot/2.0 (i1search web crawler; http://www.i1search.com; crawler@i1search.com)</String>
  6810. <Description>i1search robot</Description>
  6811. <Type>R</Type>
  6812. <Comment>65.111.164.1xx</Comment>
  6813. <Link1>http://www.i1search.com/</Link1>
  6814. <Link2></Link2>
  6815. </user-agent>
  6816. <user-agent>
  6817. <ID>id_g_m_461</ID>
  6818. <String>IAArchiver-1.0</String>
  6819. <Description>Alexa / The Internet Archive (209.237.238.1xx)</Description>
  6820. <Type>R</Type>
  6821. <Comment></Comment>
  6822. <Link1>http://www.alexa.com</Link1>
  6823. <Link2></Link2>
  6824. </user-agent>
  6825. <user-agent>
  6826. <ID>id_g_m_091205_2</ID>
  6827. <String>iaskspider</String>
  6828. <Description>Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx)</Description>
  6829. <Type></Type>
  6830. <Comment>Not from iask.com.cn - s. also Mozilla/5.0 (compatible; iaskspider/1.0 ..</Comment>
  6831. <Link1></Link1>
  6832. <Link2></Link2>
  6833. </user-agent>
  6834. <user-agent>
  6835. <ID>id_g_m_111106_1</ID>
  6836. <String>iaskspider2 (iask@staff.sina.com.cn)</String>
  6837. <Description>Iask search / Sina portal robot (China)</Description>
  6838. <Type>R</Type>
  6839. <Comment>202.106.184.xxx</Comment>
  6840. <Link1>http://iask.com/</Link1>
  6841. <Link2>http://english.sina.com/index.html</Link2>
  6842. </user-agent>
  6843. <user-agent>
  6844. <ID>id_g_m_458</ID>
  6845. <String>ia_archiver</String>
  6846. <Description>Alexa / The Internet Archive (209.237.238.1xx)</Description>
  6847. <Type>R</Type>
  6848. <Comment></Comment>
  6849. <Link1>http://www.alexa.com</Link1>
  6850. <Link2></Link2>
  6851. </user-agent>
  6852. <user-agent>
  6853. <ID>id_g_m_459</ID>
  6854. <String>ia_archiver-web.archive.org</String>
  6855. <Description>Alexa / The Internet Archive (209.237.238.1xx)</Description>
  6856. <Type>R</Type>
  6857. <Comment></Comment>
  6858. <Link1>http://www.alexa.com</Link1>
  6859. <Link2></Link2>
  6860. </user-agent>
  6861. <user-agent>
  6862. <ID>id_g_m_460</ID>
  6863. <String>ia_archiver/1.6</String>
  6864. <Description>Alexa / The Internet Archive (209.237.238.1xx)</Description>
  6865. <Type>R</Type>
  6866. <Comment></Comment>
  6867. <Link1>http://www.alexa.com</Link1>
  6868. <Link2></Link2>
  6869. </user-agent>
  6870. <user-agent>
  6871. <ID>id_g_m_462</ID>
  6872. <String>IBrowse/2.2 (AmigaOS 3.5)</String>
  6873. <Description>IOSpirit iBrowse Amiga Browser</Description>
  6874. <Type>B</Type>
  6875. <Comment>was Hisoft (http://www.hisoft.co.uk)</Comment>
  6876. <Link1>http://amiga.iospirit.de/</Link1>
  6877. <Link2></Link2>
  6878. </user-agent>
  6879. <user-agent>
  6880. <ID>id_g_m_463</ID>
  6881. <String>IBrowse/2.2 (Windows 3.1)</String>
  6882. <Description>IOSpirit iBrowse Amiga Browser</Description>
  6883. <Type>B</Type>
  6884. <Comment>was Hisoft (http://www.hisoft.co.uk)</Comment>
  6885. <Link1>http://amiga.iospirit.de/</Link1>
  6886. <Link2></Link2>
  6887. </user-agent>
  6888. <user-agent>
  6889. <ID>id_g_m_464</ID>
  6890. <String>iCab/2.5.2 (Macintosh; I; PPC)</String>
  6891. <Description>iCab MAC Web browser</Description>
  6892. <Type>B</Type>
  6893. <Comment></Comment>
  6894. <Link1>http://www.icab.de</Link1>
  6895. <Link2></Link2>
  6896. </user-agent>
  6897. <user-agent>
  6898. <ID>id_g_m_110207_2</ID>
  6899. <String>ICC-Crawler(Mozilla-compatible; http://kc.nict.go.jp/icc/crawl.html; icc-crawl(at)ml(dot)nict(dot)go(dot)jp)</String>
  6900. <Description>Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan)</Description>
  6901. <Type>R</Type>
  6902. <Comment>202.180.34.1xx</Comment>
  6903. <Link1>http://kc.nict.go.jp/icc/crawl.html</Link1>
  6904. <Link2></Link2>
  6905. </user-agent>
  6906. <user-agent>
  6907. <ID>id_g_m_250607_1</ID>
  6908. <String>ICC-Crawler(Mozilla-compatible;http://kc.nict.go.jp/icc/crawl.html;icc-crawl-contact(at)ml(dot)nict(dot)go(dot)jp)</String>
  6909. <Description>Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan)</Description>
  6910. <Type>R</Type>
  6911. <Comment>202.180.34.1xx</Comment>
  6912. <Link1>http://kc.nict.go.jp/icc/crawl.html</Link1>
  6913. <Link2></Link2>
  6914. </user-agent>
  6915. <user-agent>
  6916. <ID>id_g_m_465</ID>
  6917. <String>iCCrawler (http://www.iccenter.net)</String>
  6918. <Description>ICJobs - Intelligence Competence Center (Germany) robot</Description>
  6919. <Type>R</Type>
  6920. <Comment>212.227.76.xx</Comment>
  6921. <Link1>http://www.iccenter.net</Link1>
  6922. <Link2></Link2>
  6923. </user-agent>
  6924. <user-agent>
  6925. <ID>id_g_m_121006_1</ID>
  6926. <String>ICCrawler - ICjobs (http://www.icjobs.de/bot.htm)</String>
  6927. <Description>ICJobs - Intelligence Competence Center (Germany) robot</Description>
  6928. <Type>R</Type>
  6929. <Comment>212.227.76.xx</Comment>
  6930. <Link1>http://www.iccenter.net</Link1>
  6931. <Link2></Link2>
  6932. </user-agent>
  6933. <user-agent>
  6934. <ID>id_g_m_466</ID>
  6935. <String>ICE Browser/5.05 (Java 1.4.0; Windows 2000 5.0 x86)</String>
  6936. <Description>ICE Java browser</Description>
  6937. <Type>B</Type>
  6938. <Comment></Comment>
  6939. <Link1>http://www.ii.uib.no/~alexey/jb/</Link1>
  6940. <Link2></Link2>
  6941. </user-agent>
  6942. <user-agent>
  6943. <ID>id_g_m_040206_2</ID>
  6944. <String>ichiro/x.0 (http://help.goo.ne.jp/door/crawler.html)</String>
  6945. <Description>Goo Japan / Inktomi robot (210.173.179.xx)</Description>
  6946. <Type>R</Type>
  6947. <Comment> s. also moget / mogimogi</Comment>
  6948. <Link1>http://www.goo.ne.jp</Link1>
  6949. <Link2></Link2>
  6950. </user-agent>
  6951. <user-agent>
  6952. <ID>id_g_m_468</ID>
  6953. <String>ichiro/x.0 (ichiro@nttr.co.jp)</String>
  6954. <Description>Goo Japan / Inktomi robot (210.173.179.xx)</Description>
  6955. <Type>R</Type>
  6956. <Comment> s. also moget / mogimogi</Comment>
  6957. <Link1>http://www.goo.ne.jp</Link1>
  6958. <Link2></Link2>
  6959. </user-agent>
  6960. <user-agent>
  6961. <ID>id_g_m_469</ID>
  6962. <String>IconSurf/2.0 favicon finder (see http://iconsurf.com/robot.html)</String>
  6963. <Description>Iconsurf.com - Visual Surf Engine / favicon finder</Description>
  6964. <Type>R</Type>
  6965. <Comment></Comment>
  6966. <Link1>http://iconsurf.com</Link1>
  6967. <Link2></Link2>
  6968. </user-agent>
  6969. <user-agent>
  6970. <ID>id_g_m_470</ID>
  6971. <String>IconSurf/2.0 favicon monitor (see http://iconsurf.com/robot.html)</String>
  6972. <Description>Iconsurf.com - Visual Surf Engine / favicon finder</Description>
  6973. <Type>R</Type>
  6974. <Comment></Comment>
  6975. <Link1>http://iconsurf.com</Link1>
  6976. <Link2></Link2>
  6977. </user-agent>
  6978. <user-agent>
  6979. <ID>id_g_m_471</ID>
  6980. <String>ICOO Loader v.x.x.x</String>
  6981. <Description>icooLoader download manager</Description>
  6982. <Type>D</Type>
  6983. <Comment></Comment>
  6984. <Link1>http://www.icoonet.com</Link1>
  6985. <Link2></Link2>
  6986. </user-agent>
  6987. <user-agent>
  6988. <ID>id_g_m_472</ID>
  6989. <String>ICRA_label_spider/x.0</String>
  6990. <Description>ICRA (Internet Content Rating Association) label spider</Description>
  6991. <Type>R</Type>
  6992. <Comment></Comment>
  6993. <Link1>http://www.icra.org</Link1>
  6994. <Link2></Link2>
  6995. </user-agent>
  6996. <user-agent>
  6997. <ID>id_g_m_473</ID>
  6998. <String>icsbot-0.1</String>
  6999. <Description>ICS Robot Search Engine (International Christian school of Seoul)</Description>
  7000. <Type>R</Type>
  7001. <Comment></Comment>
  7002. <Link1>http://icseoul.org/</Link1>
  7003. <Link2></Link2>
  7004. </user-agent>
  7005. <user-agent>
  7006. <ID>id_g_m_260306_1</ID>
  7007. <String>IDA</String>
  7008. <Description>Internet Download Accelerator</Description>
  7009. <Type>D</Type>
  7010. <Comment></Comment>
  7011. <Link1>http://www.westbyte.com/ida/</Link1>
  7012. <Link2></Link2>
  7013. </user-agent>
  7014. <user-agent>
  7015. <ID>id_g_m_474</ID>
  7016. <String>ideare - SignSite/1.x</String>
  7017. <Description>Janas (Ideare.com / Tiscali.it) robot</Description>
  7018. <Type>R</Type>
  7019. <Comment></Comment>
  7020. <Link1></Link1>
  7021. <Link2></Link2>
  7022. </user-agent>
  7023. <user-agent>
  7024. <ID>id_g_m_200806_1</ID>
  7025. <String>iearthworm/1.0&#44; iearthworm@yahoo.com.cn</String>
  7026. <Description>Unknown UA from Yahoo China</Description>
  7027. <Type></Type>
  7028. <Comment>202.165.105.x</Comment>
  7029. <Link1></Link1>
  7030. <Link2></Link2>
  7031. </user-agent>
  7032. <user-agent>
  7033. <ID>id_g_m_475</ID>
  7034. <String>IEFav172Free</String>
  7035. <Description>Some bookmark manager</Description>
  7036. <Type>C</Type>
  7037. <Comment> possibly Visit URL ??</Comment>
  7038. <Link1>http://www.lodz.pdi.net/%7Eeristic/free/index.html</Link1>
  7039. <Link2></Link2>
  7040. </user-agent>
  7041. <user-agent>
  7042. <ID>id_g_m_060608_4</ID>
  7043. <String>iFeed.jp/2.0 (www.psychedelix.com/agents/agents.rss; 0 subscribers)</String>
  7044. <Description>iFeed.jp - online rss aggregator (in development)</Description>
  7045. <Type>R</Type>
  7046. <Comment>67.15.2[3-4][X].xxx</Comment>
  7047. <Link1>http://www.ifeed.jp/</Link1>
  7048. <Link2></Link2>
  7049. </user-agent>
  7050. <user-agent>
  7051. <ID>id_g_m_281207_1</ID>
  7052. <String>igdeSpyder (compatible; igde.ru; +http://igde.ru/doc/tech.html)</String>
  7053. <Description>Igde search (Russia) robot</Description>
  7054. <Type>R</Type>
  7055. <Comment>87.118.118.12x</Comment>
  7056. <Link1>http://igde.ru/</Link1>
  7057. <Link2></Link2>
  7058. </user-agent>
  7059. <user-agent>
  7060. <ID>id_g_m_476</ID>
  7061. <String>iGetter/1.x (Macintosh;G;PPC)</String>
  7062. <Description>iGetter download manager</Description>
  7063. <Type>D</Type>
  7064. <Comment></Comment>
  7065. <Link1>http://www.igetter.net</Link1>
  7066. <Link2></Link2>
  7067. </user-agent>
  7068. <user-agent>
  7069. <ID>id_g_m_477</ID>
  7070. <String>iGetter/2 (Macintosh; U; PPC Mac OS X; en)</String>
  7071. <Description>iGetter download manager</Description>
  7072. <Type>D</Type>
  7073. <Comment></Comment>
  7074. <Link1>http://www.igetter.net</Link1>
  7075. <Link2></Link2>
  7076. </user-agent>
  7077. <user-agent>
  7078. <ID>id_g_m_120507_1</ID>
  7079. <String>IIITBOT/1.1 (Indian Language Web Search Engine; http://webkhoj.iiit.net; pvvpr at iiit dot ac dot in)</String>
  7080. <Description>Webkhoj - Indian language search engine</Description>
  7081. <Type>R</Type>
  7082. <Comment>196.12.53.xx</Comment>
  7083. <Link1>http://webkhoj.iiit.net/</Link1>
  7084. <Link2></Link2>
  7085. </user-agent>
  7086. <user-agent>
  7087. <ID>id_g_m_040607_2</ID>
  7088. <String>ilial/Nutch-0.9 (Ilial&#44; Inc. is a Los Angeles based Internet startup company. For more information please visit http://www.ilial.com/crawler; http://www.ilial.com/crawler; crawl@ilial.com)</String>
  7089. <Description>Ilial Knowledge Search robot</Description>
  7090. <Type>R</Type>
  7091. <Comment>72.44.58.2xx</Comment>
  7092. <Link1>http://www.ilial.com/crawler/</Link1>
  7093. <Link2></Link2>
  7094. </user-agent>
  7095. <user-agent>
  7096. <ID>id_g_m_290906_1</ID>
  7097. <String>ilial/Nutch-0.9-dev</String>
  7098. <Description>Unknown robot from UCLA using Nutch</Description>
  7099. <Type>R</Type>
  7100. <Comment>164.67.195.xx</Comment>
  7101. <Link1>http://www.ucla.edu/</Link1>
  7102. <Link2>http://lucene.apache.org/nutch/</Link2>
  7103. </user-agent>
  7104. <user-agent>
  7105. <ID>id_g_m_270806_1</ID>
  7106. <String>IlseBot/1.x</String>
  7107. <Description>Ilse Netherlands robot (62.69.178.xx)</Description>
  7108. <Type>R</Type>
  7109. <Comment>s. also INGRID/3.0 .. / Mozilla/3.0 (INGRID/3.0 ..</Comment>
  7110. <Link1>http://www.ilse.nl/</Link1>
  7111. <Link2></Link2>
  7112. </user-agent>
  7113. <user-agent>
  7114. <ID>id_g_m_478</ID>
  7115. <String>IlTrovatore-Setaccio ( http://www.iltrovatore.it)</String>
  7116. <Description>Il Trovatore - Italian search engine robot</Description>
  7117. <Type>R</Type>
  7118. <Comment>213.215.201.2xx</Comment>
  7119. <Link1>http://www.iltrovatore.it</Link1>
  7120. <Link2></Link2>
  7121. </user-agent>
  7122. <user-agent>
  7123. <ID>id_g_m_479</ID>
  7124. <String>Iltrovatore-Setaccio/0.3-dev (Indexing; http://www.iltrovatore.it/bot.html; info@iltrovatore.it)</String>
  7125. <Description>Il Trovatore - Italian search engine robot</Description>
  7126. <Type>R</Type>
  7127. <Comment>213.215.201.2xx</Comment>
  7128. <Link1>http://www.iltrovatore.it</Link1>
  7129. <Link2></Link2>
  7130. </user-agent>
  7131. <user-agent>
  7132. <ID>id_g_m_480</ID>
  7133. <String>IlTrovatore-Setaccio/1.2 ( http://www.iltrovatore.it/aiuto/faq.html)</String>
  7134. <Description>Il Trovatore - Italian search engine robot</Description>
  7135. <Type>R</Type>
  7136. <Comment>213.215.201.2xx</Comment>
  7137. <Link1>http://www.iltrovatore.it</Link1>
  7138. <Link2></Link2>
  7139. </user-agent>
  7140. <user-agent>
  7141. <ID>id_g_m_481</ID>
  7142. <String>Iltrovatore-Setaccio/1.2 (It-bot; http://www.iltrovatore.it/bot.html; info@iltrovatore.it)</String>
  7143. <Description>Il Trovatore - Italian search engine robot</Description>
  7144. <Type>R</Type>
  7145. <Comment>213.215.201.2xx</Comment>
  7146. <Link1>http://www.iltrovatore.it</Link1>
  7147. <Link2></Link2>
  7148. </user-agent>
  7149. <user-agent>
  7150. <ID>id_g_m_482</ID>
  7151. <String>iltrovatore-setaccio/1.2-dev (spidering; http://www.iltrovatore.it/aiuto/.....)</String>
  7152. <Description>Il Trovatore - Italian search engine robot</Description>
  7153. <Type>R</Type>
  7154. <Comment>213.215.201.2xx</Comment>
  7155. <Link1>http://www.iltrovatore.it</Link1>
  7156. <Link2></Link2>
  7157. </user-agent>
  7158. <user-agent>
  7159. <ID>id_g_m_040506_1</ID>
  7160. <String>IlTrovatore/1.2 (IlTrovatore; http://www.iltrovatore.it/bot.html; bot@iltrovatore.it)</String>
  7161. <Description>Il Trovatore - Italian search engine robot</Description>
  7162. <Type>R</Type>
  7163. <Comment>213.215.201.2xx</Comment>
  7164. <Link1>http://www.iltrovatore.it</Link1>
  7165. <Link2></Link2>
  7166. </user-agent>
  7167. <user-agent>
  7168. <ID>id_g_m_060107_2</ID>
  7169. <String>ImageVisu/v4.x.x</String>
  7170. <Description>ImageVisu image and graphics viewer - display files from the Web (HTTP and ECWP)</Description>
  7171. <Type>B</Type>
  7172. <Comment></Comment>
  7173. <Link1>http://geovisu.free.fr/imagvisu/english/</Link1>
  7174. <Link2></Link2>
  7175. </user-agent>
  7176. <user-agent>
  7177. <ID>id_g_m_080907_1</ID>
  7178. <String>ImageWalker/2.0 (www.bdbrandprotect.com)</String>
  7179. <Description>BD-Brandprotect copyright infringement crawler</Description>
  7180. <Type>R</Type>
  7181. <Comment>72.14.164.1xx</Comment>
  7182. <Link1>http://www.bdbrandprotect.com/</Link1>
  7183. <Link2>http://www.bdbrandprotect.com/solutions_5.html</Link2>
  7184. </user-agent>
  7185. <user-agent>
  7186. <ID>id_g_m_110306_1</ID>
  7187. <String>Incutio HttpClient v0.x</String>
  7188. <Description>HttpClient - a PHP Web Client Class</Description>
  7189. <Type></Type>
  7190. <Comment></Comment>
  7191. <Link1>http://scripts.incutio.com/httpclient/index.php</Link1>
  7192. <Link2></Link2>
  7193. </user-agent>
  7194. <user-agent>
  7195. <ID>id_g_m_483</ID>
  7196. <String>IncyWincy data gatherer(webmaster@loopimprovements.com</String>
  7197. <Description>IncyWincy search engine using DMOZ Open Directory database</Description>
  7198. <Type>R</Type>
  7199. <Comment></Comment>
  7200. <Link1>http://www.loopimprovements.com</Link1>
  7201. <Link2></Link2>
  7202. </user-agent>
  7203. <user-agent>
  7204. <ID>id_g_m_484</ID>
  7205. <String>IncyWincy page crawler(webmaster@loopimprovements.com</String>
  7206. <Description>IncyWincy search engine using DMOZ Open Directory database</Description>
  7207. <Type>R</Type>
  7208. <Comment></Comment>
  7209. <Link1>http://www.loopimprovements.com</Link1>
  7210. <Link2></Link2>
  7211. </user-agent>
  7212. <user-agent>
  7213. <ID>id_g_m_485</ID>
  7214. <String>IncyWincy(http://www.look.com)</String>
  7215. <Description>Look.com robot using IncyWincy search engine</Description>
  7216. <Type>R</Type>
  7217. <Comment></Comment>
  7218. <Link1>http://www.loopimprovements.com</Link1>
  7219. <Link2></Link2>
  7220. </user-agent>
  7221. <user-agent>
  7222. <ID>id_g_m_486</ID>
  7223. <String>IncyWincy(http://www.loopimprovements.com/robot.html)</String>
  7224. <Description>IncyWincy search engine using DMOZ Open Directory database</Description>
  7225. <Type>R</Type>
  7226. <Comment></Comment>
  7227. <Link1>http://www.loopimprovements.com</Link1>
  7228. <Link2></Link2>
  7229. </user-agent>
  7230. <user-agent>
  7231. <ID>id_g_m_487</ID>
  7232. <String>IncyWincy/2.1(loopimprovements.com/robot.html)</String>
  7233. <Description>IncyWincy search engine using DMOZ Open Directory database</Description>
  7234. <Type>R</Type>
  7235. <Comment></Comment>
  7236. <Link1>http://www.loopimprovements.com</Link1>
  7237. <Link2></Link2>
  7238. </user-agent>
  7239. <user-agent>
  7240. <ID>id_g_m_488</ID>
  7241. <String>IndexTheWeb.com Crawler7</String>
  7242. <Description>Index the Web (69.57.134.xx) crawler</Description>
  7243. <Type>R</Type>
  7244. <Comment></Comment>
  7245. <Link1>http://www.indextheweb.com/</Link1>
  7246. <Link2></Link2>
  7247. </user-agent>
  7248. <user-agent>
  7249. <ID>id_g_m_489</ID>
  7250. <String>Industry Program 1.0.x</String>
  7251. <Description>Spam bot from diff. IPs</Description>
  7252. <Type>S</Type>
  7253. <Comment>see also Educate Search VxB - Full Web Bot</Comment>
  7254. <Link1></Link1>
  7255. <Link2></Link2>
  7256. </user-agent>
  7257. <user-agent>
  7258. <ID>id_g_m_490</ID>
  7259. <String>Inet library</String>
  7260. <Description>Inet Library Resource Center robot</Description>
  7261. <Type>R</Type>
  7262. <Comment></Comment>
  7263. <Link1>http://www.inetlibrary.com</Link1>
  7264. <Link2></Link2>
  7265. </user-agent>
  7266. <user-agent>
  7267. <ID>id_g_m_491</ID>
  7268. <String>InetURL/1.0</String>
  7269. <Description>InetURL IVM (phone software) plugin for web server access ?</Description>
  7270. <Type></Type>
  7271. <Comment></Comment>
  7272. <Link1>http://www.nch.com.au/ivm/plugins.html</Link1>
  7273. <Link2></Link2>
  7274. </user-agent>
  7275. <user-agent>
  7276. <ID>id_g_m_270607_1</ID>
  7277. <String>info@pubblisito.com- (http://www.pubblisito.com) il Sud dei Motori di Ricerca</String>
  7278. <Description>Pubblisito.com search - Italia</Description>
  7279. <Type>R</Type>
  7280. <Comment>88.149.164.2xx</Comment>
  7281. <Link1>http://www.pubblisito.com/search/</Link1>
  7282. <Link2></Link2>
  7283. </user-agent>
  7284. <user-agent>
  7285. <ID>id_g_m_211208_2</ID>
  7286. <String>Infoaxe./Nutch-0.9</String>
  7287. <Description>Infoaxe - search history and bookmark service</Description>
  7288. <Type>C</Type>
  7289. <Comment>75.126.48.17x</Comment>
  7290. <Link1>http://www.infoaxe.com/</Link1>
  7291. <Link2></Link2>
  7292. </user-agent>
  7293. <user-agent>
  7294. <ID>id_g_m_492</ID>
  7295. <String>infoConveraCrawler/0.8 ( http://www.authoritativeweb.com/crawl)</String>
  7296. <Description>Converas RetrievalWare Internet Spider (63.241.61.x)</Description>
  7297. <Type>R S ?</Type>
  7298. <Comment>s.also - Convera... Maybe does guestbook / forum spamming s. here http://www.webmasterworld.com/forum11/2871.htm</Comment>
  7299. <Link1>http://www.convera.com/Products/</Link1>
  7300. <Link2></Link2>
  7301. </user-agent>
  7302. <user-agent>
  7303. <ID>id_g_m_493</ID>
  7304. <String>InfoFly/1.0 (http://www.versions-project.org/)</String>
  7305. <Description>Versions-project.org Ingelin spider</Description>
  7306. <Type>R</Type>
  7307. <Comment></Comment>
  7308. <Link1>http://www.versions-project.org/</Link1>
  7309. <Link2></Link2>
  7310. </user-agent>
  7311. <user-agent>
  7312. <ID>id_g_m_494</ID>
  7313. <String>InfoLink/1.x</String>
  7314. <Description>InfoLink link checking tool</Description>
  7315. <Type>C</Type>
  7316. <Comment></Comment>
  7317. <Link1>http://www.biggbyte.com/biggbyte3/index.html</Link1>
  7318. <Link2></Link2>
  7319. </user-agent>
  7320. <user-agent>
  7321. <ID>id_g_m_495</ID>
  7322. <String>INFOMINE/8.0 Adders</String>
  7323. <Description>INFOMINE Scholary Internet Resource Collection crawler</Description>
  7324. <Type>R</Type>
  7325. <Comment></Comment>
  7326. <Link1>http://infomine.ucr.edu</Link1>
  7327. <Link2></Link2>
  7328. </user-agent>
  7329. <user-agent>
  7330. <ID>id_g_m_496</ID>
  7331. <String>INFOMINE/8.0 RemoteServices</String>
  7332. <Description>INFOMINE Scholary Internet Resource Collection crawler</Description>
  7333. <Type>R</Type>
  7334. <Comment></Comment>
  7335. <Link1>http://infomine.ucr.edu</Link1>
  7336. <Link2></Link2>
  7337. </user-agent>
  7338. <user-agent>
  7339. <ID>id_g_m_497</ID>
  7340. <String>INFOMINE/8.0 VLCrawler (http://infomine.ucr.edu/useragents)</String>
  7341. <Description>INFOMINE Scholary Internet Resource Collection crawler</Description>
  7342. <Type>R</Type>
  7343. <Comment></Comment>
  7344. <Link1>http://infomine.ucr.edu</Link1>
  7345. <Link2></Link2>
  7346. </user-agent>
  7347. <user-agent>
  7348. <ID>id_g_m_498</ID>
  7349. <String>InfoNaviRobot(F107)</String>
  7350. <Description>164.71.1.1xx jp.co.fujitsu.t2 Robot</Description>
  7351. <Type>R</Type>
  7352. <Comment></Comment>
  7353. <Link1></Link1>
  7354. <Link2></Link2>
  7355. </user-agent>
  7356. <user-agent>
  7357. <ID>id_g_m_499</ID>
  7358. <String>InfoSeek Sidewinder/0.9</String>
  7359. <Description>Infoseek robot</Description>
  7360. <Type>R</Type>
  7361. <Comment></Comment>
  7362. <Link1>http://www.infoseek.com</Link1>
  7363. <Link2></Link2>
  7364. </user-agent>
  7365. <user-agent>
  7366. <ID>id_g_m_500</ID>
  7367. <String>InfoSeek Sidewinder/1.0A</String>
  7368. <Description>Infoseek robot</Description>
  7369. <Type>R</Type>
  7370. <Comment></Comment>
  7371. <Link1>http://www.infoseek.com</Link1>
  7372. <Link2></Link2>
  7373. </user-agent>
  7374. <user-agent>
  7375. <ID>id_g_m_501</ID>
  7376. <String>InfoSeek Sidewinder/1.1A</String>
  7377. <Description>Infoseek robot</Description>
  7378. <Type>R</Type>
  7379. <Comment></Comment>
  7380. <Link1>http://www.infoseek.com</Link1>
  7381. <Link2></Link2>
  7382. </user-agent>
  7383. <user-agent>
  7384. <ID>id_g_m_502</ID>
  7385. <String>Infoseek SideWinder/1.45 (Compatible; MSIE 10.0; UNIX)</String>
  7386. <Description>Infoseek robot</Description>
  7387. <Type>R</Type>
  7388. <Comment></Comment>
  7389. <Link1>http://www.infoseek.com</Link1>
  7390. <Link2></Link2>
  7391. </user-agent>
  7392. <user-agent>
  7393. <ID>id_g_m_503</ID>
  7394. <String>Infoseek SideWinder/2.0B (Linux 2.4 i686)</String>
  7395. <Description>Infoseek Japan robot</Description>
  7396. <Type>R</Type>
  7397. <Comment>210.148.160.1xx</Comment>
  7398. <Link1>http://www.infoseek.com</Link1>
  7399. <Link2></Link2>
  7400. </user-agent>
  7401. <user-agent>
  7402. <ID>id_g_m_504</ID>
  7403. <String>INGRID/3.0 MT (webcrawler@NOSPAMexperimental.net; http://webmaster.ilse.nl/jsp/webmaster.jsp)</String>
  7404. <Description>Ilse Netherlands robot (62.69.178.xx)</Description>
  7405. <Type>R</Type>
  7406. <Comment> s.also - Mozilla/3.0 (INGRID/3.0 .. / IlseBot/1.0 ..</Comment>
  7407. <Link1>http://www.ilse.nl/</Link1>
  7408. <Link2></Link2>
  7409. </user-agent>
  7410. <user-agent>
  7411. <ID>id_g_m_505</ID>
  7412. <String>Inktomi Search</String>
  7413. <Description>Inktomi (Hotbot-Lycos NBCi etc.) robot</Description>
  7414. <Type>R</Type>
  7415. <Comment></Comment>
  7416. <Link1>http://www.inktomi.com/</Link1>
  7417. <Link2></Link2>
  7418. </user-agent>
  7419. <user-agent>
  7420. <ID>id_g_m_506</ID>
  7421. <String>InnerpriseBot/1.0 (http://www.innerprise.com/)</String>
  7422. <Description>Enterprise Search engine software (64.202.165.xxx) </Description>
  7423. <Type>R</Type>
  7424. <Comment>s. also - Enterprise_Search - ES.NET_Crawler</Comment>
  7425. <Link1>http://www.innerprise.net</Link1>
  7426. <Link2></Link2>
  7427. </user-agent>
  7428. <user-agent>
  7429. <ID>id_g_m_111205_4</ID>
  7430. <String>Insitor.com search and find world wide!</String>
  7431. <Description>Insitor Search robot (80.67.20.1xx)</Description>
  7432. <Type>R</Type>
  7433. <Comment>s. also Insitornaut</Comment>
  7434. <Link1>http://www.insitor.com/</Link1>
  7435. <Link2></Link2>
  7436. </user-agent>
  7437. <user-agent>
  7438. <ID>id_g_m_121205_3</ID>
  7439. <String>Insitornaut</String>
  7440. <Description>Insitor Search robot (80.67.20.1xx)</Description>
  7441. <Type>R</Type>
  7442. <Comment>s. also Insitor.com</Comment>
  7443. <Link1>http://www.insitor.com/</Link1>
  7444. <Link2></Link2>
  7445. </user-agent>
  7446. <user-agent>
  7447. <ID>id_g_m_507</ID>
  7448. <String>InstallShield DigitalWizard</String>
  7449. <Description>download manager</Description>
  7450. <Type>D</Type>
  7451. <Comment></Comment>
  7452. <Link1></Link1>
  7453. <Link2></Link2>
  7454. </user-agent>
  7455. <user-agent>
  7456. <ID>id_g_m_200308_1</ID>
  7457. <String>integrity/1.6</String>
  7458. <Description>Integrity - website broken link checker for MAC OSx</Description>
  7459. <Type>C</Type>
  7460. <Comment></Comment>
  7461. <Link1>http://peacockmedia.co.uk/index.php/products/7-products/4-integrity</Link1>
  7462. <Link2></Link2>
  7463. </user-agent>
  7464. <user-agent>
  7465. <ID>id_g_m_010907_1</ID>
  7466. <String>Intelix/0.x (cs; http://www.microton.cz/intelix/; microton@@microton.cz)</String>
  7467. <Description>Microton Intelix robot for Eurotran translation software ?</Description>
  7468. <Type>D</Type>
  7469. <Comment></Comment>
  7470. <Link1>http://www.microton.cz/intelix/</Link1>
  7471. <Link2></Link2>
  7472. </user-agent>
  7473. <user-agent>
  7474. <ID>id_g_m_508</ID>
  7475. <String>Interarchy/x.x.x (InterarchyCrawler)</String>
  7476. <Description>Interarchy file transfer software - SFTP/FTP client for Mac OS X</Description>
  7477. <Type>D</Type>
  7478. <Comment></Comment>
  7479. <Link1>http://www.interarchy.com</Link1>
  7480. <Link2></Link2>
  7481. </user-agent>
  7482. <user-agent>
  7483. <ID>id_g_m_509</ID>
  7484. <String>Internet Ninja x.0</String>
  7485. <Description>Dream Train (Japan) Internet search robot</Description>
  7486. <Type>R</Type>
  7487. <Comment></Comment>
  7488. <Link1>http://www.dti.ne.jp</Link1>
  7489. <Link2></Link2>
  7490. </user-agent>
  7491. <user-agent>
  7492. <ID>id_g_m_510</ID>
  7493. <String>InternetArchive/0.8-dev(Nutch;http://lucene.apache.org/nutch/bot.html;nutch-agent@lucene.apache</String>
  7494. <Description>Heritrix - The Internet Archive's open-source crawler based on Nutch (207.241.225.2xx)</Description>
  7495. <Type>R</Type>
  7496. <Comment>s.also - archive.org_bot - Mozilla/5.0 (compatible;archive.org_bot/...</Comment>
  7497. <Link1>http://www.archive.org/</Link1>
  7498. <Link2>http://lucene.apache.org</Link2>
  7499. </user-agent>
  7500. <user-agent>
  7501. <ID>id_g_m_511</ID>
  7502. <String>InternetLinkAgent/3.1</String>
  7503. <Description>Internet Link Agent - link checking tool</Description>
  7504. <Type>C</Type>
  7505. <Comment></Comment>
  7506. <Link1>http://www.osk.3web.ne.jp/~goronyan/winprg/sub.shtml</Link1>
  7507. <Link2></Link2>
  7508. </user-agent>
  7509. <user-agent>
  7510. <ID>id_g_m_512</ID>
  7511. <String>InternetSeer.com</String>
  7512. <Description>Internetseer Web site monitoring / Claymont robot</Description>
  7513. <Type>R</Type>
  7514. <Comment></Comment>
  7515. <Link1>http://www.internetseer.com</Link1>
  7516. <Link2></Link2>
  7517. </user-agent>
  7518. <user-agent>
  7519. <ID>id_g_m_513</ID>
  7520. <String>intraVnews/1.x</String>
  7521. <Description>intraVNews - Feed reader &amp; RSS aggregator for Outlook</Description>
  7522. <Type>B</Type>
  7523. <Comment></Comment>
  7524. <Link1>http://www.intravnews.com</Link1>
  7525. <Link2></Link2>
  7526. </user-agent>
  7527. <user-agent>
  7528. <ID>id_g_m_061208_1</ID>
  7529. <String>IOI/2.0 (ISC Open Index crawler; http://index.isc.org/; bot@index.isc.org)</String>
  7530. <Description>Internet Open Index crawler using Nutch</Description>
  7531. <Type>R</Type>
  7532. <Comment>149.20.54.1xx</Comment>
  7533. <Link1>http://index.isc.org/</Link1>
  7534. <Link2>http://www.nutch.org</Link2>
  7535. </user-agent>
  7536. <user-agent>
  7537. <ID>id_g_m_514</ID>
  7538. <String>IP*Works! V5 HTTP/S Component - by /n software - www.nsoftware.com</String>
  7539. <Description>IP*Works! HTTP Component</Description>
  7540. <Type></Type>
  7541. <Comment></Comment>
  7542. <Link1>http://www.nsoftware.com/products/controls/?ctl=HTTP</Link1>
  7543. <Link2></Link2>
  7544. </user-agent>
  7545. <user-agent>
  7546. <ID>id_g_m_515</ID>
  7547. <String>http://www.ip2location.com</String>
  7548. <Description>IP2Location - Reverse lookup geographical data and ISP by IP</Description>
  7549. <Type>R C</Type>
  7550. <Comment></Comment>
  7551. <Link1>http://www.ip2location.com</Link1>
  7552. <Link2></Link2>
  7553. </user-agent>
  7554. <user-agent>
  7555. <ID>id_g_m_270106_1</ID>
  7556. <String>IP2MapBot/1.1 &lt;a href=http://www.ip2map.com>http://www.ip2map.com&lt;/a></String>
  7557. <Description>IP2Map - geographical IP mapping</Description>
  7558. <Type>R C</Type>
  7559. <Comment></Comment>
  7560. <Link1>http://www.ip2map.com/</Link1>
  7561. <Link2></Link2>
  7562. </user-agent>
  7563. <user-agent>
  7564. <ID>id_g_m_516</ID>
  7565. <String>IPiumBot laurion(dot)com</String>
  7566. <Description>Laurions Ipium robot</Description>
  7567. <Type>R</Type>
  7568. <Comment></Comment>
  7569. <Link1>http://www.laurion.com</Link1>
  7570. <Link2></Link2>
  7571. </user-agent>
  7572. <user-agent>
  7573. <ID>id_g_m_517</ID>
  7574. <String>IpselonBot/0.xx-beta (Ipselon; http://www.ipselon.com; ipselonbot@ipselon.com)</String>
  7575. <Description>Ipselon Web Search robot</Description>
  7576. <Type>R</Type>
  7577. <Comment></Comment>
  7578. <Link1>http://www.ipselon.com</Link1>
  7579. <Link2></Link2>
  7580. </user-agent>
  7581. <user-agent>
  7582. <ID>id_g_m_518</ID>
  7583. <String>Iria/1.xxa</String>
  7584. <Description>Iria download manager</Description>
  7585. <Type>D</Type>
  7586. <Comment></Comment>
  7587. <Link1>http://www5.tok2.com/home/koteturamu/soft/iria.htm</Link1>
  7588. <Link2></Link2>
  7589. </user-agent>
  7590. <user-agent>
  7591. <ID>id_g_m_519</ID>
  7592. <String>IRLbot/1.0 ( http://irl.cs.tamu.edu/crawler)</String>
  7593. <Description>IRL-crawler - Texas A&amp;M University research project crawler</Description>
  7594. <Type>R</Type>
  7595. <Comment>128.194.135.xx</Comment>
  7596. <Link1>http://irl.cs.tamu.edu</Link1>
  7597. <Link2></Link2>
  7598. </user-agent>
  7599. <user-agent>
  7600. <ID>id_g_m_240308_4</ID>
  7601. <String>IRLbot/3.0 (compatible; MSIE 6.0; http://irl.cs.tamu.edu/crawler/)</String>
  7602. <Description>IRL-crawler - Texas A&amp;M University research project crawler</Description>
  7603. <Type>R</Type>
  7604. <Comment>128.194.135.xx</Comment>
  7605. <Link1>http://irl.cs.tamu.edu</Link1>
  7606. <Link2></Link2>
  7607. </user-agent>
  7608. <user-agent>
  7609. <ID>id_g_m_520</ID>
  7610. <String>IrssiUrlLog/0.2</String>
  7611. <Description>url_log - Irssi Perl url grabber</Description>
  7612. <Type></Type>
  7613. <Comment></Comment>
  7614. <Link1>http://www.irssi.org/scripts/html/url_log.pl.html</Link1>
  7615. <Link2></Link2>
  7616. </user-agent>
  7617. <user-agent>
  7618. <ID>id_g_m_521</ID>
  7619. <String>Irvine/1.x.x</String>
  7620. <Description>Irvine downloading tool</Description>
  7621. <Type>D</Type>
  7622. <Comment></Comment>
  7623. <Link1>http://hp.vector.co.jp/authors/VA024591/</Link1>
  7624. <Link2></Link2>
  7625. </user-agent>
  7626. <user-agent>
  7627. <ID>id_g_m_140506_1</ID>
  7628. <String>ISC Systems iRc Search 2.1</String>
  7629. <Description>Unknown spambot / harvester from diff. IPs</Description>
  7630. <Type>S</Type>
  7631. <Comment></Comment>
  7632. <Link1>http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1</Link1>
  7633. <Link2></Link2>
  7634. </user-agent>
  7635. <user-agent>
  7636. <ID>id_g_m_030106_1</ID>
  7637. <String>iSiloX/4.xx Windows/32</String>
  7638. <Description>iSiloX document converter for iSilo reader</Description>
  7639. <Type>B</Type>
  7640. <Comment></Comment>
  7641. <Link1>http://www.isilox.com/</Link1>
  7642. <Link2></Link2>
  7643. </user-agent>
  7644. <user-agent>
  7645. <ID>id_g_m_522</ID>
  7646. <String>isurf (tszhu@canada.com)</String>
  7647. <Description>Unknown University of Alberta link-checking ?</Description>
  7648. <Type>C</Type>
  7649. <Comment></Comment>
  7650. <Link1>http://www.ualberta.ca</Link1>
  7651. <Link2></Link2>
  7652. </user-agent>
  7653. <user-agent>
  7654. <ID>id_g_m_150408_5</ID>
  7655. <String>iTunes/x.x.x</String>
  7656. <Description>iTunes UA name for access and decrypt the iTunes music store pages</Description>
  7657. <Type>B</Type>
  7658. <Comment></Comment>
  7659. <Link1>http://www.apple.com/itunes/</Link1>
  7660. <Link2></Link2>
  7661. </user-agent>
  7662. <user-agent>
  7663. <ID>id_g_m_523</ID>
  7664. <String>IUPUI Research Bot v 1.9a</String>
  7665. <Description>Some spam bot from 66.139.78.xx(x)</Description>
  7666. <Type>S</Type>
  7667. <Comment></Comment>
  7668. <Link1></Link1>
  7669. <Link2></Link2>
  7670. </user-agent>
  7671. <user-agent>
  7672. <ID>id_g_m_280906_1</ID>
  7673. <String>iVia Page Fetcher (http://ivia.ucr.edu/useragents.shtml)</String>
  7674. <Description>iVia robot - Open source Internet portal &amp; virtual library system software</Description>
  7675. <Type>D</Type>
  7676. <Comment></Comment>
  7677. <Link1>http://ivia.ucr.edu/</Link1>
  7678. <Link2></Link2>
  7679. </user-agent>
  7680. <user-agent>
  7681. <ID>id_g_m_524</ID>
  7682. <String>iVia/4.0 CanonizeUrl (http://infomine.ucr.edu/iVia/useragents.shtml</String>
  7683. <Description>iVia robot - Open source Internet portal &amp; virtual library system software</Description>
  7684. <Type>D</Type>
  7685. <Comment></Comment>
  7686. <Link1>http://ivia.ucr.edu/</Link1>
  7687. <Link2></Link2>
  7688. </user-agent>
  7689. <user-agent>
  7690. <ID>id_g_m_180707_1</ID>
  7691. <String>IWAgent/ 1.0 - www.brandprotect.com</String>
  7692. <Description>BD BrandProtect - brand&#44; company or trademarks online monitoring</Description>
  7693. <Type>R</Type>
  7694. <Comment>72.14.164.1xx</Comment>
  7695. <Link1>http://www.brandprotect.com/</Link1>
  7696. <Link2></Link2>
  7697. </user-agent>
  7698. <user-agent>
  7699. <ID>id_g_m_525</ID>
  7700. <String>J-PHONE/3.0/J-SH07</String>
  7701. <Description>Proxy message from jp-q.ne.jp</Description>
  7702. <Type>P</Type>
  7703. <Comment></Comment>
  7704. <Link1></Link1>
  7705. <Link2></Link2>
  7706. </user-agent>
  7707. <user-agent>
  7708. <ID>id_g_m_526</ID>
  7709. <String>Jabot/6.x (http://odin.ingrid.org/)</String>
  7710. <Description>ODIN Directory Japan robot (163.138.95.xx)</Description>
  7711. <Type>R</Type>
  7712. <Comment></Comment>
  7713. <Link1>http://www.ingrid.org</Link1>
  7714. <Link2></Link2>
  7715. </user-agent>
  7716. <user-agent>
  7717. <ID>id_g_m_527</ID>
  7718. <String>Jabot/7.x.x (http://odin.ingrid.org/)</String>
  7719. <Description>ODIN Directory Japan robot (163.138.95.xx)</Description>
  7720. <Type>R</Type>
  7721. <Comment></Comment>
  7722. <Link1>http://www.ingrid.org</Link1>
  7723. <Link2></Link2>
  7724. </user-agent>
  7725. <user-agent>
  7726. <ID>id_g_m_528</ID>
  7727. <String>Jack</String>
  7728. <Description>German Domanova (offline since Feb.02) robot</Description>
  7729. <Type>R</Type>
  7730. <Comment></Comment>
  7731. <Link1></Link1>
  7732. <Link2></Link2>
  7733. </user-agent>
  7734. <user-agent>
  7735. <ID>id_g_m_529</ID>
  7736. <String>Jakarta Commons-HttpClient/2.0xxx</String>
  7737. <Description>Jakarta Commons (Java based) HTTP client</Description>
  7738. <Type>B</Type>
  7739. <Comment></Comment>
  7740. <Link1>http://jakarta.apache.org/commons/httpclient/</Link1>
  7741. <Link2></Link2>
  7742. </user-agent>
  7743. <user-agent>
  7744. <ID>id_g_m_530</ID>
  7745. <String>Jakarta Commons-HttpClient/3.0-rcx</String>
  7746. <Description>Jakarta Commons (Java based) HTTP client</Description>
  7747. <Type>B</Type>
  7748. <Comment></Comment>
  7749. <Link1>http://jakarta.apache.org/commons/httpclient/</Link1>
  7750. <Link2></Link2>
  7751. </user-agent>
  7752. <user-agent>
  7753. <ID>id_g_m_240306_3</ID>
  7754. <String>Jambot/0.1.x (Jambot; http://www.jambot.com/blog; crawler@jambot.com)</String>
  7755. <Description>JamBot search robot (70.146.82.xx)</Description>
  7756. <Type>R</Type>
  7757. <Comment></Comment>
  7758. <Link1>http://www.jambot.com/</Link1>
  7759. <Link2></Link2>
  7760. </user-agent>
  7761. <user-agent>
  7762. <ID>id_g_m_130108_1</ID>
  7763. <String>Jambot/0.2.1 (Jambot; http://www.jambot.com/blog/static.php?page=webmaster-robot; crawler@jambot.com)</String>
  7764. <Description>JamBot search robot</Description>
  7765. <Type>R</Type>
  7766. <Comment>70.146.82.xx</Comment>
  7767. <Link1>http://www.jambot.com/</Link1>
  7768. <Link2></Link2>
  7769. </user-agent>
  7770. <user-agent>
  7771. <ID>id_g_m_531</ID>
  7772. <String>Java 1.1</String>
  7773. <Description>Java VM</Description>
  7774. <Type></Type>
  7775. <Comment></Comment>
  7776. <Link1>http://java.sun.com/</Link1>
  7777. <Link2></Link2>
  7778. </user-agent>
  7779. <user-agent>
  7780. <ID>id_g_m_532</ID>
  7781. <String>Java/1.4.1_01</String>
  7782. <Description>Java VM</Description>
  7783. <Type>R B D</Type>
  7784. <Comment> used as robot from 194.203.40.xx</Comment>
  7785. <Link1>http://java.sun.com/</Link1>
  7786. <Link2></Link2>
  7787. </user-agent>
  7788. <user-agent>
  7789. <ID>id_g_m_533</ID>
  7790. <String>Java1.0.21.0</String>
  7791. <Description>Java VM</Description>
  7792. <Type>B</Type>
  7793. <Comment></Comment>
  7794. <Link1>http://java.sun.com/</Link1>
  7795. <Link2></Link2>
  7796. </user-agent>
  7797. <user-agent>
  7798. <ID>id_g_m_534</ID>
  7799. <String>Java1.1.xx.x</String>
  7800. <Description>Java VM</Description>
  7801. <Type></Type>
  7802. <Comment></Comment>
  7803. <Link1>http://java.sun.com/</Link1>
  7804. <Link2></Link2>
  7805. </user-agent>
  7806. <user-agent>
  7807. <ID>id_g_m_535</ID>
  7808. <String>Java1.3.0rc1</String>
  7809. <Description>Java VM</Description>
  7810. <Type></Type>
  7811. <Comment></Comment>
  7812. <Link1>http://java.sun.com/</Link1>
  7813. <Link2></Link2>
  7814. </user-agent>
  7815. <user-agent>
  7816. <ID>id_g_m_536</ID>
  7817. <String>Java1.3.x</String>
  7818. <Description>Java VM</Description>
  7819. <Type></Type>
  7820. <Comment></Comment>
  7821. <Link1>http://java.sun.com/</Link1>
  7822. <Link2></Link2>
  7823. </user-agent>
  7824. <user-agent>
  7825. <ID>id_g_m_537</ID>
  7826. <String>Java1.4.0</String>
  7827. <Description>Java VM</Description>
  7828. <Type>R B D</Type>
  7829. <Comment>used by diff. IPs for various purposes i.e.: - Dortmund University Java based robot - Roadrunner.net (66.108.xxx.xxx) user robot in conjunction w. RPT-HTTPClient/0.3-3</Comment>
  7830. <Link1>http://java.sun.com/</Link1>
  7831. <Link2>http://www.informatik.uni-dortmund.DE</Link2>
  7832. </user-agent>
  7833. <user-agent>
  7834. <ID>id_g_m_538</ID>
  7835. <String>Jayde Crawler. http://www.jayde.com</String>
  7836. <Description>Jayde B2B Search robot (66.28.139.xx)</Description>
  7837. <Type>R</Type>
  7838. <Comment></Comment>
  7839. <Link1>http://www.jayde.com</Link1>
  7840. <Link2></Link2>
  7841. </user-agent>
  7842. <user-agent>
  7843. <ID>id_g_m_539</ID>
  7844. <String>JBH Agent 2.0</String>
  7845. <Description>some site downloading tool ? via 61.77.51.xxx</Description>
  7846. <Type>D</Type>
  7847. <Comment></Comment>
  7848. <Link1></Link1>
  7849. <Link2></Link2>
  7850. </user-agent>
  7851. <user-agent>
  7852. <ID>id_g_m_540</ID>
  7853. <String>jBrowser/J2ME Profile/MIDP-1.0 Configuration/CLDC-1.0 (Google WAP Proxy/1.0)</String>
  7854. <Description>WAP 2.0 / jBrowser for handhelds</Description>
  7855. <Type>B</Type>
  7856. <Comment></Comment>
  7857. <Link1>http://www.jataayusoft.com/DbWAPHH.htm</Link1>
  7858. <Link2></Link2>
  7859. </user-agent>
  7860. <user-agent>
  7861. <ID>id_g_m_541</ID>
  7862. <String>JCheckLinks/0.1 RPT-HTTPClient/0.3-1</String>
  7863. <Description>JCheckLinks Java hyperlink validator</Description>
  7864. <Type>C</Type>
  7865. <Comment></Comment>
  7866. <Link1>http://web.purplefrog.com/%7Ethoth/jchecklinks/</Link1>
  7867. <Link2></Link2>
  7868. </user-agent>
  7869. <user-agent>
  7870. <ID>id_g_m_542</ID>
  7871. <String>JDK/1.1</String>
  7872. <Description>Java Development Kit</Description>
  7873. <Type></Type>
  7874. <Comment></Comment>
  7875. <Link1>http://developers.sun.com/index.html</Link1>
  7876. <Link2></Link2>
  7877. </user-agent>
  7878. <user-agent>
  7879. <ID>id_g_m_543</ID>
  7880. <String>Jeode/1.x.x</String>
  7881. <Description>Insignias Jeode (PDA) Java platform</Description>
  7882. <Type>B</Type>
  7883. <Comment></Comment>
  7884. <Link1>http://www.insignia.com/content/products/jvmProducts.shtml</Link1>
  7885. <Link2></Link2>
  7886. </user-agent>
  7887. <user-agent>
  7888. <ID>id_g_m_544</ID>
  7889. <String>Jetbot/1.0</String>
  7890. <Description>JetEye Search robot (64.62.142.xxx / 64.71.144.xxx)</Description>
  7891. <Type>R</Type>
  7892. <Comment></Comment>
  7893. <Link1>http://www.jeteye.com</Link1>
  7894. <Link2></Link2>
  7895. </user-agent>
  7896. <user-agent>
  7897. <ID>id_g_m_545</ID>
  7898. <String>JetBrains Omea Reader 1.0.x (http://www.jetbrains.com/omea_reader/)</String>
  7899. <Description>Omea RSS -  Atom - newsgroups web page reader </Description>
  7900. <Type>B</Type>
  7901. <Comment></Comment>
  7902. <Link1>http://www.jetbrains.com/omea_reader/</Link1>
  7903. <Link2></Link2>
  7904. </user-agent>
  7905. <user-agent>
  7906. <ID>id_g_m_546</ID>
  7907. <String>JetBrains Omea Reader 2.0 Release Candidate 1 (http://www.jetbrains.com/omea_reader/)</String>
  7908. <Description>Omea RSS -  Atom - newsgroups web page reader </Description>
  7909. <Type>B</Type>
  7910. <Comment></Comment>
  7911. <Link1>http://www.jetbrains.com/omea_reader/</Link1>
  7912. <Link2></Link2>
  7913. </user-agent>
  7914. <user-agent>
  7915. <ID>id_g_m_547</ID>
  7916. <String>JetCar</String>
  7917. <Description>JetCar / Flashget download manager</Description>
  7918. <Type>D</Type>
  7919. <Comment></Comment>
  7920. <Link1>http://www.amazesoft.com</Link1>
  7921. <Link2></Link2>
  7922. </user-agent>
  7923. <user-agent>
  7924. <ID>id_g_m_548</ID>
  7925. <String>Jigsaw/2.2.x W3C_CSS_Validator_JFouffa/2.0</String>
  7926. <Description>Jigsaw - W3C's CSS Validator Server</Description>
  7927. <Type>C</Type>
  7928. <Comment></Comment>
  7929. <Link1>http://jigsaw.w3.org/css-validator/validator-uri.html</Link1>
  7930. <Link2></Link2>
  7931. </user-agent>
  7932. <user-agent>
  7933. <ID>id_g_m_550</ID>
  7934. <String>JoBo/1.x (http://www.matuschek.net/jobo.html)</String>
  7935. <Description>Jobo website downloading program</Description>
  7936. <Type>D B</Type>
  7937. <Comment></Comment>
  7938. <Link1>http://www.matuschek.net/software/jobo/index.html</Link1>
  7939. <Link2></Link2>
  7940. </user-agent>
  7941. <user-agent>
  7942. <ID>id_g_m_549</ID>
  7943. <String>JoBo/@JOBO_VERSION@(http://www.matuschek.net/jobo.html)</String>
  7944. <Description>Jobo website downloading program</Description>
  7945. <Type>D B</Type>
  7946. <Comment></Comment>
  7947. <Link1>http://www.matuschek.net/software/jobo/index.html</Link1>
  7948. <Link2></Link2>
  7949. </user-agent>
  7950. <user-agent>
  7951. <ID>id_g_m_551</ID>
  7952. <String>JobSpider_BA/1.1</String>
  7953. <Description>Finacialbot.com - German (213.61.218.xx) job search JobRoboter</Description>
  7954. <Type>R</Type>
  7955. <Comment></Comment>
  7956. <Link1>http://www.finbot.com/jr1.html</Link1>
  7957. <Link2></Link2>
  7958. </user-agent>
  7959. <user-agent>
  7960. <ID>id_g_m_552</ID>
  7961. <String>JOC Web Spider</String>
  7962. <Description>Jocsoft Web Spider - website downloading tool</Description>
  7963. <Type>D B</Type>
  7964. <Comment></Comment>
  7965. <Link1>http://www.jocsoft.com/jws/index.htm</Link1>
  7966. <Link2></Link2>
  7967. </user-agent>
  7968. <user-agent>
  7969. <ID>id_g_m_051206_5</ID>
  7970. <String>JordoMedia/1.0 RSS File Reader (http://www.jordomedia.com)</String>
  7971. <Description>Jordo Media RSS / Atom feed directory link checking</Description>
  7972. <Type>C</Type>
  7973. <Comment>216.227.208.1xx</Comment>
  7974. <Link1>http://www.jordomedia.com/</Link1>
  7975. <Link2></Link2>
  7976. </user-agent>
  7977. <user-agent>
  7978. <ID>id_g_m_090206_2</ID>
  7979. <String>Journster [alpha] (http://journster.com/)</String>
  7980. <Description>Journster.com RSS/Atom aggregator</Description>
  7981. <Type>C</Type>
  7982. <Comment></Comment>
  7983. <Link1>http://beta.journster.com/</Link1>
  7984. <Link2></Link2>
  7985. </user-agent>
  7986. <user-agent>
  7987. <ID>id_g_m_090206_3</ID>
  7988. <String>Journster.com RSS/Atom aggregator 0.5 (http://www.journster.com/bot.phtml)</String>
  7989. <Description>Journster.com RSS/Atom aggregator</Description>
  7990. <Type>C</Type>
  7991. <Comment></Comment>
  7992. <Link1>http://beta.journster.com/</Link1>
  7993. <Link2></Link2>
  7994. </user-agent>
  7995. <user-agent>
  7996. <ID>id_g_m_553</ID>
  7997. <String>JRTS Check Favorites Utility</String>
  7998. <Description>Check Favorites bookmark checking</Description>
  7999. <Type>C</Type>
  8000. <Comment></Comment>
  8001. <Link1>http://www.jrtwine.com/Products/CheckFavs/</Link1>
  8002. <Link2></Link2>
  8003. </user-agent>
  8004. <user-agent>
  8005. <ID>id_g_m_554</ID>
  8006. <String>JRTwine Software Check Favorites Utility</String>
  8007. <Description>Check Favorites bookmark checking</Description>
  8008. <Type>C</Type>
  8009. <Comment></Comment>
  8010. <Link1>http://www.jrtwine.com/Products/CheckFavs/</Link1>
  8011. <Link2></Link2>
  8012. </user-agent>
  8013. <user-agent>
  8014. <ID>id_g_m_555</ID>
  8015. <String>Jyxobot/x</String>
  8016. <Description>Jyxo search (Czech Republic) robot (212.71.128.xx)</Description>
  8017. <Type>R</Type>
  8018. <Comment></Comment>
  8019. <Link1>http://jyxo.cz/</Link1>
  8020. <Link2></Link2>
  8021. </user-agent>
  8022. <user-agent>
  8023. <ID>id_g_m_556</ID>
  8024. <String>K-Meleon/0.6 (Windows; U; Windows NT 5.1; en-US; rv:0.9.5) Gecko/20011011</String>
  8025. <Description>K-meleon browser -  Windows 2000</Description>
  8026. <Type>B</Type>
  8027. <Comment></Comment>
  8028. <Link1>http://kmeleon.sourceforge.net/</Link1>
  8029. <Link2></Link2>
  8030. </user-agent>
  8031. <user-agent>
  8032. <ID>id_g_m_557</ID>
  8033. <String>k2spider</String>
  8034. <Description>Verity K2 Spider ( Network search software)</Description>
  8035. <Type>R</Type>
  8036. <Comment></Comment>
  8037. <Link1>http://www.verity.com/products/pdf/MK0368a_K2_Spider.pdf</Link1>
  8038. <Link2></Link2>
  8039. </user-agent>
  8040. <user-agent>
  8041. <ID>id_g_m_010108_3</ID>
  8042. <String>KAIST AITrc Crawler</String>
  8043. <Description>Unknown robot from AITrc (Advanced Information Technology Research Center) - Korea</Description>
  8044. <Type>R</Type>
  8045. <Comment>143.248.134.22x</Comment>
  8046. <Link1>http://aitrc.kaist.ac.kr/english/</Link1>
  8047. <Link2></Link2>
  8048. </user-agent>
  8049. <user-agent>
  8050. <ID>id_g_m_010506_1</ID>
  8051. <String>KakleBot - www.kakle.com/0.1 (KakleBot - www.kakle.com; http:// www.kakle.com/bot.html; support@kakle.com)</String>
  8052. <Description>Kakle ranked metasearch robot</Description>
  8053. <Type>R</Type>
  8054. <Comment>216.139.221.1xx</Comment>
  8055. <Link1>http://www.kakle.com/</Link1>
  8056. <Link2></Link2>
  8057. </user-agent>
  8058. <user-agent>
  8059. <ID>id_g_m_250408_3</ID>
  8060. <String>kalooga/kalooga-4.0-dev-datahouse (Kalooga; http://www.kalooga.com; info@kalooga.com)</String>
  8061. <Description>Kalooga image crawler</Description>
  8062. <Type>R</Type>
  8063. <Comment>195.210.57.1xx</Comment>
  8064. <Link1>http://www.kalooga.com/</Link1>
  8065. <Link2></Link2>
  8066. </user-agent>
  8067. <user-agent>
  8068. <ID>id_g_m_011108_3</ID>
  8069. <String>kalooga/KaloogaBot (Kalooga; http://www.kalooga.com/info.html?page=crawler; crawler@kalooga.com)</String>
  8070. <Description>Kalooga image crawler</Description>
  8071. <Type>R</Type>
  8072. <Comment>195.210.57.1xx</Comment>
  8073. <Link1>http://www.kalooga.com/</Link1>
  8074. <Link2></Link2>
  8075. </user-agent>
  8076. <user-agent>
  8077. <ID>id_g_m_558</ID>
  8078. <String>Kapere (http://www.kapere.com)</String>
  8079. <Description>Kapere site grapper / web downloader</Description>
  8080. <Type>D</Type>
  8081. <Comment></Comment>
  8082. <Link1>http://www.kapere.com</Link1>
  8083. <Link2></Link2>
  8084. </user-agent>
  8085. <user-agent>
  8086. <ID>id_g_m_090807_1</ID>
  8087. <String>Kazehakase/0.x.x.[x]</String>
  8088. <Description>Kazehakase - Gecko based browser (Japan)</Description>
  8089. <Type>B</Type>
  8090. <Comment></Comment>
  8091. <Link1>http://kazehakase.sourceforge.jp/</Link1>
  8092. <Link2></Link2>
  8093. </user-agent>
  8094. <user-agent>
  8095. <ID>id_g_m_559</ID>
  8096. <String>KDDI-SN22 UP.Browser/6.0.7 (GUI) MMP/1.1 (Google WAP Proxy/1.0)</String>
  8097. <Description>Openwave UP.Browser for mobiles via Google WAP Proxy (216.239.33.x)</Description>
  8098. <Type>P</Type>
  8099. <Comment></Comment>
  8100. <Link1>http://www.openwave.com</Link1>
  8101. <Link2></Link2>
  8102. </user-agent>
  8103. <user-agent>
  8104. <ID>id_g_m_561</ID>
  8105. <String>Kenjin Spider</String>
  8106. <Description>Kenjin Spider search agent</Description>
  8107. <Type>R</Type>
  8108. <Comment></Comment>
  8109. <Link1>http://www.kenjin.ne.jp</Link1>
  8110. <Link2></Link2>
  8111. </user-agent>
  8112. <user-agent>
  8113. <ID>id_g_m_562</ID>
  8114. <String>Kevin http://dznet.com/kevin/</String>
  8115. <Description>Dznet.com Kevin crawler (link checking ?) via 68.39.148.xx (nj.comcast.net)</Description>
  8116. <Type>R</Type>
  8117. <Comment></Comment>
  8118. <Link1>http://www.dznet.com</Link1>
  8119. <Link2></Link2>
  8120. </user-agent>
  8121. <user-agent>
  8122. <ID>id_g_m_563</ID>
  8123. <String>Kevin http://websitealert.net/kevin/</String>
  8124. <Description>Website AlertsKevin crawler (website monitoring) via 68.39.148.xx (nj.comcast.net)</Description>
  8125. <Type>R</Type>
  8126. <Comment></Comment>
  8127. <Link1>http://www.websitealert.net</Link1>
  8128. <Link2></Link2>
  8129. </user-agent>
  8130. <user-agent>
  8131. <ID>id_g_m_560</ID>
  8132. <String>KE_1.0/2.0 libwww/5.2.8</String>
  8133. <Description>Voila.fr robot</Description>
  8134. <Type>R</Type>
  8135. <Comment></Comment>
  8136. <Link1>http://www.voila.fr</Link1>
  8137. <Link2></Link2>
  8138. </user-agent>
  8139. <user-agent>
  8140. <ID>id_g_m_301105_5</ID>
  8141. <String>KFSW-Bot (Version: 1.01 powered by KFSW www.kfsw.de)</String>
  8142. <Description>Some Perl search script from KFSW (Germany)</Description>
  8143. <Type>R</Type>
  8144. <Comment></Comment>
  8145. <Link1>http://www.kfsw.de/</Link1>
  8146. <Link2></Link2>
  8147. </user-agent>
  8148. <user-agent>
  8149. <ID>id_g_m_100206_4</ID>
  8150. <String>kinja-imagebot (http://www.kinja.com/)</String>
  8151. <Description>kinja weblog search robot</Description>
  8152. <Type>R</Type>
  8153. <Comment></Comment>
  8154. <Link1>http://www.kinja.com/</Link1>
  8155. <Link2></Link2>
  8156. </user-agent>
  8157. <user-agent>
  8158. <ID>id_g_m_100206_3</ID>
  8159. <String>kinjabot (http://www.kinja.com)</String>
  8160. <Description>kinja weblog search robot</Description>
  8161. <Type>R</Type>
  8162. <Comment></Comment>
  8163. <Link1>http://www.kinja.com/</Link1>
  8164. <Link2></Link2>
  8165. </user-agent>
  8166. <user-agent>
  8167. <ID>id_g_m_564</ID>
  8168. <String>KIT-Fireball/2.0</String>
  8169. <Description>Fireball search (Germany) robot</Description>
  8170. <Type>R</Type>
  8171. <Comment></Comment>
  8172. <Link1>http://www.fireball.de</Link1>
  8173. <Link2></Link2>
  8174. </user-agent>
  8175. <user-agent>
  8176. <ID>id_g_m_565</ID>
  8177. <String>KIT-Fireball/2.0 (compatible; Mozilla 4.0; MSIE 5.5)</String>
  8178. <Description>Fireball search (Germany) robot</Description>
  8179. <Type>R</Type>
  8180. <Comment></Comment>
  8181. <Link1>http://www.fireball.de</Link1>
  8182. <Link2></Link2>
  8183. </user-agent>
  8184. <user-agent>
  8185. <ID>id_g_m_566</ID>
  8186. <String>Klondike/1.50 (WSP Win32) (Google WAP Proxy/1.0)</String>
  8187. <Description>Klondike WAP Browser</Description>
  8188. <Type>B</Type>
  8189. <Comment></Comment>
  8190. <Link1>http://www.apachesoftware.com</Link1>
  8191. <Link2></Link2>
  8192. </user-agent>
  8193. <user-agent>
  8194. <ID>id_g_m_567</ID>
  8195. <String>KnowItAll(knowitall@cs.washington.edu)</String>
  8196. <Description>University of Washington KnowItAll - web information extraction</Description>
  8197. <Type>R</Type>
  8198. <Comment></Comment>
  8199. <Link1>http://www.cs.washington.edu</Link1>
  8200. <Link2></Link2>
  8201. </user-agent>
  8202. <user-agent>
  8203. <ID>id_g_m_568</ID>
  8204. <String>Knowledge.com/0.x</String>
  8205. <Description>The knowledge.com (ODP) directory robot</Description>
  8206. <Type>R</Type>
  8207. <Comment></Comment>
  8208. <Link1>http://www.knowledge.com</Link1>
  8209. <Link2></Link2>
  8210. </user-agent>
  8211. <user-agent>
  8212. <ID>id_g_m_569</ID>
  8213. <String>Kontiki Client x.xx</String>
  8214. <Description>Kontiki Client download manager</Description>
  8215. <Type>D</Type>
  8216. <Comment></Comment>
  8217. <Link1>http://www.kontiki.com/client/userhelp_f.shtml</Link1>
  8218. <Link2></Link2>
  8219. </user-agent>
  8220. <user-agent>
  8221. <ID>id_g_m_280406_2</ID>
  8222. <String>Krugle/Krugle&#44;Nutch/0.8+ (Krugle web crawler; http://www.krugle.com/crawler/info.html; webcrawler@krugle.com)</String>
  8223. <Description>Krugle source code search engine for developers (64.71.164.1xx) </Description>
  8224. <Type>R</Type>
  8225. <Comment>powered by Nutch</Comment>
  8226. <Link1>http://www.krugle.com/</Link1>
  8227. <Link2></Link2>
  8228. </user-agent>
  8229. <user-agent>
  8230. <ID>id_g_m_180606_2</ID>
  8231. <String>KSbot/1.0 (KnowledgeStorm crawler; http://www.knowledgestorm.com/resources/content/crawler/index.html; crawleradmin@knowledgestorm.com)</String>
  8232. <Description>KnowledgeStorm technology industry crawler for Findtech.com</Description>
  8233. <Type>R</Type>
  8234. <Comment>12.129.110.xx</Comment>
  8235. <Link1>http://www.findtech.com/</Link1>
  8236. <Link2>http://www.knowledgestorm.com/resources/content/crawler/index.html</Link2>
  8237. </user-agent>
  8238. <user-agent>
  8239. <ID>id_g_m_570</ID>
  8240. <String>kuloko-bot/0.x</String>
  8241. <Description>Kuloko contextual search robot</Description>
  8242. <Type>R</Type>
  8243. <Comment></Comment>
  8244. <Link1>http://www.kuloko.com/</Link1>
  8245. <Link2></Link2>
  8246. </user-agent>
  8247. <user-agent>
  8248. <ID>id_g_m_571</ID>
  8249. <String>kulokobot www.kuloko.com kuloko@backweave.com</String>
  8250. <Description>Kuloko contextual search robot</Description>
  8251. <Type>R</Type>
  8252. <Comment></Comment>
  8253. <Link1>http://www.kuloko.com</Link1>
  8254. <Link2></Link2>
  8255. </user-agent>
  8256. <user-agent>
  8257. <ID>id_g_m_572</ID>
  8258. <String>kulturarw3/0.1</String>
  8259. <Description>National Library of Sweden Heritage Project robot</Description>
  8260. <Type>R</Type>
  8261. <Comment></Comment>
  8262. <Link1>http://www.kb.se/ENG/kbstart.htm</Link1>
  8263. <Link2></Link2>
  8264. </user-agent>
  8265. <user-agent>
  8266. <ID>id_g_m_301105_2</ID>
  8267. <String>KummHttp/1.1 (compatible; KummClient; Linux rulez)</String>
  8268. <Description>Link or server checking from Sanoma Budapest (195.70.35.xxx)</Description>
  8269. <Type>C R</Type>
  8270. <Comment>Sanoma also runs some web-portals i.e. http://www.startlap.com/</Comment>
  8271. <Link1>http://sanomabp.hu/</Link1>
  8272. <Link2></Link2>
  8273. </user-agent>
  8274. <user-agent>
  8275. <ID>id_g_m_280209_3</ID>
  8276. <String>KWC-KX9/1109 UP.Browser/6.2.3.9.g.1.107 (GUI) MMP/2.0 UP.Link/6.3.0.0.0</String>
  8277. <Description>UP.Browser for mobiles on Kyocera KWC-KX9 cellphone</Description>
  8278. <Type>B</Type>
  8279. <Comment></Comment>
  8280. <Link1>http://www.openwave.com</Link1>
  8281. <Link2></Link2>
  8282. </user-agent>
  8283. <user-agent>
  8284. <ID>id_g_m_211208_3</ID>
  8285. <String>Labrador/0.2; http://ir.dcs.gla.ac.uk/labrador; craigm@dcs.gla.ac.uk</String>
  8286. <Description>TREC Blog Track - Blog and news feed crawler</Description>
  8287. <Type>130.209.241.2xx</Type>
  8288. <Comment>http://ir.dcs.gla.ac.uk/wiki/TREC-Blog</Comment>
  8289. <Link1></Link1>
  8290. <Link2></Link2>
  8291. </user-agent>
  8292. <user-agent>
  8293. <ID>id_g_m_573</ID>
  8294. <String>Lachesis</String>
  8295. <Description>Intels Lachesis web site response time monitoring tool</Description>
  8296. <Type>C</Type>
  8297. <Comment></Comment>
  8298. <Link1>ftp://ftp.imag.fr/pub/labo-LSR/DRAKKAR/internet-performance/lachesis/</Link1>
  8299. <Link2></Link2>
  8300. </user-agent>
  8301. <user-agent>
  8302. <ID>id_g_m_140406_1</ID>
  8303. <String>lanshanbot/1.0</String>
  8304. <Description>Unknown robot from Easten Network China (202.96.51.1xx)</Description>
  8305. <Type></Type>
  8306. <Comment>reads robots.txt</Comment>
  8307. <Link1></Link1>
  8308. <Link2></Link2>
  8309. </user-agent>
  8310. <user-agent>
  8311. <ID>id_g_m_021206_2</ID>
  8312. <String>lanshanbot/1.0 (+http://search.msn.com/msnbot.htm)</String>
  8313. <Description>Unknown robot from Easten Network China (202.96.51.1xx)</Description>
  8314. <Type></Type>
  8315. <Comment>reads robots.txt</Comment>
  8316. <Link1></Link1>
  8317. <Link2></Link2>
  8318. </user-agent>
  8319. <user-agent>
  8320. <ID>id_g_m_271105_1</ID>
  8321. <String>LapozzBot/1.4 ( http://robot.lapozz.com)</String>
  8322. <Description>Lapozz search (Hungary) robot (82.131.195.xx)</Description>
  8323. <Type>R</Type>
  8324. <Comment></Comment>
  8325. <Link1>http://www.lapozz.com/</Link1>
  8326. <Link2></Link2>
  8327. </user-agent>
  8328. <user-agent>
  8329. <ID>id_g_m_280508_3</ID>
  8330. <String>LapozzBot/1.5 (+http://robot.lapozz.hu)</String>
  8331. <Description>Lapozz search (Hungary) robot (82.131.195.xx)</Description>
  8332. <Type>R</Type>
  8333. <Comment></Comment>
  8334. <Link1>http://www.lapozz.com/</Link1>
  8335. <Link2></Link2>
  8336. </user-agent>
  8337. <user-agent>
  8338. <ID>id_g_m_574</ID>
  8339. <String>larbin (samualt9@bigfoot.com)</String>
  8340. <Description>Larbin indexer used as Metacarta.com (66.28.xx.xxx) robot</Description>
  8341. <Type>R</Type>
  8342. <Comment></Comment>
  8343. <Link1>http://www.metacarta.com/</Link1>
  8344. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8345. </user-agent>
  8346. <user-agent>
  8347. <ID>id_g_m_592</ID>
  8348. <String>LARBIN-EXPERIMENTAL (efp@gmx.net)</String>
  8349. <Description>Unknown robot from 66.230.140.xx (argon.oxeo.com)</Description>
  8350. <Type>S</Type>
  8351. <Comment>maybe an e-mail collector - see also Mozilla/4.0 efp@gmx.net</Comment>
  8352. <Link1></Link1>
  8353. <Link2></Link2>
  8354. </user-agent>
  8355. <user-agent>
  8356. <ID>id_g_m_575</ID>
  8357. <String>larbin_2.1.1 larbin2.1.1@somewhere.com</String>
  8358. <Description>Larbin indexer used by Mitsubishi Electric Research Labs</Description>
  8359. <Type>R</Type>
  8360. <Comment></Comment>
  8361. <Link1>http://www.merl.com</Link1>
  8362. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8363. </user-agent>
  8364. <user-agent>
  8365. <ID>id_g_m_576</ID>
  8366. <String>larbin_2.2.0 (crawl@compete.com)</String>
  8367. <Description>Larbin indexer used as Compete.com crawler</Description>
  8368. <Type>R</Type>
  8369. <Comment></Comment>
  8370. <Link1>http://www.compete.com</Link1>
  8371. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8372. </user-agent>
  8373. <user-agent>
  8374. <ID>id_g_m_577</ID>
  8375. <String>larbin_2.2.1_de_Viennot (Laurent.Viennot@inria.fr)</String>
  8376. <Description>Larbin indexer used as Inria robot</Description>
  8377. <Type>R</Type>
  8378. <Comment></Comment>
  8379. <Link1>http://www.inria.fr/index.en.html</Link1>
  8380. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8381. </user-agent>
  8382. <user-agent>
  8383. <ID>id_g_m_578</ID>
  8384. <String>larbin_2.2.2 (sugayama@lab7.kuis.kyoto-u.ac.jp)</String>
  8385. <Description>Larbin indexer used as Kyoto University robot</Description>
  8386. <Type>R</Type>
  8387. <Comment></Comment>
  8388. <Link1>http://www.kyoto-u.ac.jp/</Link1>
  8389. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8390. </user-agent>
  8391. <user-agent>
  8392. <ID>id_g_m_579</ID>
  8393. <String>larbin_2.2.2_guillaume (guillaume@liafa.jussieu.fr)</String>
  8394. <Description>Larbin indexer used as Inria robot</Description>
  8395. <Type>R</Type>
  8396. <Comment></Comment>
  8397. <Link1>http://www.inria.fr/index.en.html</Link1>
  8398. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8399. </user-agent>
  8400. <user-agent>
  8401. <ID>id_g_m_581</ID>
  8402. <String>larbin_2.6.0 (larbin2.6.0@unspecified.mail)</String>
  8403. <Description>Larbin indexer used by an unknown dsl.net client</Description>
  8404. <Type>R</Type>
  8405. <Comment></Comment>
  8406. <Link1>http://larbin.sourceforge.net/index-eng.html</Link1>
  8407. <Link2></Link2>
  8408. </user-agent>
  8409. <user-agent>
  8410. <ID>id_g_m_582</ID>
  8411. <String>larbin_2.6.1 (larbin2.6.1@unspecified.mail)</String>
  8412. <Description>Larbin indexer used by diff. IPs / services</Description>
  8413. <Type>R</Type>
  8414. <Comment> ie.: -Central Host Inc. (client) robot ? - Colt Net France robot</Comment>
  8415. <Link1>http://www.centralhost.com</Link1>
  8416. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8417. </user-agent>
  8418. <user-agent>
  8419. <ID>id_g_m_583</ID>
  8420. <String>larbin_2.6.2 (hamasaki@grad.nii.ac.jp)</String>
  8421. <Description>Larbin indexer used by National Institut of Informatics (NII/Japan)</Description>
  8422. <Type>R</Type>
  8423. <Comment></Comment>
  8424. <Link1>http://www.nii.ac.jp</Link1>
  8425. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8426. </user-agent>
  8427. <user-agent>
  8428. <ID>id_g_m_584</ID>
  8429. <String>larbin_2.6.2 (larbin2.6.2@unspecified.mail)</String>
  8430. <Description>Larbin indexer used by diff. IPs</Description>
  8431. <Type>R</Type>
  8432. <Comment></Comment>
  8433. <Link1>http://larbin.sourceforge.net/index-eng.html</Link1>
  8434. <Link2></Link2>
  8435. </user-agent>
  8436. <user-agent>
  8437. <ID>id_g_m_585</ID>
  8438. <String>larbin_2.6.2 (listonATccDOTgatechDOTedu)</String>
  8439. <Description>Larbin indexer used as robot by Georgia Institute of Technology http://www.gatech.edu/</Description>
  8440. <Type>R</Type>
  8441. <Comment></Comment>
  8442. <Link1>http://www.gatech.edu</Link1>
  8443. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8444. </user-agent>
  8445. <user-agent>
  8446. <ID>id_g_m_586</ID>
  8447. <String>larbin_2.6.2 (pimenas@systems.tuc.gr)</String>
  8448. <Description>Larbin indexer used by Technical University of Crete</Description>
  8449. <Type>R</Type>
  8450. <Comment></Comment>
  8451. <Link1>http://www.systems.tuc.gr</Link1>
  8452. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8453. </user-agent>
  8454. <user-agent>
  8455. <ID>id_g_m_587</ID>
  8456. <String>larbin_2.6.2 (tom@lemurconsulting.com)</String>
  8457. <Description>Larbin indexer used as Lemur Consulting robot</Description>
  8458. <Type>R</Type>
  8459. <Comment></Comment>
  8460. <Link1>http://www.lemurconsulting.com</Link1>
  8461. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8462. </user-agent>
  8463. <user-agent>
  8464. <ID>id_g_m_588</ID>
  8465. <String>larbin_2.6.2 (vitalbox1@hotmail.com)</String>
  8466. <Description>Larbin indexer used as robot via cloud9.net (168.100.192.xxx)</Description>
  8467. <Type>R</Type>
  8468. <Comment></Comment>
  8469. <Link1>http://larbin.sourceforge.net/index-eng.html</Link1>
  8470. <Link2></Link2>
  8471. </user-agent>
  8472. <user-agent>
  8473. <ID>id_g_m_261205_1</ID>
  8474. <String>larbin_2.6.3 (ltaa_web_crawler@groupes.epfl.ch)</String>
  8475. <Description>Unknown robot from EPFL Lausanne Switzerland (128.178.155.1xx)</Description>
  8476. <Type>R</Type>
  8477. <Comment>reads robots.txt</Comment>
  8478. <Link1>http://www.epfl.ch/Eindex.html</Link1>
  8479. <Link2></Link2>
  8480. </user-agent>
  8481. <user-agent>
  8482. <ID>id_g_m_589</ID>
  8483. <String>larbin_2.6.3 (wgao@genieknows.com)</String>
  8484. <Description>Larbin indexer used by GenieKnows.com search</Description>
  8485. <Type>R</Type>
  8486. <Comment> s. also: - geniebot wgao@genieknows.com</Comment>
  8487. <Link1>http://www.genieknows.com</Link1>
  8488. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8489. </user-agent>
  8490. <user-agent>
  8491. <ID>id_g_m_590</ID>
  8492. <String>larbin_2.6.3_for_(http://cosco.hiit.fi/search/) tsilande@hiit.fi</String>
  8493. <Description>Larbin indexer used by Next Generation Information Retrieval (NGIR)</Description>
  8494. <Type>R</Type>
  8495. <Comment></Comment>
  8496. <Link1>http://cosco.hiit.fi</Link1>
  8497. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8498. </user-agent>
  8499. <user-agent>
  8500. <ID>id_g_m_580</ID>
  8501. <String>larbin_2.6_basileocaml (basile.starynkevitch@cea.fr)</String>
  8502. <Description>Larbin indexer used by CEA / DCom Rechercher</Description>
  8503. <Type>R</Type>
  8504. <Comment></Comment>
  8505. <Link1>http://www.cea.fr</Link1>
  8506. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8507. </user-agent>
  8508. <user-agent>
  8509. <ID>id_g_m_591</ID>
  8510. <String>larbin_devel (http://pauillac.inria.fr/~ailleret/prog/larbin/)</String>
  8511. <Description>Larbin indexer used as Inria robot</Description>
  8512. <Type>R</Type>
  8513. <Comment></Comment>
  8514. <Link1>http://pauillac.inria.fr</Link1>
  8515. <Link2>http://larbin.sourceforge.net/index-eng.html</Link2>
  8516. </user-agent>
  8517. <user-agent>
  8518. <ID>id_g_m_160807_2</ID>
  8519. <String>lawinfo-crawler/Nutch-0.9-dev (Crawler for lawinfo.com pages; http://www.lawinfo.com; webmaster@lawinfo.com)</String>
  8520. <Description>LawInfo - Lawyer and attorney directory</Description>
  8521. <Type>R</Type>
  8522. <Comment>216.86.137.xx</Comment>
  8523. <Link1>http://www.lawinfo.com/</Link1>
  8524. <Link2></Link2>
  8525. </user-agent>
  8526. <user-agent>
  8527. <ID>id_g_m_020506_3</ID>
  8528. <String>lc/$ROADS::Version libwww-perl/5.00</String>
  8529. <Description>ROADS - Perl web based subject based gateway tool</Description>
  8530. <Type></Type>
  8531. <Comment></Comment>
  8532. <Link1>http://roads.opensource.ac.uk/</Link1>
  8533. <Link2></Link2>
  8534. </user-agent>
  8535. <user-agent>
  8536. <ID>id_g_m_593</ID>
  8537. <String>lcabotAccept: */*</String>
  8538. <Description>unknown robot via MTT.ca / Aliant.ca</Description>
  8539. <Type></Type>
  8540. <Comment>142.177.168.xxx</Comment>
  8541. <Link1></Link1>
  8542. <Link2></Link2>
  8543. </user-agent>
  8544. <user-agent>
  8545. <ID>id_g_m_140408_1</ID>
  8546. <String>LeapTag/0.8.1.beta081.r3750 (compatible; Mozilla 4.0; MSIE 5.5; robot@yoriwa.com)</String>
  8547. <Description>LeapTag news reader and content discovery tool</Description>
  8548. <Type>B</Type>
  8549. <Comment></Comment>
  8550. <Link1>http://www.leaptag.com/</Link1>
  8551. <Link2></Link2>
  8552. </user-agent>
  8553. <user-agent>
  8554. <ID>id_g_m_594</ID>
  8555. <String>LECodeChecker/3.0 libgetdoc/1.0</String>
  8556. <Description>Linkexchange crawler</Description>
  8557. <Type>R</Type>
  8558. <Comment></Comment>
  8559. <Link1>http://www.linkexchange.com</Link1>
  8560. <Link2></Link2>
  8561. </user-agent>
  8562. <user-agent>
  8563. <ID>id_g_m_595</ID>
  8564. <String>LeechGet 200x (www.leechget.de)</String>
  8565. <Description>Leechget download manager</Description>
  8566. <Type>D</Type>
  8567. <Comment></Comment>
  8568. <Link1>http://www.leechget.de</Link1>
  8569. <Link2></Link2>
  8570. </user-agent>
  8571. <user-agent>
  8572. <ID>id_g_m_596</ID>
  8573. <String>LEIA/2.90</String>
  8574. <Description>Gseek.com (site is offline) robot</Description>
  8575. <Type>R</Type>
  8576. <Comment></Comment>
  8577. <Link1></Link1>
  8578. <Link2></Link2>
  8579. </user-agent>
  8580. <user-agent>
  8581. <ID>id_g_m_597</ID>
  8582. <String>LEIA/3.01pr (LEIAcrawler; [SNIP])</String>
  8583. <Description>Gseek.com (site is offline) robot</Description>
  8584. <Type>R</Type>
  8585. <Comment></Comment>
  8586. <Link1></Link1>
  8587. <Link2></Link2>
  8588. </user-agent>
  8589. <user-agent>
  8590. <ID>id_g_m_210106_2</ID>
  8591. <String>LetsCrawl.com/1.0 +http://letscrawl.com/</String>
  8592. <Description>Maybe logfile spamming for Lets crawl! search (Germany)</Description>
  8593. <Type>S</Type>
  8594. <Comment>website has no function</Comment>
  8595. <Link1>http://letscrawl.com/</Link1>
  8596. <Link2></Link2>
  8597. </user-agent>
  8598. <user-agent>
  8599. <ID>id_g_m_598</ID>
  8600. <String>LexiBot/1.00</String>
  8601. <Description>Lexibot (exMataHari) search software</Description>
  8602. <Type>R</Type>
  8603. <Comment></Comment>
  8604. <Link1>http://www.lexibot.com/index.asp</Link1>
  8605. <Link2></Link2>
  8606. </user-agent>
  8607. <user-agent>
  8608. <ID>id_g_m_140209_2</ID>
  8609. <String>LG-LX260 POLARIS-LX260/2.0 MMP/2.0 Profile/MIDP-2.0 Configuration/CLDC-1.1</String>
  8610. <Description>Polaris mobile browser on LG LX 260 Sprint Rumor phone</Description>
  8611. <Type>B</Type>
  8612. <Comment></Comment>
  8613. <Link1>http://www.infraware.co.kr/eng/01_product/product10.asp</Link1>
  8614. <Link2></Link2>
  8615. </user-agent>
  8616. <user-agent>
  8617. <ID>id_g_m_599</ID>
  8618. <String>LG/U8138/v1.0</String>
  8619. <Description>LG 8138 Mobile Phone browser</Description>
  8620. <Type>B</Type>
  8621. <Comment></Comment>
  8622. <Link1></Link1>
  8623. <Link2></Link2>
  8624. </user-agent>
  8625. <user-agent>
  8626. <ID>id_g_m_600</ID>
  8627. <String>Libby_1.1/libwww-perl/5.47</String>
  8628. <Description>About.com robot</Description>
  8629. <Type>R</Type>
  8630. <Comment></Comment>
  8631. <Link1>http://www.about.com/</Link1>
  8632. <Link2></Link2>
  8633. </user-agent>
  8634. <user-agent>
  8635. <ID>id_g_m_100306_1</ID>
  8636. <String>libcurl-agent/1.0</String>
  8637. <Description>libcurl's (multiprotocol file transfer library) standard user-agent name</Description>
  8638. <Type>D</Type>
  8639. <Comment></Comment>
  8640. <Link1>http://curl.haxx.se/libcurl/</Link1>
  8641. <Link2></Link2>
  8642. </user-agent>
  8643. <user-agent>
  8644. <ID>id_g_m_080507_1</ID>
  8645. <String>LibertyW (+http://www.lw01.com)</String>
  8646. <Description>LibertyW search for mobile (France)</Description>
  8647. <Type>R</Type>
  8648. <Comment>213.251.135.2xx</Comment>
  8649. <Link1>http://www.lw01.com/en/</Link1>
  8650. <Link2></Link2>
  8651. </user-agent>
  8652. <user-agent>
  8653. <ID>id_g_m_601</ID>
  8654. <String>libWeb/clsHTTP -- hiongun@kt.co.kr</String>
  8655. <Description>Korea Telecom Search robot</Description>
  8656. <Type>R</Type>
  8657. <Comment></Comment>
  8658. <Link1>http://www.kt.co.kr/kt_home/eng/index.jsp</Link1>
  8659. <Link2></Link2>
  8660. </user-agent>
  8661. <user-agent>
  8662. <ID>id_g_m_602</ID>
  8663. <String>libwww-perl/5.41</String>
  8664. <Description>CMP United Media robot</Description>
  8665. <Type>R</Type>
  8666. <Comment></Comment>
  8667. <Link1>http://www.cmpnet.com</Link1>
  8668. <Link2></Link2>
  8669. </user-agent>
  8670. <user-agent>
  8671. <ID>id_g_m_603</ID>
  8672. <String>libwww-perl/5.45</String>
  8673. <Description>SplatSearch robot (207.44.142.xx)</Description>
  8674. <Type>R</Type>
  8675. <Comment></Comment>
  8676. <Link1>http://www.splatsearch.com</Link1>
  8677. <Link2></Link2>
  8678. </user-agent>
  8679. <user-agent>
  8680. <ID>id_g_m_604</ID>
  8681. <String>libwww-perl/5.48</String>
  8682. <Description>Alexa robot</Description>
  8683. <Type>R</Type>
  8684. <Comment></Comment>
  8685. <Link1>http://www.alexa.com</Link1>
  8686. <Link2></Link2>
  8687. </user-agent>
  8688. <user-agent>
  8689. <ID>id_g_m_605</ID>
  8690. <String>libwww-perl/5.50</String>
  8691. <Description>diff. IPs / services</Description>
  8692. <Type>R C P</Type>
  8693. <Comment> ie.: - secure-netz.de link checking (in conjunction w. LWP::Simple/5.50) -N2H2 Internet filtering</Comment>
  8694. <Link1>http://www.n2h2.com</Link1>
  8695. <Link2></Link2>
  8696. </user-agent>
  8697. <user-agent>
  8698. <ID>id_g_m_606</ID>
  8699. <String>libwww-perl/5.52 FP/2.1</String>
  8700. <Description>Fast Search robot</Description>
  8701. <Type>R</Type>
  8702. <Comment></Comment>
  8703. <Link1>http://www.alltheweb.com</Link1>
  8704. <Link2></Link2>
  8705. </user-agent>
  8706. <user-agent>
  8707. <ID>id_g_m_607</ID>
  8708. <String>libwww-perl/5.52 FP/4.0</String>
  8709. <Description>Fast Search robot</Description>
  8710. <Type>R</Type>
  8711. <Comment></Comment>
  8712. <Link1>http://www.alltheweb.com</Link1>
  8713. <Link2></Link2>
  8714. </user-agent>
  8715. <user-agent>
  8716. <ID>id_g_m_608</ID>
  8717. <String>libwww-perl/5.53</String>
  8718. <Description>diff. IPs / services</Description>
  8719. <Type>R C P</Type>
  8720. <Comment> ie.: -iPrism Web filtering software - softclub.net link checking</Comment>
  8721. <Link1>http://www.stbernard.com/default.asp</Link1>
  8722. <Link2></Link2>
  8723. </user-agent>
  8724. <user-agent>
  8725. <ID>id_g_m_609</ID>
  8726. <String>libwww-perl/5.63</String>
  8727. <Description>Profile for You internet profiling (?)</Description>
  8728. <Type>R C</Type>
  8729. <Comment></Comment>
  8730. <Link1>http://www.profile4u.com</Link1>
  8731. <Link2></Link2>
  8732. </user-agent>
  8733. <user-agent>
  8734. <ID>id_g_m_610</ID>
  8735. <String>libwww-perl/5.64</String>
  8736. <Description>unknown link checking from Wanadoo.fr (193.253.33.xxx)</Description>
  8737. <Type>R C</Type>
  8738. <Comment></Comment>
  8739. <Link1></Link1>
  8740. <Link2></Link2>
  8741. </user-agent>
  8742. <user-agent>
  8743. <ID>id_g_m_611</ID>
  8744. <String>libwww-perl/5.65</String>
  8745. <Description>Amidalla search engine robot (62.241.33.xx)</Description>
  8746. <Type>R</Type>
  8747. <Comment> s. also amibot</Comment>
  8748. <Link1>http://www.amidalla.com</Link1>
  8749. <Link2></Link2>
  8750. </user-agent>
  8751. <user-agent>
  8752. <ID>id_g_m_612</ID>
  8753. <String>libwww-perl/5.800</String>
  8754. <Description>SplatSearch robot (72.36.210.xx)</Description>
  8755. <Type>R</Type>
  8756. <Comment></Comment>
  8757. <Link1>http://www.splatsearch.com/</Link1>
  8758. <Link2></Link2>
  8759. </user-agent>
  8760. <user-agent>
  8761. <ID>id_g_m_613</ID>
  8762. <String>libwww/5.3.2</String>
  8763. <Description>Mediater Rechercher robot</Description>
  8764. <Type>R</Type>
  8765. <Comment></Comment>
  8766. <Link1>http://www.mediater.net</Link1>
  8767. <Link2></Link2>
  8768. </user-agent>
  8769. <user-agent>
  8770. <ID>id_g_m_160206_1</ID>
  8771. <String>Liferea/0.x.x (Linux; en_US.UTF-8; http://liferea.sf.net/)</String>
  8772. <Description>Liferea - Linux feed reader</Description>
  8773. <Type>B</Type>
  8774. <Comment></Comment>
  8775. <Link1>http://liferea.sourceforge.net/</Link1>
  8776. <Link2></Link2>
  8777. </user-agent>
  8778. <user-agent>
  8779. <ID>id_g_m_140508_4</ID>
  8780. <String>Liferea/1.x.x (Linux; es_ES.UTF-8; http://liferea.sf.net/)</String>
  8781. <Description>Liferea (Linux Feed Reader) news aggregator for Unix and Linux</Description>
  8782. <Type>B</Type>
  8783. <Comment></Comment>
  8784. <Link1>http://liferea.sourceforge.net/</Link1>
  8785. <Link2></Link2>
  8786. </user-agent>
  8787. <user-agent>
  8788. <ID>id_g_m_614</ID>
  8789. <String>LightningDownload/1.0beta2</String>
  8790. <Description>Lightning Download manager</Description>
  8791. <Type>D</Type>
  8792. <Comment></Comment>
  8793. <Link1>http://www.lightningdownload.com</Link1>
  8794. <Link2></Link2>
  8795. </user-agent>
  8796. <user-agent>
  8797. <ID>id_g_m_615</ID>
  8798. <String>LightningDownload/1.x.x</String>
  8799. <Description>Lightning Download manager</Description>
  8800. <Type>D</Type>
  8801. <Comment></Comment>
  8802. <Link1>http://www.lightningdownload.com</Link1>
  8803. <Link2></Link2>
  8804. </user-agent>
  8805. <user-agent>
  8806. <ID>id_g_m_616</ID>
  8807. <String>LightningDownload/1.x.x [Accelerated x]</String>
  8808. <Description>Lightning Download manager</Description>
  8809. <Type>D</Type>
  8810. <Comment></Comment>
  8811. <Link1>http://www.lightningdownload.com</Link1>
  8812. <Link2></Link2>
  8813. </user-agent>
  8814. <user-agent>
  8815. <ID>id_g_m_131207_1</ID>
  8816. <String>LijitSpider/Nutch-0.9 (Reports crawler; http://www.lijit.com/; info(a)lijit(d)com)</String>
  8817. <Description>Lijit blog search spider</Description>
  8818. <Type>R</Type>
  8819. <Comment>216.24.131.1xx</Comment>
  8820. <Link1>http://www.lijit.com/</Link1>
  8821. <Link2></Link2>
  8822. </user-agent>
  8823. <user-agent>
  8824. <ID>id_g_m_617</ID>
  8825. <String>Lincoln State Web Browser</String>
  8826. <Description>Some spam bot</Description>
  8827. <Type>S</Type>
  8828. <Comment>s. this Guestbook http://www.donotenter.com/guestbook/gbook.html</Comment>
  8829. <Link1>http://www.donotenter.com/guestbook/gbook.html</Link1>
  8830. <Link2></Link2>
  8831. </user-agent>
  8832. <user-agent>
  8833. <ID>id_g_m_618</ID>
  8834. <String>Link Valet Online 1.x</String>
  8835. <Description>Link Valet online link checking</Description>
  8836. <Type>C</Type>
  8837. <Comment></Comment>
  8838. <Link1>http://www.htmlhelp.com</Link1>
  8839. <Link2></Link2>
  8840. </user-agent>
  8841. <user-agent>
  8842. <ID>id_g_m_620</ID>
  8843. <String>LinkAlarm/2.x</String>
  8844. <Description>Linkalarm link validation</Description>
  8845. <Type>C</Type>
  8846. <Comment></Comment>
  8847. <Link1>http://www.linkalarm.com</Link1>
  8848. <Link2></Link2>
  8849. </user-agent>
  8850. <user-agent>
  8851. <ID>id_g_m_621</ID>
  8852. <String>Linkbot</String>
  8853. <Description>Linkbot Pro link checking software</Description>
  8854. <Type>C</Type>
  8855. <Comment></Comment>
  8856. <Link1>http://www.watchfire.com</Link1>
  8857. <Link2></Link2>
  8858. </user-agent>
  8859. <user-agent>
  8860. <ID>id_g_m_622</ID>
  8861. <String>linkbot</String>
  8862. <Description>Rpsoft 2000 Site-Crawler</Description>
  8863. <Type>R</Type>
  8864. <Comment></Comment>
  8865. <Link1>http://www.rpsoft2000.com/rps-site-crawler.htm</Link1>
  8866. <Link2></Link2>
  8867. </user-agent>
  8868. <user-agent>
  8869. <ID>id_g_m_623</ID>
  8870. <String>Linkbot x.0</String>
  8871. <Description>Linkbot Pro link checking software</Description>
  8872. <Type>C</Type>
  8873. <Comment></Comment>
  8874. <Link1>http://www.watchfire.com</Link1>
  8875. <Link2></Link2>
  8876. </user-agent>
  8877. <user-agent>
  8878. <ID>id_g_m_624</ID>
  8879. <String>LinkCheck (linkcheck@inter7.com http://www.inter7.com/linkcheck)</String>
  8880. <Description>Linkcheck - linkchecking tool for Unix/Linux</Description>
  8881. <Type>C</Type>
  8882. <Comment></Comment>
  8883. <Link1>http://www.inter7.com</Link1>
  8884. <Link2></Link2>
  8885. </user-agent>
  8886. <user-agent>
  8887. <ID>id_g_m_625</ID>
  8888. <String>LinkLint-checkonly/2.x.x</String>
  8889. <Description>Linklint - Perl html link checker</Description>
  8890. <Type>C</Type>
  8891. <Comment></Comment>
  8892. <Link1>http://www.linklint.org</Link1>
  8893. <Link2></Link2>
  8894. </user-agent>
  8895. <user-agent>
  8896. <ID>id_g_m_626</ID>
  8897. <String>LinkLint-spider/2.x.x</String>
  8898. <Description>Linklint - Perl html link checker</Description>
  8899. <Type>C</Type>
  8900. <Comment></Comment>
  8901. <Link1>http://www.linklint.org</Link1>
  8902. <Link2></Link2>
  8903. </user-agent>
  8904. <user-agent>
  8905. <ID>id_g_m_627</ID>
  8906. <String>linknzbot</String>
  8907. <Description>Linknz - The Kiwi Search Engine (New Zealand)</Description>
  8908. <Type>R</Type>
  8909. <Comment></Comment>
  8910. <Link1>http://www.linknz.co.nz</Link1>
  8911. <Link2></Link2>
  8912. </user-agent>
  8913. <user-agent>
  8914. <ID>id_g_m_280606_1</ID>
  8915. <String>LinkPimpin v1.0</String>
  8916. <Description>Link-Pimp web directory link checking</Description>
  8917. <Type>C</Type>
  8918. <Comment>216.89.111.x</Comment>
  8919. <Link1>http://www.link-pimp.com/</Link1>
  8920. <Link2></Link2>
  8921. </user-agent>
  8922. <user-agent>
  8923. <ID>id_g_m_628</ID>
  8924. <String>LinkProver 2.1</String>
  8925. <Description>TafWeb link checking program</Description>
  8926. <Type>C</Type>
  8927. <Comment></Comment>
  8928. <Link1>http://www.tafweb.com</Link1>
  8929. <Link2></Link2>
  8930. </user-agent>
  8931. <user-agent>
  8932. <ID>id_g_m_630</ID>
  8933. <String>Links (0.9x; Linux 2.4.7-10 i686)</String>
  8934. <Description>Links text browser for Unix &amp; OS/2</Description>
  8935. <Type>B</Type>
  8936. <Comment></Comment>
  8937. <Link1>http://artax.karlin.mff.cuni.cz/%7Emikulas/links/</Link1>
  8938. <Link2></Link2>
  8939. </user-agent>
  8940. <user-agent>
  8941. <ID>id_g_m_631</ID>
  8942. <String>Links (0.9xpre12; Linux 2.2.14-5.0 i686; 80x24)</String>
  8943. <Description>Links text browser for Unix &amp; OS/2</Description>
  8944. <Type>B</Type>
  8945. <Comment></Comment>
  8946. <Link1>http://artax.karlin.mff.cuni.cz/%7Emikulas/links/</Link1>
  8947. <Link2></Link2>
  8948. </user-agent>
  8949. <user-agent>
  8950. <ID>id_g_m_632</ID>
  8951. <String>Links (2.xpre7; Linux 2.4.18 i586; x)</String>
  8952. <Description>Links text browser for Unix &amp; OS/2</Description>
  8953. <Type>B</Type>
  8954. <Comment></Comment>
  8955. <Link1>http://artax.karlin.mff.cuni.cz/%7Emikulas/links/</Link1>
  8956. <Link2></Link2>
  8957. </user-agent>
  8958. <user-agent>
  8959. <ID>id_g_m_629</ID>
  8960. <String>Links - http://gossamer-threads.com/scripts/links/</String>
  8961. <Description>Links SQL directory management program</Description>
  8962. <Type>C</Type>
  8963. <Comment></Comment>
  8964. <Link1>http://gossamer-threads.com/scripts/links/</Link1>
  8965. <Link2></Link2>
  8966. </user-agent>
  8967. <user-agent>
  8968. <ID>id_g_m_633</ID>
  8969. <String>Links 2.0 (http://gossamer-threads.com/scripts/links/)</String>
  8970. <Description>Links SQL directory management program</Description>
  8971. <Type>R</Type>
  8972. <Comment></Comment>
  8973. <Link1>http://gossamer-threads.com/scripts/links/</Link1>
  8974. <Link2></Link2>
  8975. </user-agent>
  8976. <user-agent>
  8977. <ID>id_g_m_634</ID>
  8978. <String>Links SQL (http://gossamer-threads.com/scripts/links-sql/)</String>
  8979. <Description>Links SQL directory management program</Description>
  8980. <Type>R</Type>
  8981. <Comment></Comment>
  8982. <Link1>http://gossamer-threads.com/scripts/links-sql/</Link1>
  8983. <Link2></Link2>
  8984. </user-agent>
  8985. <user-agent>
  8986. <ID>id_g_m_280406_3</ID>
  8987. <String>Links4US-Crawler&#44; (+http://links4us.com/)</String>
  8988. <Description>Links4us ODP based directory link checking</Description>
  8989. <Type>C</Type>
  8990. <Comment>209.190.5.2xx</Comment>
  8991. <Link1>http://links4us.com/</Link1>
  8992. <Link2></Link2>
  8993. </user-agent>
  8994. <user-agent>
  8995. <ID>id_g_m_635</ID>
  8996. <String>LinkScan/11.0beta2 UnixShareware robot from Elsop.com (used by Indiafocus/Indiainfo)</String>
  8997. <Description>Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others)</Description>
  8998. <Type>R</Type>
  8999. <Comment></Comment>
  9000. <Link1>http://www.elsop.com</Link1>
  9001. <Link2>http://indiafocus.indiainfo.com/</Link2>
  9002. </user-agent>
  9003. <user-agent>
  9004. <ID>id_g_m_636</ID>
  9005. <String>LinkScan/9.0g Unix</String>
  9006. <Description>Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others)</Description>
  9007. <Type>R</Type>
  9008. <Comment></Comment>
  9009. <Link1>http://www.elsop.com</Link1>
  9010. <Link2>http://indiafocus.indiainfo.com/</Link2>
  9011. </user-agent>
  9012. <user-agent>
  9013. <ID>id_g_m_637</ID>
  9014. <String>LinkScan/x.x Unix</String>
  9015. <Description>Shareware robot from Elsop.com</Description>
  9016. <Type>R</Type>
  9017. <Comment></Comment>
  9018. <Link1>http://www.elsop.com</Link1>
  9019. <Link2></Link2>
  9020. </user-agent>
  9021. <user-agent>
  9022. <ID>id_g_m_638</ID>
  9023. <String>LinksManager.com (http://linksmanager.com/linkchecker.html)</String>
  9024. <Description>Linksmanager bookmark checking</Description>
  9025. <Type>C</Type>
  9026. <Comment>s.also Mozilla/5.0 (compatible; LinksManager.com_bot...</Comment>
  9027. <Link1>http://linksmanager.com/linkchecker.html</Link1>
  9028. <Link2></Link2>
  9029. </user-agent>
  9030. <user-agent>
  9031. <ID>id_g_m_639</ID>
  9032. <String>LinkSonar/1.35</String>
  9033. <Description>LinkSonar (Japan) link checking tool</Description>
  9034. <Type>C</Type>
  9035. <Comment></Comment>
  9036. <Link1>http://hp.vector.co.jp/authors/VA014575/chicchi/linksonar/readme.html</Link1>
  9037. <Link2></Link2>
  9038. </user-agent>
  9039. <user-agent>
  9040. <ID>id_g_m_640</ID>
  9041. <String>LinkSweeper/1.x</String>
  9042. <Description>Left Side Software's LinkSweeper (ceased) bookmark utility</Description>
  9043. <Type>C</Type>
  9044. <Comment></Comment>
  9045. <Link1>http://www.lss.com.au/lss/lss_main.htm</Link1>
  9046. <Link2></Link2>
  9047. </user-agent>
  9048. <user-agent>
  9049. <ID>id_g_m_641</ID>
  9050. <String>LinkWalker</String>
  9051. <Description>Seventwentyfour link checking robot</Description>
  9052. <Type>C</Type>
  9053. <Comment></Comment>
  9054. <Link1>http://www.seventwentyfour.com</Link1>
  9055. <Link2></Link2>
  9056. </user-agent>
  9057. <user-agent>
  9058. <ID>id_g_m_619</ID>
  9059. <String>link_check3.plx libwww-perl/5.65</String>
  9060. <Description>link check 3 - Perl HTML link checker (from Perl for Web Site Management)</Description>
  9061. <Type>C</Type>
  9062. <Comment></Comment>
  9063. <Link1>http://www.elanus.net/cgi/examples.cgi/view/ex_1102.txt</Link1>
  9064. <Link2></Link2>
  9065. </user-agent>
  9066. <user-agent>
  9067. <ID>id_g_m_642</ID>
  9068. <String>ListBidBot (freelance job spider http://listbid.com)&lt;a href=http://listbid.com>Freelance&lt;/a></String>
  9069. <Description>Listbid.com / Directnic.com link checking ?</Description>
  9070. <Type>R C</Type>
  9071. <Comment></Comment>
  9072. <Link1>http://listbid.com</Link1>
  9073. <Link2></Link2>
  9074. </user-agent>
  9075. <user-agent>
  9076. <ID>id_g_m_031107_3</ID>
  9077. <String>LiveTrans/Nutch-0.9 (maintainer: cobain at iis dot sinica dot edu dot tw; http://wkd.iis.sinica.edu.tw/LiveTrans/)</String>
  9078. <Description>WKD Lab: LiveTrans - Online query and terminology translation service</Description>
  9079. <Type>R</Type>
  9080. <Comment>140.109.19.1xx</Comment>
  9081. <Link1>http://wkd.iis.sinica.edu.tw/LiveTrans/</Link1>
  9082. <Link2></Link2>
  9083. </user-agent>
  9084. <user-agent>
  9085. <ID>id_g_m_643</ID>
  9086. <String>Llaut/1.0 (http://mnm.uib.es/~gallir/llaut/bot.html)</String>
  9087. <Description>llaut robot - Universitat de les Illes Balears (Spain)</Description>
  9088. <Type>R</Type>
  9089. <Comment></Comment>
  9090. <Link1>http://mnm.uib.es</Link1>
  9091. <Link2></Link2>
  9092. </user-agent>
  9093. <user-agent>
  9094. <ID>id_g_m_200307_2</ID>
  9095. <String>LMQueueBot/0.2</String>
  9096. <Description>E-Mail harvesting robot - same as ContactBot</Description>
  9097. <Type>S</Type>
  9098. <Comment>64.124.152.xx</Comment>
  9099. <Link1></Link1>
  9100. <Link2></Link2>
  9101. </user-agent>
  9102. <user-agent>
  9103. <ID>id_g_m_644</ID>
  9104. <String>lmspider (lmspider@scansoft.com)</String>
  9105. <Description>lmspider from Scansoft (192.133.61.xx) - Web text collector</Description>
  9106. <Type>R</Type>
  9107. <Comment>see here</Comment>
  9108. <Link1>http://www.kahunaburger.com/blog/archives/000117.html</Link1>
  9109. <Link2></Link2>
  9110. </user-agent>
  9111. <user-agent>
  9112. <ID>id_g_m_645</ID>
  9113. <String>LNSpiderguy</String>
  9114. <Description>Lexis-Nexis robot</Description>
  9115. <Type>R</Type>
  9116. <Comment></Comment>
  9117. <Link1>http://www.lexis-nexis.com/</Link1>
  9118. <Link2></Link2>
  9119. </user-agent>
  9120. <user-agent>
  9121. <ID>id_g_m_300106_4</ID>
  9122. <String>LocalBot/1.0 ( http://www.localbot.co.uk/)</String>
  9123. <Description>LocalBot company information collector</Description>
  9124. <Type>R</Type>
  9125. <Comment></Comment>
  9126. <Link1>http://www.localbot.co.uk/</Link1>
  9127. <Link2></Link2>
  9128. </user-agent>
  9129. <user-agent>
  9130. <ID>id_g_m_646</ID>
  9131. <String>LocalcomBot/1.2.x ( http://www.local.com/bot.htm)</String>
  9132. <Description>Local.com local search robot (216.52.252.xxx)</Description>
  9133. <Type>R</Type>
  9134. <Comment></Comment>
  9135. <Link1>http://www.local.com/</Link1>
  9136. <Link2></Link2>
  9137. </user-agent>
  9138. <user-agent>
  9139. <ID>id_g_m_647</ID>
  9140. <String>Lockstep Spider/1.0</String>
  9141. <Description>Lockstep (website content protection tool) user agent</Description>
  9142. <Type>R</Type>
  9143. <Comment></Comment>
  9144. <Link1>http://www.lockstep.com</Link1>
  9145. <Link2></Link2>
  9146. </user-agent>
  9147. <user-agent>
  9148. <ID>id_g_m_648</ID>
  9149. <String>Look.com</String>
  9150. <Description>GlobalQueue spider (64.40.105.xxx)</Description>
  9151. <Type>R</Type>
  9152. <Comment></Comment>
  9153. <Link1>http://www.multi-mode.com/</Link1>
  9154. <Link2></Link2>
  9155. </user-agent>
  9156. <user-agent>
  9157. <ID>id_g_m_649</ID>
  9158. <String>Lotus-Notes/4.5 ( Windows-NT )</String>
  9159. <Description>Lotus Notes browser</Description>
  9160. <Type>B</Type>
  9161. <Comment></Comment>
  9162. <Link1></Link1>
  9163. <Link2></Link2>
  9164. </user-agent>
  9165. <user-agent>
  9166. <ID>id_g_m_650</ID>
  9167. <String>LotusDiscovery/x.0 (compatible; Mozilla 4.0; MSIE 4.01; Windows NT)</String>
  9168. <Description>IBM Lotus Discovery Server</Description>
  9169. <Type></Type>
  9170. <Comment></Comment>
  9171. <Link1>http://www-142.ibm.com/software/sw-lotus/products/product3.nsf/wdocs/644012e0434859b585256ec9006d37b8</Link1>
  9172. <Link2></Link2>
  9173. </user-agent>
  9174. <user-agent>
  9175. <ID>id_g_m_051207_1</ID>
  9176. <String>Lovel as 1.0 ( +http://www.everatom.com)</String>
  9177. <Description>Everatom.com song lyrics search</Description>
  9178. <Type>R</Type>
  9179. <Comment>80.91.191.2xx</Comment>
  9180. <Link1>http://www.everatom.com</Link1>
  9181. <Link2></Link2>
  9182. </user-agent>
  9183. <user-agent>
  9184. <ID>id_g_m_100308_2</ID>
  9185. <String>LTI/LemurProject Nutch Spider/Nutch-1.0-dev (lti crawler for CMU; http://www.lti.cs.cmu.edu; changkuk at cmu dot edu)</String>
  9186. <Description>LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo</Description>
  9187. <Type>R</Type>
  9188. <Comment>68.180.139.12x</Comment>
  9189. <Link1>http://www.lemurproject.org/</Link1>
  9190. <Link2>http://www.yahoo.com/</Link2>
  9191. </user-agent>
  9192. <user-agent>
  9193. <ID>id_g_m_050208_3</ID>
  9194. <String>LTI/LemurProject Nutch Spider/Nutch-1.0-dev (Research spider using Nutch; http://www.lemurproject.org; mhoy@cs.cmu.edu)</String>
  9195. <Description>LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo</Description>
  9196. <Type>R</Type>
  9197. <Comment>68.180.139.12x</Comment>
  9198. <Link1>http://www.lemurproject.org/</Link1>
  9199. <Link2>http://www.yahoo.com/</Link2>
  9200. </user-agent>
  9201. <user-agent>
  9202. <ID>id_g_m_651</ID>
  9203. <String>luchs.at URL checker</String>
  9204. <Description>Luchs.at (Linux Wiki) link checking</Description>
  9205. <Type>C</Type>
  9206. <Comment></Comment>
  9207. <Link1>http://web.luchs.at/information/linkchecker.php</Link1>
  9208. <Link2></Link2>
  9209. </user-agent>
  9210. <user-agent>
  9211. <ID>id_g_m_090106_1</ID>
  9212. <String>Lunascape</String>
  9213. <Description>Lunascape IE based browser (Japan)</Description>
  9214. <Type>B</Type>
  9215. <Comment>s. also Mozilla/4.0 (... Lunascape ...)</Comment>
  9216. <Link1>http://www2.lunascape.jp/index.aspx</Link1>
  9217. <Link2></Link2>
  9218. </user-agent>
  9219. <user-agent>
  9220. <ID>id_g_m_652</ID>
  9221. <String>lwp-trivial/1.32</String>
  9222. <Description>Ultimate Search / Smartdesk (no website) robot</Description>
  9223. <Type>R</Type>
  9224. <Comment></Comment>
  9225. <Link1></Link1>
  9226. <Link2></Link2>
  9227. </user-agent>
  9228. <user-agent>
  9229. <ID>id_g_m_653</ID>
  9230. <String>lwp-trivial/1.34</String>
  9231. <Description>Search4free robot</Description>
  9232. <Type>R</Type>
  9233. <Comment></Comment>
  9234. <Link1>http://www.search4free.com</Link1>
  9235. <Link2></Link2>
  9236. </user-agent>
  9237. <user-agent>
  9238. <ID>id_g_m_654</ID>
  9239. <String>lwp-trivial/1.34</String>
  9240. <Description>Search4free robot</Description>
  9241. <Type>R</Type>
  9242. <Comment></Comment>
  9243. <Link1>http://www.search4free.com</Link1>
  9244. <Link2></Link2>
  9245. </user-agent>
  9246. <user-agent>
  9247. <ID>id_g_m_656</ID>
  9248. <String>lwp-trivial/1.35</String>
  9249. <Description>Expert HTML online source viewer</Description>
  9250. <Type>B</Type>
  9251. <Comment></Comment>
  9252. <Link1>http://www.expert-html.com/</Link1>
  9253. <Link2></Link2>
  9254. </user-agent>
  9255. <user-agent>
  9256. <ID>id_g_m_655</ID>
  9257. <String>lwp-trivial/1.35</String>
  9258. <Description>Expert HTML online source viewer</Description>
  9259. <Type>B</Type>
  9260. <Comment></Comment>
  9261. <Link1>http://www.expert-html.com/</Link1>
  9262. <Link2></Link2>
  9263. </user-agent>
  9264. <user-agent>
  9265. <ID>id_g_m_657</ID>
  9266. <String>LWP::Simple/5.22</String>
  9267. <Description>Perl LWP:Collective module</Description>
  9268. <Type>R</Type>
  9269. <Comment></Comment>
  9270. <Link1>http://www.thatrobotsite.com</Link1>
  9271. <Link2></Link2>
  9272. </user-agent>
  9273. <user-agent>
  9274. <ID>id_g_m_658</ID>
  9275. <String>LWP::Simple/5.36</String>
  9276. <Description>Perl LWP:Collective module</Description>
  9277. <Type>R</Type>
  9278. <Comment></Comment>
  9279. <Link1>http://www.thatrobotsite.com</Link1>
  9280. <Link2></Link2>
  9281. </user-agent>
  9282. <user-agent>
  9283. <ID>id_g_m_659</ID>
  9284. <String>LWP::Simple/5.48</String>
  9285. <Description>Perl LWP:Collective module - Linkomatic robot</Description>
  9286. <Type>R</Type>
  9287. <Comment></Comment>
  9288. <Link1>http://www.linkomatic.com/</Link1>
  9289. <Link2>http://www.thatrobotsite.com</Link2>
  9290. </user-agent>
  9291. <user-agent>
  9292. <ID>id_g_m_660</ID>
  9293. <String>LWP::Simple/5.50</String>
  9294. <Description>Perl LWP:Collective module - secure-netz.de link checking (in conjunction w. libwww-perl/5.50)</Description>
  9295. <Type>R</Type>
  9296. <Comment></Comment>
  9297. <Link1>http://www.secure-netz.de</Link1>
  9298. <Link2>http://www.thatrobotsite.com</Link2>
  9299. </user-agent>
  9300. <user-agent>
  9301. <ID>id_g_m_661</ID>
  9302. <String>LWP::Simple/5.51</String>
  9303. <Description>Perl LWP:Collective module - Inktomi (62.253.64.x) robot</Description>
  9304. <Type>R</Type>
  9305. <Comment></Comment>
  9306. <Link1>http://www.inktomi.com/</Link1>
  9307. <Link2>http://www.thatrobotsite.com</Link2>
  9308. </user-agent>
  9309. <user-agent>
  9310. <ID>id_g_m_662</ID>
  9311. <String>LWP::Simple/5.53</String>
  9312. <Description>Perl LWP:Collective module - Only.com </Description>
  9313. <Type>R</Type>
  9314. <Comment>in conjunction w. Spida/0.1</Comment>
  9315. <Link1>http://www.only.com</Link1>
  9316. <Link2>http://www.thatrobotsite.com</Link2>
  9317. </user-agent>
  9318. <user-agent>
  9319. <ID>id_g_m_663</ID>
  9320. <String>LWP::Simple/5.63</String>
  9321. <Description>Perl LWP:Collective module</Description>
  9322. <Type>R</Type>
  9323. <Comment></Comment>
  9324. <Link1>http://www.thatrobotsite.com</Link1>
  9325. <Link2></Link2>
  9326. </user-agent>
  9327. <user-agent>
  9328. <ID>id_g_m_291105_3</ID>
  9329. <String>LWP::Simple/5.803</String>
  9330. <Description>ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx</Description>
  9331. <Type>S</Type>
  9332. <Comment>appears also as Poirot - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)</Comment>
  9333. <Link1>http://spamhuntress.com/wiki/Manila_Industries</Link1>
  9334. <Link2></Link2>
  9335. </user-agent>
  9336. <user-agent>
  9337. <ID>id_g_m_664</ID>
  9338. <String>Lycos_Spider_(modspider)</String>
  9339. <Description>Lycos spider</Description>
  9340. <Type>R</Type>
  9341. <Comment></Comment>
  9342. <Link1>http://www.lycos.com</Link1>
  9343. <Link2></Link2>
  9344. </user-agent>
  9345. <user-agent>
  9346. <ID>id_g_m_665</ID>
  9347. <String>Lycos_Spider_(T-Rex)</String>
  9348. <Description>Lycos spider</Description>
  9349. <Type>R</Type>
  9350. <Comment></Comment>
  9351. <Link1>http://www.lycos.com</Link1>
  9352. <Link2></Link2>
  9353. </user-agent>
  9354. <user-agent>
  9355. <ID>id_g_m_200308_2</ID>
  9356. <String>Lynx/2-4-2 (Bobcat/0.5 [DOS] Jp Beta04)</String>
  9357. <Description>Bobcat - Text and Lynx based DOS browser</Description>
  9358. <Type>B</Type>
  9359. <Comment></Comment>
  9360. <Link1>http://www.fdisk.com/doslynx/bobcat.htm</Link1>
  9361. <Link2></Link2>
  9362. </user-agent>
  9363. <user-agent>
  9364. <ID>id_g_m_666</ID>
  9365. <String>Lynx/2.6 libwww-FM/2.14</String>
  9366. <Description>Lynx 2.x text mode browser</Description>
  9367. <Type>B</Type>
  9368. <Comment></Comment>
  9369. <Link1>http://lynx.browser.org/</Link1>
  9370. <Link2></Link2>
  9371. </user-agent>
  9372. <user-agent>
  9373. <ID>id_g_m_180108_1</ID>
  9374. <String>Lynx/2.8 (;http://seebot.org)</String>
  9375. <Description>seebot.org online service - uses lynx browser for crawlers view of web pages</Description>
  9376. <Type>B</Type>
  9377. <Comment>208.113.176.x[xx]</Comment>
  9378. <Link1>http://seebot.org/</Link1>
  9379. <Link2></Link2>
  9380. </user-agent>
  9381. <user-agent>
  9382. <ID>id_g_m_667</ID>
  9383. <String>Lynx/2.8.3dev.9 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6</String>
  9384. <Description>Lynx 2.x text mode browser</Description>
  9385. <Type>B</Type>
  9386. <Comment></Comment>
  9387. <Link1>http://lynx.browser.org/</Link1>
  9388. <Link2></Link2>
  9389. </user-agent>
  9390. <user-agent>
  9391. <ID>id_g_m_668</ID>
  9392. <String>Lynx/2.8.4rel.1 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6c (human-guided@lerly.net)</String>
  9393. <Description>Lynx 2.x text mode browser used as robot via cogentco.com</Description>
  9394. <Type>R</Type>
  9395. <Comment></Comment>
  9396. <Link1></Link1>
  9397. <Link2></Link2>
  9398. </user-agent>
  9399. <user-agent>
  9400. <ID>id_g_m_669</ID>
  9401. <String>Mac Finder 1.0.xx</String>
  9402. <Description>Some spam bot</Description>
  9403. <Type>S</Type>
  9404. <Comment></Comment>
  9405. <Link1>http://www.kloth.net/internet/badbots.php</Link1>
  9406. <Link2></Link2>
  9407. </user-agent>
  9408. <user-agent>
  9409. <ID>id_g_m_670</ID>
  9410. <String>Mackster( http://www.ukwizz.com )</String>
  9411. <Description>UKWizz search robot</Description>
  9412. <Type>R</Type>
  9413. <Comment>s. also UKWizz/Nutch</Comment>
  9414. <Link1>http://www.ukwizz.com</Link1>
  9415. <Link2></Link2>
  9416. </user-agent>
  9417. <user-agent>
  9418. <ID>id_g_m_671</ID>
  9419. <String>Mag-Net</String>
  9420. <Description>Wind.it client user-agent ?</Description>
  9421. <Type></Type>
  9422. <Comment></Comment>
  9423. <Link1></Link1>
  9424. <Link2></Link2>
  9425. </user-agent>
  9426. <user-agent>
  9427. <ID>id_g_m_180606_3</ID>
  9428. <String>MagicWML/1.0 (forcewml)</String>
  9429. <Description>All Magic/Wap wml service for mobile devices</Description>
  9430. <Type>P</Type>
  9431. <Comment></Comment>
  9432. <Link1>http://allmagic3.com/wap/</Link1>
  9433. <Link2></Link2>
  9434. </user-agent>
  9435. <user-agent>
  9436. <ID>id_g_m_061206_1</ID>
  9437. <String>MagpieRSS/0.7x (+http://magpierss.sf.net)</String>
  9438. <Description>Magpie RSS - PHP RSS Parser</Description>
  9439. <Type>B</Type>
  9440. <Comment></Comment>
  9441. <Link1>http://magpierss.sourceforge.net/</Link1>
  9442. <Link2></Link2>
  9443. </user-agent>
  9444. <user-agent>
  9445. <ID>id_g_m_030308_1</ID>
  9446. <String>Mahiti.Com/Mahiti Crawler-1.0 (Mahiti.Com; http://mahiti.com ; mahiti.com)</String>
  9447. <Description>Mahiti.com India search crawler</Description>
  9448. <Type>R</Type>
  9449. <Comment>72.167.143.1x</Comment>
  9450. <Link1>http://mahiti.com/</Link1>
  9451. <Link2></Link2>
  9452. </user-agent>
  9453. <user-agent>
  9454. <ID>id_g_m_020707_2</ID>
  9455. <String>Mail.Ru/1.0</String>
  9456. <Description>Mail.ru search</Description>
  9457. <Type>R</Type>
  9458. <Comment>194.186.55.2xx</Comment>
  9459. <Link1>http://www.mail.ru/</Link1>
  9460. <Link2></Link2>
  9461. </user-agent>
  9462. <user-agent>
  9463. <ID>id_g_m_672</ID>
  9464. <String>mailto:webcraft@bea.com</String>
  9465. <Description>Unknown Bea robot</Description>
  9466. <Type>R</Type>
  9467. <Comment></Comment>
  9468. <Link1>http://www.beasys.com</Link1>
  9469. <Link2></Link2>
  9470. </user-agent>
  9471. <user-agent>
  9472. <ID>id_g_m_673</ID>
  9473. <String>mammoth/1.0 ( http://www.sli-systems.com/)</String>
  9474. <Description>SLI Systems mammoth robot</Description>
  9475. <Type>R</Type>
  9476. <Comment>s. also Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1</Comment>
  9477. <Link1>http://www.sli-systems.com/</Link1>
  9478. <Link2>http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M</Link2>
  9479. </user-agent>
  9480. <user-agent>
  9481. <ID>id_g_m_674</ID>
  9482. <String>MantraAgent</String>
  9483. <Description>Looksmart robot</Description>
  9484. <Type>R</Type>
  9485. <Comment></Comment>
  9486. <Link1>http://www.looksmart.com</Link1>
  9487. <Link2></Link2>
  9488. </user-agent>
  9489. <user-agent>
  9490. <ID>id_g_m_675</ID>
  9491. <String>MapoftheInternet.com ( http://MapoftheInternet.com)</String>
  9492. <Description>Map of the Internet visual search engine index robot</Description>
  9493. <Type>R</Type>
  9494. <Comment></Comment>
  9495. <Link1>http://MapoftheInternet.com</Link1>
  9496. <Link2></Link2>
  9497. </user-agent>
  9498. <user-agent>
  9499. <ID>id_g_m_676</ID>
  9500. <String>Mariner/5.1b [de] (Win95; I ;Kolibri gncwebbot)</String>
  9501. <Description>Kolibri.de robot</Description>
  9502. <Type>R</Type>
  9503. <Comment></Comment>
  9504. <Link1>http://www.kolibri.de</Link1>
  9505. <Link2></Link2>
  9506. </user-agent>
  9507. <user-agent>
  9508. <ID>id_g_m_677</ID>
  9509. <String>Marketwave Hit List</String>
  9510. <Description>Pilot Hitlist web site analysis</Description>
  9511. <Type>R</Type>
  9512. <Comment></Comment>
  9513. <Link1>http://www.marketwave.com/products_solutions/hitlist.html</Link1>
  9514. <Link2></Link2>
  9515. </user-agent>
  9516. <user-agent>
  9517. <ID>id_g_m_678</ID>
  9518. <String>Martini</String>
  9519. <Description>Looksmart directory page analysis</Description>
  9520. <Type>R</Type>
  9521. <Comment></Comment>
  9522. <Link1>http://www.looksmart.com</Link1>
  9523. <Link2></Link2>
  9524. </user-agent>
  9525. <user-agent>
  9526. <ID>id_g_m_679</ID>
  9527. <String>MARTINI</String>
  9528. <Description>Looksmart directory page analysis</Description>
  9529. <Type>R</Type>
  9530. <Comment></Comment>
  9531. <Link1>http://www.looksmart.com</Link1>
  9532. <Link2></Link2>
  9533. </user-agent>
  9534. <user-agent>
  9535. <ID>id_g_m_680</ID>
  9536. <String>Marvin v0.3</String>
  9537. <Description>Marvin Medhunt robot</Description>
  9538. <Type>R</Type>
  9539. <Comment></Comment>
  9540. <Link1>http://www.hon.ch/MedHunt/Marvin.html</Link1>
  9541. <Link2></Link2>
  9542. </user-agent>
  9543. <user-agent>
  9544. <ID>id_g_m_270606_1</ID>
  9545. <String>MaSagool/1.0 (MaSagool; http://sagool.jp/; info@sagool.jp)</String>
  9546. <Description>Sagool search Japan robot</Description>
  9547. <Type>R</Type>
  9548. <Comment>124.32.246.xx</Comment>
  9549. <Link1>http://sagool.jp/</Link1>
  9550. <Link2></Link2>
  9551. </user-agent>
  9552. <user-agent>
  9553. <ID>id_g_m_681</ID>
  9554. <String>Mass Downloader 2.x</String>
  9555. <Description>Mass Downloader download manager</Description>
  9556. <Type>D</Type>
  9557. <Comment></Comment>
  9558. <Link1>http://www.metaproducts.com</Link1>
  9559. <Link2></Link2>
  9560. </user-agent>
  9561. <user-agent>
  9562. <ID>id_g_m_682</ID>
  9563. <String>MasterSeek</String>
  9564. <Description>Masterseek (Scandinavia) Beta business search ?</Description>
  9565. <Type>R</Type>
  9566. <Comment></Comment>
  9567. <Link1>http://www.masterseek.com</Link1>
  9568. <Link2></Link2>
  9569. </user-agent>
  9570. <user-agent>
  9571. <ID>id_g_m_683</ID>
  9572. <String>Mata Hari/2.00 </String>
  9573. <Description>Lexibot (exMataHari) search software</Description>
  9574. <Type>R</Type>
  9575. <Comment></Comment>
  9576. <Link1>http://www.lexibot.com</Link1>
  9577. <Link2></Link2>
  9578. </user-agent>
  9579. <user-agent>
  9580. <ID>id_g_m_684</ID>
  9581. <String>Matrix S.p.A. - FAST Enterprise Crawler 6 (Unknown admin e-mail address)</String>
  9582. <Description>Virgilio Italy robot (212.48.11.xxx) using Fast Enterprise Search</Description>
  9583. <Type>R</Type>
  9584. <Comment></Comment>
  9585. <Link1>http://www.virgilio.it</Link1>
  9586. <Link2></Link2>
  9587. </user-agent>
  9588. <user-agent>
  9589. <ID>id_g_m_685</ID>
  9590. <String>maxomobot/dev-20051201 (maxomo; http://67.102.134.34:4047/MAXOMO/MAXOMObot.html; maxomobot@maxomo.com)</String>
  9591. <Description>Maxomo multimedia search robot</Description>
  9592. <Type>R</Type>
  9593. <Comment></Comment>
  9594. <Link1>http://www.maxomo.com</Link1>
  9595. <Link2></Link2>
  9596. </user-agent>
  9597. <user-agent>
  9598. <ID>id_g_m_686</ID>
  9599. <String>McBot/5.001 (windows; U; NT4.0; en-us)</String>
  9600. <Description>Unknown robot from McAfee Austria (80.123.144.xx)</Description>
  9601. <Type></Type>
  9602. <Comment></Comment>
  9603. <Link1></Link1>
  9604. <Link2></Link2>
  9605. </user-agent>
  9606. <user-agent>
  9607. <ID>id_g_m_290108_1</ID>
  9608. <String>MDbot/1.0 (+http://www.megadownload.net/bot.html)</String>
  9609. <Description>MegaDownload files search robot</Description>
  9610. <Type>R</Type>
  9611. <Comment>91.121.83.19x</Comment>
  9612. <Link1>http://www.megadownload.net/</Link1>
  9613. <Link2>http://www.megadownload.net/bot.html</Link2>
  9614. </user-agent>
  9615. <user-agent>
  9616. <ID>id_g_m_170306_1</ID>
  9617. <String>Media Player Classic</String>
  9618. <Description>Substitute for Windows Media Player</Description>
  9619. <Type>B</Type>
  9620. <Comment></Comment>
  9621. <Link1>http://sourceforge.net/projects/guliverkli/</Link1>
  9622. <Link2></Link2>
  9623. </user-agent>
  9624. <user-agent>
  9625. <ID>id_g_m_687</ID>
  9626. <String>MediaCrawler-1.0 (Experimental)</String>
  9627. <Description>Media Find crawler</Description>
  9628. <Type>R</Type>
  9629. <Comment></Comment>
  9630. <Link1>http://www.mediacrawler.de</Link1>
  9631. <Link2></Link2>
  9632. </user-agent>
  9633. <user-agent>
  9634. <ID>id_g_m_688</ID>
  9635. <String>Mediapartners-Google/2.1 ( http://www.googlebot.com/bot.html)</String>
  9636. <Description>Google AdSense robot</Description>
  9637. <Type>R</Type>
  9638. <Comment></Comment>
  9639. <Link1>http://www.google.com/ads/</Link1>
  9640. <Link2></Link2>
  9641. </user-agent>
  9642. <user-agent>
  9643. <ID>id_g_m_689</ID>
  9644. <String>MediaSearch/0.1</String>
  9645. <Description>WWW.fi Media Search</Description>
  9646. <Type>R</Type>
  9647. <Comment></Comment>
  9648. <Link1>http://www.fi/haku/</Link1>
  9649. <Link2></Link2>
  9650. </user-agent>
  9651. <user-agent>
  9652. <ID>id_g_m_690</ID>
  9653. <String>MegaSheep v1.0 (www.searchuk.com internet sheep)</String>
  9654. <Description>Search UK robot</Description>
  9655. <Type>R</Type>
  9656. <Comment></Comment>
  9657. <Link1>http://www.searchuk.com</Link1>
  9658. <Link2></Link2>
  9659. </user-agent>
  9660. <user-agent>
  9661. <ID>id_g_m_131107_1</ID>
  9662. <String>Megite2.0 (http://www.megite.com)</String>
  9663. <Description>Megite web2.0 RSS and news service software</Description>
  9664. <Type>R</Type>
  9665. <Comment></Comment>
  9666. <Link1>http://www.megite.com/</Link1>
  9667. <Link2></Link2>
  9668. </user-agent>
  9669. <user-agent>
  9670. <ID>id_g_m_691</ID>
  9671. <String>Mercator-1.x</String>
  9672. <Description>Mercator crawler software (used by Altavista)</Description>
  9673. <Type>R</Type>
  9674. <Comment></Comment>
  9675. <Link1>http://www.research.compaq.com</Link1>
  9676. <Link2></Link2>
  9677. </user-agent>
  9678. <user-agent>
  9679. <ID>id_g_m_692</ID>
  9680. <String>Mercator-2.0</String>
  9681. <Description>Mercator crawler software (used by Altavista)</Description>
  9682. <Type>R</Type>
  9683. <Comment></Comment>
  9684. <Link1>http://www.research.compaq.com</Link1>
  9685. <Link2></Link2>
  9686. </user-agent>
  9687. <user-agent>
  9688. <ID>id_g_m_693</ID>
  9689. <String>Mercator-Scrub-1.1</String>
  9690. <Description>Mercator crawler software (used by Altavista)</Description>
  9691. <Type>R</Type>
  9692. <Comment></Comment>
  9693. <Link1>http://www.research.compaq.com</Link1>
  9694. <Link2></Link2>
  9695. </user-agent>
  9696. <user-agent>
  9697. <ID>id_g_m_070207_1</ID>
  9698. <String>Metaeuro Web Crawler/0.2 (MetaEuro Web Search Clustering Engine; http://www.metaeuro.com; crawler at metaeuro dot com)</String>
  9699. <Description>MetaEuro.com Clustering Web Search Engine crawler</Description>
  9700. <Type>R</Type>
  9701. <Comment>83.97.31.1xx</Comment>
  9702. <Link1>http://www.metaeuro.com/</Link1>
  9703. <Link2></Link2>
  9704. </user-agent>
  9705. <user-agent>
  9706. <ID>id_g_m_694</ID>
  9707. <String>MetaGer-LinkChecker</String>
  9708. <Description>MetaGer search robot (Germany)</Description>
  9709. <Type>R</Type>
  9710. <Comment>130.75.2.xx</Comment>
  9711. <Link1>http://www.metager.de/</Link1>
  9712. <Link2></Link2>
  9713. </user-agent>
  9714. <user-agent>
  9715. <ID>id_g_m_270706_1</ID>
  9716. <String>MetagerBot/0.8-dev (MetagerBot; http://metager.de;  )</String>
  9717. <Description>MetaGer search robot (Germany)</Description>
  9718. <Type>R</Type>
  9719. <Comment>130.75.2.xx</Comment>
  9720. <Link1>http://www.metager.de/</Link1>
  9721. <Link2></Link2>
  9722. </user-agent>
  9723. <user-agent>
  9724. <ID>id_g_m_060307_1</ID>
  9725. <String>MetaGer_PreChecker0.1</String>
  9726. <Description>MetaGer search robot (Germany)</Description>
  9727. <Type>R</Type>
  9728. <Comment>130.75.2.xx</Comment>
  9729. <Link1>http://www.metager.de/</Link1>
  9730. <Link2></Link2>
  9731. </user-agent>
  9732. <user-agent>
  9733. <ID>id_g_m_695</ID>
  9734. <String>MetaProducts Download Express/1.x</String>
  9735. <Description>Download Express download manager</Description>
  9736. <Type>D</Type>
  9737. <Comment></Comment>
  9738. <Link1>http://www.metaproducts.com</Link1>
  9739. <Link2></Link2>
  9740. </user-agent>
  9741. <user-agent>
  9742. <ID>id_g_m_696</ID>
  9743. <String>Metaspinner/0.01 (Metaspinner; http://www.meta-spinner.de/; support@meta-spinner.de/)</String>
  9744. <Description>Metaspinner search robot - Germany</Description>
  9745. <Type>R</Type>
  9746. <Comment></Comment>
  9747. <Link1>http://www.meta-spinner.de/</Link1>
  9748. <Link2></Link2>
  9749. </user-agent>
  9750. <user-agent>
  9751. <ID>id_g_m_300407_1</ID>
  9752. <String>metatagsdir/0.7 (+http://metatagsdir.com/directory/)</String>
  9753. <Description>Metatagsdir.com directory index spider</Description>
  9754. <Type>R</Type>
  9755. <Comment>206.196.111.2xx</Comment>
  9756. <Link1>http://metatagsdir.com/directory/</Link1>
  9757. <Link2></Link2>
  9758. </user-agent>
  9759. <user-agent>
  9760. <ID>id_g_m_697</ID>
  9761. <String>MFC Foundation Class Library 4.0</String>
  9762. <Description>Microsoft Foundation Class Library - i.e. used for e-mail harvesting from 68.154.96.xx (bellsouth.net)</Description>
  9763. <Type>S</Type>
  9764. <Comment>appears also as Full Web Bot 0516B or Demo Bot Z 16b</Comment>
  9765. <Link1></Link1>
  9766. <Link2></Link2>
  9767. </user-agent>
  9768. <user-agent>
  9769. <ID>id_g_m_698</ID>
  9770. <String>MFC_Tear_Sample</String>
  9771. <Description>Microsoft.com user agent</Description>
  9772. <Type></Type>
  9773. <Comment></Comment>
  9774. <Link1></Link1>
  9775. <Link2></Link2>
  9776. </user-agent>
  9777. <user-agent>
  9778. <ID>id_g_m_699</ID>
  9779. <String>MFHttpScan</String>
  9780. <Description>Advanced Site Crawler web site ripper and extractor</Description>
  9781. <Type>D</Type>
  9782. <Comment></Comment>
  9783. <Link1>http://www.innovative.go.ro/sitecrawler/index.htm</Link1>
  9784. <Link2></Link2>
  9785. </user-agent>
  9786. <user-agent>
  9787. <ID>id_g_m_700</ID>
  9788. <String>MicroBaz</String>
  9789. <Description>GigaBaz Brainbot (Germany) robot (213.139.152.xx)</Description>
  9790. <Type>R</Type>
  9791. <Comment> s. also - gigabaz/3.1x ...</Comment>
  9792. <Link1>http://brainbot.com//site3</Link1>
  9793. <Link2></Link2>
  9794. </user-agent>
  9795. <user-agent>
  9796. <ID>id_g_m_701</ID>
  9797. <String>Microsoft Data Access Internet Publishing Provider Cache Manager</String>
  9798. <Description>MS Office 2000 acting as WebDAV client</Description>
  9799. <Type>B P</Type>
  9800. <Comment></Comment>
  9801. <Link1></Link1>
  9802. <Link2></Link2>
  9803. </user-agent>
  9804. <user-agent>
  9805. <ID>id_g_m_702</ID>
  9806. <String>Microsoft Data Access Internet Publishing Provider DAV</String>
  9807. <Description>MS Office 2000 acting as WebDAV client</Description>
  9808. <Type>B</Type>
  9809. <Comment></Comment>
  9810. <Link1></Link1>
  9811. <Link2></Link2>
  9812. </user-agent>
  9813. <user-agent>
  9814. <ID>id_g_m_704</ID>
  9815. <String>Microsoft Data Access Internet Publishing Provider Protocol Discovery</String>
  9816. <Description>Server probe for data access operations using MS Frontpage with OPTION header</Description>
  9817. <Type>B C</Type>
  9818. <Comment></Comment>
  9819. <Link1></Link1>
  9820. <Link2></Link2>
  9821. </user-agent>
  9822. <user-agent>
  9823. <ID>id_g_m_703</ID>
  9824. <String>Microsoft Data Access Internet Publishing Provider Protocol Discovery</String>
  9825. <Description>MS Office 2000 acting as WebDAV client</Description>
  9826. <Type>B C</Type>
  9827. <Comment></Comment>
  9828. <Link1></Link1>
  9829. <Link2></Link2>
  9830. </user-agent>
  9831. <user-agent>
  9832. <ID>id_g_m_190807_2</ID>
  9833. <String>Microsoft Log Parser 2.2</String>
  9834. <Description>Microsoft Log Parser text query tool</Description>
  9835. <Type>D</Type>
  9836. <Comment></Comment>
  9837. <Link1>http://www.microsoft.com/technet/scriptcenter/tools/logparser/default.mspx</Link1>
  9838. <Link2></Link2>
  9839. </user-agent>
  9840. <user-agent>
  9841. <ID>id_g_m_180306_1</ID>
  9842. <String>Microsoft Small Business Indexer</String>
  9843. <Description>MS Small Business Server content indexer</Description>
  9844. <Type>R</Type>
  9845. <Comment>Indexing from Microsoft: 204.71.191.xx</Comment>
  9846. <Link1>http://www.microsoft.com/windowsserver2003/sbs/default.mspx</Link1>
  9847. <Link2></Link2>
  9848. </user-agent>
  9849. <user-agent>
  9850. <ID>id_g_m_705</ID>
  9851. <String>Microsoft URL Control - 6.00.8xxx</String>
  9852. <Description>user agent looks for form-mail components (spam-bot)</Description>
  9853. <Type>S</Type>
  9854. <Comment></Comment>
  9855. <Link1></Link1>
  9856. <Link2></Link2>
  9857. </user-agent>
  9858. <user-agent>
  9859. <ID>id_g_m_707</ID>
  9860. <String>MicrosoftPrototypeCrawler (How's my crawling? mailto:newbiecrawler@hotmail.com)</String>
  9861. <Description>Unknown robot from Microsoft.com (131.107.163.xx)</Description>
  9862. <Type>R</Type>
  9863. <Comment></Comment>
  9864. <Link1></Link1>
  9865. <Link2></Link2>
  9866. </user-agent>
  9867. <user-agent>
  9868. <ID>id_g_m_706</ID>
  9869. <String>Microsoft_Internet_Explorer_5.00.438 (fjones@isd.net)</String>
  9870. <Description>Secure Computing SmartFilterWhere  / Bess web filter (192.55.214.xx)</Description>
  9871. <Type>P</Type>
  9872. <Comment></Comment>
  9873. <Link1>http://www.securecomputing.com/index.cfm?skey=22</Link1>
  9874. <Link2></Link2>
  9875. </user-agent>
  9876. <user-agent>
  9877. <ID>id_g_m_708</ID>
  9878. <String>MIIxpc/4.2</String>
  9879. <Description>xpc-mii.net HTTP server message</Description>
  9880. <Type>P</Type>
  9881. <Comment></Comment>
  9882. <Link1></Link1>
  9883. <Link2></Link2>
  9884. </user-agent>
  9885. <user-agent>
  9886. <ID>id_g_m_130807_2</ID>
  9887. <String>Mindjet MindManager</String>
  9888. <Description>The Mindjet blog MindManager category</Description>
  9889. <Type>D</Type>
  9890. <Comment>80.229.1xx</Comment>
  9891. <Link1>http://blog.mindjet.com/category/mindjet/mindmanager/</Link1>
  9892. <Link2></Link2>
  9893. </user-agent>
  9894. <user-agent>
  9895. <ID>id_g_m_709</ID>
  9896. <String>minibot</String>
  9897. <Description>unknown robot via Korea Telecom (211.218.xxx.xxx)</Description>
  9898. <Type></Type>
  9899. <Comment></Comment>
  9900. <Link1></Link1>
  9901. <Link2></Link2>
  9902. </user-agent>
  9903. <user-agent>
  9904. <ID>id_g_m_110506_2</ID>
  9905. <String>miniRank/1.6 (Website ranking; www.minirank.com; robot)</String>
  9906. <Description>mini- Rank website popularity tool</Description>
  9907. <Type>C</Type>
  9908. <Comment>64.230.71.2xx</Comment>
  9909. <Link1>http://www.minirank.com/</Link1>
  9910. <Link2></Link2>
  9911. </user-agent>
  9912. <user-agent>
  9913. <ID>id_g_m_710</ID>
  9914. <String>MiracleAlphaTest</String>
  9915. <Description>unknown robot via nec.co.jp Telecom (210.143.35.xx)</Description>
  9916. <Type></Type>
  9917. <Comment></Comment>
  9918. <Link1></Link1>
  9919. <Link2></Link2>
  9920. </user-agent>
  9921. <user-agent>
  9922. <ID>id_g_m_711</ID>
  9923. <String>Missauga Locate 1.0.0</String>
  9924. <Description>Some spam bot</Description>
  9925. <Type>S</Type>
  9926. <Comment></Comment>
  9927. <Link1>http://www.neilgunton.com/spambot_trap/appendix/</Link1>
  9928. <Link2></Link2>
  9929. </user-agent>
  9930. <user-agent>
  9931. <ID>id_g_m_712</ID>
  9932. <String>Missigua Locator 1.9</String>
  9933. <Description>Some spam bot</Description>
  9934. <Type>S</Type>
  9935. <Comment></Comment>
  9936. <Link1>http://www.neilgunton.com/spambot_trap/appendix/</Link1>
  9937. <Link2></Link2>
  9938. </user-agent>
  9939. <user-agent>
  9940. <ID>id_g_m_713</ID>
  9941. <String>Missouri College Browse</String>
  9942. <Description>Some spam bot</Description>
  9943. <Type>S</Type>
  9944. <Comment></Comment>
  9945. <Link1></Link1>
  9946. <Link2></Link2>
  9947. </user-agent>
  9948. <user-agent>
  9949. <ID>id_g_m_714</ID>
  9950. <String>Mister Pix II 2.02a</String>
  9951. <Description>Mister PiX picture finding software</Description>
  9952. <Type>D R</Type>
  9953. <Comment></Comment>
  9954. <Link1>http://www.mister-pix.com/</Link1>
  9955. <Link2></Link2>
  9956. </user-agent>
  9957. <user-agent>
  9958. <ID>id_g_m_715</ID>
  9959. <String>Mister PiX version.dll</String>
  9960. <Description>Mister PiX  picture finding software</Description>
  9961. <Type>D R</Type>
  9962. <Comment></Comment>
  9963. <Link1>http://www.mister-pix.com/</Link1>
  9964. <Link2></Link2>
  9965. </user-agent>
  9966. <user-agent>
  9967. <ID>id_g_m_110206_3</ID>
  9968. <String>Misterbot-Nutch/0.7.1 (Misterbot-Nutch; http://www.misterbot.fr; admin@misterbot.fr)</String>
  9969. <Description>Misterbot search France robot</Description>
  9970. <Type>R</Type>
  9971. <Comment></Comment>
  9972. <Link1>http://www.misterbot.fr/</Link1>
  9973. <Link2></Link2>
  9974. </user-agent>
  9975. <user-agent>
  9976. <ID>id_g_m_716</ID>
  9977. <String>Miva (AlgoFeedback@miva.com)</String>
  9978. <Description>Miva / ex Findwhat.com search robot (66.150.55.2xx)</Description>
  9979. <Type>R</Type>
  9980. <Comment></Comment>
  9981. <Link1>http://www.miva.com/</Link1>
  9982. <Link2></Link2>
  9983. </user-agent>
  9984. <user-agent>
  9985. <ID>id_g_m_141105_2</ID>
  9986. <String>Mizzu Labs 2.2</String>
  9987. <Description>Some spam bot from Jasmine Internet - Bangkok (203.147.0.xx)</Description>
  9988. <Type>S</Type>
  9989. <Comment>s. link </Comment>
  9990. <Link1>http://www.projecthoneypot.org/ip_inspector.php?iph=7bc2eae614063a45b0e1d0786dbe6a2e</Link1>
  9991. <Link2></Link2>
  9992. </user-agent>
  9993. <user-agent>
  9994. <ID>id_g_m_080706_3</ID>
  9995. <String>MJ12bot/vx.x.x (http://majestic12.co.uk/bot.php?+)</String>
  9996. <Description>Majestic-12 DSearch MJ12bot (Experimental distributed crawler)</Description>
  9997. <Type>R</Type>
  9998. <Comment></Comment>
  9999. <Link1>http://www.majestic12.co.uk/projects/dsearch/</Link1>
  10000. <Link2></Link2>
  10001. </user-agent>
  10002. <user-agent>
  10003. <ID>id_g_m_717</ID>
  10004. <String>MJ12bot/vx.x.x (http://www.majestic12.co.uk/projects/dsearch/mj12bot.php)</String>
  10005. <Description>Majestic-12 DSearch MJ12bot (Experimental distributed crawler)</Description>
  10006. <Type>R</Type>
  10007. <Comment></Comment>
  10008. <Link1>http://www.majestic12.co.uk/projects/dsearch/mj12bot.php</Link1>
  10009. <Link2></Link2>
  10010. </user-agent>
  10011. <user-agent>
  10012. <ID>id_g_m_200108_1</ID>
  10013. <String>MJBot (SEO assessment)</String>
  10014. <Description>MJB SEO Club MJBot</Description>
  10015. <Type>R</Type>
  10016. <Comment>217.8.248.19x</Comment>
  10017. <Link1>http://www.mjbdata.com/information/</Link1>
  10018. <Link2></Link2>
  10019. </user-agent>
  10020. <user-agent>
  10021. <ID>id_g_m_030308_2</ID>
  10022. <String>MLBot (www.metadatalabs.com)</String>
  10023. <Description>MLBot - metadata labs web crawler for building a media index (beta)</Description>
  10024. <Type>R</Type>
  10025. <Comment></Comment>
  10026. <Link1>http://www.metadatalabs.com/</Link1>
  10027. <Link2></Link2>
  10028. </user-agent>
  10029. <user-agent>
  10030. <ID>id_g_m_718</ID>
  10031. <String>MnogoSearch/3.2.xx</String>
  10032. <Description>mnoGoSearch (ex UdmSearch) software robot</Description>
  10033. <Type>R</Type>
  10034. <Comment></Comment>
  10035. <Link1>http://mnogosearch.org/</Link1>
  10036. <Link2></Link2>
  10037. </user-agent>
  10038. <user-agent>
  10039. <ID>id_g_m_260306_3</ID>
  10040. <String>Mo College 1.9</String>
  10041. <Description>Unknown bad bot - maybe guestbook spamming or email harvesting</Description>
  10042. <Type>S</Type>
  10043. <Comment>see link:</Comment>
  10044. <Link1>http://www.kloth.net/internet/badbots.php</Link1>
  10045. <Link2></Link2>
  10046. </user-agent>
  10047. <user-agent>
  10048. <ID>id_g_m_719</ID>
  10049. <String>moget/x.x (moget@goo.ne.jp)</String>
  10050. <Description>Goo Japan / Inktomi robot (210.173.179.xx)</Description>
  10051. <Type>R</Type>
  10052. <Comment>s. also ichiro</Comment>
  10053. <Link1>http://www.goo.ne.jp</Link1>
  10054. <Link2></Link2>
  10055. </user-agent>
  10056. <user-agent>
  10057. <ID>id_g_m_720</ID>
  10058. <String>mogimogi/1.0</String>
  10059. <Description>Goo Japan / Inktomi robot (210.173.179.xx)</Description>
  10060. <Type>R</Type>
  10061. <Comment>s. also ichiro</Comment>
  10062. <Link1>http://www.goo.ne.jp</Link1>
  10063. <Link2></Link2>
  10064. </user-agent>
  10065. <user-agent>
  10066. <ID>id_g_m_721</ID>
  10067. <String>moiNAG 0.02</String>
  10068. <Description>moiNag - net.art generator</Description>
  10069. <Type>R D</Type>
  10070. <Comment></Comment>
  10071. <Link1>http://soundwarez.org/generator/moiNAG/</Link1>
  10072. <Link2></Link2>
  10073. </user-agent>
  10074. <user-agent>
  10075. <ID>id_g_m_722</ID>
  10076. <String>MojeekBot/0.x (archi; http://www.mojeek.com/bot.html)</String>
  10077. <Description>Mojeek Search Preview robot (217.155.205.xx)</Description>
  10078. <Type>R</Type>
  10079. <Comment>s.also Mozilla/5.0 (compatible; MojeekBot/2.0 ...</Comment>
  10080. <Link1>http://www.mojeek.com</Link1>
  10081. <Link2></Link2>
  10082. </user-agent>
  10083. <user-agent>
  10084. <ID>id_g_m_150407_1</ID>
  10085. <String>monkeyagent</String>
  10086. <Description>Greasemonkey Firefox extension</Description>
  10087. <Type>D</Type>
  10088. <Comment></Comment>
  10089. <Link1>http://www.greasespot.net/</Link1>
  10090. <Link2>http://diveintogreasemonkey.org/install/what-is-greasemonkey.html</Link2>
  10091. </user-agent>
  10092. <user-agent>
  10093. <ID>id_g_m_090106_2</ID>
  10094. <String>MoonBrowser (version 0.41 Beta4)</String>
  10095. <Description>Moonbrowser - IE based browser (Japan)</Description>
  10096. <Type>B</Type>
  10097. <Comment></Comment>
  10098. <Link1>http://www.geocities.co.jp/SiliconValley-Cupertino/8986/</Link1>
  10099. <Link2></Link2>
  10100. </user-agent>
  10101. <user-agent>
  10102. <ID>id_g_m_010307_2</ID>
  10103. <String>Moreoverbot/x.00 (+http://www.moreover.com)</String>
  10104. <Description>Moreover / FeedDirect RSS feed robot</Description>
  10105. <Type>C</Type>
  10106. <Comment>72.13.32.x</Comment>
  10107. <Link1>http://w.moreover.com/</Link1>
  10108. <Link2>http://www.feeddirect.com/</Link2>
  10109. </user-agent>
  10110. <user-agent>
  10111. <ID>id_g_m_723</ID>
  10112. <String>Morris - Mixcat Crawler ( http://mixcat.com)</String>
  10113. <Description>MixCat robot s. also Felix</Description>
  10114. <Type>R</Type>
  10115. <Comment></Comment>
  10116. <Link1>http://mixcat.com</Link1>
  10117. <Link2></Link2>
  10118. </user-agent>
  10119. <user-agent>
  10120. <ID>id_g_m_100206_2</ID>
  10121. <String>Motoricerca-Robots.txt-Checker/1.0 (http://tool.motoricerca.info/robots-checker.phtml)</String>
  10122. <Description>Robots.txt online checker</Description>
  10123. <Type>C</Type>
  10124. <Comment></Comment>
  10125. <Link1>http://tool.motoricerca.info/robots-checker.phtml</Link1>
  10126. <Link2></Link2>
  10127. </user-agent>
  10128. <user-agent>
  10129. <ID>id_g_m_240108_1</ID>
  10130. <String>Motorola-V3m Obigo</String>
  10131. <Description>Obigo WAP browser for mobiles on Motorola V3</Description>
  10132. <Type>B</Type>
  10133. <Comment></Comment>
  10134. <Link1>http://www.obigo.com/</Link1>
  10135. <Link2>http://en.wikipedia.org/wiki/Obigo_Browser</Link2>
  10136. </user-agent>
  10137. <user-agent>
  10138. <ID>id_g_m_724</ID>
  10139. <String>Mouse-House/7.4 (spider_monkey spider info at www.mobrien.com/sm.shtml)</String>
  10140. <Description>MPRM Group Ltd. Spider Monkey robot</Description>
  10141. <Type>R</Type>
  10142. <Comment></Comment>
  10143. <Link1>http://www.spidermonkey.ca/sm.shtml</Link1>
  10144. <Link2></Link2>
  10145. </user-agent>
  10146. <user-agent>
  10147. <ID>id_g_m_725</ID>
  10148. <String>MovableType/x.x</String>
  10149. <Description>Movable Type  web-based personal publishing system</Description>
  10150. <Type>B</Type>
  10151. <Comment></Comment>
  10152. <Link1>http://www.movabletype.org</Link1>
  10153. <Link2></Link2>
  10154. </user-agent>
  10155. <user-agent>
  10156. <ID>id_g_m_726</ID>
  10157. <String>mozDex/0.xx-dev (mozDex; http://www.mozdex.com/en/bot.html; spider@mozdex.com)</String>
  10158. <Description>Mozdex Open search engine spider (65.98.100.2xx)</Description>
  10159. <Type>R</Type>
  10160. <Comment></Comment>
  10161. <Link1>http://www.mozdex.com/</Link1>
  10162. <Link2></Link2>
  10163. </user-agent>
  10164. <user-agent>
  10165. <ID>id_g_m_727</ID>
  10166. <String>Mozi!</String>
  10167. <Description>Bell Nexxia / Sympatico Canada user robot &amp; spoofed referer from diff. IPs</Description>
  10168. <Type></Type>
  10169. <Comment></Comment>
  10170. <Link1></Link1>
  10171. <Link2></Link2>
  10172. </user-agent>
  10173. <user-agent>
  10174. <ID>id_moz_728</ID>
  10175. <String>Mozilla</String>
  10176. <Description>Unknown robots from diff. IPs</Description>
  10177. <Type></Type>
  10178. <Comment></Comment>
  10179. <Link1></Link1>
  10180. <Link2></Link2>
  10181. </user-agent>
  10182. <user-agent>
  10183. <ID>id_moz_100109_3</ID>
  10184. <String>Mozilla (libwhisker/2.4)</String>
  10185. <Description>libwhisker - HTTP client and utility - Perl library</Description>
  10186. <Type></Type>
  10187. <Comment></Comment>
  10188. <Link1>http://www.wiretrip.net/rfp/lw.asp</Link1>
  10189. <Link2></Link2>
  10190. </user-agent>
  10191. <user-agent>
  10192. <ID>id_moz_729</ID>
  10193. <String>Mozilla (Mozilla@somewhere.com)</String>
  10194. <Description>http://www.somewhere.com robot</Description>
  10195. <Type>R</Type>
  10196. <Comment></Comment>
  10197. <Link1>http://www.somewhere.com</Link1>
  10198. <Link2></Link2>
  10199. </user-agent>
  10200. <user-agent>
  10201. <ID>id_moz_041007_1</ID>
  10202. <String>Mozilla 4.0(compatible; BotSeer/1.0; +http://botseer.ist.psu.edu)</String>
  10203. <Description>BotSeer search engine for robots.txt</Description>
  10204. <Type>R</Type>
  10205. <Comment>130.203.154.2xx</Comment>
  10206. <Link1>http://botseer.ist.psu.edu/</Link1>
  10207. <Link2>http://botseer.ist.psu.edu/about.html</Link2>
  10208. </user-agent>
  10209. <user-agent>
  10210. <ID>id_moz_731</ID>
  10211. <String>Mozilla/1.1 (compatible; MSPIE 2.0; Windows CE)</String>
  10212. <Description>PDA Pocket IE 2.x Windows CE</Description>
  10213. <Type>B</Type>
  10214. <Comment></Comment>
  10215. <Link1></Link1>
  10216. <Link2></Link2>
  10217. </user-agent>
  10218. <user-agent>
  10219. <ID>id_moz_732</ID>
  10220. <String>Mozilla/1.10 [en] (Compatible; RISC OS 3.70; Oregano 1.10)</String>
  10221. <Description>Oregano browser for RISC OS</Description>
  10222. <Type>B</Type>
  10223. <Comment></Comment>
  10224. <Link1>http://www.crashnet.org.uk</Link1>
  10225. <Link2></Link2>
  10226. </user-agent>
  10227. <user-agent>
  10228. <ID>id_moz_730</ID>
  10229. <String>Mozilla/1.22 (compatible; MSIE 2.0d; Windows NT)</String>
  10230. <Description>IE 2.x WinNT</Description>
  10231. <Type>B</Type>
  10232. <Comment></Comment>
  10233. <Link1></Link1>
  10234. <Link2></Link2>
  10235. </user-agent>
  10236. <user-agent>
  10237. <ID>id_moz_733</ID>
  10238. <String>Mozilla/1.22 (compatible; MSIE 5.01; PalmOS 3.0) EudoraWeb 2</String>
  10239. <Description>EudoraWeb 2.0 browser (Eudora Internet Suite) for PalmOS</Description>
  10240. <Type>B</Type>
  10241. <Comment></Comment>
  10242. <Link1>http://www.eudora.com/products/unsupported/internetsuite/</Link1>
  10243. <Link2></Link2>
  10244. </user-agent>
  10245. <user-agent>
  10246. <ID>id_moz_1552</ID>
  10247. <String>Mozilla/2.0</String>
  10248. <Description>Dummy user agent - i.e. used by Namo Web Editor</Description>
  10249. <Type>B</Type>
  10250. <Comment></Comment>
  10251. <Link1>http://www.namo.com/</Link1>
  10252. <Link2></Link2>
  10253. </user-agent>
  10254. <user-agent>
  10255. <ID>id_moz_734</ID>
  10256. <String>Mozilla/2.0 (compatible; AOL 3.0; Mac_PowerPC)</String>
  10257. <Description>AOL Mac</Description>
  10258. <Type>B</Type>
  10259. <Comment></Comment>
  10260. <Link1></Link1>
  10261. <Link2></Link2>
  10262. </user-agent>
  10263. <user-agent>
  10264. <ID>id_moz_735</ID>
  10265. <String>Mozilla/2.0 (Compatible; AOL-IWENG 3.0; Win16)</String>
  10266. <Description>AOL Win 3.x</Description>
  10267. <Type>B</Type>
  10268. <Comment></Comment>
  10269. <Link1></Link1>
  10270. <Link2></Link2>
  10271. </user-agent>
  10272. <user-agent>
  10273. <ID>id_moz_736</ID>
  10274. <String>Mozilla/2.0 (compatible; Ask Jeeves)</String>
  10275. <Description>Ask Jeeves /Teoma robot</Description>
  10276. <Type>R</Type>
  10277. <Comment> 65.214.45.[x]xx</Comment>
  10278. <Link1>http://sp.ask.com</Link1>
  10279. <Link2></Link2>
  10280. </user-agent>
  10281. <user-agent>
  10282. <ID>id_moz_040707_2</ID>
  10283. <String>Mozilla/2.0 (compatible; Ask Jeeves/Teoma)</String>
  10284. <Description>Ask Jeeves /Teoma robot</Description>
  10285. <Type>R</Type>
  10286. <Comment>65.214.45.[x]xx</Comment>
  10287. <Link1>http://sp.ask.com</Link1>
  10288. <Link2></Link2>
  10289. </user-agent>
  10290. <user-agent>
  10291. <ID>id_moz_160506_3</ID>
  10292. <String>Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml) </String>
  10293. <Description>Ask Jeeves /Teoma robot</Description>
  10294. <Type>R</Type>
  10295. <Comment> 65.214.45.[x]xx</Comment>
  10296. <Link1>http://sp.ask.com</Link1>
  10297. <Link2></Link2>
  10298. </user-agent>
  10299. <user-agent>
  10300. <ID>id_moz_737</ID>
  10301. <String>Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://sp.ask.com/docs/about/tech_crawling.html)</String>
  10302. <Description>Ask Jeeves /Teoma robot</Description>
  10303. <Type>R</Type>
  10304. <Comment> 65.214.45.[x]xx</Comment>
  10305. <Link1>http://sp.ask.com</Link1>
  10306. <Link2></Link2>
  10307. </user-agent>
  10308. <user-agent>
  10309. <ID>id_moz_738</ID>
  10310. <String>Mozilla/2.0 (compatible; EZResult -- Internet Search Engine)</String>
  10311. <Description>Direct Hit Robot</Description>
  10312. <Type>R</Type>
  10313. <Comment></Comment>
  10314. <Link1>http://www.directhit.com</Link1>
  10315. <Link2></Link2>
  10316. </user-agent>
  10317. <user-agent>
  10318. <ID>id_moz_739</ID>
  10319. <String>Mozilla/2.0 (compatible; MS FrontPage x.0)</String>
  10320. <Description>MS Frontpage x.x web editor</Description>
  10321. <Type>B</Type>
  10322. <Comment></Comment>
  10323. <Link1></Link1>
  10324. <Link2></Link2>
  10325. </user-agent>
  10326. <user-agent>
  10327. <ID>id_moz_740</ID>
  10328. <String>Mozilla/2.0 (compatible; MSIE 2.1; Mac_PowerPC)</String>
  10329. <Description>IE 2.x Mac Power PC</Description>
  10330. <Type>B</Type>
  10331. <Comment></Comment>
  10332. <Link1></Link1>
  10333. <Link2></Link2>
  10334. </user-agent>
  10335. <user-agent>
  10336. <ID>id_moz_743</ID>
  10337. <String>Mozilla/2.0 (compatible; MSIE 3.02; Update a; AK; Windows NT)</String>
  10338. <Description>IE 3.x WinNT</Description>
  10339. <Type>B</Type>
  10340. <Comment></Comment>
  10341. <Link1></Link1>
  10342. <Link2></Link2>
  10343. </user-agent>
  10344. <user-agent>
  10345. <ID>id_moz_744</ID>
  10346. <String>Mozilla/2.0 (compatible; MSIE 3.02; Update a; AOL 3.0; Windows 95)</String>
  10347. <Description>IE 3.x AOL Win95</Description>
  10348. <Type>B</Type>
  10349. <Comment></Comment>
  10350. <Link1></Link1>
  10351. <Link2></Link2>
  10352. </user-agent>
  10353. <user-agent>
  10354. <ID>id_moz_741</ID>
  10355. <String>Mozilla/2.0 (compatible; MSIE 3.0; AK; Windows 95)</String>
  10356. <Description>IE 3.x Win95</Description>
  10357. <Type>B</Type>
  10358. <Comment></Comment>
  10359. <Link1></Link1>
  10360. <Link2></Link2>
  10361. </user-agent>
  10362. <user-agent>
  10363. <ID>id_moz_742</ID>
  10364. <String>Mozilla/2.0 (compatible; MSIE 3.0; Windows 3.1)</String>
  10365. <Description>IE 3.x Win 3.1</Description>
  10366. <Type>B</Type>
  10367. <Comment></Comment>
  10368. <Link1></Link1>
  10369. <Link2></Link2>
  10370. </user-agent>
  10371. <user-agent>
  10372. <ID>id_moz_745</ID>
  10373. <String>Mozilla/2.0 (compatible; MSIE 3.0B; Win32)</String>
  10374. <Description>IE 3.x WinXP</Description>
  10375. <Type>B</Type>
  10376. <Comment></Comment>
  10377. <Link1></Link1>
  10378. <Link2></Link2>
  10379. </user-agent>
  10380. <user-agent>
  10381. <ID>id_moz_746</ID>
  10382. <String>Mozilla/2.0 (compatible; NEWT ActiveX; Win32)</String>
  10383. <Description>Borland Delphi .OCX component used by WebCollector email harverster</Description>
  10384. <Type>S</Type>
  10385. <Comment></Comment>
  10386. <Link1></Link1>
  10387. <Link2></Link2>
  10388. </user-agent>
  10389. <user-agent>
  10390. <ID>id_moz_747</ID>
  10391. <String>Mozilla/2.0 (compatible; T-H-U-N-D-E-R-S-T-O-N-E)</String>
  10392. <Description>Thunderstone's Webinator Web indexing program</Description>
  10393. <Type>R</Type>
  10394. <Comment></Comment>
  10395. <Link1>http://www.thunderstone.com/texis/site/pages/Products.html</Link1>
  10396. <Link2></Link2>
  10397. </user-agent>
  10398. <user-agent>
  10399. <ID>id_moz_748</ID>
  10400. <String>Mozilla/2.0 compatible; Check&amp;Get 1.1x (Windows 98)</String>
  10401. <Description>Check&amp;Get bookmark and link checking tool</Description>
  10402. <Type>C</Type>
  10403. <Comment></Comment>
  10404. <Link1>http://www.activeurls.com</Link1>
  10405. <Link2></Link2>
  10406. </user-agent>
  10407. <user-agent>
  10408. <ID>id_moz_749</ID>
  10409. <String>Mozilla/2.01 (Win16; I)</String>
  10410. <Description>Netscape 2.x Win3.x International</Description>
  10411. <Type>B</Type>
  10412. <Comment></Comment>
  10413. <Link1></Link1>
  10414. <Link2></Link2>
  10415. </user-agent>
  10416. <user-agent>
  10417. <ID>id_moz_750</ID>
  10418. <String>Mozilla/2.02Gold (Win95; I)</String>
  10419. <Description>Netscape 2.x Gold Win95</Description>
  10420. <Type>B</Type>
  10421. <Comment></Comment>
  10422. <Link1></Link1>
  10423. <Link2></Link2>
  10424. </user-agent>
  10425. <user-agent>
  10426. <ID>id_moz_771</ID>
  10427. <String>Mozilla/3.0 (compatible)</String>
  10428. <Description>Faked user agent for diff. purposes i.e.: - some download manager - E-mail harvesting</Description>
  10429. <Type>S D</Type>
  10430. <Comment></Comment>
  10431. <Link1></Link1>
  10432. <Link2></Link2>
  10433. </user-agent>
  10434. <user-agent>
  10435. <ID>id_moz_751</ID>
  10436. <String>Mozilla/3.0 (compatible; AvantGo 3.2)</String>
  10437. <Description>AvantGo PDA browser</Description>
  10438. <Type>B</Type>
  10439. <Comment></Comment>
  10440. <Link1>http://avantgo.com/products/solutions/sfa.html</Link1>
  10441. <Link2></Link2>
  10442. </user-agent>
  10443. <user-agent>
  10444. <ID>id_moz_752</ID>
  10445. <String>Mozilla/3.0 (compatible; Fluffy the spider; http://www.searchhippo.com/; info@searchhippo.com)</String>
  10446. <Description>Searchhippo robot</Description>
  10447. <Type>R</Type>
  10448. <Comment></Comment>
  10449. <Link1>http://www.searchhippo.com</Link1>
  10450. <Link2></Link2>
  10451. </user-agent>
  10452. <user-agent>
  10453. <ID>id_moz_753</ID>
  10454. <String>Mozilla/3.0 (compatible; HP Web PrintSmart 04b0 1.0.1.34)</String>
  10455. <Description>HP Web PrintSmart (discontinued) - web page printing software</Description>
  10456. <Type>B D</Type>
  10457. <Comment></Comment>
  10458. <Link1></Link1>
  10459. <Link2></Link2>
  10460. </user-agent>
  10461. <user-agent>
  10462. <ID>id_moz_754</ID>
  10463. <String>Mozilla/3.0 (compatible; Indy Library)</String>
  10464. <Description>Internet Direct Library for Borland (often used as e-mail address collector and mass mailing tool)</Description>
  10465. <Type>S</Type>
  10466. <Comment></Comment>
  10467. <Link1>http://forge.novell.com/modules/xfmod/project/?indy-net</Link1>
  10468. <Link2>http://www.indyproject.org/</Link2>
  10469. </user-agent>
  10470. <user-agent>
  10471. <ID>id_moz_755</ID>
  10472. <String>Mozilla/3.0 (compatible; Linkman)</String>
  10473. <Description>Outertechs Linkman bookmark tool</Description>
  10474. <Type>C</Type>
  10475. <Comment></Comment>
  10476. <Link1>http://www.outertech.com</Link1>
  10477. <Link2></Link2>
  10478. </user-agent>
  10479. <user-agent>
  10480. <ID>id_moz_757</ID>
  10481. <String>Mozilla/3.0 (compatible; MuscatFerret/1.5.4; claude@euroferret.com)</String>
  10482. <Description>Euroferret robot</Description>
  10483. <Type>R</Type>
  10484. <Comment></Comment>
  10485. <Link1>http://www.euroferret.com</Link1>
  10486. <Link2></Link2>
  10487. </user-agent>
  10488. <user-agent>
  10489. <ID>id_moz_756</ID>
  10490. <String>Mozilla/3.0 (compatible; MuscatFerret/1.5; olly@muscat.co.uk)</String>
  10491. <Description>Euroferret robot</Description>
  10492. <Type>R</Type>
  10493. <Comment></Comment>
  10494. <Link1>http://www.euroferret.com</Link1>
  10495. <Link2></Link2>
  10496. </user-agent>
  10497. <user-agent>
  10498. <ID>id_moz_758</ID>
  10499. <String>Mozilla/3.0 (compatible; MuscatFerret/1.6.x; claude@euroferret.com)</String>
  10500. <Description>Euroferret robot</Description>
  10501. <Type>R</Type>
  10502. <Comment></Comment>
  10503. <Link1>http://www.euroferret.com</Link1>
  10504. <Link2></Link2>
  10505. </user-agent>
  10506. <user-agent>
  10507. <ID>id_moz_759</ID>
  10508. <String>Mozilla/3.0 (compatible; netart generator/1.0; libwww-perl/5.64)</String>
  10509. <Description>Netart Generator  - script generated random websites</Description>
  10510. <Type>R D</Type>
  10511. <Comment></Comment>
  10512. <Link1>http://www.obn.org/generator/</Link1>
  10513. <Link2></Link2>
  10514. </user-agent>
  10515. <user-agent>
  10516. <ID>id_moz_760</ID>
  10517. <String>Mozilla/3.0 (compatible; NetPositive/2.2)</String>
  10518. <Description>NetPositive BEOS browser</Description>
  10519. <Type>B</Type>
  10520. <Comment></Comment>
  10521. <Link1>http://www.tunetrackersystems.com/bedocs/documentation/User's%20Guide/03_network/Network07_NetPositive.html</Link1>
  10522. <Link2></Link2>
  10523. </user-agent>
  10524. <user-agent>
  10525. <ID>id_moz_761</ID>
  10526. <String>Mozilla/3.0 (compatible; Opera/3.0; Windows 3.1) v3.1</String>
  10527. <Description>Opera 3.x Win3.x</Description>
  10528. <Type>B</Type>
  10529. <Comment></Comment>
  10530. <Link1></Link1>
  10531. <Link2></Link2>
  10532. </user-agent>
  10533. <user-agent>
  10534. <ID>id_moz_762</ID>
  10535. <String>Mozilla/3.0 (compatible; Opera/3.0; Windows 95/NT4) 3.2</String>
  10536. <Description>Opera 3.x Win95/NT</Description>
  10537. <Type>B</Type>
  10538. <Comment></Comment>
  10539. <Link1></Link1>
  10540. <Link2></Link2>
  10541. </user-agent>
  10542. <user-agent>
  10543. <ID>id_moz_763</ID>
  10544. <String>Mozilla/3.0 (compatible; PerMan Surfer 3.0; Win95)</String>
  10545. <Description>Perman Surfer  bookmark tool</Description>
  10546. <Type>C</Type>
  10547. <Comment></Comment>
  10548. <Link1>http://www.bug.co.jp/nami-nori/</Link1>
  10549. <Link2></Link2>
  10550. </user-agent>
  10551. <user-agent>
  10552. <ID>id_moz_764</ID>
  10553. <String>Mozilla/3.0 (compatible; REL Software Web Link Validator 2.x)</String>
  10554. <Description>Web Link Validator link validation software</Description>
  10555. <Type>C</Type>
  10556. <Comment></Comment>
  10557. <Link1>http://www.relsoftware.com</Link1>
  10558. <Link2></Link2>
  10559. </user-agent>
  10560. <user-agent>
  10561. <ID>id_moz_765</ID>
  10562. <String>Mozilla/3.0 (compatible; scan4mail (advanced version) http://www.peterspages.net/?scan4mail)</String>
  10563. <Description>Scan4Mail online mail extraction service</Description>
  10564. <Type>S</Type>
  10565. <Comment></Comment>
  10566. <Link1>http://www.peterspages.net</Link1>
  10567. <Link2></Link2>
  10568. </user-agent>
  10569. <user-agent>
  10570. <ID>id_moz_220606_2</ID>
  10571. <String>Mozilla/3.0 (compatible; ScollSpider; http://www.webwobot.com)</String>
  10572. <Description>WebWobot UK search engine robot (82.43.129.2xx)</Description>
  10573. <Type>R</Type>
  10574. <Comment>s. also ScollSpider</Comment>
  10575. <Link1>http://www.webwobot.com/</Link1>
  10576. <Link2></Link2>
  10577. </user-agent>
  10578. <user-agent>
  10579. <ID>id_moz_766</ID>
  10580. <String>Mozilla/3.0 (compatible; Web Link Validator 2.x)Web Link Validator http://www.relsoftware.com/ link validation software</String>
  10581. <Description>Web Link Validator link validation software</Description>
  10582. <Type>C</Type>
  10583. <Comment></Comment>
  10584. <Link1>http://www.relsoftware.com</Link1>
  10585. <Link2></Link2>
  10586. </user-agent>
  10587. <user-agent>
  10588. <ID>id_moz_767</ID>
  10589. <String>Mozilla/3.0 (compatible; WebCapture x.x; Auto; Windows)</String>
  10590. <Description>Xelios Web Capture (now Wysigot) website downloading tool (Discontinued)</Description>
  10591. <Type>D</Type>
  10592. <Comment></Comment>
  10593. <Link1>http://www.xelios.com/</Link1>
  10594. <Link2>http://www.wysigot.com/int/about.html</Link2>
  10595. </user-agent>
  10596. <user-agent>
  10597. <ID>id_moz_768</ID>
  10598. <String>Mozilla/3.0 (compatible; Webinator-DEV01.home.iprospect.com/2.56)</String>
  10599. <Description>Iprospect search engine positioning using Thunderstone's Webinator</Description>
  10600. <Type>R</Type>
  10601. <Comment></Comment>
  10602. <Link1>http://www.iprospect.com</Link1>
  10603. <Link2>http://www.thunderstone.com/texis/site/pages/Products.html</Link2>
  10604. </user-agent>
  10605. <user-agent>
  10606. <ID>id_moz_769</ID>
  10607. <String>Mozilla/3.0 (compatible; Webinator-indexer.cyberalert.com/2.56)</String>
  10608. <Description>CyberAlert's Media Monitor using Thunderstone's Webinator</Description>
  10609. <Type>R</Type>
  10610. <Comment></Comment>
  10611. <Link1>http://www.cyberalert.com</Link1>
  10612. <Link2>http://www.thunderstone.com/texis/site/pages/Products.html</Link2>
  10613. </user-agent>
  10614. <user-agent>
  10615. <ID>id_moz_770</ID>
  10616. <String>Mozilla/3.0 (Compatible;Viking/1.8)</String>
  10617. <Description>Viking server user/client</Description>
  10618. <Type>P</Type>
  10619. <Comment></Comment>
  10620. <Link1>http://www.robtex.com</Link1>
  10621. <Link2></Link2>
  10622. </user-agent>
  10623. <user-agent>
  10624. <ID>id_moz_772</ID>
  10625. <String>Mozilla/3.0 (DreamPassport/3.0)</String>
  10626. <Description>One of DC-Sakuras download manager user-agent names</Description>
  10627. <Type>D</Type>
  10628. <Comment></Comment>
  10629. <Link1>http://www.dc-sakura.com</Link1>
  10630. <Link2></Link2>
  10631. </user-agent>
  10632. <user-agent>
  10633. <ID>id_moz_773</ID>
  10634. <String>Mozilla/3.0 (INGRID/3.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints)</String>
  10635. <Description>Ilse Netherlands robot (62.69.178.xx)</Description>
  10636. <Type>R</Type>
  10637. <Comment>s. also - INGRID/3.0 .. / IlseBot/1.0 ..</Comment>
  10638. <Link1>http://www.ilse.nl/</Link1>
  10639. <Link2></Link2>
  10640. </user-agent>
  10641. <user-agent>
  10642. <ID>id_moz_774</ID>
  10643. <String>Mozilla/3.0 (Liberate DTV 1.1)</String>
  10644. <Description>Liberate DTV server suite / TV-emulator</Description>
  10645. <Type>B P</Type>
  10646. <Comment></Comment>
  10647. <Link1>http://www.liberate.com</Link1>
  10648. <Link2></Link2>
  10649. </user-agent>
  10650. <user-agent>
  10651. <ID>id_moz_775</ID>
  10652. <String>Mozilla/3.0 (Planetweb/2.100 JS SSL US; Dreamcast US)</String>
  10653. <Description>Planetweb 2.1 Browser (discontinued) for Dreamcast</Description>
  10654. <Type>B</Type>
  10655. <Comment></Comment>
  10656. <Link1>http://www.planetweb.com</Link1>
  10657. <Link2></Link2>
  10658. </user-agent>
  10659. <user-agent>
  10660. <ID>id_moz_776</ID>
  10661. <String>Mozilla/3.0 (Slurp.so/Goo; slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  10662. <Description>http://www.goo.ne.jp /Inktomi robot</Description>
  10663. <Type>R</Type>
  10664. <Comment></Comment>
  10665. <Link1>http://www.goo.ne.jp</Link1>
  10666. <Link2></Link2>
  10667. </user-agent>
  10668. <user-agent>
  10669. <ID>id_moz_777</ID>
  10670. <String>Mozilla/3.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  10671. <Description>Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)</Description>
  10672. <Type>R</Type>
  10673. <Comment>s. also Slurpy Verifier ...</Comment>
  10674. <Link1>http://www.inktomi.com/</Link1>
  10675. <Link2></Link2>
  10676. </user-agent>
  10677. <user-agent>
  10678. <ID>id_moz_778</ID>
  10679. <String>Mozilla/3.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  10680. <Description>Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)</Description>
  10681. <Type>R</Type>
  10682. <Comment>s. also Slurpy Verifier ...</Comment>
  10683. <Link1>http://www.inktomi.com/</Link1>
  10684. <Link2></Link2>
  10685. </user-agent>
  10686. <user-agent>
  10687. <ID>id_moz_779</ID>
  10688. <String>Mozilla/3.0 (Vagabondo/1.1 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/)</String>
  10689. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  10690. <Type>R</Type>
  10691. <Comment>s. also Vagabondo</Comment>
  10692. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  10693. <Link2></Link2>
  10694. </user-agent>
  10695. <user-agent>
  10696. <ID>id_moz_780</ID>
  10697. <String>Mozilla/3.0 (Vagabondo/1.x MT; webagent@wise-guys.nl; http://webagent.wise-guys.nl/)</String>
  10698. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  10699. <Type>R</Type>
  10700. <Comment>s. also Vagabondo</Comment>
  10701. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  10702. <Link2></Link2>
  10703. </user-agent>
  10704. <user-agent>
  10705. <ID>id_moz_781</ID>
  10706. <String>Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints)</String>
  10707. <Description>Ilse Netherlands robot</Description>
  10708. <Type>R</Type>
  10709. <Comment></Comment>
  10710. <Link1>http://www.ilse.nl</Link1>
  10711. <Link2></Link2>
  10712. </user-agent>
  10713. <user-agent>
  10714. <ID>id_moz_782</ID>
  10715. <String>Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/)</String>
  10716. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  10717. <Type>R</Type>
  10718. <Comment>s. also Vagabondo</Comment>
  10719. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  10720. <Link2></Link2>
  10721. </user-agent>
  10722. <user-agent>
  10723. <ID>id_moz_783</ID>
  10724. <String>Mozilla/3.0 (Win16; I)</String>
  10725. <Description>Netscape 3.x Win3.x</Description>
  10726. <Type>B</Type>
  10727. <Comment></Comment>
  10728. <Link1></Link1>
  10729. <Link2></Link2>
  10730. </user-agent>
  10731. <user-agent>
  10732. <ID>id_moz_784</ID>
  10733. <String>Mozilla/3.0 (Win95; I)</String>
  10734. <Description>Netscape 3.x Win95</Description>
  10735. <Type>B</Type>
  10736. <Comment></Comment>
  10737. <Link1></Link1>
  10738. <Link2></Link2>
  10739. </user-agent>
  10740. <user-agent>
  10741. <ID>id_moz_785</ID>
  10742. <String>Mozilla/3.0 (WinNT; I)</String>
  10743. <Description>Netscape 3.x WinNT</Description>
  10744. <Type>B</Type>
  10745. <Comment></Comment>
  10746. <Link1></Link1>
  10747. <Link2></Link2>
  10748. </user-agent>
  10749. <user-agent>
  10750. <ID>id_moz_786</ID>
  10751. <String>Mozilla/3.0 (WorldGate Gazelle 3.5.1 build 11; FreeBSD2.2.8-STABLE)</String>
  10752. <Description>Netscape 3.x FreeBSD</Description>
  10753. <Type>B</Type>
  10754. <Comment></Comment>
  10755. <Link1></Link1>
  10756. <Link2></Link2>
  10757. </user-agent>
  10758. <user-agent>
  10759. <ID>id_moz_787</ID>
  10760. <String>Mozilla/3.0 (X11; I; OSF1 V4.0 alpha)</String>
  10761. <Description>Netscape 3.x OSF1 V4.0 alpha </Description>
  10762. <Type>B</Type>
  10763. <Comment></Comment>
  10764. <Link1></Link1>
  10765. <Link2></Link2>
  10766. </user-agent>
  10767. <user-agent>
  10768. <ID>id_moz_788</ID>
  10769. <String>Mozilla/3.0 NAVIO_AOLTV (11; 13; Philips; PH200; 1; R2.0C36_AOL.0110OPTIK; R2.0.0139d_OPTIK)</String>
  10770. <Description>AOL Web TV</Description>
  10771. <Type>B</Type>
  10772. <Comment></Comment>
  10773. <Link1></Link1>
  10774. <Link2></Link2>
  10775. </user-agent>
  10776. <user-agent>
  10777. <ID>id_moz_789</ID>
  10778. <String>Mozilla/3.0 WebTV/1.2 (compatible; MSIE 2.0)</String>
  10779. <Description>WebTV</Description>
  10780. <Type>B</Type>
  10781. <Comment></Comment>
  10782. <Link1></Link1>
  10783. <Link2></Link2>
  10784. </user-agent>
  10785. <user-agent>
  10786. <ID>id_moz_790</ID>
  10787. <String>Mozilla/3.01 (compatible; AmigaVoyager/2.95; AmigaOS/MC680x0)</String>
  10788. <Description>Amiga Voyager Browser Amiga</Description>
  10789. <Type>B</Type>
  10790. <Comment></Comment>
  10791. <Link1></Link1>
  10792. <Link2></Link2>
  10793. </user-agent>
  10794. <user-agent>
  10795. <ID>id_moz_791</ID>
  10796. <String>Mozilla/3.01 (Compatible; Links2Go Similarity Engine)</String>
  10797. <Description>Links2Go robot</Description>
  10798. <Type>R</Type>
  10799. <Comment></Comment>
  10800. <Link1>http://www.links2go.com</Link1>
  10801. <Link2></Link2>
  10802. </user-agent>
  10803. <user-agent>
  10804. <ID>id_moz_792</ID>
  10805. <String>Mozilla/3.01 (compatible; Netbox/3.5 R92; Linux 2.2)</String>
  10806. <Description>Netgem Netbox cable modem TV Box Linux</Description>
  10807. <Type>B</Type>
  10808. <Comment></Comment>
  10809. <Link1>http://www.netgem.com</Link1>
  10810. <Link2></Link2>
  10811. </user-agent>
  10812. <user-agent>
  10813. <ID>id_moz_793</ID>
  10814. <String>Mozilla/3.01-C-MACOS8 (Macintosh; I; PPC)</String>
  10815. <Description>Netscape 3.x Mac</Description>
  10816. <Type>B</Type>
  10817. <Comment></Comment>
  10818. <Link1></Link1>
  10819. <Link2></Link2>
  10820. </user-agent>
  10821. <user-agent>
  10822. <ID>id_moz_794</ID>
  10823. <String>Mozilla/3.01Gold (X11; I; Linux 2.0.32 i486)</String>
  10824. <Description>Netscape 3.x Linux</Description>
  10825. <Type>B</Type>
  10826. <Comment></Comment>
  10827. <Link1></Link1>
  10828. <Link2></Link2>
  10829. </user-agent>
  10830. <user-agent>
  10831. <ID>id_moz_795</ID>
  10832. <String>Mozilla/3.01Gold (X11; I; SunOS 5.5.1 sun4m)</String>
  10833. <Description>Netscape 3.x SunOS</Description>
  10834. <Type>B</Type>
  10835. <Comment></Comment>
  10836. <Link1></Link1>
  10837. <Link2></Link2>
  10838. </user-agent>
  10839. <user-agent>
  10840. <ID>id_moz_796</ID>
  10841. <String>Mozilla/3.01SGoldC-SGI (X11; I; IRIX 6.3 IP32)</String>
  10842. <Description>Netscape 3.x Irix</Description>
  10843. <Type>B</Type>
  10844. <Comment></Comment>
  10845. <Link1></Link1>
  10846. <Link2></Link2>
  10847. </user-agent>
  10848. <user-agent>
  10849. <ID>id_moz_797</ID>
  10850. <String>Mozilla/3.04 (compatible; ANTFresco/2.13; RISC OS 4.02)</String>
  10851. <Description>ANT Fresco Browser Risc OS</Description>
  10852. <Type>B</Type>
  10853. <Comment></Comment>
  10854. <Link1>http://www.antlimited.com</Link1>
  10855. <Link2></Link2>
  10856. </user-agent>
  10857. <user-agent>
  10858. <ID>id_moz_798</ID>
  10859. <String>Mozilla/3.04 (compatible; NCBrowser/2.35; ANTFresco/2.17; RISC OS-NC 5.13 Laz1UK1309)</String>
  10860. <Description>NCBrowser ANT Fresco Browser Risc OS</Description>
  10861. <Type>B</Type>
  10862. <Comment></Comment>
  10863. <Link1>http://www.antlimited.com</Link1>
  10864. <Link2></Link2>
  10865. </user-agent>
  10866. <user-agent>
  10867. <ID>id_moz_281106_1</ID>
  10868. <String>Mozilla/3.04 (compatible;QNX Voyager 2.03B ;Photon)</String>
  10869. <Description>QNX OS Voyager embedded browser</Description>
  10870. <Type>B</Type>
  10871. <Comment></Comment>
  10872. <Link1>http://www.qnx.com/products/browsers/</Link1>
  10873. <Link2></Link2>
  10874. </user-agent>
  10875. <user-agent>
  10876. <ID>id_moz_799</ID>
  10877. <String>Mozilla/3.x (I-Opener 1.1; Netpliance)</String>
  10878. <Description>I-Opener (was www.netpliance.com/) web PC</Description>
  10879. <Type>B</Type>
  10880. <Comment></Comment>
  10881. <Link1></Link1>
  10882. <Link2></Link2>
  10883. </user-agent>
  10884. <user-agent>
  10885. <ID>id_moz_100406_3</ID>
  10886. <String>Mozilla/4.0</String>
  10887. <Description>Yahoo Mindset: Intent-driven Search (66.228.182.1xx)</Description>
  10888. <Type>R</Type>
  10889. <Comment>s. also Yahoo! Mindset</Comment>
  10890. <Link1>http://mindset.research.yahoo.com/</Link1>
  10891. <Link2></Link2>
  10892. </user-agent>
  10893. <user-agent>
  10894. <ID>id_moz_800</ID>
  10895. <String>Mozilla/4.0 (agadine3.0) www.agada.de</String>
  10896. <Description>Agada search (Germany) robot</Description>
  10897. <Type>R</Type>
  10898. <Comment>s. also agadine/1.x.x</Comment>
  10899. <Link1>http://www.agada.de</Link1>
  10900. <Link2></Link2>
  10901. </user-agent>
  10902. <user-agent>
  10903. <ID>id_moz_290406_1</ID>
  10904. <String>Mozilla/4.0 (Compatible); URLBase 6</String>
  10905. <Description>URLBase 6 bookmark manager</Description>
  10906. <Type>C</Type>
  10907. <Comment>s. also URLBase/6.x</Comment>
  10908. <Link1>http://www.terriadev.com/products/urlbase/</Link1>
  10909. <Link2></Link2>
  10910. </user-agent>
  10911. <user-agent>
  10912. <ID>id_moz_895</ID>
  10913. <String>Mozilla/4.0 (compatible: AstraSpider V.2.1 : astrafind.com)</String>
  10914. <Description>Astrafind! adult search robot (66.98.252.xx)</Description>
  10915. <Type>R</Type>
  10916. <Comment></Comment>
  10917. <Link1>http://www.astrafind.com</Link1>
  10918. <Link2></Link2>
  10919. </user-agent>
  10920. <user-agent>
  10921. <ID>id_moz_021205_1</ID>
  10922. <String>Mozilla/4.0 (compatible;  Vagabondo/2.2; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)</String>
  10923. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  10924. <Type>R</Type>
  10925. <Comment>s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..</Comment>
  10926. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  10927. <Link2></Link2>
  10928. </user-agent>
  10929. <user-agent>
  10930. <ID>id_moz_240906_1</ID>
  10931. <String>Mozilla/4.0 (compatible;  Vagabondo/4.0Beta; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)</String>
  10932. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  10933. <Type>R</Type>
  10934. <Comment>s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..</Comment>
  10935. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  10936. <Link2></Link2>
  10937. </user-agent>
  10938. <user-agent>
  10939. <ID>id_moz_100208_1</ID>
  10940. <String>Mozilla/4.0 (compatible; &lt;a href=http://www.reget.com>ReGet Deluxe 5.1&lt;/a>; Windows NT 5.1)</String>
  10941. <Description>ReGet Deluxe! download manager</Description>
  10942. <Type>D</Type>
  10943. <Comment></Comment>
  10944. <Link1>http://deluxe.reget.com/en/</Link1>
  10945. <Link2></Link2>
  10946. </user-agent>
  10947. <user-agent>
  10948. <ID>id_moz_801</ID>
  10949. <String>Mozilla/4.0 (compatible; Advanced Email Extractor v2.xx)</String>
  10950. <Description>Advanced Email Extractor e-mail collector (spam bot)</Description>
  10951. <Type>S</Type>
  10952. <Comment></Comment>
  10953. <Link1>http://www.mailutilities.com</Link1>
  10954. <Link2></Link2>
  10955. </user-agent>
  10956. <user-agent>
  10957. <ID>id_moz_802</ID>
  10958. <String>Mozilla/4.0 (compatible; Arachmo)</String>
  10959. <Description>Arachmo Spider - web site file extraction tool</Description>
  10960. <Type>D</Type>
  10961. <Comment></Comment>
  10962. <Link1>http://bbbearchan.hp.infoseek.co.jp/</Link1>
  10963. <Link2></Link2>
  10964. </user-agent>
  10965. <user-agent>
  10966. <ID>id_moz_804</ID>
  10967. <String>Mozilla/4.0 (compatible; BorderManager 3.0)</String>
  10968. <Description>Novell Border Manager security suite</Description>
  10969. <Type>P</Type>
  10970. <Comment></Comment>
  10971. <Link1></Link1>
  10972. <Link2></Link2>
  10973. </user-agent>
  10974. <user-agent>
  10975. <ID>id_moz_090807_3</ID>
  10976. <String>Mozilla/4.0 (compatible; BOTW Spider; +http://botw.org)</String>
  10977. <Description>Best of the Web directory link checking</Description>
  10978. <Type>C</Type>
  10979. <Comment>209.11.177.1xx</Comment>
  10980. <Link1>http://botw.org/</Link1>
  10981. <Link2></Link2>
  10982. </user-agent>
  10983. <user-agent>
  10984. <ID>id_moz_803</ID>
  10985. <String>Mozilla/4.0 (compatible; B_L_I_T_Z_B_O_T)</String>
  10986. <Description>Blitzsuche Germany robot</Description>
  10987. <Type>R</Type>
  10988. <Comment>s. BlitzBOT@tricus.net</Comment>
  10989. <Link1>http://blitzsuche.rp-online.de/</Link1>
  10990. <Link2></Link2>
  10991. </user-agent>
  10992. <user-agent>
  10993. <ID>id_moz_805</ID>
  10994. <String>Mozilla/4.0 (compatible; Cerberian Drtrs Version-3.2-Build-0)</String>
  10995. <Description>Content Control from Blue Coat</Description>
  10996. <Type>P</Type>
  10997. <Comment></Comment>
  10998. <Link1>http://www.cerberian.com</Link1>
  10999. <Link2></Link2>
  11000. </user-agent>
  11001. <user-agent>
  11002. <ID>id_moz_080706_1</ID>
  11003. <String>Mozilla/4.0 (compatible; Check&amp;Get 3.0; Windows NT)</String>
  11004. <Description>Check&amp;Get bookmark manager&#44; web change monitor and archiver</Description>
  11005. <Type>C</Type>
  11006. <Comment></Comment>
  11007. <Link1>http://activeurls.com/en/</Link1>
  11008. <Link2></Link2>
  11009. </user-agent>
  11010. <user-agent>
  11011. <ID>id_moz_806</ID>
  11012. <String>Mozilla/4.0 (compatible; ChristCrawler.com ChristCrawler@ChristCENTRAL.com)</String>
  11013. <Description>Christcentral.com Christcrawler (was www.christcrawler.com)</Description>
  11014. <Type>R</Type>
  11015. <Comment>s.also ChristCRAWLER</Comment>
  11016. <Link1></Link1>
  11017. <Link2></Link2>
  11018. </user-agent>
  11019. <user-agent>
  11020. <ID>id_moz_301105_4</ID>
  11021. <String>Mozilla/4.0 (compatible; crawlx&#44; crawler@trd.overture.com)</String>
  11022. <Description>Yahoo Search Marketing crawler (68.142.211.1xx)</Description>
  11023. <Type>R</Type>
  11024. <Comment></Comment>
  11025. <Link1>http://www.content.overture.com/d/</Link1>
  11026. <Link2></Link2>
  11027. </user-agent>
  11028. <user-agent>
  11029. <ID>id_moz_011207_1</ID>
  11030. <String>Mozilla/4.0 (compatible; DAUMOA-video; +http://ws.daum.net/aboutkr.html)</String>
  11031. <Description>DAUMOA - Daum search Korea robot (211.115.109.xxx)</Description>
  11032. <Type>R</Type>
  11033. <Comment>s. also RaBot</Comment>
  11034. <Link1>http://www.daum.net/</Link1>
  11035. <Link2>http://ws.daum.net/abouten.html</Link2>
  11036. </user-agent>
  11037. <user-agent>
  11038. <ID>id_moz_131206_1</ID>
  11039. <String>Mozilla/4.0 (compatible; DepSpid/5.0x; +http://about.depspid.net)</String>
  11040. <Description>DepSpid distributed web crawler for link dependencies</Description>
  11041. <Type>C</Type>
  11042. <Comment></Comment>
  11043. <Link1>http://depspid.net/</Link1>
  11044. <Link2>http://about.depspid.net/</Link2>
  11045. </user-agent>
  11046. <user-agent>
  11047. <ID>id_moz_807</ID>
  11048. <String>Mozilla/4.0 (compatible; DnloadMage 1.0)</String>
  11049. <Description>Download Mage download manager</Description>
  11050. <Type>D</Type>
  11051. <Comment></Comment>
  11052. <Link1>http://www.dlmage.com</Link1>
  11053. <Link2></Link2>
  11054. </user-agent>
  11055. <user-agent>
  11056. <ID>id_moz_808</ID>
  11057. <String>Mozilla/4.0 (compatible; FastCrawler3 support-fastcrawler3@fast.no)</String>
  11058. <Description>Fast/Alltheweb crawler</Description>
  11059. <Type>R</Type>
  11060. <Comment></Comment>
  11061. <Link1>http://www.alltheweb.com</Link1>
  11062. <Link2></Link2>
  11063. </user-agent>
  11064. <user-agent>
  11065. <ID>id_moz_809</ID>
  11066. <String>Mozilla/4.0 (compatible; FDSE robot)</String>
  11067. <Description>Fluid Dynamics Search Engine (FDSE) robot used by Abadoor.de</Description>
  11068. <Type>R</Type>
  11069. <Comment></Comment>
  11070. <Link1>http://www.xav.com/scripts/search/</Link1>
  11071. <Link2>http://www.abadoor.de/</Link2>
  11072. </user-agent>
  11073. <user-agent>
  11074. <ID>id_moz_161105_2</ID>
  11075. <String>Mozilla/4.0 (compatible; GPU p2p crawler http://gpu.sourceforge.net/search_engine.php)</String>
  11076. <Description>GPU Distributed Search Engine crawler</Description>
  11077. <Type>R</Type>
  11078. <Comment></Comment>
  11079. <Link1>http://gpu.sourceforge.net/search_engine.php</Link1>
  11080. <Link2></Link2>
  11081. </user-agent>
  11082. <user-agent>
  11083. <ID>id_moz_810</ID>
  11084. <String>Mozilla/4.0 (compatible; grub-client-0.2.x; Crawl your stuff with http://grub.org)</String>
  11085. <Description>Grub open source crawler</Description>
  11086. <Type>R</Type>
  11087. <Comment></Comment>
  11088. <Link1>http://www.grub.org</Link1>
  11089. <Link2></Link2>
  11090. </user-agent>
  11091. <user-agent>
  11092. <ID>id_moz_811</ID>
  11093. <String>Mozilla/4.0 (compatible; grub-client-0.3.x; Crawl your own stuff with http://grub.org)</String>
  11094. <Description>Grub open source crawler</Description>
  11095. <Type>R</Type>
  11096. <Comment></Comment>
  11097. <Link1>http://www.grub.org</Link1>
  11098. <Link2></Link2>
  11099. </user-agent>
  11100. <user-agent>
  11101. <ID>id_moz_812</ID>
  11102. <String>Mozilla/4.0 (compatible; grub-client-2.x)</String>
  11103. <Description>Grub open source crawler used by Looksmart ( 64.241.242.xx)</Description>
  11104. <Type>R</Type>
  11105. <Comment></Comment>
  11106. <Link1>http://www.grub.org</Link1>
  11107. <Link2></Link2>
  11108. </user-agent>
  11109. <user-agent>
  11110. <ID>id_moz_261205_2</ID>
  11111. <String>Mozilla/4.0 (compatible; ibisBrowser)</String>
  11112. <Description>ibisBrowser Japanese mobile browser</Description>
  11113. <Type>B</Type>
  11114. <Comment></Comment>
  11115. <Link1>http://www.ibis.ne.jp/products/ibisBrowser/index.html</Link1>
  11116. <Link2></Link2>
  11117. </user-agent>
  11118. <user-agent>
  11119. <ID>id_moz_813</ID>
  11120. <String>Mozilla/4.0 (compatible; ICS 1.2.xxx)</String>
  11121. <Description>Novell iChain Cool Solutions caching</Description>
  11122. <Type>P</Type>
  11123. <Comment></Comment>
  11124. <Link1>http://www.novell.com</Link1>
  11125. <Link2></Link2>
  11126. </user-agent>
  11127. <user-agent>
  11128. <ID>id_moz_220206_1</ID>
  11129. <String>Mozilla/4.0 (compatible; IE-Favorites-Check-0.5)</String>
  11130. <Description>IE Favorites Check - Bookmark manager</Description>
  11131. <Type>C</Type>
  11132. <Comment></Comment>
  11133. <Link1>http://secure.sintraweb.net/public/soft/iefc/</Link1>
  11134. <Link2></Link2>
  11135. </user-agent>
  11136. <user-agent>
  11137. <ID>id_moz_814</ID>
  11138. <String>Mozilla/4.0 (compatible; Iplexx Spider/1.0 http://www.iplexx.at)</String>
  11139. <Description>Iplexx Austria (webhosting company) logfile spamming bot</Description>
  11140. <Type>S</Type>
  11141. <Comment></Comment>
  11142. <Link1>http://www.iplexx.at</Link1>
  11143. <Link2></Link2>
  11144. </user-agent>
  11145. <user-agent>
  11146. <ID>id_moz_020208_1</ID>
  11147. <String>Mozilla/4.0 (compatible; KeepNI web site monitor)</String>
  11148. <Description>KeepNi Monitors - Web site monitoring / link checking tool</Description>
  11149. <Type>C</Type>
  11150. <Comment></Comment>
  11151. <Link1>http://www.keepni.com/</Link1>
  11152. <Link2></Link2>
  11153. </user-agent>
  11154. <user-agent>
  11155. <ID>id_moz_815</ID>
  11156. <String>Mozilla/4.0 (compatible; Link Utility; http://net-promoter.com)</String>
  11157. <Description>NetPromoter Link Utility link checking tool</Description>
  11158. <Type>C</Type>
  11159. <Comment>s. also - Mozilla/4.0 (compatible; NetPromoter Spider ...</Comment>
  11160. <Link1>http://www.net-promoter.com/</Link1>
  11161. <Link2></Link2>
  11162. </user-agent>
  11163. <user-agent>
  11164. <ID>id_moz_816</ID>
  11165. <String>Mozilla/4.0 (compatible; Lotus-Notes/5.0; Windows-NT)</String>
  11166. <Description>Lotus Notes 5.0 browser</Description>
  11167. <Type>B</Type>
  11168. <Comment></Comment>
  11169. <Link1>http://www-10.lotus.com/ldd/whatisnotes#Release%205.0%3A%20Web%20integration%20by%20d</Link1>
  11170. <Link2></Link2>
  11171. </user-agent>
  11172. <user-agent>
  11173. <ID>id_moz_819</ID>
  11174. <String>Mozilla/4.0 (compatible; MSIE 4.01; AOL 4.0; Windows 98)</String>
  11175. <Description>IE 4.x AOL Win98</Description>
  11176. <Type>B</Type>
  11177. <Comment></Comment>
  11178. <Link1></Link1>
  11179. <Link2></Link2>
  11180. </user-agent>
  11181. <user-agent>
  11182. <ID>id_moz_820</ID>
  11183. <String>Mozilla/4.0 (compatible; MSIE 4.01; Mac_PowerPC)</String>
  11184. <Description>IE 4.x Mac Power PC</Description>
  11185. <Type>B</Type>
  11186. <Comment></Comment>
  11187. <Link1></Link1>
  11188. <Link2></Link2>
  11189. </user-agent>
  11190. <user-agent>
  11191. <ID>id_moz_821</ID>
  11192. <String>Mozilla/4.0 (compatible; MSIE 4.01; MSIECrawler; Windows 95)</String>
  11193. <Description>Internet Explorer 4.0 URL check</Description>
  11194. <Type>B C</Type>
  11195. <Comment></Comment>
  11196. <Link1></Link1>
  11197. <Link2></Link2>
  11198. </user-agent>
  11199. <user-agent>
  11200. <ID>id_moz_090506_1</ID>
  11201. <String>Mozilla/4.0 (compatible; MSIE 4.01; Vonna.com b o t)</String>
  11202. <Description>Vonna search robot</Description>
  11203. <Type>R</Type>
  11204. <Comment></Comment>
  11205. <Link1>http://www.vonna.com/</Link1>
  11206. <Link2></Link2>
  11207. </user-agent>
  11208. <user-agent>
  11209. <ID>id_moz_822</ID>
  11210. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows 95)</String>
  11211. <Description>IE 4.x Win95</Description>
  11212. <Type>B</Type>
  11213. <Comment></Comment>
  11214. <Link1></Link1>
  11215. <Link2></Link2>
  11216. </user-agent>
  11217. <user-agent>
  11218. <ID>id_moz_823</ID>
  11219. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; MSN Companion 2.0; 800x600; Compaq)</String>
  11220. <Description>IE PDA Browser Windows CE</Description>
  11221. <Type>B</Type>
  11222. <Comment></Comment>
  11223. <Link1></Link1>
  11224. <Link2></Link2>
  11225. </user-agent>
  11226. <user-agent>
  11227. <ID>id_moz_100109_4</ID>
  11228. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPC; 240x320; SPV M700; OpVer 19.123.2.733) OrangeBot-Mobile 2008.0 (mobilesearch.support@orange-ftgroup.com)</String>
  11229. <Description>Orange France robot for mobiles</Description>
  11230. <Type>R</Type>
  11231. <Comment>81.52.143.xx</Comment>
  11232. <Link1>http://www.orange.com/en_EN/</Link1>
  11233. <Link2></Link2>
  11234. </user-agent>
  11235. <user-agent>
  11236. <ID>id_moz_010308_2</ID>
  11237. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPS; 240x320)</String>
  11238. <Description>IE for Windows CE on a PocketPC (HP iPAQ)</Description>
  11239. <Type>B</Type>
  11240. <Comment></Comment>
  11241. <Link1>http://www.hp.com/</Link1>
  11242. <Link2></Link2>
  11243. </user-agent>
  11244. <user-agent>
  11245. <ID>id_moz_824</ID>
  11246. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows NT Windows CE)</String>
  11247. <Description>IE PDA Browser Windows CE</Description>
  11248. <Type>B</Type>
  11249. <Comment></Comment>
  11250. <Link1></Link1>
  11251. <Link2></Link2>
  11252. </user-agent>
  11253. <user-agent>
  11254. <ID>id_moz_826</ID>
  11255. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows NT)</String>
  11256. <Description>IE 4.x WinNT</Description>
  11257. <Type>B</Type>
  11258. <Comment></Comment>
  11259. <Link1></Link1>
  11260. <Link2></Link2>
  11261. </user-agent>
  11262. <user-agent>
  11263. <ID>id_moz_825</ID>
  11264. <String>Mozilla/4.0 (compatible; MSIE 4.01; Windows NT; MS Search 4.0 Robot) Microsoft</String>
  11265. <Description>diff. IPs / services i.e.: - Microsoft server information robot (see link) - Okanagan Internet Junction web filter (robot)</Description>
  11266. <Type></Type>
  11267. <Comment></Comment>
  11268. <Link1>http://www.webmasterworld.com/forum11/841.htm</Link1>
  11269. <Link2>http://www.junction.net/</Link2>
  11270. </user-agent>
  11271. <user-agent>
  11272. <ID>id_moz_010406_3</ID>
  11273. <String>Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) ACR</String>
  11274. <Description>Unknown robot from American College of Radiology (ACR) running MS Site Server</Description>
  11275. <Type>R C</Type>
  11276. <Comment>208.236.180.xx</Comment>
  11277. <Link1>http://www.acr.org/s_acr/index.asp</Link1>
  11278. <Link2>http://www.microsoft.com/commerceserver/default.mspx</Link2>
  11279. </user-agent>
  11280. <user-agent>
  11281. <ID>id_moz_817</ID>
  11282. <String>Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) Indonesia Interactive</String>
  11283. <Description>Indonesia Interactive Web-portal robot on MS Site Server</Description>
  11284. <Type>R</Type>
  11285. <Comment></Comment>
  11286. <Link1>http://www.i-2.co.id/</Link1>
  11287. <Link2>http://www.microsoft.com/commerceserver/default.mspx</Link2>
  11288. </user-agent>
  11289. <user-agent>
  11290. <ID>id_moz_818</ID>
  11291. <String>Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) WebQuest Designs</String>
  11292. <Description>Webquestdesigns hosting</Description>
  11293. <Type></Type>
  11294. <Comment></Comment>
  11295. <Link1>http://www.webquestdesigns.com</Link1>
  11296. <Link2></Link2>
  11297. </user-agent>
  11298. <user-agent>
  11299. <ID>id_moz_841</ID>
  11300. <String>Mozilla/4.0 (compatible; MSIE 5.01; Windows 95) via &lt;B>Avirt Gateway Server&lt;/B> v4.0</String>
  11301. <Description>Avirt Gateway proxy server</Description>
  11302. <Type>P</Type>
  11303. <Comment></Comment>
  11304. <Link1>http://www.avirt.com/products/gateway.html</Link1>
  11305. <Link2></Link2>
  11306. </user-agent>
  11307. <user-agent>
  11308. <ID>id_moz_843</ID>
  11309. <String>Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0) (samualt9@bigfoot.com)</String>
  11310. <Description>Metacarta.com (66.28.xx.xxx) robot</Description>
  11311. <Type>R</Type>
  11312. <Comment>s. Larbin....</Comment>
  11313. <Link1>http://www.metacarta.com/</Link1>
  11314. <Link2></Link2>
  11315. </user-agent>
  11316. <user-agent>
  11317. <ID>id_moz_842</ID>
  11318. <String>Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0; NetCaptor 6.5.0RC1)</String>
  11319. <Description>NetCaptor IE browser addon</Description>
  11320. <Type>B</Type>
  11321. <Comment></Comment>
  11322. <Link1>http://www.netcaptor.com</Link1>
  11323. <Link2></Link2>
  11324. </user-agent>
  11325. <user-agent>
  11326. <ID>id_moz_827</ID>
  11327. <String>Mozilla/4.0 (compatible; MSIE 5.0; AOL 5.0; Windows 95; DigExt; Gateway2000; sureseeker.com)</String>
  11328. <Description>IE 5.x AOL Win95 Sureseeker search plugin</Description>
  11329. <Type>B</Type>
  11330. <Comment></Comment>
  11331. <Link1>http://www.sureseeker.com</Link1>
  11332. <Link2></Link2>
  11333. </user-agent>
  11334. <user-agent>
  11335. <ID>id_moz_828</ID>
  11336. <String>Mozilla/4.0 (compatible; MSIE 5.0; Mac_PowerPC; AtHome021)</String>
  11337. <Description>IE 5.x Mac PowerPC AtHome user</Description>
  11338. <Type>B</Type>
  11339. <Comment></Comment>
  11340. <Link1></Link1>
  11341. <Link2></Link2>
  11342. </user-agent>
  11343. <user-agent>
  11344. <ID>id_moz_829</ID>
  11345. <String>Mozilla/4.0 (compatible; MSIE 5.0; NetNose-Crawler 2.0; A New Search Experience: http://www.netnose.com)</String>
  11346. <Description>www.netnose.com crawler</Description>
  11347. <Type>R</Type>
  11348. <Comment>parked domain</Comment>
  11349. <Link1>http://www.netnose.com/</Link1>
  11350. <Link2></Link2>
  11351. </user-agent>
  11352. <user-agent>
  11353. <ID>id_moz_830</ID>
  11354. <String>Mozilla/4.0 (compatible; MSIE 5.0; Win32) via proxy gateway CERN-HTTPD/3.0 libwww/2.17</String>
  11355. <Description>WinXP via CERN httpd proxy server </Description>
  11356. <Type>P</Type>
  11357. <Comment></Comment>
  11358. <Link1>http://www.w3.org</Link1>
  11359. <Link2></Link2>
  11360. </user-agent>
  11361. <user-agent>
  11362. <ID>id_moz_831</ID>
  11363. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) TrueRobot; 1.5</String>
  11364. <Description>Echo.com robot</Description>
  11365. <Type>R</Type>
  11366. <Comment></Comment>
  11367. <Link1>http://www.echo.com</Link1>
  11368. <Link2></Link2>
  11369. </user-agent>
  11370. <user-agent>
  11371. <ID>id_moz_832</ID>
  11372. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot BETA 1.2 (http://www.voila.com/)</String>
  11373. <Description>Voila.fr robot</Description>
  11374. <Type>R</Type>
  11375. <Comment></Comment>
  11376. <Link1>http://www.voila.fr</Link1>
  11377. <Link2></Link2>
  11378. </user-agent>
  11379. <user-agent>
  11380. <ID>id_moz_833</ID>
  11381. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot; 1.6</String>
  11382. <Description>Voila.fr robot</Description>
  11383. <Type>R</Type>
  11384. <Comment></Comment>
  11385. <Link1>http://www.voila.fr</Link1>
  11386. <Link2></Link2>
  11387. </user-agent>
  11388. <user-agent>
  11389. <ID>id_moz_835</ID>
  11390. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows ME) Opera 5.11 [en]</String>
  11391. <Description>WinME Opera 5.x</Description>
  11392. <Type>B</Type>
  11393. <Comment></Comment>
  11394. <Link1></Link1>
  11395. <Link2></Link2>
  11396. </user-agent>
  11397. <user-agent>
  11398. <ID>id_moz_834</ID>
  11399. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows ME; Link Checker 2.x.xx http://www.kyosoft.com)</String>
  11400. <Description>Kyosoft's Link Checker</Description>
  11401. <Type>C</Type>
  11402. <Comment></Comment>
  11403. <Link1>http://www.kyosoft.com</Link1>
  11404. <Link2></Link2>
  11405. </user-agent>
  11406. <user-agent>
  11407. <ID>id_moz_836</ID>
  11408. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; DigExt; DTS Agent</String>
  11409. <Description>Beijing Express Email Address Extractor via DHCP Data Transport Services (DTS)</Description>
  11410. <Type>S</Type>
  11411. <Comment>site is closed</Comment>
  11412. <Link1>http://www.zstools.com</Link1>
  11413. <Link2>http://esupport.ca.com/index.html?/public/dto_transportit/infodocs/dto1013.asp</Link2>
  11414. </user-agent>
  11415. <user-agent>
  11416. <ID>id_moz_837</ID>
  11417. <String>Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; Girafabot; girafabot at girafa dot com; http://www.girafa.com)</String>
  11418. <Description>Girafa (browser plug-in) robot</Description>
  11419. <Type>B R</Type>
  11420. <Comment></Comment>
  11421. <Link1>http://www.girafa.com</Link1>
  11422. <Link2></Link2>
  11423. </user-agent>
  11424. <user-agent>
  11425. <ID>id_moz_838</ID>
  11426. <String>Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com)</String>
  11427. <Description>Galaxy robot (63.121.41.xxx) </Description>
  11428. <Type>R</Type>
  11429. <Comment>s. also GalaxyBot..</Comment>
  11430. <Link1>http://www.galaxy.com/</Link1>
  11431. <Link2></Link2>
  11432. </user-agent>
  11433. <user-agent>
  11434. <ID>id_moz_839</ID>
  11435. <String>Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com/; http://www.galaxy.com/info/crawler.html)</String>
  11436. <Description>Galaxy robot (63.121.41.xxx)</Description>
  11437. <Type>R</Type>
  11438. <Comment>s. also GalaxyBot..</Comment>
  11439. <Link1>http://www.galaxy.com/</Link1>
  11440. <Link2></Link2>
  11441. </user-agent>
  11442. <user-agent>
  11443. <ID>id_moz_840</ID>
  11444. <String>Mozilla/4.0 (compatible; MSIE 5.0; YANDEX)</String>
  11445. <Description>Yandex Search Russia link checking (213.180.206.2xx)</Description>
  11446. <Type>R</Type>
  11447. <Comment>s. also Yandex/1...</Comment>
  11448. <Link1>http://www.yandex.ru</Link1>
  11449. <Link2></Link2>
  11450. </user-agent>
  11451. <user-agent>
  11452. <ID>id_moz_844</ID>
  11453. <String>Mozilla/4.0 (compatible; MSIE 5.5; AOL 4.0; Windows 98; GoBeez (www.gobeez.com))</String>
  11454. <Description>Gobeez starting page plugin</Description>
  11455. <Type>C</Type>
  11456. <Comment>site is offline</Comment>
  11457. <Link1>http://www.gobeez.com/</Link1>
  11458. <Link2></Link2>
  11459. </user-agent>
  11460. <user-agent>
  11461. <ID>id_moz_845</ID>
  11462. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 95; Transmission Segment; Hotbar 2.0)</String>
  11463. <Description>IE 5.5 Win95 Hotbar plug-in</Description>
  11464. <Type></Type>
  11465. <Comment></Comment>
  11466. <Link1>http://hotbar.com/install/firstvisit.asp</Link1>
  11467. <Link2></Link2>
  11468. </user-agent>
  11469. <user-agent>
  11470. <ID>id_moz_846</ID>
  11471. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Crazy Browser 1.x.x)</String>
  11472. <Description>Crazy Browser - IE based tabbed Browser</Description>
  11473. <Type>B</Type>
  11474. <Comment></Comment>
  11475. <Link1>http://www.crazybrowser.com</Link1>
  11476. <Link2></Link2>
  11477. </user-agent>
  11478. <user-agent>
  11479. <ID>id_moz_847</ID>
  11480. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; KITV4.7 Wanadoo)</String>
  11481. <Description>Wanadoo Internet services</Description>
  11482. <Type>B</Type>
  11483. <Comment></Comment>
  11484. <Link1></Link1>
  11485. <Link2></Link2>
  11486. </user-agent>
  11487. <user-agent>
  11488. <ID>id_moz_848</ID>
  11489. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SAFEXPLORER TL)</String>
  11490. <Description>Safexplorer (safexplorer.com - site is offline) kids browser</Description>
  11491. <Type>B</Type>
  11492. <Comment></Comment>
  11493. <Link1></Link1>
  11494. <Link2></Link2>
  11495. </user-agent>
  11496. <user-agent>
  11497. <ID>id_moz_849</ID>
  11498. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SYMPA; Katiesoft 7; SimulBrowse 3.0)</String>
  11499. <Description>Katiesoft Scroll (ex www.katiesoft.com now discarded) &amp; SimulBrowse (ex www.simulbrowse.com now dead) IE browser plugins</Description>
  11500. <Type>B</Type>
  11501. <Comment></Comment>
  11502. <Link1></Link1>
  11503. <Link2></Link2>
  11504. </user-agent>
  11505. <user-agent>
  11506. <ID>id_moz_850</ID>
  11507. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; BTinternet V8.1)</String>
  11508. <Description>Windows ME BTOpenworld Internet services</Description>
  11509. <Type>B</Type>
  11510. <Comment></Comment>
  11511. <Link1></Link1>
  11512. <Link2></Link2>
  11513. </user-agent>
  11514. <user-agent>
  11515. <ID>id_moz_851</ID>
  11516. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; MSIECrawler)</String>
  11517. <Description>Windows ME Internet Explorer URL check</Description>
  11518. <Type>B C</Type>
  11519. <Comment></Comment>
  11520. <Link1></Link1>
  11521. <Link2></Link2>
  11522. </user-agent>
  11523. <user-agent>
  11524. <ID>id_moz_852</ID>
  11525. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; obot)</String>
  11526. <Description>Cobion Germany Brand Protection Services robot</Description>
  11527. <Type>R</Type>
  11528. <Comment></Comment>
  11529. <Link1>http://www.cobion.com</Link1>
  11530. <Link2></Link2>
  11531. </user-agent>
  11532. <user-agent>
  11533. <ID>id_moz_853</ID>
  11534. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; QXW03018)</String>
  11535. <Description>Cobion Germany Brand Protection Services robot</Description>
  11536. <Type>R</Type>
  11537. <Comment></Comment>
  11538. <Link1>http://www.cobion.com</Link1>
  11539. <Link2></Link2>
  11540. </user-agent>
  11541. <user-agent>
  11542. <ID>id_moz_858</ID>
  11543. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Active Cache Request</String>
  11544. <Description>IE 5.5 Win2000 / user agent</Description>
  11545. <Type>B</Type>
  11546. <Comment></Comment>
  11547. <Link1></Link1>
  11548. <Link2></Link2>
  11549. </user-agent>
  11550. <user-agent>
  11551. <ID>id_moz_859</ID>
  11552. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Fetch API Request</String>
  11553. <Description>Maybe: - MS Internet Security &amp; Acceleration Server (ISA) cache refreshing request (see link) or - IE 5.5 Win2000 probably with some (website) API request component (see 2nd link) - suspected as email-harvester / site scanning tool (see http://www.byte.com/documents/s=493/byt20010208s0001/index.htm</Description>
  11554. <Type>P S ?</Type>
  11555. <Comment></Comment>
  11556. <Link1>http://groups.google.com/groups?hl=en&amp;lr=&amp;ie=UTF-8&amp;safe=off&amp;threadm=uGoenyodBHA.1472%40tkmsftngp07&amp;rnum=1&amp;prev=/groups%3Fq%3DFetch%2BAPI%26hl%3Den%26lr%3D%26ie%3DUTF-8%26safe%3Doff%26selm%3DuGoenyodBHA.1472%2540tkmsftngp07%26rnum%3D1</Link1>
  11557. <Link2>http://groups.google.de/groups?q=%22fetch+api+request%22&amp;hl=de&amp;lr=&amp;ie=UTF-8&amp;oe=UTF-8&amp;selm=3CAD577B.C29BA3B2%40execpc.com&amp;rnum=2</Link2>
  11558. </user-agent>
  11559. <user-agent>
  11560. <ID>id_moz_854</ID>
  11561. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; .NET CLR 1.0.3705)</String>
  11562. <Description>IE 5.5 Win2000 with MS.NET SDK</Description>
  11563. <Type>B</Type>
  11564. <Comment></Comment>
  11565. <Link1></Link1>
  11566. <Link2></Link2>
  11567. </user-agent>
  11568. <user-agent>
  11569. <ID>id_moz_855</ID>
  11570. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AIRF)</String>
  11571. <Description>IE 5.5 Win2000 / user agent w. AI RoboForm (AIRF) password manager</Description>
  11572. <Type>B</Type>
  11573. <Comment></Comment>
  11574. <Link1>http://www.roboform.com</Link1>
  11575. <Link2></Link2>
  11576. </user-agent>
  11577. <user-agent>
  11578. <ID>id_moz_856</ID>
  11579. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AspTear 1.5)</String>
  11580. <Description>AspTear URL fetching program component / Download32.com spider</Description>
  11581. <Type>R D</Type>
  11582. <Comment></Comment>
  11583. <Link1>http://www.alphasierrapapa.com/IisDev/Components/AspTear/</Link1>
  11584. <Link2>http://www.download32.com</Link2>
  11585. </user-agent>
  11586. <user-agent>
  11587. <ID>id_moz_857</ID>
  11588. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; N_o_k_i_a)</String>
  11589. <Description>Nokia.com network</Description>
  11590. <Type>B</Type>
  11591. <Comment></Comment>
  11592. <Link1></Link1>
  11593. <Link2></Link2>
  11594. </user-agent>
  11595. <user-agent>
  11596. <ID>id_moz_051102_1</ID>
  11597. <String>Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; T312461) RPT-HTTPClient/0.3-3E</String>
  11598. <Description>Unknown Object Sciences Corp. robot using the HTTPClient</Description>
  11599. <Type></Type>
  11600. <Comment></Comment>
  11601. <Link1>http://www.objectsciences.com</Link1>
  11602. <Link2>http://www.innovation.ch/java/HTTPClient/</Link2>
  11603. </user-agent>
  11604. <user-agent>
  11605. <ID>id_moz_060406_2</ID>
  11606. <String>Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler v4; +http://www.singingfish.com/help/spider.html; webmaster@singingfish.com); SpiderThread  Revision: 3.10</String>
  11607. <Description>Singingfish media spider (64.12.186.2xx) via AOL search</Description>
  11608. <Type>R</Type>
  11609. <Comment>s. also asterias/2.0</Comment>
  11610. <Link1>http://search.singingfish.com/sfw/home.jsp</Link1>
  11611. <Link2></Link2>
  11612. </user-agent>
  11613. <user-agent>
  11614. <ID>id_moz_200108_2</ID>
  11615. <String>Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows 98; .NET CLR 1.1.4322; MEGAUPLOAD 2.0)</String>
  11616. <Description>Megaupload Mega Manager - Download manager toolbar for IE</Description>
  11617. <Type>D</Type>
  11618. <Comment></Comment>
  11619. <Link1>http://www.megaupload.com/manager/de/</Link1>
  11620. <Link2></Link2>
  11621. </user-agent>
  11622. <user-agent>
  11623. <ID>id_moz_010106_1</ID>
  11624. <String>Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows NT 5.1; SV1; HbTools 4.7.2)</String>
  11625. <Description>Hotbar IE graphical skin</Description>
  11626. <Type>B</Type>
  11627. <Comment>Adware / Spyware component</Comment>
  11628. <Link1>http://hotbar.com/Installation/Browsing/WhatIs/Hotbar.htm</Link1>
  11629. <Link2></Link2>
  11630. </user-agent>
  11631. <user-agent>
  11632. <ID>id_moz_860</ID>
  11633. <String>Mozilla/4.0 (compatible; MSIE 6.0; MSIE 5.5; Windows NT 5.1) Skampy/0.9.x [en]</String>
  11634. <Description>Skaffe.com directory link checker</Description>
  11635. <Type>R</Type>
  11636. <Comment>s. also Skampy</Comment>
  11637. <Link1>http://www.skaffe.com</Link1>
  11638. <Link2></Link2>
  11639. </user-agent>
  11640. <user-agent>
  11641. <ID>id_moz_100606_1</ID>
  11642. <String>Mozilla/4.0 (compatible; MSIE 6.0; TargetSeek/1.0; +http://www.targetgroups.net/TargetSeek.html)</String>
  11643. <Description>TargetSeek Crawler concerning electronics industry product announcements</Description>
  11644. <Type>R</Type>
  11645. <Comment>71.161.205.2xx</Comment>
  11646. <Link1>http://www.targetgroups.net/TargetSeek.html</Link1>
  11647. <Link2></Link2>
  11648. </user-agent>
  11649. <user-agent>
  11650. <ID>id_moz_861</ID>
  11651. <String>Mozilla/4.0 (compatible; MSIE 6.0; Win32) WebWasher 3.0</String>
  11652. <Description>IE 6.0 WebWasher ad filter</Description>
  11653. <Type>B P</Type>
  11654. <Comment></Comment>
  11655. <Link1>http://www.webwasher.com</Link1>
  11656. <Link2></Link2>
  11657. </user-agent>
  11658. <user-agent>
  11659. <ID>id_moz_864</ID>
  11660. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) REL Software Web Link Validator 2.x)</String>
  11661. <Description>Web Link Validator link validation software</Description>
  11662. <Type>C</Type>
  11663. <Comment></Comment>
  11664. <Link1>http://www.relsoftware.com</Link1>
  11665. <Link2></Link2>
  11666. </user-agent>
  11667. <user-agent>
  11668. <ID>id_moz_865</ID>
  11669. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) Web Link Validator 2.x)</String>
  11670. <Description>Web Link Validator link validation software</Description>
  11671. <Type>C</Type>
  11672. <Comment></Comment>
  11673. <Link1>http://www.relsoftware.com</Link1>
  11674. <Link2></Link2>
  11675. </user-agent>
  11676. <user-agent>
  11677. <ID>id_moz_862</ID>
  11678. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Net M@nager V3.02 - www.vinn.com.au)</String>
  11679. <Description>IE 6.0 Netmanager IE add-on</Description>
  11680. <Type>B</Type>
  11681. <Comment></Comment>
  11682. <Link1>http://www.vinn.com.au</Link1>
  11683. <Link2></Link2>
  11684. </user-agent>
  11685. <user-agent>
  11686. <ID>id_moz_290306_1</ID>
  11687. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com; http://www.illumit.com/Products/weblight/)</String>
  11688. <Description>WebLight web analyzer &amp; link checker</Description>
  11689. <Type>C</Type>
  11690. <Comment>s. also WebLight/4.x.x ...</Comment>
  11691. <Link1>http://www.illumit.com/Products/weblight/</Link1>
  11692. <Link2></Link2>
  11693. </user-agent>
  11694. <user-agent>
  11695. <ID>id_moz_863</ID>
  11696. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Win 9x 4.90; http://www.Abolimba.de)</String>
  11697. <Description>Abolimba Multibrowser - IE based browser</Description>
  11698. <Type>C</Type>
  11699. <Comment></Comment>
  11700. <Link1>http://www.autag.com</Link1>
  11701. <Link2></Link2>
  11702. </user-agent>
  11703. <user-agent>
  11704. <ID>id_moz_866</ID>
  11705. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; .NET CLR 1.1.4322; Lunascape 2.1.3)</String>
  11706. <Description>Lunascape IE based browser (Japan)</Description>
  11707. <Type>B</Type>
  11708. <Comment>s. also Lunascape</Comment>
  11709. <Link1>http://www2.lunascape.jp/index.aspx</Link1>
  11710. <Link2></Link2>
  11711. </user-agent>
  11712. <user-agent>
  11713. <ID>id_moz_290708_4</ID>
  11714. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; Google Wireless Transcoder;)</String>
  11715. <Description>Google wireless transcoder (GWT) proxy for rewriting websites for mobiles</Description>
  11716. <Type>P</Type>
  11717. <Comment>209.85.136.xxx</Comment>
  11718. <Link1>http://www.google.com/gwt/n</Link1>
  11719. <Link2></Link2>
  11720. </user-agent>
  11721. <user-agent>
  11722. <ID>id_moz_150906_1</ID>
  11723. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP entries t_st; http://tuezilla.de/t_st-odp-entries-agent.html)</String>
  11724. <Description>T&#252;zilla (Germany) - ODP link checking using Robozilla</Description>
  11725. <Type>R</Type>
  11726. <Comment>81.169.154.xx</Comment>
  11727. <Link1>http://tuezilla.de</Link1>
  11728. <Link2>http://dmoz.org/profiles/robozilla.html</Link2>
  11729. </user-agent>
  11730. <user-agent>
  11731. <ID>id_moz_867</ID>
  11732. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP links test; http://tuezilla.de/test-odp-links-agent.html)</String>
  11733. <Description>T&#252;zilla (Germany) - ODP link checking using Robozilla</Description>
  11734. <Type>R</Type>
  11735. <Comment>81.169.154.xx</Comment>
  11736. <Link1>http://tuezilla.de</Link1>
  11737. <Link2>http://dmoz.org/profiles/robozilla.html</Link2>
  11738. </user-agent>
  11739. <user-agent>
  11740. <ID>id_moz_080606_1</ID>
  11741. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ZoomSpider.net bot; .NET CLR 1.1.4322)</String>
  11742. <Description>ZoomSpider.Net indexing robot for several directorys</Description>
  11743. <Type>R</Type>
  11744. <Comment>70.94.232.2xx</Comment>
  11745. <Link1>http://www.zoomspider.net/</Link1>
  11746. <Link2></Link2>
  11747. </user-agent>
  11748. <user-agent>
  11749. <ID>id_moz_882</ID>
  11750. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) (dns_admin@c-a-s-h.com)</String>
  11751. <Description>unknown robot from 64.246.44.xx</Description>
  11752. <Type></Type>
  11753. <Comment></Comment>
  11754. <Link1></Link1>
  11755. <Link2></Link2>
  11756. </user-agent>
  11757. <user-agent>
  11758. <ID>id_moz_280408_1</ID>
  11759. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Covac UPPS Cathan 1.2.5;)</String>
  11760. <Description>Covac Software UPPS (Universal PHP Proxy Server) - free public proxy server</Description>
  11761. <Type>P</Type>
  11762. <Comment></Comment>
  11763. <Link1>http://www.covac-software.com/proxy/</Link1>
  11764. <Link2></Link2>
  11765. </user-agent>
  11766. <user-agent>
  11767. <ID>id_moz_160406_1</ID>
  11768. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Crayon Crawler; snprtz|T04056566514940; (R1 1.5))</String>
  11769. <Description>GetNetWise Crayon Crawler web filter</Description>
  11770. <Type>P</Type>
  11771. <Comment></Comment>
  11772. <Link1>http://kids.getnetwise.org/tools/tool_info.php?tool_id=931919301.7202</Link1>
  11773. <Link2></Link2>
  11774. </user-agent>
  11775. <user-agent>
  11776. <ID>id_moz_868</ID>
  11777. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Deepnet Explorer)</String>
  11778. <Description>Deepnet Explorer - IE based browser</Description>
  11779. <Type>B</Type>
  11780. <Comment></Comment>
  11781. <Link1>http://deepnetexplorer.com/</Link1>
  11782. <Link2></Link2>
  11783. </user-agent>
  11784. <user-agent>
  11785. <ID>id_moz_869</ID>
  11786. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; heritrix/1.3.0 http://www.cs.washington.edu/research/networking/websys/)</String>
  11787. <Description>Heritrix Internet Archive's open-source web project used by Analysis Projects at UW</Description>
  11788. <Type>R</Type>
  11789. <Comment></Comment>
  11790. <Link1>http://crawler.archive.org/</Link1>
  11791. <Link2>http://www.cs.washington.edu/research/networking/websys/</Link2>
  11792. </user-agent>
  11793. <user-agent>
  11794. <ID>id_moz_870</ID>
  11795. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Hotbar 3.0)</String>
  11796. <Description>IE 6x WinXP Hotbar plug-in</Description>
  11797. <Type>B</Type>
  11798. <Comment></Comment>
  11799. <Link1>http://hotbar.com/install/firstvisit.asp</Link1>
  11800. <Link2></Link2>
  11801. </user-agent>
  11802. <user-agent>
  11803. <ID>id_moz_871</ID>
  11804. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iOpus-I-M)</String>
  11805. <Description>IE 6x WinXP iOpus Internet Macros - Internet-based macro recorder </Description>
  11806. <Type>B</Type>
  11807. <Comment></Comment>
  11808. <Link1>http://www.iopus.com</Link1>
  11809. <Link2></Link2>
  11810. </user-agent>
  11811. <user-agent>
  11812. <ID>id_moz_872</ID>
  11813. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iRider 2.21.1108; FDM)</String>
  11814. <Description>iRider - IE based browser / Free Download Manager (FDM)</Description>
  11815. <Type>D</Type>
  11816. <Comment></Comment>
  11817. <Link1>http://www.irider.com/irider/index.htm</Link1>
  11818. <Link2>http://www.freedownloadmanager.org/</Link2>
  11819. </user-agent>
  11820. <user-agent>
  11821. <ID>id_moz_873</ID>
  11822. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; KKman3.0)</String>
  11823. <Description>KKman http://www.kkman.com/ - Japanese IE based browser</Description>
  11824. <Type>B</Type>
  11825. <Comment></Comment>
  11826. <Link1>http://www.kkman.com</Link1>
  11827. <Link2></Link2>
  11828. </user-agent>
  11829. <user-agent>
  11830. <ID>id_moz_874</ID>
  11831. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MathPlayer2.0)</String>
  11832. <Description>IE 6x WinXP MathPlayer mathematical notation plugin </Description>
  11833. <Type>B</Type>
  11834. <Comment></Comment>
  11835. <Link1>http://www.mathtype.com/en/products/mathplayer/</Link1>
  11836. <Link2></Link2>
  11837. </user-agent>
  11838. <user-agent>
  11839. <ID>id_moz_875</ID>
  11840. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Maxthon) </String>
  11841. <Description>Maxton (ex MyIE2) - IE based browser</Description>
  11842. <Type>B</Type>
  11843. <Comment></Comment>
  11844. <Link1>http://www.maxthon.com</Link1>
  11845. <Link2></Link2>
  11846. </user-agent>
  11847. <user-agent>
  11848. <ID>id_moz_876</ID>
  11849. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; PeoplePal 3.0; MSIECrawler)</String>
  11850. <Description>IE 6x WinXP peoplepc online PeoplePal IE toolbar</Description>
  11851. <Type>B</Type>
  11852. <Comment></Comment>
  11853. <Link1>http://home.vfw-online.com/peoplepal/default.asp</Link1>
  11854. <Link2></Link2>
  11855. </user-agent>
  11856. <user-agent>
  11857. <ID>id_moz_877</ID>
  11858. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Q312461; IOpener Release 1.1.04)</String>
  11859. <Description>IE 6x WinXP / I-Opener (was www.netpliance.com/) web PC</Description>
  11860. <Type>B</Type>
  11861. <Comment></Comment>
  11862. <Link1></Link1>
  11863. <Link2></Link2>
  11864. </user-agent>
  11865. <user-agent>
  11866. <ID>id_moz_050307_1</ID>
  11867. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; QihooBot 1.0  qihoobot@qihoo.net)</String>
  11868. <Description>Qihoo search (China) robot</Description>
  11869. <Type>R</Type>
  11870. <Comment>220.181.34.1xx</Comment>
  11871. <Link1>http://www.qihoo.com/</Link1>
  11872. <Link2></Link2>
  11873. </user-agent>
  11874. <user-agent>
  11875. <ID>id_moz_070306_1</ID>
  11876. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SIMBAR Enabled; InfoPath.1)</String>
  11877. <Description>SimBar IE toolbar for accessing The Sims sites / Infopath IE form &amp; spreadsheet plugin</Description>
  11878. <Type>B</Type>
  11879. <Comment></Comment>
  11880. <Link1>http://www.simstools.com/simbar.php</Link1>
  11881. <Link2>http://office.microsoft.com/en-us/fx010857921033.aspx</Link2>
  11882. </user-agent>
  11883. <user-agent>
  11884. <ID>id_moz_878</ID>
  11885. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; StumbleUpon.com 1.760; .NET CLR 1.1.4322)</String>
  11886. <Description>IE 6x WinXP Stumble Upon IE toolbar</Description>
  11887. <Type>B</Type>
  11888. <Comment></Comment>
  11889. <Link1>http://www.stumbleupon.com</Link1>
  11890. <Link2></Link2>
  11891. </user-agent>
  11892. <user-agent>
  11893. <ID>id_moz_150807_1</ID>
  11894. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1;  Embedded Web Browser from: http://bsalsa.com/; MSIECrawler)</String>
  11895. <Description>Balsa Productions embedded web browser package for Borland Delphi</Description>
  11896. <Type>B</Type>
  11897. <Comment></Comment>
  11898. <Link1>http://bsalsa.com/product.html</Link1>
  11899. <Link2></Link2>
  11900. </user-agent>
  11901. <user-agent>
  11902. <ID>id_moz_030807_2</ID>
  11903. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1;  http://www.changedetection.com/bot.html )</String>
  11904. <Description>ChangeDetection robot for web page monitoring</Description>
  11905. <Type>C</Type>
  11906. <Comment>68.166.223.x</Comment>
  11907. <Link1>http://www.changedetection.com/</Link1>
  11908. <Link2>http://www.changedetection.com/bot.html</Link2>
  11909. </user-agent>
  11910. <user-agent>
  11911. <ID>id_moz_879</ID>
  11912. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 1.1.4322)</String>
  11913. <Description>IE 6x WinXP also used by WebSite Pro HTML editor</Description>
  11914. <Type>B</Type>
  11915. <Comment></Comment>
  11916. <Link1>http://www.gtpcc.org/gtpcc/websitepro.htm</Link1>
  11917. <Link2></Link2>
  11918. </user-agent>
  11919. <user-agent>
  11920. <ID>id_moz_880</ID>
  11921. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; DX-Browser 5.0.0.0)</String>
  11922. <Description>DX-Browser - German IE based browser</Description>
  11923. <Type>B</Type>
  11924. <Comment>was http://www.dx-soft.net/ (expired)</Comment>
  11925. <Link1>http://www.zdnet.de/downloads/prg/t/p/deDCTP-wc.html</Link1>
  11926. <Link2></Link2>
  11927. </user-agent>
  11928. <user-agent>
  11929. <ID>id_moz_271006_1</ID>
  11930. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; FunWebProducts; ezPeer+ v1.0 Beta (0.4.1.98); ezPeer+ v1.0 (0.5.0.00); .NET CLR 1.1.4322; MSIECrawler)</String>
  11931. <Description>ezPeer+ P2P IE addon</Description>
  11932. <Type>B</Type>
  11933. <Comment></Comment>
  11934. <Link1>http://web.ezpeer.com/</Link1>
  11935. <Link2></Link2>
  11936. </user-agent>
  11937. <user-agent>
  11938. <ID>id_moz_881</ID>
  11939. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; IBP; .NET CLR 1.1.4322)</String>
  11940. <Description>Axandra IBP website promotion software ?</Description>
  11941. <Type>C B</Type>
  11942. <Comment></Comment>
  11943. <Link1>http://www.axandra-web-site-promotion-software-tool.com/index.htm</Link1>
  11944. <Link2></Link2>
  11945. </user-agent>
  11946. <user-agent>
  11947. <ID>id_moz_290606_3</ID>
  11948. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; MRA 4.3 (build 01218))</String>
  11949. <Description>MRA = Mail.ru Agent - Instant Messenger / VoIP</Description>
  11950. <Type>B</Type>
  11951. <Comment></Comment>
  11952. <Link1>http://agent.mail.ru/</Link1>
  11953. <Link2></Link2>
  11954. </user-agent>
  11955. <user-agent>
  11956. <ID>id_moz_883</ID>
  11957. <String>Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search 4.0 Robot)</String>
  11958. <Description>MSN Search robot (207.46.89.xx)</Description>
  11959. <Type>R</Type>
  11960. <Comment>s. also: - MSNBOT</Comment>
  11961. <Link1></Link1>
  11962. <Link2></Link2>
  11963. </user-agent>
  11964. <user-agent>
  11965. <ID>id_moz_170207_3</ID>
  11966. <String>Mozilla/4.0 (compatible; MSIE 7.0; Win32) Link Commander 4.0</String>
  11967. <Description>Link Commander bookmark manager</Description>
  11968. <Type>C</Type>
  11969. <Comment></Comment>
  11970. <Link1>http://www.resortlabs.com/bookmark-manager/linkcommander.php</Link1>
  11971. <Link2></Link2>
  11972. </user-agent>
  11973. <user-agent>
  11974. <ID>id_moz_170706_2</ID>
  11975. <String>Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; bgft)</String>
  11976. <Description>IE 7.0 - WinXP</Description>
  11977. <Type>B</Type>
  11978. <Comment></Comment>
  11979. <Link1>http://www.microsoft.com/windows/ie/default.mspx</Link1>
  11980. <Link2></Link2>
  11981. </user-agent>
  11982. <user-agent>
  11983. <ID>id_moz_080209_1</ID>
  11984. <String>Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; GTB5; User-agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://bsalsa.com) ; .NET CLR 2.0.50727)</String>
  11985. <Description>GTB = Google Toolbar Internet Explorer add-on</Description>
  11986. <Type>B</Type>
  11987. <Comment></Comment>
  11988. <Link1>http://toolbar.google.com/T4/index.html</Link1>
  11989. <Link2></Link2>
  11990. </user-agent>
  11991. <user-agent>
  11992. <ID>id_moz_080209_2</ID>
  11993. <String>Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; Tablet PC 2.0)</String>
  11994. <Description>MSIE 7.0 *and* Trident token used by Internet Explorer 8 in compatibility view mode</Description>
  11995. <Type>B</Type>
  11996. <Comment></Comment>
  11997. <Link1>http://blogs.msdn.com/ie/archive/2009/01/09/the-internet-explorer-8-user-agent-string-updated-edition.aspx</Link1>
  11998. <Link2></Link2>
  11999. </user-agent>
  12000. <user-agent>
  12001. <ID>id_moz_080209_3</ID>
  12002. <String>Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0; .NET CLR 2.0.50727; .NET CLR 1.1.4322; .NET CLR 3.0.04506.30; .NET CLR 3.0.04506.648)</String>
  12003. <Description>Internet Explorer 8</Description>
  12004. <Type>B</Type>
  12005. <Comment></Comment>
  12006. <Link1>http://www.microsoft.com/windows/internet-explorer/beta/default.aspx</Link1>
  12007. <Link2></Link2>
  12008. </user-agent>
  12009. <user-agent>
  12010. <ID>id_moz_150408_4</ID>
  12011. <String>Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0)</String>
  12012. <Description>IE 8.0 (beta) on Win Vista</Description>
  12013. <Type>B</Type>
  12014. <Comment></Comment>
  12015. <Link1>http://www.microsoft.com/windows/products/winfamily/ie/ie8/default.mspx</Link1>
  12016. <Link2></Link2>
  12017. </user-agent>
  12018. <user-agent>
  12019. <ID>id_moz_030110_1</ID>
  12020. <String>Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0; Orange 8.0; GTB6.3; Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1) ;  Embedded Web Browser from: http://bsalsa.com/; SLCC1; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30618; OfficeLiveConnector.1.3; OfficeLivePatch.1.3)</String>
  12021. <Description>Bsalsa embedded browser</Description>
  12022. <Type>B</Type>
  12023. <Comment></Comment>
  12024. <Link1>http://bsalsa.com/</Link1>
  12025. <Link2></Link2>
  12026. </user-agent>
  12027. <user-agent>
  12028. <ID>id_moz_010108_4</ID>
  12029. <String>Mozilla/4.0 (compatible; MSIE enviable; DAUMOA 2.0; DAUM Web Robot; Daum Communications Corp.&#44; Korea; +http://ws.daum.net/aboutkr.html)</String>
  12030. <Description>DAUMOA - Daum search Korea robot (211.115.109.xxx)</Description>
  12031. <Type>R</Type>
  12032. <Comment>s. also RaBot</Comment>
  12033. <Link1>http://www.daum.net/</Link1>
  12034. <Link2>http://ws.daum.net/abouten.html</Link2>
  12035. </user-agent>
  12036. <user-agent>
  12037. <ID>id_moz_311206_1</ID>
  12038. <String>Mozilla/4.0 (compatible; MSIE is not me; DAUMOA/1.0.1; DAUM Web Robot; Daum Communications Corp.&#44; Korea)</String>
  12039. <Description>DAUMOA - Daum search Korea robot (211.115.109.xxx)</Description>
  12040. <Type>R</Type>
  12041. <Comment>s. also RaBot</Comment>
  12042. <Link1>http://www.daum.net/</Link1>
  12043. <Link2></Link2>
  12044. </user-agent>
  12045. <user-agent>
  12046. <ID>id_moz_281106_2</ID>
  12047. <String>Mozilla/4.0 (compatible; NaverBot/1.0; http://help.naver.com/delete_main.asp)</String>
  12048. <Description>Naver Search Korea Naverbot</Description>
  12049. <Type>R</Type>
  12050. <Comment></Comment>
  12051. <Link1>http://www.naver.com/</Link1>
  12052. <Link2></Link2>
  12053. </user-agent>
  12054. <user-agent>
  12055. <ID>id_moz_884</ID>
  12056. <String>Mozilla/4.0 (compatible; Netcraft Web Server Survey)</String>
  12057. <Description>Netcraft webserver info</Description>
  12058. <Type>R C</Type>
  12059. <Comment></Comment>
  12060. <Link1>http://www.netcraft.com</Link1>
  12061. <Link2></Link2>
  12062. </user-agent>
  12063. <user-agent>
  12064. <ID>id_moz_885</ID>
  12065. <String>Mozilla/4.0 (compatible; NetPromoter Spider;http://www.net-promoter.com/)</String>
  12066. <Description>NetPromoter Link Utility link checking tool </Description>
  12067. <Type>C</Type>
  12068. <Comment>s. also - Mozilla/4.0 (compatible; Link Utility ...</Comment>
  12069. <Link1>http://www.net-promoter.com/</Link1>
  12070. <Link2></Link2>
  12071. </user-agent>
  12072. <user-agent>
  12073. <ID>id_moz_886</ID>
  12074. <String>Mozilla/4.0 (compatible; Opera/3.0; Windows 4.10) 3.51 [en]</String>
  12075. <Description>Opera 3.x WinNT</Description>
  12076. <Type>B</Type>
  12077. <Comment></Comment>
  12078. <Link1></Link1>
  12079. <Link2></Link2>
  12080. </user-agent>
  12081. <user-agent>
  12082. <ID>id_moz_887</ID>
  12083. <String>Mozilla/4.0 (compatible; Powermarks/3.5; Windows 95/98/2000/NT)</String>
  12084. <Description>Powermarks bookmark manager</Description>
  12085. <Type>C</Type>
  12086. <Comment></Comment>
  12087. <Link1>http://www.kaylon.com</Link1>
  12088. <Link2></Link2>
  12089. </user-agent>
  12090. <user-agent>
  12091. <ID>id_moz_230607_1</ID>
  12092. <String>Mozilla/4.0 (compatible; RSS Popper)</String>
  12093. <Description>RSS Popper - MS Outlook RSS reader plugin</Description>
  12094. <Type>B</Type>
  12095. <Comment></Comment>
  12096. <Link1>http://rsspopper.unknown/2004/10/home.html</Link1>
  12097. <Link2></Link2>
  12098. </user-agent>
  12099. <user-agent>
  12100. <ID>id_moz_888</ID>
  12101. <String>Mozilla/4.0 (compatible; SiteKiosk 4.0; MSIE 5.0; Windows 98; SiteCoach 1.0)</String>
  12102. <Description>SiteKiosk public terminal browser</Description>
  12103. <Type>B</Type>
  12104. <Comment></Comment>
  12105. <Link1>http://www.sitekiosk.com</Link1>
  12106. <Link2></Link2>
  12107. </user-agent>
  12108. <user-agent>
  12109. <ID>id_moz_889</ID>
  12110. <String>Mozilla/4.0 (compatible; SpeedySpider; www.entireweb.com)</String>
  12111. <Description>Entireweb Search Speedyspider (62.13.25.xxx)</Description>
  12112. <Type>R</Type>
  12113. <Comment>s. also Worldlight</Comment>
  12114. <Link1>http://www.entireweb.com</Link1>
  12115. <Link2></Link2>
  12116. </user-agent>
  12117. <user-agent>
  12118. <ID>id_moz_890</ID>
  12119. <String>Mozilla/4.0 (compatible; SPENG)</String>
  12120. <Description>SiteProbe - website status checking</Description>
  12121. <Type>R C</Type>
  12122. <Comment></Comment>
  12123. <Link1>http://www.siteprobe.com</Link1>
  12124. <Link2></Link2>
  12125. </user-agent>
  12126. <user-agent>
  12127. <ID>id_moz_891</ID>
  12128. <String>Mozilla/4.0 (compatible; SuperCleaner 2.xx; Windows 98)</String>
  12129. <Description>Super Cleaner privacy tool (bookmark checking)</Description>
  12130. <Type>C</Type>
  12131. <Comment></Comment>
  12132. <Link1>http://www.southbaypc.com/SuperCleaner/</Link1>
  12133. <Link2></Link2>
  12134. </user-agent>
  12135. <user-agent>
  12136. <ID>id_moz_020406_1</ID>
  12137. <String>Mozilla/4.0 (compatible; Synapse)</String>
  12138. <Description>Synapse - Apache web service for processing XML documents</Description>
  12139. <Type>P</Type>
  12140. <Comment></Comment>
  12141. <Link1>http://wiki.apache.org/incubator/SynapseProposal</Link1>
  12142. <Link2></Link2>
  12143. </user-agent>
  12144. <user-agent>
  12145. <ID>id_moz_150207_1</ID>
  12146. <String>Mozilla/4.0 (compatible; WebCapture 3.0; Windows)</String>
  12147. <Description>Web2PDF - Adobe Acrobat plugin for site traversal and other services for the Web Capture feature</Description>
  12148. <Type>D</Type>
  12149. <Comment></Comment>
  12150. <Link1></Link1>
  12151. <Link2></Link2>
  12152. </user-agent>
  12153. <user-agent>
  12154. <ID>id_moz_892</ID>
  12155. <String>Mozilla/4.0 (compatible; Win32; WinHttp.WinHttpRequest.5)</String>
  12156. <Description>Windows HTTP Services (WinHTTP / XML-parser)</Description>
  12157. <Type></Type>
  12158. <Comment></Comment>
  12159. <Link1></Link1>
  12160. <Link2></Link2>
  12161. </user-agent>
  12162. <user-agent>
  12163. <ID>id_moz_170108_1</ID>
  12164. <String>Mozilla/4.0 (compatible; WSN Links)</String>
  12165. <Description>WSN Links PHP directory software</Description>
  12166. <Type>C</Type>
  12167. <Comment></Comment>
  12168. <Link1>http://scripts.webmastersite.net/wsnlinks/</Link1>
  12169. <Link2></Link2>
  12170. </user-agent>
  12171. <user-agent>
  12172. <ID>id_moz_111205_6</ID>
  12173. <String>Mozilla/4.0 (compatible; www.euro-directory.com; urlchecker1.0)</String>
  12174. <Description>Euro Directory (German / Austrian) directory link checking</Description>
  12175. <Type>R C</Type>
  12176. <Comment></Comment>
  12177. <Link1>http://www.euro-directory.com/</Link1>
  12178. <Link2></Link2>
  12179. </user-agent>
  12180. <user-agent>
  12181. <ID>id_moz_893</ID>
  12182. <String>Mozilla/4.0 (compatible; www.galaxy.com)</String>
  12183. <Description>Galaxy robot</Description>
  12184. <Type>R</Type>
  12185. <Comment></Comment>
  12186. <Link1>http://www.galaxy.com</Link1>
  12187. <Link2></Link2>
  12188. </user-agent>
  12189. <user-agent>
  12190. <ID>id_moz_894</ID>
  12191. <String>Mozilla/4.0 (compatible; www.linkguard.com Linkguard Online 1.0; Windows NT)</String>
  12192. <Description>Linkguard.com link validation (service is offline)</Description>
  12193. <Type>C</Type>
  12194. <Comment></Comment>
  12195. <Link1></Link1>
  12196. <Link2></Link2>
  12197. </user-agent>
  12198. <user-agent>
  12199. <ID>id_moz_240106_1</ID>
  12200. <String>Mozilla/4.0 (compatible; Y!J; for robot study; keyoshid)</String>
  12201. <Description>Yahoo Search Japan robot (203.141.52.)</Description>
  12202. <Type>R</Type>
  12203. <Comment>s. also Y!J-BSC/1.0...</Comment>
  12204. <Link1>http://www.yahoo.co.jp/</Link1>
  12205. <Link2></Link2>
  12206. </user-agent>
  12207. <user-agent>
  12208. <ID>id_moz_170706_1</ID>
  12209. <String>Mozilla/4.0 (compatible; Yahoo Japan; for robot study; kasugiya)</String>
  12210. <Description>Yahoo Japan robot (202.93.76.xx)</Description>
  12211. <Type>R</Type>
  12212. <Comment></Comment>
  12213. <Link1>http://www.yahoo.co.jp/</Link1>
  12214. <Link2></Link2>
  12215. </user-agent>
  12216. <user-agent>
  12217. <ID>id_moz_210207_1</ID>
  12218. <String>Mozilla/4.0 (compatible;MSIE 6.0; Windows NT 5.0; H010818)</String>
  12219. <Description>Faked IE id string used by DeepTrawl link checking tool</Description>
  12220. <Type>C</Type>
  12221. <Comment></Comment>
  12222. <Link1>http://deeptrawl.com/</Link1>
  12223. <Link2></Link2>
  12224. </user-agent>
  12225. <user-agent>
  12226. <ID>id_moz_896</ID>
  12227. <String>Mozilla/4.0 (fantomBrowser)</String>
  12228. <Description>spoofed referer by Fantomaster (Multiblocker) anonymity products</Description>
  12229. <Type>P</Type>
  12230. <Comment></Comment>
  12231. <Link1>http://fantomaster.com</Link1>
  12232. <Link2>http://multiblocker.com/home.html</Link2>
  12233. </user-agent>
  12234. <user-agent>
  12235. <ID>id_moz_897</ID>
  12236. <String>Mozilla/4.0 (fantomCrew Browser)</String>
  12237. <Description>spoofed referer by Fantomaster (Multiblocker) anonymity products</Description>
  12238. <Type>P</Type>
  12239. <Comment></Comment>
  12240. <Link1>http://fantomaster.com</Link1>
  12241. <Link2>http://multiblocker.com/home.html</Link2>
  12242. </user-agent>
  12243. <user-agent>
  12244. <ID>id_moz_898</ID>
  12245. <String>Mozilla/4.0 (hhjhj@yahoo.com)</String>
  12246. <Description>unknown robot from - 64.57.223.40 - 66.28.233.xxx (cogentco.com)</Description>
  12247. <Type></Type>
  12248. <Comment></Comment>
  12249. <Link1></Link1>
  12250. <Link2></Link2>
  12251. </user-agent>
  12252. <user-agent>
  12253. <ID>id_moz_899</ID>
  12254. <String>Mozilla/4.0 (JemmaTheTourist;http://www.activtourist.com)</String>
  12255. <Description>Activtourist Jemma spider</Description>
  12256. <Type>R</Type>
  12257. <Comment></Comment>
  12258. <Link1>http://www.activtourist.com</Link1>
  12259. <Link2></Link2>
  12260. </user-agent>
  12261. <user-agent>
  12262. <ID>id_moz_900</ID>
  12263. <String>Mozilla/4.0 (MobilePhone PM-8200/US/1.0) NetFront/3.x MMP/2.0</String>
  12264. <Description>NetFront (v3.x) for Pocket PC (here on Sanyo PM-8200 cell phone)</Description>
  12265. <Type>B</Type>
  12266. <Comment></Comment>
  12267. <Link1>http://nfppc.access.co.jp/english/</Link1>
  12268. <Link2></Link2>
  12269. </user-agent>
  12270. <user-agent>
  12271. <ID>id_moz_901</ID>
  12272. <String>Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html)</String>
  12273. <Description>Google robot from 66.249.66.xxx </Description>
  12274. <Type>R</Type>
  12275. <Comment>s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1...</Comment>
  12276. <Link1>http://www.google.com</Link1>
  12277. <Link2></Link2>
  12278. </user-agent>
  12279. <user-agent>
  12280. <ID>id_moz_902</ID>
  12281. <String>Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 FAKE (compatible; Googlebot/2.1; http://www.google.com/bot.html)</String>
  12282. <Description>Google robot from 66.249.66.xxx </Description>
  12283. <Type>R</Type>
  12284. <Comment>s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1...</Comment>
  12285. <Link1>http://www.google.com</Link1>
  12286. <Link2></Link2>
  12287. </user-agent>
  12288. <user-agent>
  12289. <ID>id_moz_081106_1</ID>
  12290. <String>Mozilla/4.0 (Mozilla; http://www.mozilla.org/docs/en/bot.html; master@mozilla.com)</String>
  12291. <Description>Unknown robot from Mozilla.org</Description>
  12292. <Type>R</Type>
  12293. <Comment>63.209.222.xx</Comment>
  12294. <Link1>http://www.mozilla.org/</Link1>
  12295. <Link2></Link2>
  12296. </user-agent>
  12297. <user-agent>
  12298. <ID>id_moz_903</ID>
  12299. <String>Mozilla/4.0 (Sleek Spider/1.2)</String>
  12300. <Description>ASI - Any Search Info robot</Description>
  12301. <Type>R</Type>
  12302. <Comment></Comment>
  12303. <Link1>http://search-info.com/</Link1>
  12304. <Link2></Link2>
  12305. </user-agent>
  12306. <user-agent>
  12307. <ID>id_moz_170406_1</ID>
  12308. <String>Mozilla/4.0 compatible FurlBot/Furl Search 2.0 (FurlBot; http://www.furl.net; wn.furlbot@looksmart.net)</String>
  12309. <Description>Furl (Looksmart) online bookmark tool robot</Description>
  12310. <Type>R</Type>
  12311. <Comment>64.242.88.xx</Comment>
  12312. <Link1>http://www.furl.net/</Link1>
  12313. <Link2></Link2>
  12314. </user-agent>
  12315. <user-agent>
  12316. <ID>id_moz_905</ID>
  12317. <String>Mozilla/4.0 compatible ZyBorg/1.0 (wn.zyborg@looksmart.net; http://www.WISEnutbot.com)</String>
  12318. <Description>Wisenut robot</Description>
  12319. <Type>R</Type>
  12320. <Comment></Comment>
  12321. <Link1>http://www.wisenut.com/</Link1>
  12322. <Link2></Link2>
  12323. </user-agent>
  12324. <user-agent>
  12325. <ID>id_moz_906</ID>
  12326. <String>Mozilla/4.0 compatible ZyBorg/1.0 (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com)</String>
  12327. <Description>Wisenut robot</Description>
  12328. <Type>R</Type>
  12329. <Comment></Comment>
  12330. <Link1>http://www.wisenut.com/</Link1>
  12331. <Link2></Link2>
  12332. </user-agent>
  12333. <user-agent>
  12334. <ID>id_moz_907</ID>
  12335. <String>Mozilla/4.0 compatible ZyBorg/1.0 Dead Link Checker (wn.zyborg@looksmart.net; http://www.WISEnutbot.com)</String>
  12336. <Description>Wisenut robot</Description>
  12337. <Type>R</Type>
  12338. <Comment></Comment>
  12339. <Link1>http://www.wisenut.com/</Link1>
  12340. <Link2></Link2>
  12341. </user-agent>
  12342. <user-agent>
  12343. <ID>id_moz_908</ID>
  12344. <String>Mozilla/4.0 compatible ZyBorg/1.0 for Homepage (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com)</String>
  12345. <Description>Wisenut robot</Description>
  12346. <Type>R</Type>
  12347. <Comment></Comment>
  12348. <Link1>http://www.wisenut.com/</Link1>
  12349. <Link2></Link2>
  12350. </user-agent>
  12351. <user-agent>
  12352. <ID>id_moz_909</ID>
  12353. <String>Mozilla/4.0 efp@gmx.net</String>
  12354. <Description>Unknown robot from 66.230.140.xx (argon.oxeo.com) maybe an e-mail collector</Description>
  12355. <Type>S</Type>
  12356. <Comment>see also LARBIN-EXPERIMENTAL</Comment>
  12357. <Link1></Link1>
  12358. <Link2></Link2>
  12359. </user-agent>
  12360. <user-agent>
  12361. <ID>id_moz_910</ID>
  12362. <String>Mozilla/4.0 WebTV/2.6 (compatible; MSIE 4.0)</String>
  12363. <Description>WebTV</Description>
  12364. <Type>B</Type>
  12365. <Comment></Comment>
  12366. <Link1></Link1>
  12367. <Link2></Link2>
  12368. </user-agent>
  12369. <user-agent>
  12370. <ID>id_moz_904</ID>
  12371. <String>Mozilla/4.0 [en] (Ask Jeeves Corporate Spider)</String>
  12372. <Description>Ask / Ask Jeeves robot</Description>
  12373. <Type>R</Type>
  12374. <Comment></Comment>
  12375. <Link1>http://www.Ask.com</Link1>
  12376. <Link2></Link2>
  12377. </user-agent>
  12378. <user-agent>
  12379. <ID>id_moz_913</ID>
  12380. <String>Mozilla/4.0(compatible; Zealbot 1.0)</String>
  12381. <Description>LookSmart spider</Description>
  12382. <Type>R</Type>
  12383. <Comment></Comment>
  12384. <Link1>http://www.looksmart.com</Link1>
  12385. <Link2></Link2>
  12386. </user-agent>
  12387. <user-agent>
  12388. <ID>id_moz_290807_1</ID>
  12389. <String>Mozilla/4.01 (compatible; NORAD National Defence Network)</String>
  12390. <Description>HideMe - Web based anonymous proxy server service</Description>
  12391. <Type>P</Type>
  12392. <Comment></Comment>
  12393. <Link1>http://www.hideme.biz/</Link1>
  12394. <Link2>http://www.cnn.com/TECH/computing/9901/25/hacktracts.idg/index.html</Link2>
  12395. </user-agent>
  12396. <user-agent>
  12397. <ID>id_moz_914</ID>
  12398. <String>Mozilla/4.01 [en](Win95;I)</String>
  12399. <Description>Some download manager spoofing Netscape 4.01</Description>
  12400. <Type>D</Type>
  12401. <Comment></Comment>
  12402. <Link1></Link1>
  12403. <Link2></Link2>
  12404. </user-agent>
  12405. <user-agent>
  12406. <ID>id_moz_915</ID>
  12407. <String>Mozilla/4.02 [en] (X11; I; SunOS 5.6 sun4u)</String>
  12408. <Description>Netscape 4.x SunOS 5.6</Description>
  12409. <Type>B</Type>
  12410. <Comment></Comment>
  12411. <Link1></Link1>
  12412. <Link2></Link2>
  12413. </user-agent>
  12414. <user-agent>
  12415. <ID>id_moz_161105_3</ID>
  12416. <String>Mozilla/4.04 (compatible; Dulance bot; +http://www.dulance.com/bot.jsp)</String>
  12417. <Description>Dulance Bot - Dulance automated price comparison engine</Description>
  12418. <Type>R</Type>
  12419. <Comment></Comment>
  12420. <Link1>http://www.dulance.com/</Link1>
  12421. <Link2></Link2>
  12422. </user-agent>
  12423. <user-agent>
  12424. <ID>id_moz_916</ID>
  12425. <String>Mozilla/4.04 [en] (X11; I; HP-UX B.10.20 9000/712)</String>
  12426. <Description>Netscape 4.x HP-Unix</Description>
  12427. <Type>B</Type>
  12428. <Comment></Comment>
  12429. <Link1></Link1>
  12430. <Link2></Link2>
  12431. </user-agent>
  12432. <user-agent>
  12433. <ID>id_moz_917</ID>
  12434. <String>Mozilla/4.04 [en] (X11; I; IRIX 5.3 IP22)</String>
  12435. <Description>Netscape 4.x IRIX</Description>
  12436. <Type>B</Type>
  12437. <Comment></Comment>
  12438. <Link1></Link1>
  12439. <Link2></Link2>
  12440. </user-agent>
  12441. <user-agent>
  12442. <ID>id_moz_918</ID>
  12443. <String>Mozilla/4.05 (Macintosh; I; 68K Nav)</String>
  12444. <Description>Netscape 4.x Macintosh 68k</Description>
  12445. <Type>B</Type>
  12446. <Comment></Comment>
  12447. <Link1></Link1>
  12448. <Link2></Link2>
  12449. </user-agent>
  12450. <user-agent>
  12451. <ID>id_moz_919</ID>
  12452. <String>Mozilla/4.05 (Macintosh; I; PPC Nav)</String>
  12453. <Description>Netscape 4.x Macintosh PowerPC</Description>
  12454. <Type>B</Type>
  12455. <Comment></Comment>
  12456. <Link1></Link1>
  12457. <Link2></Link2>
  12458. </user-agent>
  12459. <user-agent>
  12460. <ID>id_moz_920</ID>
  12461. <String>Mozilla/4.05 [en] (X11; I; SunOS 4.1.4 sun4m)</String>
  12462. <Description>Netscape 4.x SunOS 4.1.4</Description>
  12463. <Type>B</Type>
  12464. <Comment></Comment>
  12465. <Link1></Link1>
  12466. <Link2></Link2>
  12467. </user-agent>
  12468. <user-agent>
  12469. <ID>id_moz_921</ID>
  12470. <String>Mozilla/4.08 [en] (Win98; U ;Nav)</String>
  12471. <Description>Version 4.08 [en]-98306</Description>
  12472. <Type>Someone copied the help function in the referrer field ?</Type>
  12473. <Comment></Comment>
  12474. <Link1></Link1>
  12475. <Link2></Link2>
  12476. </user-agent>
  12477. <user-agent>
  12478. <ID>id_moz_922</ID>
  12479. <String>Mozilla/4.08 [en] (WinNT; U)</String>
  12480. <Description>Netscape 4.x WinNT</Description>
  12481. <Type>B</Type>
  12482. <Comment></Comment>
  12483. <Link1></Link1>
  12484. <Link2></Link2>
  12485. </user-agent>
  12486. <user-agent>
  12487. <ID>id_moz_911</ID>
  12488. <String>Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_TrueRobot/1.4 libwww/5.2.8</String>
  12489. <Description>Echo.com robot</Description>
  12490. <Type>R</Type>
  12491. <Comment></Comment>
  12492. <Link1>http://www.echo.com</Link1>
  12493. <Link2></Link2>
  12494. </user-agent>
  12495. <user-agent>
  12496. <ID>id_moz_912</ID>
  12497. <String>Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_VoilaBot/1.6 libwww/5.3.2</String>
  12498. <Description>Voila.fr robot</Description>
  12499. <Type>R</Type>
  12500. <Comment></Comment>
  12501. <Link1>http://www.voila.fr</Link1>
  12502. <Link2></Link2>
  12503. </user-agent>
  12504. <user-agent>
  12505. <ID>id_moz_923</ID>
  12506. <String>Mozilla/4.5 (compatible; HTTrack 3.0x; Windows 98)</String>
  12507. <Description>HTTrack Offline Browser</Description>
  12508. <Type>B D</Type>
  12509. <Comment></Comment>
  12510. <Link1>http://www.httrack.com/</Link1>
  12511. <Link2></Link2>
  12512. </user-agent>
  12513. <user-agent>
  12514. <ID>id_moz_924</ID>
  12515. <String>Mozilla/4.5 (compatible; iCab 2.5.3; Macintosh; I; PPC)</String>
  12516. <Description>iCab MAC Web browser MAC Power PC</Description>
  12517. <Type>B</Type>
  12518. <Comment></Comment>
  12519. <Link1>http://www.icab.de</Link1>
  12520. <Link2></Link2>
  12521. </user-agent>
  12522. <user-agent>
  12523. <ID>id_moz_925</ID>
  12524. <String>Mozilla/4.5 (compatible; OmniWeb/4.0.5; Mac_PowerPC)</String>
  12525. <Description>OmniWeb 4.x.x Mac browser</Description>
  12526. <Type>B</Type>
  12527. <Comment></Comment>
  12528. <Link1>http://www.omnigroup.com</Link1>
  12529. <Link2></Link2>
  12530. </user-agent>
  12531. <user-agent>
  12532. <ID>id_moz_926</ID>
  12533. <String>Mozilla/4.5 (compatible; OmniWeb/4.1-beta-1; Mac_PowerPC)</String>
  12534. <Description>OmniWeb 4.x.x Mac browser</Description>
  12535. <Type>B</Type>
  12536. <Comment></Comment>
  12537. <Link1>http://www.omnigroup.com</Link1>
  12538. <Link2></Link2>
  12539. </user-agent>
  12540. <user-agent>
  12541. <ID>id_moz_928</ID>
  12542. <String>Mozilla/4.5 RPT-HTTPClient/0.3-2</String>
  12543. <Description>different IPs using the HTTPClient library (mostly link checking)</Description>
  12544. <Type>C R</Type>
  12545. <Comment></Comment>
  12546. <Link1>http://www.innovation.ch</Link1>
  12547. <Link2></Link2>
  12548. </user-agent>
  12549. <user-agent>
  12550. <ID>id_moz_927</ID>
  12551. <String>Mozilla/4.5 [en]C-CCK-MCD {RuralNet} (Win98; I)</String>
  12552. <Description>RuralNet Internet Services</Description>
  12553. <Type>B</Type>
  12554. <Comment></Comment>
  12555. <Link1>http://www.ruralnet.net.au</Link1>
  12556. <Link2></Link2>
  12557. </user-agent>
  12558. <user-agent>
  12559. <ID>id_moz_929</ID>
  12560. <String>Mozilla/4.5b1 [en] (X11; I; Linux 2.0.35 i586)</String>
  12561. <Description>Netscape 4.x Linux</Description>
  12562. <Type>B</Type>
  12563. <Comment></Comment>
  12564. <Link1></Link1>
  12565. <Link2></Link2>
  12566. </user-agent>
  12567. <user-agent>
  12568. <ID>id_moz_301105_3</ID>
  12569. <String>Mozilla/4.6 [en] (http://www.cnet.com/)</String>
  12570. <Description>Cnet robot for Search.com (216.239.114.xx)</Description>
  12571. <Type>R</Type>
  12572. <Comment></Comment>
  12573. <Link1>http://www.search.com/</Link1>
  12574. <Link2>http://www.cnet.com/</Link2>
  12575. </user-agent>
  12576. <user-agent>
  12577. <ID>id_moz_930</ID>
  12578. <String>Mozilla/4.61 [de] (OS/2; I)</String>
  12579. <Description>Netscape 4.x OS/2</Description>
  12580. <Type>B</Type>
  12581. <Comment></Comment>
  12582. <Link1></Link1>
  12583. <Link2></Link2>
  12584. </user-agent>
  12585. <user-agent>
  12586. <ID>id_moz_931</ID>
  12587. <String>Mozilla/4.61 [en] (X11; U; ) - BrowseX (2.0.0 Windows)</String>
  12588. <Description>BrowseX cross-platform browser</Description>
  12589. <Type>B</Type>
  12590. <Comment></Comment>
  12591. <Link1>http://browsex.com/</Link1>
  12592. <Link2></Link2>
  12593. </user-agent>
  12594. <user-agent>
  12595. <ID>id_moz_932</ID>
  12596. <String>Mozilla/4.7</String>
  12597. <Description>Nameprotect (12.148.196.128 - 12.148.196.255) snoopbot</Description>
  12598. <Type>R</Type>
  12599. <Comment></Comment>
  12600. <Link1>http://www.nameprotect.com</Link1>
  12601. <Link2></Link2>
  12602. </user-agent>
  12603. <user-agent>
  12604. <ID>id_moz_933</ID>
  12605. <String>Mozilla/4.7 (compatible; http://eidetica.com/spider)</String>
  12606. <Description>Eidetica earch and text mining spider</Description>
  12607. <Type>R</Type>
  12608. <Comment></Comment>
  12609. <Link1>http://eidetica.com/</Link1>
  12610. <Link2></Link2>
  12611. </user-agent>
  12612. <user-agent>
  12613. <ID>id_moz_934</ID>
  12614. <String>Mozilla/4.7 (compatible; Intelliseek; http://www.intelliseek.com)</String>
  12615. <Description>Intelliseek (64.158.138.xx) robot</Description>
  12616. <Type>R</Type>
  12617. <Comment></Comment>
  12618. <Link1>http://www.intelliseek.com</Link1>
  12619. <Link2></Link2>
  12620. </user-agent>
  12621. <user-agent>
  12622. <ID>id_moz_935</ID>
  12623. <String>Mozilla/4.7 (compatible; OffByOne; Windows 98) Webster Pro V3.2</String>
  12624. <Description>OffByOne Browser</Description>
  12625. <Type>B</Type>
  12626. <Comment></Comment>
  12627. <Link1>http://www.offbyone.com</Link1>
  12628. <Link2></Link2>
  12629. </user-agent>
  12630. <user-agent>
  12631. <ID>id_moz_937</ID>
  12632. <String>Mozilla/4.7 (compatible; Whizbang)</String>
  12633. <Description>WhizBang! Labs information extraction robot</Description>
  12634. <Type>R</Type>
  12635. <Comment>closed since May 2002</Comment>
  12636. <Link1>http://www.whizbang.com</Link1>
  12637. <Link2></Link2>
  12638. </user-agent>
  12639. <user-agent>
  12640. <ID>id_moz_936</ID>
  12641. <String>Mozilla/4.7 (compatible; WhizBang; http://www.whizbang.com/crawler)</String>
  12642. <Description>WhizBang! Labs information extraction robot</Description>
  12643. <Type>R</Type>
  12644. <Comment>closed since May 2002</Comment>
  12645. <Link1>http://www.whizbang.com</Link1>
  12646. <Link2></Link2>
  12647. </user-agent>
  12648. <user-agent>
  12649. <ID>id_moz_938</ID>
  12650. <String>Mozilla/4.7 [en](BecomeBot@exava.com)</String>
  12651. <Description>BecomeBot - Becomecom shopping search (64.124.85.xx(x))</Description>
  12652. <Type>R</Type>
  12653. <Comment>64.124.85.[x]xx</Comment>
  12654. <Link1>http://www.become.com</Link1>
  12655. <Link2></Link2>
  12656. </user-agent>
  12657. <user-agent>
  12658. <ID>id_moz_939</ID>
  12659. <String>Mozilla/4.7 [en](Exabot@exava.com)</String>
  12660. <Description>Exabot - exava shopping search (64.124.85.xx(x))</Description>
  12661. <Type>R</Type>
  12662. <Comment></Comment>
  12663. <Link1>http://www.exava.com</Link1>
  12664. <Link2></Link2>
  12665. </user-agent>
  12666. <user-agent>
  12667. <ID>id_moz_940</ID>
  12668. <String>Mozilla/4.7 [en]C-CCK-MCD {Yahoo;YIP052400} (Win95; I)</String>
  12669. <Description>unknown</Description>
  12670. <Type></Type>
  12671. <Comment></Comment>
  12672. <Link1></Link1>
  12673. <Link2></Link2>
  12674. </user-agent>
  12675. <user-agent>
  12676. <ID>id_moz_941</ID>
  12677. <String>Mozilla/4.72 [en] (BACS http://www.ba.be)</String>
  12678. <Description>http://www.ba.be robot</Description>
  12679. <Type>R</Type>
  12680. <Comment></Comment>
  12681. <Link1>http://www.ba.be</Link1>
  12682. <Link2></Link2>
  12683. </user-agent>
  12684. <user-agent>
  12685. <ID>id_moz_942</ID>
  12686. <String>Mozilla/4.72C-CCK-MCD Caldera Systems OpenLinux [en] (X11; U; Linux 2.2.14 i686)</String>
  12687. <Description>Netscpape 4.7x Caldera Open Linux Pentium III</Description>
  12688. <Type>B</Type>
  12689. <Comment></Comment>
  12690. <Link1></Link1>
  12691. <Link2></Link2>
  12692. </user-agent>
  12693. <user-agent>
  12694. <ID>id_moz_943</ID>
  12695. <String>Mozilla/4.75C-ja [ja] (X11; U; OSF1 V5.1 alpha)</String>
  12696. <Description>Netscape 4.7x Japan OSF1 alpha</Description>
  12697. <Type>B</Type>
  12698. <Comment></Comment>
  12699. <Link1></Link1>
  12700. <Link2></Link2>
  12701. </user-agent>
  12702. <user-agent>
  12703. <ID>id_moz_944</ID>
  12704. <String>Mozilla/4.76 (Windows 98; U) Opera 5.12 [en]</String>
  12705. <Description>Opera 5.x Win 98</Description>
  12706. <Type>B</Type>
  12707. <Comment></Comment>
  12708. <Link1></Link1>
  12709. <Link2></Link2>
  12710. </user-agent>
  12711. <user-agent>
  12712. <ID>id_moz_945</ID>
  12713. <String>Mozilla/4.76 [en] (X11; U; FreeBSD 4.4-STABLE i386)</String>
  12714. <Description>Netscape 4.7x FreeBSD</Description>
  12715. <Type>B</Type>
  12716. <Comment></Comment>
  12717. <Link1></Link1>
  12718. <Link2></Link2>
  12719. </user-agent>
  12720. <user-agent>
  12721. <ID>id_moz_946</ID>
  12722. <String>Mozilla/4.76 [en] (X11; U; SunOS 5.7 sun4u)</String>
  12723. <Description>Netscape 4.7x SunOS</Description>
  12724. <Type>B</Type>
  12725. <Comment></Comment>
  12726. <Link1></Link1>
  12727. <Link2></Link2>
  12728. </user-agent>
  12729. <user-agent>
  12730. <ID>id_moz_947</ID>
  12731. <String>Mozilla/4.77C-SGI [en] (X11; U; IRIX 6.5 IP32)</String>
  12732. <Description>IRIX 6.5</Description>
  12733. <Type>B</Type>
  12734. <Comment></Comment>
  12735. <Link1></Link1>
  12736. <Link2></Link2>
  12737. </user-agent>
  12738. <user-agent>
  12739. <ID>id_moz_948</ID>
  12740. <String>Mozilla/5.0</String>
  12741. <Description>GigaMedia / NTT DoCoMo robot</Description>
  12742. <Type>R</Type>
  12743. <Comment></Comment>
  12744. <Link1>http://ir.giga.net.tw/products.htm</Link1>
  12745. <Link2></Link2>
  12746. </user-agent>
  12747. <user-agent>
  12748. <ID>id_moz_040707_3</ID>
  12749. <String>Mozilla/5.0 (+http://www.eurekster.com/mammoth) Mammoth/0.1</String>
  12750. <Description>Eurekster Swicki community search using SLI-Systems site search engine Mammoth</Description>
  12751. <Type>R</Type>
  12752. <Comment>64.106.253.1xx</Comment>
  12753. <Link1>http://www.eurekster.com/</Link1>
  12754. <Link2>http://www.sli-systems.com/</Link2>
  12755. </user-agent>
  12756. <user-agent>
  12757. <ID>id_moz_240306_2</ID>
  12758. <String>Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1</String>
  12759. <Description>SLI Systems mammoth robot</Description>
  12760. <Type>R</Type>
  12761. <Comment>s. also mammoth/1.0 ...</Comment>
  12762. <Link1>http://www.sli-systems.com/</Link1>
  12763. <Link2>http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M</Link2>
  12764. </user-agent>
  12765. <user-agent>
  12766. <ID>id_moz_949</ID>
  12767. <String>Mozilla/5.0 (Clustered-Search-Bot/1.0; support@clush.com; http://www.clush.com/)</String>
  12768. <Description>Clush search robot</Description>
  12769. <Type>R</Type>
  12770. <Comment></Comment>
  12771. <Link1>http://www.clush.com</Link1>
  12772. <Link2></Link2>
  12773. </user-agent>
  12774. <user-agent>
  12775. <ID>id_moz_020807_1</ID>
  12776. <String>Mozilla/5.0 (compatible) GM RSS Panel X</String>
  12777. <Description>Greasemonkey RSS panel Firefox plugin</Description>
  12778. <Type>B</Type>
  12779. <Comment></Comment>
  12780. <Link1>http://www.xs4all.nl/~jlpoutre/BoT/Javascript/RSSpanel/</Link1>
  12781. <Link2></Link2>
  12782. </user-agent>
  12783. <user-agent>
  12784. <ID>id_moz_140209_3</ID>
  12785. <String>Mozilla/5.0 (compatible; +http://www.evri.com/evrinid)</String>
  12786. <Description>Evri search robot</Description>
  12787. <Type>R</Type>
  12788. <Comment>216.168.43.1xx</Comment>
  12789. <Link1>http://www.evri.com/</Link1>
  12790. <Link2></Link2>
  12791. </user-agent>
  12792. <user-agent>
  12793. <ID>id_new_250310_1</ID>
  12794. <String>Mozilla/5.0 (compatible; 008/0.83; http://www.80legs.com/spider.html;) Gecko/2008032620</String>
  12795. <Description>008 distributed crawler for 80legs</Description>
  12796. <Type>R</Type>
  12797. <Comment></Comment>
  12798. <Link1>http://www.80legs.com/spider.html</Link1>
  12799. <Link2></Link2>
  12800. </user-agent>
  12801. <user-agent>
  12802. <ID>id_moz_140209_4</ID>
  12803. <String>Mozilla/5.0 (compatible; Abonti/0.8 - http://www.abonti.com)</String>
  12804. <Description>Abonti WebSearch beta robot</Description>
  12805. <Type>R</Type>
  12806. <Comment>77.233.225.11x</Comment>
  12807. <Link1>http://www.abonti.com/</Link1>
  12808. <Link2></Link2>
  12809. </user-agent>
  12810. <user-agent>
  12811. <ID>id_moz_030110_4</ID>
  12812. <String>Mozilla/5.0 (compatible; aiHitBot/1.0; +http://www.aihit.com/)</String>
  12813. <Description>HitCompanies Aihit crawler</Description>
  12814. <Type>R</Type>
  12815. <Comment>195.128.18.xx</Comment>
  12816. <Link1>http://hitcompanies.aihit.com/search.htm</Link1>
  12817. <Link2></Link2>
  12818. </user-agent>
  12819. <user-agent>
  12820. <ID>id_moz_300406_1</ID>
  12821. <String>Mozilla/5.0 (compatible; AnsearchBot/1.x; +http://www.ansearch.com.au/)</String>
  12822. <Description>Ansearch Australian search robot</Description>
  12823. <Type>R</Type>
  12824. <Comment>203.206.162.x</Comment>
  12825. <Link1>http://www.ansearch.com.au/</Link1>
  12826. <Link2></Link2>
  12827. </user-agent>
  12828. <user-agent>
  12829. <ID>id_moz_011107_1</ID>
  12830. <String>Mozilla/5.0 (compatible; archive.org_bot/1.10.0 +http://www.loc.gov/minerva/crawl.html)</String>
  12831. <Description>The Library of Congress Minerva crawler</Description>
  12832. <Type>R</Type>
  12833. <Comment>207.241.232.1xx</Comment>
  12834. <Link1>http://www.loc.gov/minerva/crawl.html</Link1>
  12835. <Link2></Link2>
  12836. </user-agent>
  12837. <user-agent>
  12838. <ID>id_moz_230607_2</ID>
  12839. <String>Mozilla/5.0 (compatible; archive.org_bot/1.13.1x http://crawler.archive.org)</String>
  12840. <Description>Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx)</Description>
  12841. <Type>R</Type>
  12842. <Comment>s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/...</Comment>
  12843. <Link1>http://www.archive.org/</Link1>
  12844. <Link2></Link2>
  12845. </user-agent>
  12846. <user-agent>
  12847. <ID>id_moz_141105_1</ID>
  12848. <String>Mozilla/5.0 (compatible; archive.org_bot/1.5.0-200506132127 http://crawler.archive.org) Hurricane Katrina</String>
  12849. <Description>Heritrix - The Internet Archive's open-source crawler</Description>
  12850. <Type>R</Type>
  12851. <Comment>s. also - InternetArchive/0.8-dev... - mozilla/5.0 (compatible; heritrix/...</Comment>
  12852. <Link1>http://www.archive.org/</Link1>
  12853. <Link2></Link2>
  12854. </user-agent>
  12855. <user-agent>
  12856. <ID>id_moz_150207_2</ID>
  12857. <String>Mozilla/5.0 (compatible; Ask Jeeves/Teoma;  http://about.ask.com/en/docs/about/webmasters.shtml)</String>
  12858. <Description>Ask Jeeves /Teoma robot</Description>
  12859. <Type>R</Type>
  12860. <Comment> 65.214.45.[x]xx</Comment>
  12861. <Link1>http://sp.ask.com</Link1>
  12862. <Link2></Link2>
  12863. </user-agent>
  12864. <user-agent>
  12865. <ID>id_moz_291205_2</ID>
  12866. <String>Mozilla/5.0 (compatible; BanBots/2.0b; Fetch; +http://www.banbots.com)</String>
  12867. <Description>Project BanBots Perl script robot</Description>
  12868. <Type>C</Type>
  12869. <Comment>s. also BanBots/1.2...</Comment>
  12870. <Link1>http://www.banbots.com/</Link1>
  12871. <Link2></Link2>
  12872. </user-agent>
  12873. <user-agent>
  12874. <ID>id_moz_950</ID>
  12875. <String>Mozilla/5.0 (compatible; BecomeBot/1.23; http://www.become.com/webmasters.html)</String>
  12876. <Description>BecomeBot - Become.com shopping search (64.124.85.xx(x))</Description>
  12877. <Type>R</Type>
  12878. <Comment>64.124.85.[x]xx</Comment>
  12879. <Link1>http://www.become.com</Link1>
  12880. <Link2></Link2>
  12881. </user-agent>
  12882. <user-agent>
  12883. <ID>id_moz_951</ID>
  12884. <String>Mozilla/5.0 (compatible; BecomeBot/1.xx; MSIE 6.0 compatible; http://www.become.com/webmasters.html)</String>
  12885. <Description>BecomeBot - Become.com shopping search (64.124.85.xx(x))</Description>
  12886. <Type>R</Type>
  12887. <Comment>64.124.85.[x]xx</Comment>
  12888. <Link1>http://www.become.com</Link1>
  12889. <Link2></Link2>
  12890. </user-agent>
  12891. <user-agent>
  12892. <ID>id_moz_952</ID>
  12893. <String>Mozilla/5.0 (compatible; BecomeBot/2.0beta; http://www.become.com/webmasters.html)</String>
  12894. <Description>BecomeBot - Become.com shopping search (64.124.85.xx(x))</Description>
  12895. <Type>R</Type>
  12896. <Comment>64.124.85.[x]xx</Comment>
  12897. <Link1>http://www.become.com</Link1>
  12898. <Link2></Link2>
  12899. </user-agent>
  12900. <user-agent>
  12901. <ID>id_moz_953</ID>
  12902. <String>Mozilla/5.0 (compatible; BecomeBot/2.x; MSIE 6.0 compatible; http://www.become.com/site_owners.html)</String>
  12903. <Description>BecomeBot - Become.com shopping search (64.124.85.xx(x))</Description>
  12904. <Type>R</Type>
  12905. <Comment>64.124.85.[x]xx</Comment>
  12906. <Link1>http://www.become.com</Link1>
  12907. <Link2></Link2>
  12908. </user-agent>
  12909. <user-agent>
  12910. <ID>id_moz_090506_2</ID>
  12911. <String>Mozilla/5.0 (compatible; BecomeJPBot/2.3; MSIE 6.0 compatible; +http://www.become.co.jp/site_owners.html)</String>
  12912. <Description>BecomeBot - Become.com shopping search (64.124.85.xx(x))</Description>
  12913. <Type>R</Type>
  12914. <Comment>64.124.85.[x]xx</Comment>
  12915. <Link1>http://www.become.com</Link1>
  12916. <Link2></Link2>
  12917. </user-agent>
  12918. <user-agent>
  12919. <ID>id_moz_020907_1</ID>
  12920. <String>Mozilla/5.0 (compatible; BlogRefsBot/0.1; http://www.blogrefs.com/about/bloggers)</String>
  12921. <Description>BlogRefsBot.com blog robot</Description>
  12922. <Type>R</Type>
  12923. <Comment>69.90.42.xx</Comment>
  12924. <Link1>http://www.blogrefs.com/</Link1>
  12925. <Link2>http://www.blogrefs.com/about/bloggers</Link2>
  12926. </user-agent>
  12927. <user-agent>
  12928. <ID>id_moz_171107_1</ID>
  12929. <String>Mozilla/5.0 (compatible; Bot; +http://pressemitteilung.ws/spamfilter</String>
  12930. <Description>Pressemitteilungen Webservice RSS / news crawler (Germany)</Description>
  12931. <Type>R</Type>
  12932. <Comment>87.164.242.1xx</Comment>
  12933. <Link1>http://pressemitteilung.ws/</Link1>
  12934. <Link2></Link2>
  12935. </user-agent>
  12936. <user-agent>
  12937. <ID>id_moz_031206_1</ID>
  12938. <String>Mozilla/5.0 (compatible; BuzzRankingBot/1.0; +http://www.buzzrankingbot.com/)</String>
  12939. <Description>BuzzRanking internet content analysis</Description>
  12940. <Type>R</Type>
  12941. <Comment>213.251.187.1xx</Comment>
  12942. <Link1>http://www.buzzrankingbot.com/</Link1>
  12943. <Link2></Link2>
  12944. </user-agent>
  12945. <user-agent>
  12946. <ID>id_moz_310506_1</ID>
  12947. <String>Mozilla/5.0 (compatible; Charlotte/1.0b; charlotte@betaspider.com)</String>
  12948. <Description>Charlotte indexing spider for Searchme / Wikiseek</Description>
  12949. <Type>R</Type>
  12950. <Comment>209.249.86.x</Comment>
  12951. <Link1>http://www.searchme.com/</Link1>
  12952. <Link2>http://www.wikiseek.com/</Link2>
  12953. </user-agent>
  12954. <user-agent>
  12955. <ID>id_moz_080307_1</ID>
  12956. <String>Mozilla/5.0 (compatible; Charlotte/1.0b; http://www.searchme.com/support/)</String>
  12957. <Description>Charlotte indexing spider for Searchme / Wikiseek</Description>
  12958. <Type>R</Type>
  12959. <Comment>209.249.86.x</Comment>
  12960. <Link1>http://www.searchme.com/</Link1>
  12961. <Link2>http://www.wikiseek.com/</Link2>
  12962. </user-agent>
  12963. <user-agent>
  12964. <ID>id_moz_220106_1</ID>
  12965. <String>Mozilla/5.0 (compatible; Crawling jpeg; http://www.yama.info.waseda.ac.jp)</String>
  12966. <Description>Unknown graphics crawler or downloading agent from Yamana Laboratory - Waseda Univerity Japan (133.9.238.xx)</Description>
  12967. <Type>R</Type>
  12968. <Comment>doesn't read robots.txt</Comment>
  12969. <Link1>http://www.yama.info.waseda.ac.jp/eng/index.html</Link1>
  12970. <Link2></Link2>
  12971. </user-agent>
  12972. <user-agent>
  12973. <ID>id_moz_954</ID>
  12974. <String>Mozilla/5.0 (compatible; Custo 3 (Netwu.com); Windows NT 5.1)</String>
  12975. <Description>Custo web site spidering tool (link checking)</Description>
  12976. <Type>C</Type>
  12977. <Comment>s. also - Custo x.x (www.netwu.com)</Comment>
  12978. <Link1>http://www.netwu.com</Link1>
  12979. <Link2></Link2>
  12980. </user-agent>
  12981. <user-agent>
  12982. <ID>id_moz_071207_1</ID>
  12983. <String>Mozilla/5.0 (compatible; de/1.13.2 +http://www.de.com)</String>
  12984. <Description>De.com German travel related search via Amazon Web Services</Description>
  12985. <Type>R</Type>
  12986. <Comment>67.202.29.xx</Comment>
  12987. <Link1>http://www.de.com/start.php?homepage=true</Link1>
  12988. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  12989. </user-agent>
  12990. <user-agent>
  12991. <ID>id_moz_170109_1</ID>
  12992. <String>Mozilla/5.0 (compatible; Diffbot/0.1; +http://www.diffbot.com)</String>
  12993. <Description>Diffbot beta - RSS and news feed crawler</Description>
  12994. <Type>R</Type>
  12995. <Comment>64.71.190.13x</Comment>
  12996. <Link1>http://www.diffbot.com/</Link1>
  12997. <Link2></Link2>
  12998. </user-agent>
  12999. <user-agent>
  13000. <ID>id_moz_030207_1</ID>
  13001. <String>Mozilla/5.0 (compatible; DNS-Digger-Explorer/1.0; +http://www.dnsdigger.com)</String>
  13002. <Description>DNS-Digger - DNS server neighbourhood search</Description>
  13003. <Type>R</Type>
  13004. <Comment>212.214.165.2xx</Comment>
  13005. <Link1>http://www.dnsdigger.com/</Link1>
  13006. <Link2></Link2>
  13007. </user-agent>
  13008. <user-agent>
  13009. <ID>id_moz_100606_2</ID>
  13010. <String>Mozilla/5.0 (compatible; DNS-Digger/1.0; +http://www.dnsdigger.com)</String>
  13011. <Description>DNS-Digger - DNS server neighbourhood search</Description>
  13012. <Type>R</Type>
  13013. <Comment>212.214.165.2xx</Comment>
  13014. <Link1>http://www.dnsdigger.com/</Link1>
  13015. <Link2></Link2>
  13016. </user-agent>
  13017. <user-agent>
  13018. <ID>id_moz_020506_1</ID>
  13019. <String>Mozilla/5.0 (compatible; EARTHCOM.info/2.01; http://www.earthcom.info)</String>
  13020. <Description>Earthcom (Czech Republic) search robot (194.108.39.xx)</Description>
  13021. <Type>R</Type>
  13022. <Comment>s. also EARTHCOM ..</Comment>
  13023. <Link1>http://www.earthcom.info</Link1>
  13024. <Link2></Link2>
  13025. </user-agent>
  13026. <user-agent>
  13027. <ID>id_moz_190807_3</ID>
  13028. <String>Mozilla/5.0 (compatible; EARTHCOM/2.2; +http://enter4u.eu)</String>
  13029. <Description>enter4u / Earthcom.info search (Czech Republic)</Description>
  13030. <Type>R</Type>
  13031. <Comment></Comment>
  13032. <Link1>http://enter4u.eu/</Link1>
  13033. <Link2>http://www.earthcom.info</Link2>
  13034. </user-agent>
  13035. <user-agent>
  13036. <ID>id_moz_050107_1</ID>
  13037. <String>Mozilla/5.0 (compatible; egothor/8.0g; +http://ego.ms.mff.cuni.cz/)</String>
  13038. <Description>Prague Faculty of Mathematics and Physics using Egothor open source crawler</Description>
  13039. <Type>P</Type>
  13040. <Comment>195.113.20.125</Comment>
  13041. <Link1>http://ego.ms.mff.cuni.cz/</Link1>
  13042. <Link2>http://www.egothor.org/</Link2>
  13043. </user-agent>
  13044. <user-agent>
  13045. <ID>id_moz_310507_1</ID>
  13046. <String>Mozilla/5.0 (compatible; Exabot Test/3.0; +http://www.exabot.com/go/robot)</String>
  13047. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  13048. <Type>R</Type>
  13049. <Comment>s. Harvest-NG/1.0.2 and Exalead NG...</Comment>
  13050. <Link1>http://www.exabot.com/</Link1>
  13051. <Link2></Link2>
  13052. </user-agent>
  13053. <user-agent>
  13054. <ID>id_moz_221207_1</ID>
  13055. <String>Mozilla/5.0 (compatible; FatBot 2.0; http://www.thefind.com/main/CrawlerFAQs.fhtml)</String>
  13056. <Description>TheFind.com - Shopping search robot</Description>
  13057. <Type>R</Type>
  13058. <Comment>64.124.148.xx[x]</Comment>
  13059. <Link1>http://www.thefind.com/</Link1>
  13060. <Link2></Link2>
  13061. </user-agent>
  13062. <user-agent>
  13063. <ID>id_moz_170109_2</ID>
  13064. <String>Mozilla/5.0 (compatible; Galbot/1.0; +http://www.galbot.com/bot.html)</String>
  13065. <Description>Galbot tagging robot (beta) - Denmark</Description>
  13066. <Type>R</Type>
  13067. <Comment></Comment>
  13068. <Link1>http://www.galbot.com/</Link1>
  13069. <Link2></Link2>
  13070. </user-agent>
  13071. <user-agent>
  13072. <ID>id_moz_955</ID>
  13073. <String>mozilla/5.0 (compatible; genevabot http://www.healthdash.com)</String>
  13074. <Description>Geneva Single-Site Search Engine used by Healthdash health search</Description>
  13075. <Type>R</Type>
  13076. <Comment></Comment>
  13077. <Link1>http://www.healthdash.com</Link1>
  13078. <Link2></Link2>
  13079. </user-agent>
  13080. <user-agent>
  13081. <ID>id_moz_170207_4</ID>
  13082. <String>Mozilla/5.0 (compatible; Google Desktop) Paros/3.2.12</String>
  13083. <Description>Paros - a Java based HTTP/HTTPS proxy</Description>
  13084. <Type>P</Type>
  13085. <Comment></Comment>
  13086. <Link1>http://sourceforge.net/projects/paros</Link1>
  13087. <Link2></Link2>
  13088. </user-agent>
  13089. <user-agent>
  13090. <ID>id_moz_956</ID>
  13091. <String>Mozilla/5.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html)</String>
  13092. <Description>Google robot</Description>
  13093. <Type>R</Type>
  13094. <Comment>s. also: - Googlebot - Mozilla/4.0 (MobilePhone SCP ...</Comment>
  13095. <Link1>http://www.google.com</Link1>
  13096. <Link2></Link2>
  13097. </user-agent>
  13098. <user-agent>
  13099. <ID>id_moz_957</ID>
  13100. <String>mozilla/5.0 (compatible; heritrix/1.0.4 http://innovationblog.com)</String>
  13101. <Description>Unknown robot using Heritrix</Description>
  13102. <Type>R</Type>
  13103. <Comment></Comment>
  13104. <Link1>http://innovationblog.com</Link1>
  13105. <Link2>http://crawler.archive.org/</Link2>
  13106. </user-agent>
  13107. <user-agent>
  13108. <ID>id_moz_280207_1</ID>
  13109. <String>Mozilla/5.0 (compatible; heritrix/1.10.2 +http://i.stanford.edu/)</String>
  13110. <Description>The Stanford University InfoLab robot using Heritrix</Description>
  13111. <Type>R</Type>
  13112. <Comment>171.67.73.1x</Comment>
  13113. <Link1>http://i.stanford.edu/</Link1>
  13114. <Link2>http://www.archive.org/</Link2>
  13115. </user-agent>
  13116. <user-agent>
  13117. <ID>id_moz_280108_2</ID>
  13118. <String>Mozilla/5.0 (compatible; heritrix/1.12.1 +http://newstin.com/)</String>
  13119. <Description>Newstin news feed search using Heritrix</Description>
  13120. <Type>R</Type>
  13121. <Comment>195.39.35.1xx</Comment>
  13122. <Link1>http://www.newstin.com/</Link1>
  13123. <Link2></Link2>
  13124. </user-agent>
  13125. <user-agent>
  13126. <ID>id_moz_210807_1</ID>
  13127. <String>Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com)</String>
  13128. <Description>Page-store.com vertical search via Amazon Web Services</Description>
  13129. <Type>R</Type>
  13130. <Comment>72.44.62.1xx</Comment>
  13131. <Link1>http://www.page-store.com/</Link1>
  13132. <Link2>http://www.amazonaws.com/</Link2>
  13133. </user-agent>
  13134. <user-agent>
  13135. <ID>id_moz_230108_1</ID>
  13136. <String>Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com) [email:paul@page-store.com]</String>
  13137. <Description>Page-store.com vertical search via Amazon Web Services</Description>
  13138. <Type>R</Type>
  13139. <Comment>72.44.62.1xx</Comment>
  13140. <Link1>http://www.page-store.com/</Link1>
  13141. <Link2>http://www.amazonaws.com/</Link2>
  13142. </user-agent>
  13143. <user-agent>
  13144. <ID>id_moz_958</ID>
  13145. <String>mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)</String>
  13146. <Description>Heritrix Internet Archive's open-source web project </Description>
  13147. <Type>R</Type>
  13148. <Comment></Comment>
  13149. <Link1>http://archive.crawler.org</Link1>
  13150. <Link2></Link2>
  13151. </user-agent>
  13152. <user-agent>
  13153. <ID>id_moz_270106_2</ID>
  13154. <String>Mozilla/5.0 (compatible; heritrix/1.4.0 +http://www.chepi.net)</String>
  13155. <Description>Chepi Beta search Spain (194.116.240.1xx) using Heritrix</Description>
  13156. <Type>R</Type>
  13157. <Comment></Comment>
  13158. <Link1>http://www.chepi.net/</Link1>
  13159. <Link2>http://lucene.apache.org</Link2>
  13160. </user-agent>
  13161. <user-agent>
  13162. <ID>id_moz_959</ID>
  13163. <String>Mozilla/5.0 (compatible; heritrix/1.4t http://www.truveo.com/)</String>
  13164. <Description>Truveo data mining robot using Heritrix</Description>
  13165. <Type>R</Type>
  13166. <Comment></Comment>
  13167. <Link1>http://www.truveo.com/home/</Link1>
  13168. <Link2>http://crawler.archive.org/</Link2>
  13169. </user-agent>
  13170. <user-agent>
  13171. <ID>id_moz_960</ID>
  13172. <String>Mozilla/5.0 (compatible; heritrix/1.5.0 http://www.l3s.de/~kohlschuetter/projects/crawling/)</String>
  13173. <Description>L3S WebCrawling Project (Germany) using Heritrix</Description>
  13174. <Type>R</Type>
  13175. <Comment></Comment>
  13176. <Link1>http://www.l3s.de/~kohlschuetter/projects/crawling/</Link1>
  13177. <Link2>http://crawler.archive.org/</Link2>
  13178. </user-agent>
  13179. <user-agent>
  13180. <ID>id_moz_961</ID>
  13181. <String>Mozilla/5.0 (compatible; heritrix/1.5.0-200506231921 http://pandora.nla.gov.au/crawl.html)</String>
  13182. <Description>Pandora Internet Archive crawler (Australia) using Heritrix</Description>
  13183. <Type>R</Type>
  13184. <Comment></Comment>
  13185. <Link1>http://pandora.nla.gov.au</Link1>
  13186. <Link2>http://crawler.archive.org/</Link2>
  13187. </user-agent>
  13188. <user-agent>
  13189. <ID>id_moz_250706_3</ID>
  13190. <String>Mozilla/5.0 (compatible; heritrix/1.6.0 http://www.worio.com/)</String>
  13191. <Description>WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler</Description>
  13192. <Type>R</Type>
  13193. <Comment>137.82.84.xx</Comment>
  13194. <Link1>http://www.worio.com/</Link1>
  13195. <Link2>http://www.archive.org/</Link2>
  13196. </user-agent>
  13197. <user-agent>
  13198. <ID>id_moz_190607_1</ID>
  13199. <String>Mozilla/5.0 (compatible; heritrix/1.7.0 +http://www.greaterera.com/)</String>
  13200. <Description>greatarea.com website collection project using Heritrix</Description>
  13201. <Type>R</Type>
  13202. <Comment>63.209.222.</Comment>
  13203. <Link1>http://www.greaterera.com/</Link1>
  13204. <Link2></Link2>
  13205. </user-agent>
  13206. <user-agent>
  13207. <ID>id_moz_230307_1</ID>
  13208. <String>Mozilla/5.0 (compatible; Heritrix/1.8.0 http://www.hanzoarchives.com)</String>
  13209. <Description>hanzo:web social web archiving service</Description>
  13210. <Type>D</Type>
  13211. <Comment>216.182.238.</Comment>
  13212. <Link1>http://www.hanzoweb.com/</Link1>
  13213. <Link2></Link2>
  13214. </user-agent>
  13215. <user-agent>
  13216. <ID>id_moz_151106_1</ID>
  13217. <String>Mozilla/5.0 (compatible; heritrix/1.x.x +http://www.accelobot.com)</String>
  13218. <Description>Accelobot - Accelovation Market Discovery software robot</Description>
  13219. <Type>R</Type>
  13220. <Comment>72.20.99.xx</Comment>
  13221. <Link1>http://www.accelobot.com/</Link1>
  13222. <Link2>http://www.accelovation.com/solutions.html</Link2>
  13223. </user-agent>
  13224. <user-agent>
  13225. <ID>id_moz_030208_1</ID>
  13226. <String>Mozilla/5.0 (compatible; heritrix/2.0.0-RC1 +http://www.aol.com)</String>
  13227. <Description>Unknown AOL robot using Heritrix</Description>
  13228. <Type>R</Type>
  13229. <Comment>64.236.128.x</Comment>
  13230. <Link1>http://www.aol.com/</Link1>
  13231. <Link2></Link2>
  13232. </user-agent>
  13233. <user-agent>
  13234. <ID>id_moz_051207_2</ID>
  13235. <String>Mozilla/5.0 (compatible; Hermit Search. Com; +http://www.hermitsearch.com)</String>
  13236. <Description>Hermits Search.com - Products and service search robot</Description>
  13237. <Type>R</Type>
  13238. <Comment>72.55.165.11x</Comment>
  13239. <Link1>http://www.hermitsearch.com/</Link1>
  13240. <Link2></Link2>
  13241. </user-agent>
  13242. <user-agent>
  13243. <ID>id_moz_161006_2</ID>
  13244. <String>Mozilla/5.0 (compatible; http://www.IsMySiteUp.Net/bot/ )</String>
  13245. <Description>IsMySiteUp? - Online website monitoring service</Description>
  13246. <Type>C</Type>
  13247. <Comment>142.179.247.xx</Comment>
  13248. <Link1>http://www.ismysiteup.net/</Link1>
  13249. <Link2></Link2>
  13250. </user-agent>
  13251. <user-agent>
  13252. <ID>id_moz_101106_2</ID>
  13253. <String>Mozilla/5.0 (compatible; http://www.UptimeAuditor.com/bot/ )</String>
  13254. <Description>UptimeAuditor - real time web monitoring</Description>
  13255. <Type>C</Type>
  13256. <Comment>142.179.247.xx</Comment>
  13257. <Link1>http://www.uptimeauditor.com/</Link1>
  13258. <Link2></Link2>
  13259. </user-agent>
  13260. <user-agent>
  13261. <ID>id_moz_180508_1</ID>
  13262. <String>Mozilla/5.0 (compatible; HyperixScoop/1.3; +http://www.hyperix.com)</String>
  13263. <Description>Hyperix vertical search crawler</Description>
  13264. <Type>R</Type>
  13265. <Comment>64.40.113.[x]xx</Comment>
  13266. <Link1>http://www.hyperix.com/</Link1>
  13267. <Link2></Link2>
  13268. </user-agent>
  13269. <user-agent>
  13270. <ID>id_moz_070406_1</ID>
  13271. <String>Mozilla/5.0 (compatible; iaskspider/1.0; MSIE 6.0)</String>
  13272. <Description>Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx)</Description>
  13273. <Type></Type>
  13274. <Comment>Not from iask.com.cn - s. also iaskspider</Comment>
  13275. <Link1></Link1>
  13276. <Link2></Link2>
  13277. </user-agent>
  13278. <user-agent>
  13279. <ID>id_moz_280607_1</ID>
  13280. <String>Mozilla/5.0 (compatible; IDBot/1.0; +http://www.id-search.org/bot.html)</String>
  13281. <Description>ID-Search.org - Russian search project</Description>
  13282. <Type>R</Type>
  13283. <Comment>67.159.44.2xx</Comment>
  13284. <Link1>http://id-search.org/bot.html</Link1>
  13285. <Link2></Link2>
  13286. </user-agent>
  13287. <user-agent>
  13288. <ID>id_moz_962</ID>
  13289. <String>Mozilla/5.0 (compatible; InterseekWeb/3.x)</String>
  13290. <Description>Najdi.si (Slovenia) search using Interseek/Web Interseek/API Search Engine</Description>
  13291. <Type>R</Type>
  13292. <Comment></Comment>
  13293. <Link1>http://www.najdi.si/pomoc/eng/index.jsp</Link1>
  13294. <Link2></Link2>
  13295. </user-agent>
  13296. <user-agent>
  13297. <ID>id_moz_130807_4</ID>
  13298. <String>Mozilla/5.0 (compatible; Jim +http://www.hanzoarchives.com)</String>
  13299. <Description>hanzo:web social web archiving service</Description>
  13300. <Type>D</Type>
  13301. <Comment>216.182.238.</Comment>
  13302. <Link1>http://www.hanzoweb.com/</Link1>
  13303. <Link2></Link2>
  13304. </user-agent>
  13305. <user-agent>
  13306. <ID>id_moz_963</ID>
  13307. <String>Mozilla/5.0 (compatible; Konqueror/2.0.1; X11); Supports MD5-Digest; Supports gzip encoding</String>
  13308. <Description>Konqueror 2.0.x X11</Description>
  13309. <Type>B</Type>
  13310. <Comment></Comment>
  13311. <Link1>http://www.konqueror.org/</Link1>
  13312. <Link2></Link2>
  13313. </user-agent>
  13314. <user-agent>
  13315. <ID>id_moz_964</ID>
  13316. <String>Mozilla/5.0 (compatible; Konqueror/2.1.1; X11)</String>
  13317. <Description>Konqueror 2.1.x X11</Description>
  13318. <Type>B</Type>
  13319. <Comment></Comment>
  13320. <Link1>http://www.konqueror.org/</Link1>
  13321. <Link2></Link2>
  13322. </user-agent>
  13323. <user-agent>
  13324. <ID>id_moz_966</ID>
  13325. <String>Mozilla/5.0 (compatible; Konqueror/2.2.2)</String>
  13326. <Description>Konqueror 2.2.x</Description>
  13327. <Type>B</Type>
  13328. <Comment></Comment>
  13329. <Link1>http://www.konqueror.org/</Link1>
  13330. <Link2></Link2>
  13331. </user-agent>
  13332. <user-agent>
  13333. <ID>id_moz_965</ID>
  13334. <String>Mozilla/5.0 (compatible; Konqueror/2.2.2; Linux 2.4.14-xfs; X11; i686)</String>
  13335. <Description>Konqueror 2.2.x Linux</Description>
  13336. <Type>B</Type>
  13337. <Comment></Comment>
  13338. <Link1>http://www.konqueror.org/</Link1>
  13339. <Link2></Link2>
  13340. </user-agent>
  13341. <user-agent>
  13342. <ID>id_moz_050108_2</ID>
  13343. <String>Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)</String>
  13344. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  13345. <Type>R</Type>
  13346. <Comment>s. Harvest-NG/1.0.2 and Exalead NG...</Comment>
  13347. <Link1>http://www.exabot.com/</Link1>
  13348. <Link2></Link2>
  13349. </user-agent>
  13350. <user-agent>
  13351. <ID>id_moz_967</ID>
  13352. <String>Mozilla/5.0 (compatible; LemSpider 0.1)</String>
  13353. <Description>Lemur Consulting LemIR spider</Description>
  13354. <Type>R</Type>
  13355. <Comment></Comment>
  13356. <Link1>http://www.lemurconsulting.com</Link1>
  13357. <Link2></Link2>
  13358. </user-agent>
  13359. <user-agent>
  13360. <ID>id_moz_968</ID>
  13361. <String>Mozilla/5.0 (compatible; LinksManager.com_bot http://linksmanager.com/linkchecker.html)</String>
  13362. <Description>Linksmanager.com online link checking service</Description>
  13363. <Type>C</Type>
  13364. <Comment>s.also LinksManager.com</Comment>
  13365. <Link1>http://www.linksmanager.com</Link1>
  13366. <Link2></Link2>
  13367. </user-agent>
  13368. <user-agent>
  13369. <ID>id_moz_140408_2</ID>
  13370. <String>Mozilla/5.0 (compatible; LinkStash Bookmark Manager; http://www.xrayz.co.uk/)</String>
  13371. <Description>LinkStash Bookmark Manager</Description>
  13372. <Type>C</Type>
  13373. <Comment></Comment>
  13374. <Link1>http://www.xrayz.co.uk/</Link1>
  13375. <Link2></Link2>
  13376. </user-agent>
  13377. <user-agent>
  13378. <ID>id_moz_060706_2</ID>
  13379. <String>Mozilla/5.0 (compatible; MojeekBot/2.0; http://www.mojeek.com/bot.html)</String>
  13380. <Description>Mojeek Search Preview robot (217.155.205.xx)</Description>
  13381. <Type>R</Type>
  13382. <Comment>s. also MojeekBot/0.x</Comment>
  13383. <Link1>http://www.mojeek.com</Link1>
  13384. <Link2></Link2>
  13385. </user-agent>
  13386. <user-agent>
  13387. <ID>id_moz_290107_1</ID>
  13388. <String>Mozilla/5.0 (compatible; MOSBookmarks/v2.6-Plus; Link Checker)</String>
  13389. <Description>Joomla!/Mambo component - MosBookmarks (bot) link checking</Description>
  13390. <Type>C</Type>
  13391. <Comment></Comment>
  13392. <Link1>http://www.tegdesign.ch/</Link1>
  13393. <Link2></Link2>
  13394. </user-agent>
  13395. <user-agent>
  13396. <ID>id_moz_091007_1</ID>
  13397. <String>Mozilla/5.0 (compatible; MSIE 6.0; Podtech Network; crawler_admin@podtech.net)</String>
  13398. <Description>PodTech entertainment and video network crawler</Description>
  13399. <Type>R</Type>
  13400. <Comment>71.134.235.xx</Comment>
  13401. <Link1>http://www.podtech.net/home/</Link1>
  13402. <Link2></Link2>
  13403. </user-agent>
  13404. <user-agent>
  13405. <ID>id_moz_969</ID>
  13406. <String>Mozilla/5.0 (compatible; OnetSzukaj/5.0; http://szukaj.onet.pl)</String>
  13407. <Description>onet.pl Szukaj (Search) robot (213.180.128.1xx)</Description>
  13408. <Type>R</Type>
  13409. <Comment>s. also - Onet.pl SA</Comment>
  13410. <Link1>http://szukaj.onet.pl</Link1>
  13411. <Link2></Link2>
  13412. </user-agent>
  13413. <user-agent>
  13414. <ID>id_moz_181207_1</ID>
  13415. <String>Mozilla/5.0 (compatible; PagestackerBot; http://www.pagestacker.com)</String>
  13416. <Description>Pagestacker online bookmark service</Description>
  13417. <Type>C</Type>
  13418. <Comment>70.85.129.12x</Comment>
  13419. <Link1>http://www.pagestacker.com/</Link1>
  13420. <Link2></Link2>
  13421. </user-agent>
  13422. <user-agent>
  13423. <ID>id_moz_020307_1</ID>
  13424. <String>Mozilla/5.0 (compatible; PalmeraBot; http://www.links24h.com/help/palmera) Version 0.001</String>
  13425. <Description>PalmeraBot - Links24h.com search engine robot</Description>
  13426. <Type>R</Type>
  13427. <Comment>80.59.111.2xx</Comment>
  13428. <Link1>http://www.links24h.com/</Link1>
  13429. <Link2>http://www.links24h.com/help/palmera/</Link2>
  13430. </user-agent>
  13431. <user-agent>
  13432. <ID>id_moz_130806_1</ID>
  13433. <String>Mozilla/5.0 (compatible; PEAR HTTP_Request class; http://feed.moo.jp/)</String>
  13434. <Description>FeedMo feed search (Japan) using Pear HTTP</Description>
  13435. <Type>C ?</Type>
  13436. <Comment>210.188.205.2xx</Comment>
  13437. <Link1>http://feed.moo.jp/</Link1>
  13438. <Link2>http://pear.php.net/</Link2>
  13439. </user-agent>
  13440. <user-agent>
  13441. <ID>id_moz_190607_2</ID>
  13442. <String>Mozilla/5.0 (compatible; Phonifier; +http://www.phonifier.com)</String>
  13443. <Description>PHONifier mobile access to web content</Description>
  13444. <Type>D B</Type>
  13445. <Comment></Comment>
  13446. <Link1>http://www.phonifier.com/</Link1>
  13447. <Link2></Link2>
  13448. </user-agent>
  13449. <user-agent>
  13450. <ID>id_moz_240208_2</ID>
  13451. <String>Mozilla/5.0 (compatible; pmoz.info ODP link checker; +http://pmoz.info/doc/botinfo.htm)</String>
  13452. <Description>pmoz.info ODP link checking bot</Description>
  13453. <Type>C</Type>
  13454. <Comment>74.208.25.118 / 216.15.74.85</Comment>
  13455. <Link1>http://pmoz.info/doc/botinfo.htm</Link1>
  13456. <Link2>http://www.dmoz.org/</Link2>
  13457. </user-agent>
  13458. <user-agent>
  13459. <ID>id_moz_970</ID>
  13460. <String>Mozilla/5.0 (compatible; pogodak.ba/3.x)</String>
  13461. <Description>Pogodak search (Slovenia) robot via Interseek</Description>
  13462. <Type>R</Type>
  13463. <Comment>89.143.229.1xx</Comment>
  13464. <Link1>http://www.pogodak.hr</Link1>
  13465. <Link2>http://www.interseek.com/</Link2>
  13466. </user-agent>
  13467. <user-agent>
  13468. <ID>id_moz_100408_2</ID>
  13469. <String>Mozilla/5.0 (compatible; Pogodak.hr/3.1)</String>
  13470. <Description>Pogodak search (Slovenia) robot via Interseek</Description>
  13471. <Type>R</Type>
  13472. <Comment>89.143.229.1xx</Comment>
  13473. <Link1>http://www.pogodak.hr</Link1>
  13474. <Link2>http://www.interseek.com/</Link2>
  13475. </user-agent>
  13476. <user-agent>
  13477. <ID>id_moz_101107_1</ID>
  13478. <String>Mozilla/5.0 (compatible; Proximic crawler; +http://www.proximic.com/en/about-us/contact-us.html)</String>
  13479. <Description>Proximic Publisher Widget - RSS and news content generator</Description>
  13480. <Type>C</Type>
  13481. <Comment></Comment>
  13482. <Link1>http://www.proximic.com/</Link1>
  13483. <Link2></Link2>
  13484. </user-agent>
  13485. <user-agent>
  13486. <ID>id_moz_230907_1</ID>
  13487. <String>Mozilla/5.0 (compatible; PWeBot/3.1; http://www.programacionweb.net/robot.php)</String>
  13488. <Description>ProgramacionWeb.net PWeBot crawler (Argentina)</Description>
  13489. <Type>R</Type>
  13490. <Comment>62.149.236.2xx</Comment>
  13491. <Link1>http://www.programacionweb.net/robot-en.php</Link1>
  13492. <Link2>http://www.programacionweb.net/</Link2>
  13493. </user-agent>
  13494. <user-agent>
  13495. <ID>id_moz_130507_1</ID>
  13496. <String>Mozilla/5.0 (compatible; Quantcastbot/1.0; www.quantcast.com)</String>
  13497. <Description>Quantcast - Open Internet Ratings Service</Description>
  13498. <Type>R</Type>
  13499. <Comment></Comment>
  13500. <Link1>http://www.quantcast.com/</Link1>
  13501. <Link2></Link2>
  13502. </user-agent>
  13503. <user-agent>
  13504. <ID>id_moz_190706_1</ID>
  13505. <String>Mozilla/5.0 (compatible; robtexbot/1.0; http://www.robtex.com/ )</String>
  13506. <Description>robtex - Multi-RBL check and AS-numbercheck</Description>
  13507. <Type>C</Type>
  13508. <Comment></Comment>
  13509. <Link1>http://www.robtex.com/</Link1>
  13510. <Link2></Link2>
  13511. </user-agent>
  13512. <user-agent>
  13513. <ID>id_moz_050408_1</ID>
  13514. <String>Mozilla/5.0 (compatible; ScoutJet; +http://www.scoutjet.com/)</String>
  13515. <Description>ScoutJet (Blekko) search web crawler</Description>
  13516. <Type>R</Type>
  13517. <Comment></Comment>
  13518. <Link1>http://www.scoutjet.com/</Link1>
  13519. <Link2></Link2>
  13520. </user-agent>
  13521. <user-agent>
  13522. <ID>id_moz_300106_3</ID>
  13523. <String>Mozilla/5.0 (compatible; Scrubby/2.2;  http://www.scrubtheweb.com/)</String>
  13524. <Description>Scrub the web robot (66.93.156.xx)</Description>
  13525. <Type>R</Type>
  13526. <Comment>s.also Scrubby/2.x </Comment>
  13527. <Link1>http://www.scrubtheweb.com/</Link1>
  13528. <Link2></Link2>
  13529. </user-agent>
  13530. <user-agent>
  13531. <ID>id_moz_031107_4</ID>
  13532. <String>Mozilla/5.0 (compatible; ShunixBot/1.x.x +http://www.shunix.com/robot.htm)</String>
  13533. <Description>Shunixbot (France) beta / test semantic web indexing robot</Description>
  13534. <Type>R</Type>
  13535. <Comment></Comment>
  13536. <Link1>http://www.shunix.com/</Link1>
  13537. <Link2></Link2>
  13538. </user-agent>
  13539. <user-agent>
  13540. <ID>id_moz_971</ID>
  13541. <String>Mozilla/5.0 (compatible; ShunixBot/1.x; http://www.shunix.com/bot.htm)</String>
  13542. <Description>Shunixbot (France) beta / test semantic web indexing robot</Description>
  13543. <Type>R</Type>
  13544. <Comment></Comment>
  13545. <Link1>http://www.shunix.com/</Link1>
  13546. <Link2></Link2>
  13547. </user-agent>
  13548. <user-agent>
  13549. <ID>id_moz_280607_2</ID>
  13550. <String>Mozilla/5.0 (compatible; SkreemRBot +http://skreemr.com)</String>
  13551. <Description>Skreemr - Audio search engine</Description>
  13552. <Type>R</Type>
  13553. <Comment>64.15.69.x</Comment>
  13554. <Link1>http://skreemr.com/</Link1>
  13555. <Link2></Link2>
  13556. </user-agent>
  13557. <user-agent>
  13558. <ID>id_moz_070207_2</ID>
  13559. <String>Mozilla/5.0 (compatible; SnapPreviewBot; en-US; rv:1.8.0.9) Gecko/20061206 Firefox/1.5.0.9</String>
  13560. <Description>Snap Firefox Search Plugin</Description>
  13561. <Type>B</Type>
  13562. <Comment></Comment>
  13563. <Link1>http://www.snap.com/about/spa1A.php</Link1>
  13564. <Link2></Link2>
  13565. </user-agent>
  13566. <user-agent>
  13567. <ID>id_moz_972</ID>
  13568. <String>Mozilla/5.0 (compatible; SpurlBot/0.2) </String>
  13569. <Description>Spurl.net bookmark service &amp; search engine (84.40.30.xxx)</Description>
  13570. <Type>R C</Type>
  13571. <Comment></Comment>
  13572. <Link1>http://www.spurl.net</Link1>
  13573. <Link2></Link2>
  13574. </user-agent>
  13575. <user-agent>
  13576. <ID>id_moz_190108_1</ID>
  13577. <String>Mozilla/5.0 (compatible; SummizeBot +http://www.summize.com)</String>
  13578. <Description>Summize - Opinion and review search robot</Description>
  13579. <Type>R</Type>
  13580. <Comment>208.79.17.x[x]</Comment>
  13581. <Link1>http://www.summize.com/</Link1>
  13582. <Link2></Link2>
  13583. </user-agent>
  13584. <user-agent>
  13585. <ID>id_moz_973</ID>
  13586. <String>Mozilla/5.0 (compatible; SYCLIKControl/LinkChecker;)</String>
  13587. <Description>Syclik Control web content management system</Description>
  13588. <Type>R C</Type>
  13589. <Comment></Comment>
  13590. <Link1>http://www.syclik.com</Link1>
  13591. <Link2></Link2>
  13592. </user-agent>
  13593. <user-agent>
  13594. <ID>id_moz_070607_1</ID>
  13595. <String>Mozilla/5.0 (compatible; Synoobot/0.9; http://www.synoo.com/search/bot.html)</String>
  13596. <Description>Synoo web directory robot</Description>
  13597. <Type>R</Type>
  13598. <Comment>212.12.114.2xx</Comment>
  13599. <Link1>http://www.synoo.com/search/bot.html</Link1>
  13600. <Link2></Link2>
  13601. </user-agent>
  13602. <user-agent>
  13603. <ID>id_moz_261105_1</ID>
  13604. <String>Mozilla/5.0 (compatible; Theophrastus/x.x; http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php)</String>
  13605. <Description>Theophrastus Internet Spider for a basic search engine project</Description>
  13606. <Type>R</Type>
  13607. <Comment></Comment>
  13608. <Link1>http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php</Link1>
  13609. <Link2></Link2>
  13610. </user-agent>
  13611. <user-agent>
  13612. <ID>id_moz_030207_2</ID>
  13613. <String>Mozilla/5.0 (compatible; TridentSpider/3.1)</String>
  13614. <Description>Interseek - Java search engine technology used for Pogodak search</Description>
  13615. <Type>R</Type>
  13616. <Comment>213.253.92.x</Comment>
  13617. <Link1>http://www.interseek.com/</Link1>
  13618. <Link2>http://www.pogodak.com/</Link2>
  13619. </user-agent>
  13620. <user-agent>
  13621. <ID>id_moz_974</ID>
  13622. <String>Mozilla/5.0 (compatible; Vagabondo/2.1; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)</String>
  13623. <Description>WiseGuys robot</Description>
  13624. <Type>R</Type>
  13625. <Comment>s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..</Comment>
  13626. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  13627. <Link2></Link2>
  13628. </user-agent>
  13629. <user-agent>
  13630. <ID>id_moz_280209_4</ID>
  13631. <String>Mozilla/5.0 (compatible; Webduniabot/1.0; +http://search.webdunia.com/bot.aspx)</String>
  13632. <Description>Webdunia search (India) robot</Description>
  13633. <Type>R</Type>
  13634. <Comment></Comment>
  13635. <Link1>http://www.webdunia.com/</Link1>
  13636. <Link2></Link2>
  13637. </user-agent>
  13638. <user-agent>
  13639. <ID>id_moz_151205_1</ID>
  13640. <String>Mozilla/5.0 (compatible; Windows NT 5.0; phpwebbrainBot/0.1 - http://www.monsterli.ch/phpwebbrain/)</String>
  13641. <Description>phpwebbrain online bookmark service (Germany)</Description>
  13642. <Type>C</Type>
  13643. <Comment></Comment>
  13644. <Link1>http://www.monsterli.ch/phpwebbrain/</Link1>
  13645. <Link2></Link2>
  13646. </user-agent>
  13647. <user-agent>
  13648. <ID>id_moz_150307_1</ID>
  13649. <String>Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)</String>
  13650. <Description>WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler</Description>
  13651. <Type>R</Type>
  13652. <Comment>137.82.84.xx</Comment>
  13653. <Link1>http://www.worio.com/</Link1>
  13654. <Link2>http://www.archive.org/</Link2>
  13655. </user-agent>
  13656. <user-agent>
  13657. <ID>id_moz_221008_1</ID>
  13658. <String>Mozilla/5.0 (compatible; WoW Lemmings Kathune/2.0;http://www.wowlemmings.com/kathune.html)</String>
  13659. <Description>Kathune spider for World of Warcraft guild data. Used to power WoW Lemmings</Description>
  13660. <Type>R</Type>
  13661. <Comment>76.12.83.24x</Comment>
  13662. <Link1>http://www.wowlemmings.com/kathune.html</Link1>
  13663. <Link2>http://www.wowlemmings.com/</Link2>
  13664. </user-agent>
  13665. <user-agent>
  13666. <ID>id_moz_260407_1</ID>
  13667. <String>Mozilla/5.0 (compatible; XTbot/1.0v; +http://www.externaltest.com)</String>
  13668. <Description>eXternalTest - Server and online services monitoring</Description>
  13669. <Type>C</Type>
  13670. <Comment></Comment>
  13671. <Link1>http://www.externaltest.com/</Link1>
  13672. <Link2></Link2>
  13673. </user-agent>
  13674. <user-agent>
  13675. <ID>id_moz_290606_2</ID>
  13676. <String>Mozilla/5.0 (compatible; Yahoo! DE Slurp; http://help.yahoo.com/help/us/ysearch/slurp)</String>
  13677. <Description>Yahoo / Inktomi search robot</Description>
  13678. <Type>R</Type>
  13679. <Comment>66.196.77.1xx / 72.30.98.2xx</Comment>
  13680. <Link1></Link1>
  13681. <Link2></Link2>
  13682. </user-agent>
  13683. <user-agent>
  13684. <ID>id_moz_181105_1</ID>
  13685. <String>Mozilla/5.0 (compatible; Yahoo! Slurp China; http://misc.yahoo.com.cn/help.html)</String>
  13686. <Description>Inktomi robot (202.160.180.xxx) for Yahoo China</Description>
  13687. <Type>R</Type>
  13688. <Comment></Comment>
  13689. <Link1>http://www.yahoo.com.cn/</Link1>
  13690. <Link2>http://www.inktomi.com/</Link2>
  13691. </user-agent>
  13692. <user-agent>
  13693. <ID>id_moz_975</ID>
  13694. <String>Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)</String>
  13695. <Description>Inktomi robot for Yahoo (via 66.196.xx.xxx)</Description>
  13696. <Type>R</Type>
  13697. <Comment></Comment>
  13698. <Link1>http://www.inktomi.com</Link1>
  13699. <Link2></Link2>
  13700. </user-agent>
  13701. <user-agent>
  13702. <ID>id_moz_061208_2</ID>
  13703. <String>Mozilla/5.0 (compatible; YesupBot/1.0; +http://www.yesup.net/bot.html)</String>
  13704. <Description>Yesup Seo - Toronto SEO Service</Description>
  13705. <Type>C</Type>
  13706. <Comment>66.48.78.1xx</Comment>
  13707. <Link1>http://yesupseo.com/</Link1>
  13708. <Link2></Link2>
  13709. </user-agent>
  13710. <user-agent>
  13711. <ID>id_moz_250107_1</ID>
  13712. <String>Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/)</String>
  13713. <Description>Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)</Description>
  13714. <Type>R</Type>
  13715. <Comment>s. also yoono/1.0 web-crawler - yoofind/yoofind ..</Comment>
  13716. <Link1>http://www.yoono.com/</Link1>
  13717. <Link2></Link2>
  13718. </user-agent>
  13719. <user-agent>
  13720. <ID>id_moz_061208_3</ID>
  13721. <String>Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )</String>
  13722. <Description>Youdao search (China) robot</Description>
  13723. <Type>R</Type>
  13724. <Comment>202.108.7.1xx</Comment>
  13725. <Link1>http://www.youdao.com/</Link1>
  13726. <Link2></Link2>
  13727. </user-agent>
  13728. <user-agent>
  13729. <ID>id_moz_050807_1</ID>
  13730. <String>Mozilla/5.0 (compatible; Zenbot/1.3; +http://zen.co.za/webmasters/)</String>
  13731. <Description>Zenbot robot for the Southern African Zen search service</Description>
  13732. <Type>R</Type>
  13733. <Comment>196.46.116.x[x] / 196.23.180.x[x]</Comment>
  13734. <Link1>http://zen.co.za/</Link1>
  13735. <Link2>http://zen.co.za/webmasters/</Link2>
  13736. </user-agent>
  13737. <user-agent>
  13738. <ID>id_moz_110408_1</ID>
  13739. <String>Mozilla/5.0 (compatible; zermelo +http://www.powerset.com) [email:paul@page-store.com&#44;crawl@powerset.com]</String>
  13740. <Description>Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services</Description>
  13741. <Type>R</Type>
  13742. <Comment>67.202.34.xxx</Comment>
  13743. <Link1>http://www.powerset.com/</Link1>
  13744. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  13745. </user-agent>
  13746. <user-agent>
  13747. <ID>id_moz_030606_1</ID>
  13748. <String>Mozilla/5.0 (compatible;archive.org_bot/1.7.1; collectionId=316; Archive-It; +http://www.archive-it.org)</String>
  13749. <Description>Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx)</Description>
  13750. <Type>R</Type>
  13751. <Comment>s.also - InternetArchive/0.8-dev - archive.org_bot</Comment>
  13752. <Link1>http://www.archive.org/</Link1>
  13753. <Link2></Link2>
  13754. </user-agent>
  13755. <user-agent>
  13756. <ID>id_moz_180906_2</ID>
  13757. <String>Mozilla/5.0 (compatible;archive.org_bot/heritrix-1.9.0-200608171144 +http://pandora.nla.gov.au/crawl.html)</String>
  13758. <Description>Wayback Machine Internet Archive crawler</Description>
  13759. <Type>R</Type>
  13760. <Comment>207.241.233.2xx</Comment>
  13761. <Link1>http://www.archive.org/index.php</Link1>
  13762. <Link2></Link2>
  13763. </user-agent>
  13764. <user-agent>
  13765. <ID>id_moz_180107_1</ID>
  13766. <String>Mozilla/5.0 (compatible;FindITAnswersbot/1.0;+http://search.it-influentials.com/bot.htm)</String>
  13767. <Description>FindITAnswers - Search engine for software developers</Description>
  13768. <Type>B</Type>
  13769. <Comment>74.93.15.249</Comment>
  13770. <Link1>http://www.finditanswers.com/</Link1>
  13771. <Link2></Link2>
  13772. </user-agent>
  13773. <user-agent>
  13774. <ID>id_moz_170906_2</ID>
  13775. <String>Mozilla/5.0 (compatible;MAINSEEK_BOT)</String>
  13776. <Description>Mainseek search (Poland) robot</Description>
  13777. <Type>R</Type>
  13778. <Comment>80.190.213.xx</Comment>
  13779. <Link1>http://www.mainseek.com/</Link1>
  13780. <Link2></Link2>
  13781. </user-agent>
  13782. <user-agent>
  13783. <ID>id_moz_290708_1</ID>
  13784. <String>Mozilla/5.0 (Gecko/20070310 Mozshot/0.0.20070628; http://mozshot.nemui.org/)</String>
  13785. <Description>MozShot - Technical demo to take screenshot of any URL</Description>
  13786. <Type>B</Type>
  13787. <Comment></Comment>
  13788. <Link1>http://mozshot.nemui.org/</Link1>
  13789. <Link2></Link2>
  13790. </user-agent>
  13791. <user-agent>
  13792. <ID>id_moz_150408_2</ID>
  13793. <String>Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10.4; en-US; rv:1.9b5) Gecko/2008032619 Firefox/3.0b5</String>
  13794. <Description>Mozilla Firefox 3.0 beta (Gran Paradiso) for MacOS</Description>
  13795. <Type>B</Type>
  13796. <Comment></Comment>
  13797. <Link1>http://developer.mozilla.org/en/docs/Firefox_3_for_developers</Link1>
  13798. <Link2></Link2>
  13799. </user-agent>
  13800. <user-agent>
  13801. <ID>id_moz_976</ID>
  13802. <String>Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20021219 Chimera/0.6 </String>
  13803. <Description>Chimera browser (Mozilla/Gecko engine) - now Camino Mac PowerPC</Description>
  13804. <Type>B</Type>
  13805. <Comment></Comment>
  13806. <Link1>http://www.mozilla.org</Link1>
  13807. <Link2></Link2>
  13808. </user-agent>
  13809. <user-agent>
  13810. <ID>id_moz_977</ID>
  13811. <String>Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20030306 Camino/0.7</String>
  13812. <Description>Camino browser (Mozilla/Gecko engine) - ex Chimera Mac PowerPC</Description>
  13813. <Type>B</Type>
  13814. <Comment></Comment>
  13815. <Link1>http://www.mozilla.org</Link1>
  13816. <Link2></Link2>
  13817. </user-agent>
  13818. <user-agent>
  13819. <ID>id_moz_978</ID>
  13820. <String>Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-US) AppleWebKit/xx (KHTML like Gecko) OmniWeb/v5xx.xx</String>
  13821. <Description>OmniWeb 5.x.x Mac OS X browser</Description>
  13822. <Type>B</Type>
  13823. <Comment></Comment>
  13824. <Link1>http://www.omnigroup.com</Link1>
  13825. <Link2></Link2>
  13826. </user-agent>
  13827. <user-agent>
  13828. <ID>id_moz_979</ID>
  13829. <String>Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-us) AppleWebKit/xxx.x (KHTML like Gecko) Safari/12x.x</String>
  13830. <Description>Safari 1.2x browser (Mozilla/Gecko engine) MAC OS X</Description>
  13831. <Type>B</Type>
  13832. <Comment></Comment>
  13833. <Link1>http://www.apple.com</Link1>
  13834. <Link2></Link2>
  13835. </user-agent>
  13836. <user-agent>
  13837. <ID>id_moz_980</ID>
  13838. <String>Mozilla/5.0 (Macintosh; U; PPC; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1</String>
  13839. <Description>Netscape 6.x Mac PowerPC</Description>
  13840. <Type>B</Type>
  13841. <Comment></Comment>
  13842. <Link1></Link1>
  13843. <Link2></Link2>
  13844. </user-agent>
  13845. <user-agent>
  13846. <ID>id_moz_981</ID>
  13847. <String>Mozilla/5.0 (research@mediatrec.com)</String>
  13848. <Description>unknown robot from gw.ocg-corp.com</Description>
  13849. <Type></Type>
  13850. <Comment></Comment>
  13851. <Link1></Link1>
  13852. <Link2></Link2>
  13853. </user-agent>
  13854. <user-agent>
  13855. <ID>id_moz_260806_1</ID>
  13856. <String>Mozilla/5.0 (Sage)</String>
  13857. <Description>Sage - RSS and Atom feed reader extension for Mozilla Firefox</Description>
  13858. <Type>B</Type>
  13859. <Comment></Comment>
  13860. <Link1>http://sage.mozdev.org/</Link1>
  13861. <Link2></Link2>
  13862. </user-agent>
  13863. <user-agent>
  13864. <ID>id_moz_982</ID>
  13865. <String>Mozilla/5.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  13866. <Description>Inktomi (Hotbot-Lycos - NBCi etc.) robot</Description>
  13867. <Type>R</Type>
  13868. <Comment></Comment>
  13869. <Link1>http://www.inktomi.com</Link1>
  13870. <Link2></Link2>
  13871. </user-agent>
  13872. <user-agent>
  13873. <ID>id_moz_983</ID>
  13874. <String>Mozilla/5.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  13875. <Description>Inktomi (Hotbot-Lycos - NBCi etc.) robot</Description>
  13876. <Type>R</Type>
  13877. <Comment></Comment>
  13878. <Link1>http://www.inktomi.com</Link1>
  13879. <Link2></Link2>
  13880. </user-agent>
  13881. <user-agent>
  13882. <ID>id_moz_984</ID>
  13883. <String>Mozilla/5.0 (SunOS 5.8 sun4u; U) Opera 5.0 [en]</String>
  13884. <Description>Opera 5.x SunOS</Description>
  13885. <Type>B</Type>
  13886. <Comment></Comment>
  13887. <Link1></Link1>
  13888. <Link2></Link2>
  13889. </user-agent>
  13890. <user-agent>
  13891. <ID>id_moz_020507_1</ID>
  13892. <String>Mozilla/5.0 (Twiceler-0.9 http://www.cuill.com/twiceler/robot.html)</String>
  13893. <Description>Twiceler experimental web crawler</Description>
  13894. <Type>R</Type>
  13895. <Comment>64.62.136.xxx</Comment>
  13896. <Link1>http://www.cuill.com/</Link1>
  13897. <Link2></Link2>
  13898. </user-agent>
  13899. <user-agent>
  13900. <ID>id_moz_070106_2</ID>
  13901. <String>Mozilla/5.0 (Version: xxxx Type:xx)</String>
  13902. <Description>Some spambot from Romania (82.208.139.1xx &amp; 86.123.65.xx) - Maybe email harvesting</Description>
  13903. <Type>S</Type>
  13904. <Comment>UA sometimes have random letters like: vkfjkgo...</Comment>
  13905. <Link1></Link1>
  13906. <Link2></Link2>
  13907. </user-agent>
  13908. <user-agent>
  13909. <ID>id_moz_985</ID>
  13910. <String>Mozilla/5.0 (wgao@genieknows.com)</String>
  13911. <Description>GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx)</Description>
  13912. <Type>R</Type>
  13913. <Comment></Comment>
  13914. <Link1>http://www.genieknows.com/</Link1>
  13915. <Link2></Link2>
  13916. </user-agent>
  13917. <user-agent>
  13918. <ID>id_moz_986</ID>
  13919. <String>Mozilla/5.0 (Windows; U; Win98; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1</String>
  13920. <Description>Netscape 6.x Win98</Description>
  13921. <Type>B</Type>
  13922. <Comment></Comment>
  13923. <Link1></Link1>
  13924. <Link2></Link2>
  13925. </user-agent>
  13926. <user-agent>
  13927. <ID>id_moz_987</ID>
  13928. <String>Mozilla/5.0 (Windows; U; Win98; en-US; rv:x.xx) Gecko/20030423 Firebird Browser/0.6</String>
  13929. <Description>Firebird browser (Mozilla/Gecko engine) - ex Phoenix Win98</Description>
  13930. <Type>B</Type>
  13931. <Comment></Comment>
  13932. <Link1>http://www.mozilla.org</Link1>
  13933. <Link2></Link2>
  13934. </user-agent>
  13935. <user-agent>
  13936. <ID>id_moz_988</ID>
  13937. <String>Mozilla/5.0 (Windows; U; Win9x; en; Stable) Gecko/20020911 Beonex/0.8.1-stable</String>
  13938. <Description>Beonex Communicator browser (Mozilla/Gecko engine)</Description>
  13939. <Type>B</Type>
  13940. <Comment></Comment>
  13941. <Link1>http://www.beonex.com</Link1>
  13942. <Link2></Link2>
  13943. </user-agent>
  13944. <user-agent>
  13945. <ID>id_moz_111205_1</ID>
  13946. <String>Mozilla/5.0 (Windows; U; Windows NT 5.0; en-US; rv:1.7.7) NimbleCrawler 1.11 obeys UserAgent NimbleCrawler For problems contact: crawler_at_dataalchemy.com</String>
  13947. <Description>Healthline health related search robot (72.5.115.xx)</Description>
  13948. <Type>R</Type>
  13949. <Comment></Comment>
  13950. <Link1>http://www.healthline.com/</Link1>
  13951. <Link2></Link2>
  13952. </user-agent>
  13953. <user-agent>
  13954. <ID>id_moz_171008_2</ID>
  13955. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US) AppleWebKit/525.19 (KHTML&#44; like Gecko) Chrome/0.2.153.1 Safari/525.19</String>
  13956. <Description>Google Chrome browser based on WebKit (Safari)</Description>
  13957. <Type>B</Type>
  13958. <Comment></Comment>
  13959. <Link1>http://www.google.com/chrome</Link1>
  13960. <Link2></Link2>
  13961. </user-agent>
  13962. <user-agent>
  13963. <ID>id_moz_170207_1</ID>
  13964. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.0.5) Gecko/20060731 Firefox/1.5.0.5 Flock/0.7.4.1</String>
  13965. <Description>Flock web browser built on Mozilla technologies</Description>
  13966. <Type>B</Type>
  13967. <Comment></Comment>
  13968. <Link1>http://www.flock.com/</Link1>
  13969. <Link2></Link2>
  13970. </user-agent>
  13971. <user-agent>
  13972. <ID>id_moz_190108_3</ID>
  13973. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.11) Gecko/20071127 Firefox/2.0.0.4/Megaupload x.0</String>
  13974. <Description>Megaupload Mega Manager - Download manager plugin for Firefox</Description>
  13975. <Type>D</Type>
  13976. <Comment></Comment>
  13977. <Link1>http://www.megaupload.com/manager/de/</Link1>
  13978. <Link2></Link2>
  13979. </user-agent>
  13980. <user-agent>
  13981. <ID>id_moz_171008_1</ID>
  13982. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.0.1) Gecko/2008092215 Firefox/3.0.1 Orca/1.1 beta 3</String>
  13983. <Description>Orca browser - based on Gecko</Description>
  13984. <Type>B</Type>
  13985. <Comment></Comment>
  13986. <Link1>http://www.orcabrowser.com</Link1>
  13987. <Link2></Link2>
  13988. </user-agent>
  13989. <user-agent>
  13990. <ID>id_moz_989</ID>
  13991. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.x.x) Gecko/20041107 Firefox/x.x</String>
  13992. <Description>Firefox browser (Mozilla/Gecko engine) - ex Firebird WinXP</Description>
  13993. <Type>B</Type>
  13994. <Comment></Comment>
  13995. <Link1>http://www.mozilla.org</Link1>
  13996. <Link2></Link2>
  13997. </user-agent>
  13998. <user-agent>
  13999. <ID>id_moz_990</ID>
  14000. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xx) Gecko/20030504 Mozilla Firebird/0.6</String>
  14001. <Description>Firebird browser (Mozilla/Gecko engine) - ex Phoenix WinXP</Description>
  14002. <Type>B</Type>
  14003. <Comment></Comment>
  14004. <Link1>http://www.mozilla.org</Link1>
  14005. <Link2></Link2>
  14006. </user-agent>
  14007. <user-agent>
  14008. <ID>id_moz_991</ID>
  14009. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xxx) Gecko/20041027 Mnenhy/0.6.0.104</String>
  14010. <Description>Mnenhy - enhanced mail &amp; news Mozilla based browser</Description>
  14011. <Type>B</Type>
  14012. <Comment></Comment>
  14013. <Link1>http://mnenhy.mozdev.org/index-de.html</Link1>
  14014. <Link2></Link2>
  14015. </user-agent>
  14016. <user-agent>
  14017. <ID>id_moz_060508_2</ID>
  14018. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)</String>
  14019. <Description>Voila.fr robot</Description>
  14020. <Type>R</Type>
  14021. <Comment></Comment>
  14022. <Link1>http://www.voila.fr</Link1>
  14023. <Link2></Link2>
  14024. </user-agent>
  14025. <user-agent>
  14026. <ID>id_moz_080608_2</ID>
  14027. <String>Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)</String>
  14028. <Description>Voila.fr robot</Description>
  14029. <Type>R</Type>
  14030. <Comment></Comment>
  14031. <Link1>http://www.voila.fr</Link1>
  14032. <Link2></Link2>
  14033. </user-agent>
  14034. <user-agent>
  14035. <ID>id_moz_150408_3</ID>
  14036. <String>Mozilla/5.0 (Windows; U; Windows NT 6.0; en-US; rv:1.9b5) Gecko/2008032620 Firefox/3.0b5</String>
  14037. <Description>Mozilla Firefox 3.0 beta (Gran Paradiso) for Win</Description>
  14038. <Type>B</Type>
  14039. <Comment></Comment>
  14040. <Link1>http://developer.mozilla.org/en/docs/Firefox_3_for_developers</Link1>
  14041. <Link2></Link2>
  14042. </user-agent>
  14043. <user-agent>
  14044. <ID>id_moz_300407_2</ID>
  14045. <String>Mozilla/5.0 (Windows; U;XMPP Tiscali Communicator v.10.0.1; Windows NT 5.1; it; rv:1.8.1.3) Gecko/20070309 Firefox/2.0.0.3</String>
  14046. <Description>Tiscali Communicator - Online services suite</Description>
  14047. <Type>B</Type>
  14048. <Comment></Comment>
  14049. <Link1>http://im.tiscali.com/index.html</Link1>
  14050. <Link2></Link2>
  14051. </user-agent>
  14052. <user-agent>
  14053. <ID>id_moz_300106_1</ID>
  14054. <String>Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@health</String>
  14055. <Description>Healthline health related search robot (72.5.115.xx)</Description>
  14056. <Type>R</Type>
  14057. <Comment></Comment>
  14058. <Link1>http://www.healthline.com/</Link1>
  14059. <Link2></Link2>
  14060. </user-agent>
  14061. <user-agent>
  14062. <ID>id_moz_161205_2</ID>
  14063. <String>Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@healthline.com</String>
  14064. <Description>Healthline health related search robot (72.5.115.xx)</Description>
  14065. <Type>R</Type>
  14066. <Comment></Comment>
  14067. <Link1>http://www.healthline.com/</Link1>
  14068. <Link2></Link2>
  14069. </user-agent>
  14070. <user-agent>
  14071. <ID>id_moz_090807_2</ID>
  14072. <String>Mozilla/5.0 (X11; Linux i686; U;rv: 1.7.13) Gecko/20070322 Kazehakase/0.4.4.1</String>
  14073. <Description>Kazehakase - Gecko based browser (Japan)</Description>
  14074. <Type>B</Type>
  14075. <Comment></Comment>
  14076. <Link1>http://kazehakase.sourceforge.jp/</Link1>
  14077. <Link2></Link2>
  14078. </user-agent>
  14079. <user-agent>
  14080. <ID>id_moz_992</ID>
  14081. <String>Mozilla/5.0 (X11; U; Linux 2.4.2-2 i586; en-US; m18) Gecko/20010131 Netscape6/6.01</String>
  14082. <Description>Netscape 6.x Linux</Description>
  14083. <Type>B</Type>
  14084. <Comment></Comment>
  14085. <Link1></Link1>
  14086. <Link2></Link2>
  14087. </user-agent>
  14088. <user-agent>
  14089. <ID>id_moz_160306_1</ID>
  14090. <String>Mozilla/5.0 (X11; U; Linux i686; de-AT; rv:1.8.0.2) Gecko/20060309 SeaMonkey/1.0</String>
  14091. <Description>SeaMonkey browser suite (ex Mozilla) on Linux</Description>
  14092. <Type>B</Type>
  14093. <Comment></Comment>
  14094. <Link1>http://www.mozilla.org/projects/seamonkey/</Link1>
  14095. <Link2></Link2>
  14096. </user-agent>
  14097. <user-agent>
  14098. <ID>id_moz_993</ID>
  14099. <String>Mozilla/5.0 (X11; U; Linux i686; en-GB; rv:1.7.6) Gecko/20050405 Epiphany/1.6.1 (Ubuntu) (Ubuntu package 1.0.2)</String>
  14100. <Description>Epiphany (Mozilla/Gecko engine) browser Linux</Description>
  14101. <Type>B</Type>
  14102. <Comment></Comment>
  14103. <Link1>http://www.gnome.org/projects/epiphany/</Link1>
  14104. <Link2></Link2>
  14105. </user-agent>
  14106. <user-agent>
  14107. <ID>id_moz_994</ID>
  14108. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; Nautilus/1.0Final) Gecko/20020408</String>
  14109. <Description>Nautilus (developed by Eazel.com) 1.x Browser Linux</Description>
  14110. <Type>B</Type>
  14111. <Comment></Comment>
  14112. <Link1>http://swin05.dyndns.biz/Doc/Docrh7.03us/DocRH7.3us/sunsite.mff.cuni.cz/pub/redhat/linux/7.3/fr/doc/RH-DOCS/rhl-gsg-en-7.3/s1-browsers-nautilus.html</Link1>
  14113. <Link2></Link2>
  14114. </user-agent>
  14115. <user-agent>
  14116. <ID>id_moz_995</ID>
  14117. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:0.9.3) Gecko/20010801</String>
  14118. <Description>Mozilla (Gecko) 0.9x browser Linux</Description>
  14119. <Type>B</Type>
  14120. <Comment></Comment>
  14121. <Link1></Link1>
  14122. <Link2></Link2>
  14123. </user-agent>
  14124. <user-agent>
  14125. <ID>id_moz_030110_5</ID>
  14126. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2.1; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/20021130</String>
  14127. <Description>Spinn3r social network crawler</Description>
  14128. <Type>R</Type>
  14129. <Comment>64.34.195.1xx</Comment>
  14130. <Link1>http://spinn3r.com/</Link1>
  14131. <Link2></Link2>
  14132. </user-agent>
  14133. <user-agent>
  14134. <ID>id_moz_996</ID>
  14135. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2b) Gecko/20021007 Phoenix/0.3</String>
  14136. <Description>Phoenix 0.3 browser (Mozilla/Gecko engine) - now Firebird Linux</Description>
  14137. <Type>B</Type>
  14138. <Comment></Comment>
  14139. <Link1>http://www.firebirdsql.org/</Link1>
  14140. <Link2></Link2>
  14141. </user-agent>
  14142. <user-agent>
  14143. <ID>id_moz_997</ID>
  14144. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.6) Gecko/20040413 Epiphany/1.2.1</String>
  14145. <Description>Epiphany (Mozilla/Gecko engine) browser Linux</Description>
  14146. <Type>B</Type>
  14147. <Comment></Comment>
  14148. <Link1>http://www.gnome.org/projects/epiphany/</Link1>
  14149. <Link2></Link2>
  14150. </user-agent>
  14151. <user-agent>
  14152. <ID>id_moz_190107_1</ID>
  14153. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.0.7) Gecko/20060909 Firefox/1.5.0.7 SnapPreviewBot</String>
  14154. <Description>Snap Firefox Search Plugin</Description>
  14155. <Type>B</Type>
  14156. <Comment></Comment>
  14157. <Link1>http://www.snap.com/about/spa1A.php</Link1>
  14158. <Link2></Link2>
  14159. </user-agent>
  14160. <user-agent>
  14161. <ID>id_moz_240107_2</ID>
  14162. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1) Gecko/20061129 BonEcho/2.0</String>
  14163. <Description>Bon Echo Alpha - developer preview of future Firefox browser</Description>
  14164. <Type>B</Type>
  14165. <Comment></Comment>
  14166. <Link1>http://www.mozilla.org/projects/bonecho/releases/2.0a1.html</Link1>
  14167. <Link2></Link2>
  14168. </user-agent>
  14169. <user-agent>
  14170. <ID>id_moz_240207_2</ID>
  14171. <String>Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1.1) Gecko/20061205 Iceweasel/2.0.0.1 (Debian-2.0.0.1+dfsg-2)</String>
  14172. <Description>IceWeasel - the GNU version of the Firefox browser</Description>
  14173. <Type>B</Type>
  14174. <Comment></Comment>
  14175. <Link1>http://www.gnu.org/software/gnuzilla/</Link1>
  14176. <Link2></Link2>
  14177. </user-agent>
  14178. <user-agent>
  14179. <ID>id_moz_150408_1</ID>
  14180. <String>Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9a8) Gecko/2007100619 GranParadiso/3.0a8</String>
  14181. <Description>Mozilla Firefox 3.0 beta (Gran Paradiso) for Linux</Description>
  14182. <Type>B</Type>
  14183. <Comment></Comment>
  14184. <Link1>http://developer.mozilla.org/en/docs/Firefox_3_for_developers</Link1>
  14185. <Link2></Link2>
  14186. </user-agent>
  14187. <user-agent>
  14188. <ID>id_moz_999</ID>
  14189. <String>Mozilla/5.0 Galeon/1.0.2 (X11; Linux i686; U;) Gecko/20011224</String>
  14190. <Description>Galeon 1.x Browser Linux</Description>
  14191. <Type>B</Type>
  14192. <Comment></Comment>
  14193. <Link1>http://galeon.sourceforge.net/</Link1>
  14194. <Link2></Link2>
  14195. </user-agent>
  14196. <user-agent>
  14197. <ID>id_moz_1000</ID>
  14198. <String>Mozilla/5.0 gURLChecker/0.x.x (Linux)</String>
  14199. <Description>gURLChecker - GNOME link checking tool</Description>
  14200. <Type>C</Type>
  14201. <Comment></Comment>
  14202. <Link1>http://www.nongnu.org</Link1>
  14203. <Link2></Link2>
  14204. </user-agent>
  14205. <user-agent>
  14206. <ID>id_moz_1001</ID>
  14207. <String>Mozilla/5.0 URL-Spider</String>
  14208. <Description>URL Spider - used by usww.net</Description>
  14209. <Type>R</Type>
  14210. <Comment></Comment>
  14211. <Link1>http://www.url-spider.com/</Link1>
  14212. <Link2></Link2>
  14213. </user-agent>
  14214. <user-agent>
  14215. <ID>id_moz_1002</ID>
  14216. <String>Mozilla/5.0 usww.com-Spider-for-w8.net</String>
  14217. <Description>W8net spider</Description>
  14218. <Type>R</Type>
  14219. <Comment></Comment>
  14220. <Link1>http://www.usww.com</Link1>
  14221. <Link2></Link2>
  14222. </user-agent>
  14223. <user-agent>
  14224. <ID>id_moz_1003</ID>
  14225. <String>Mozilla/5.0 wgao@genieknows.com</String>
  14226. <Description>GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx)</Description>
  14227. <Type>R</Type>
  14228. <Comment></Comment>
  14229. <Link1>http://www.genieknows.com</Link1>
  14230. <Link2></Link2>
  14231. </user-agent>
  14232. <user-agent>
  14233. <ID>id_moz_111205_7</ID>
  14234. <String>Mozilla/5.0 whoiam [http://www.axxus.de/]</String>
  14235. <Description>axxus.de German business directory</Description>
  14236. <Type>R C</Type>
  14237. <Comment></Comment>
  14238. <Link1>http://www.axxus.de/</Link1>
  14239. <Link2></Link2>
  14240. </user-agent>
  14241. <user-agent>
  14242. <ID>id_moz_998</ID>
  14243. <String>Mozilla/5.0 [en] (compatible; Gulper Web Bot 0.2.4 www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot)</String>
  14244. <Description>Yuntis : Collaborative Web Resource Categorization and Ranking Project robot</Description>
  14245. <Type>R</Type>
  14246. <Comment></Comment>
  14247. <Link1>http://www.ecsl.cs.sunysb.edu/yuntis/</Link1>
  14248. <Link2></Link2>
  14249. </user-agent>
  14250. <user-agent>
  14251. <ID>id_g_m_190606_1</ID>
  14252. <String>MQbot metaquerier.cs.uiuc.edu/crawler</String>
  14253. <Description>MetaExplorer project's MetaQuerier robot</Description>
  14254. <Type>R</Type>
  14255. <Comment>192.17.11.xx</Comment>
  14256. <Link1>http://metaquerier.cs.uiuc.edu/</Link1>
  14257. <Link2></Link2>
  14258. </user-agent>
  14259. <user-agent>
  14260. <ID>id_g_m_251006_1</ID>
  14261. <String>MQBOT/Nutch-0.9-dev (MQBOT Nutch Crawler; http://falcon.cs.uiuc.edu; mqbot@cs.uiuc.edu)</String>
  14262. <Description>MetaExplorer project's MetaQuerier robot</Description>
  14263. <Type>R</Type>
  14264. <Comment>192.17.11.xx</Comment>
  14265. <Link1>http://metaquerier.cs.uiuc.edu/</Link1>
  14266. <Link2></Link2>
  14267. </user-agent>
  14268. <user-agent>
  14269. <ID>id_g_m_1004</ID>
  14270. <String>MSFrontPage/4.0</String>
  14271. <Description>MS Frontpage 4.x</Description>
  14272. <Type>B</Type>
  14273. <Comment></Comment>
  14274. <Link1></Link1>
  14275. <Link2></Link2>
  14276. </user-agent>
  14277. <user-agent>
  14278. <ID>id_g_m_1005</ID>
  14279. <String>MSIE 4.0 (Win95)</String>
  14280. <Description>Some faked UA - maybe for a download manager</Description>
  14281. <Type>D</Type>
  14282. <Comment></Comment>
  14283. <Link1></Link1>
  14284. <Link2></Link2>
  14285. </user-agent>
  14286. <user-agent>
  14287. <ID>id_g_m_1006</ID>
  14288. <String>MSIE-5.13 (larbin@unspecified.mail)</String>
  14289. <Description>unknown robot from gw.ocg-corp.com (209.126.176.x)</Description>
  14290. <Type></Type>
  14291. <Comment>see also: - Opera/6.01 (larbin@.....) - WinampMPEG/2.00 larbin@....</Comment>
  14292. <Link1></Link1>
  14293. <Link2></Link2>
  14294. </user-agent>
  14295. <user-agent>
  14296. <ID>id_g_m_190506_1</ID>
  14297. <String>msnbot-media/1.0 (+http://search.msn.com/msnbot.htm)</String>
  14298. <Description>MSN media search robot</Description>
  14299. <Type>R</Type>
  14300. <Comment>65.55.235.1xx</Comment>
  14301. <Link1>http://search.msn.com</Link1>
  14302. <Link2></Link2>
  14303. </user-agent>
  14304. <user-agent>
  14305. <ID>id_g_m_290806_1</ID>
  14306. <String>msnbot-Products/1.0 (+http://search.msn.com/msnbot.htm)</String>
  14307. <Description>Windows Live product search (Beta) robot</Description>
  14308. <Type>R</Type>
  14309. <Comment>207.68.157.xxx</Comment>
  14310. <Link1>http://products.live.com</Link1>
  14311. <Link2>http://productsearch.spaces.live.com/</Link2>
  14312. </user-agent>
  14313. <user-agent>
  14314. <ID>id_g_m_1007</ID>
  14315. <String>MSNBOT/0.xx (http://search.msn.com/msnbot.htm)</String>
  14316. <Description>MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx</Description>
  14317. <Type>R</Type>
  14318. <Comment>s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...</Comment>
  14319. <Link1>http://search.msn.com</Link1>
  14320. <Link2></Link2>
  14321. </user-agent>
  14322. <user-agent>
  14323. <ID>id_g_m_1008</ID>
  14324. <String>msnbot/x.xx ( http://search.msn.com/msnbot.htm)</String>
  14325. <Description>MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx</Description>
  14326. <Type>R</Type>
  14327. <Comment>s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...</Comment>
  14328. <Link1>http://search.msn.com</Link1>
  14329. <Link2></Link2>
  14330. </user-agent>
  14331. <user-agent>
  14332. <ID>id_g_m_190108_2</ID>
  14333. <String>MSNBOT_Mobile MSMOBOT Mozilla/2.0 (compatible; MSIE 4.02; Windows CE; Default)</String>
  14334. <Description>Microsoft search for mobiles</Description>
  14335. <Type>R</Type>
  14336. <Comment>65.55.241.2xx</Comment>
  14337. <Link1>http://livesearchmobile.com/?mid=1011</Link1>
  14338. <Link2></Link2>
  14339. </user-agent>
  14340. <user-agent>
  14341. <ID>id_g_m_1009</ID>
  14342. <String>MSNPTC/1.0</String>
  14343. <Description>MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx</Description>
  14344. <Type>R</Type>
  14345. <Comment>s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...</Comment>
  14346. <Link1>http://search.msn.com</Link1>
  14347. <Link2></Link2>
  14348. </user-agent>
  14349. <user-agent>
  14350. <ID>id_g_m_1010</ID>
  14351. <String>MSProxy/2.0</String>
  14352. <Description>Microsoft proxy server</Description>
  14353. <Type>P</Type>
  14354. <Comment></Comment>
  14355. <Link1>http://www.microsoft.com/isaserver/evaluation/previousversions/default.mspx</Link1>
  14356. <Link2></Link2>
  14357. </user-agent>
  14358. <user-agent>
  14359. <ID>id_g_m_181205_3</ID>
  14360. <String>MSRBOT</String>
  14361. <Description>MacEdition CodeBitch link checking</Description>
  14362. <Type>C</Type>
  14363. <Comment></Comment>
  14364. <Link1>http://www.macedition.com/cb/cb_20030310.php</Link1>
  14365. <Link2></Link2>
  14366. </user-agent>
  14367. <user-agent>
  14368. <ID>id_g_m_270407_1</ID>
  14369. <String>MSRBOT (http://research.microsoft.com/research/sv/msrbot)</String>
  14370. <Description>Microsoft MSRBot</Description>
  14371. <Type>R</Type>
  14372. <Comment></Comment>
  14373. <Link1>http://research.microsoft.com/research/sv/msrbot/</Link1>
  14374. <Link2></Link2>
  14375. </user-agent>
  14376. <user-agent>
  14377. <ID>id_g_m_070406_3</ID>
  14378. <String>Mulder&#44; VCR-1.0</String>
  14379. <Description>StreamBox VCR user agent</Description>
  14380. <Type>D</Type>
  14381. <Comment></Comment>
  14382. <Link1>http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm</Link1>
  14383. <Link2></Link2>
  14384. </user-agent>
  14385. <user-agent>
  14386. <ID>id_g_m_1011</ID>
  14387. <String>multiBlocker browser</String>
  14388. <Description>Multiblocker (Fantomaster) anonymity software user</Description>
  14389. <Type>P</Type>
  14390. <Comment></Comment>
  14391. <Link1>http://multiblocker.com/home.html</Link1>
  14392. <Link2>http://fantomaster.com</Link2>
  14393. </user-agent>
  14394. <user-agent>
  14395. <ID>id_g_m_030807_1</ID>
  14396. <String>multicrawler ( http://sw.deri.org/2006/04/multicrawler/robots.html)</String>
  14397. <Description>MultiCrawler for DERI Galway's Semantic Web Search Engine cluster</Description>
  14398. <Type>R</Type>
  14399. <Comment>140.203.154.1xx</Comment>
  14400. <Link1>http://sw.deri.org/2006/04/multicrawler/robots.html</Link1>
  14401. <Link2>http://sw.deri.ie/</Link2>
  14402. </user-agent>
  14403. <user-agent>
  14404. <ID>id_g_m_1012</ID>
  14405. <String>MultiText/0.1</String>
  14406. <Description>Virginia Tech Digital Library Research Laboratory robot</Description>
  14407. <Type>R</Type>
  14408. <Comment></Comment>
  14409. <Link1>http://www.dlib.vt.edu</Link1>
  14410. <Link2></Link2>
  14411. </user-agent>
  14412. <user-agent>
  14413. <ID>id_g_m_1013</ID>
  14414. <String>MusicWalker2.0 ( http://www.somusical.com)</String>
  14415. <Description>SoMusical! musical directory link checking</Description>
  14416. <Type>R</Type>
  14417. <Comment></Comment>
  14418. <Link1>http://www.somusical.com</Link1>
  14419. <Link2></Link2>
  14420. </user-agent>
  14421. <user-agent>
  14422. <ID>id_g_m_270306_1</ID>
  14423. <String>MVAClient</String>
  14424. <Description>Unknown bad bot from diff. Taiwanese IPs</Description>
  14425. <Type>S</Type>
  14426. <Comment>see this blog:</Comment>
  14427. <Link1>http://www.tenspider.com/business-blog/weblog.php</Link1>
  14428. <Link2></Link2>
  14429. </user-agent>
  14430. <user-agent>
  14431. <ID>id_g_m_241105_1</ID>
  14432. <String>My WinHTTP Connection</String>
  14433. <Description>Windows HTTP Services (WinHTTP)</Description>
  14434. <Type></Type>
  14435. <Comment></Comment>
  14436. <Link1>http://msdn.microsoft.com/library/?url=/library/en-us/winhttp/http/about_winhttp.asp</Link1>
  14437. <Link2></Link2>
  14438. </user-agent>
  14439. <user-agent>
  14440. <ID>id_g_m_1014</ID>
  14441. <String>myDaemon</String>
  14442. <Description>unknown user robot (24.124.34.42)</Description>
  14443. <Type></Type>
  14444. <Comment></Comment>
  14445. <Link1></Link1>
  14446. <Link2></Link2>
  14447. </user-agent>
  14448. <user-agent>
  14449. <ID>id_g_m_1015</ID>
  14450. <String>MyGetRight/1.0.0</String>
  14451. <Description>GetRight download manager</Description>
  14452. <Type>D</Type>
  14453. <Comment></Comment>
  14454. <Link1>http://www.getright.com</Link1>
  14455. <Link2></Link2>
  14456. </user-agent>
  14457. <user-agent>
  14458. <ID>id_g_m_1016</ID>
  14459. <String>MyGetRight/1.0b</String>
  14460. <Description>GetRight download manager</Description>
  14461. <Type>D</Type>
  14462. <Comment></Comment>
  14463. <Link1>http://www.getright.com</Link1>
  14464. <Link2></Link2>
  14465. </user-agent>
  14466. <user-agent>
  14467. <ID>id_g_m_1017</ID>
  14468. <String>Mylinea.com Crawler 2.0</String>
  14469. <Description>Mylinea France web catalogue crawler</Description>
  14470. <Type>R</Type>
  14471. <Comment></Comment>
  14472. <Link1>http://www.mylinea.com</Link1>
  14473. <Link2></Link2>
  14474. </user-agent>
  14475. <user-agent>
  14476. <ID>id_g_m_040906_1</ID>
  14477. <String>mylinkcheck/1.02</String>
  14478. <Description>VDOG - SEO webdirecory (Germany) link checking</Description>
  14479. <Type>C</Type>
  14480. <Comment></Comment>
  14481. <Link1>http://www.vdog.de/</Link1>
  14482. <Link2></Link2>
  14483. </user-agent>
  14484. <user-agent>
  14485. <ID>id_n_s_1018</ID>
  14486. <String>Naamah 1.0.1/Blogbot (http://blogbot.de/)</String>
  14487. <Description>Blogbot (Germany) robot</Description>
  14488. <Type>R</Type>
  14489. <Comment></Comment>
  14490. <Link1>http://blogbot.de/</Link1>
  14491. <Link2></Link2>
  14492. </user-agent>
  14493. <user-agent>
  14494. <ID>id_n_s_1019</ID>
  14495. <String>Naamah 1.0a/Blogbot (http://blogbot.de/)</String>
  14496. <Description>Blogbot (Germany) robot</Description>
  14497. <Type>R</Type>
  14498. <Comment></Comment>
  14499. <Link1>http://blogbot.de/</Link1>
  14500. <Link2></Link2>
  14501. </user-agent>
  14502. <user-agent>
  14503. <ID>id_n_s_1021</ID>
  14504. <String>NABOT/5.0</String>
  14505. <Description>Naver Japan / Korea robot </Description>
  14506. <Type>R</Type>
  14507. <Comment>s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 &amp; Cowbot</Comment>
  14508. <Link1>http://www.naver.co.jp/</Link1>
  14509. <Link2></Link2>
  14510. </user-agent>
  14511. <user-agent>
  14512. <ID>id_n_s_1020</ID>
  14513. <String>nabot_1.0</String>
  14514. <Description>Naver Japan / Korea robot </Description>
  14515. <Type>R</Type>
  14516. <Comment>s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 &amp; Cowbot</Comment>
  14517. <Link1>http://www.naver.co.jp/</Link1>
  14518. <Link2></Link2>
  14519. </user-agent>
  14520. <user-agent>
  14521. <ID>id_n_s_180408_4</ID>
  14522. <String>NameOfAgent (CMS Spider)</String>
  14523. <Description>Badbot searching for Wordpress wp-login.php</Description>
  14524. <Type>S</Type>
  14525. <Comment></Comment>
  14526. <Link1></Link1>
  14527. <Link2></Link2>
  14528. </user-agent>
  14529. <user-agent>
  14530. <ID>id_n_s_071205_1</ID>
  14531. <String>naoFavicon4IE/1.xx</String>
  14532. <Description>naoFavicon4IE</Description>
  14533. <Type>D</Type>
  14534. <Comment></Comment>
  14535. <Link1>http://nao4u.com/software/naoFavicon4IE/</Link1>
  14536. <Link2></Link2>
  14537. </user-agent>
  14538. <user-agent>
  14539. <ID>id_n_s_140506_2</ID>
  14540. <String>NASA Search 1.0</String>
  14541. <Description>Unknown spambot / harvester from diff. IPs</Description>
  14542. <Type>S</Type>
  14543. <Comment></Comment>
  14544. <Link1>http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1</Link1>
  14545. <Link2></Link2>
  14546. </user-agent>
  14547. <user-agent>
  14548. <ID>id_n_s_1022</ID>
  14549. <String>NationalDirectory-WebSpider/1.3</String>
  14550. <Description>Nationaldirectory spider</Description>
  14551. <Type>R</Type>
  14552. <Comment></Comment>
  14553. <Link1>http://www.nationaldirectory.com/</Link1>
  14554. <Link2></Link2>
  14555. </user-agent>
  14556. <user-agent>
  14557. <ID>id_n_s_1023</ID>
  14558. <String>NationalDirectoryAddURL/1.0</String>
  14559. <Description>Nationaldirectory spider</Description>
  14560. <Type>R</Type>
  14561. <Comment></Comment>
  14562. <Link1>http://www.nationaldirectory.com/</Link1>
  14563. <Link2></Link2>
  14564. </user-agent>
  14565. <user-agent>
  14566. <ID>id_n_s_1025</ID>
  14567. <String>NaverBot-1.0 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)</String>
  14568. <Description>Naver Japan / Korea robot</Description>
  14569. <Type>R</Type>
  14570. <Comment>s. also Python-urllib/1.15- nabot- cowbot &amp; dloader</Comment>
  14571. <Link1>http://www.naver.co.jp/</Link1>
  14572. <Link2></Link2>
  14573. </user-agent>
  14574. <user-agent>
  14575. <ID>id_n_s_1024</ID>
  14576. <String>NaverBot_dloader/1.5</String>
  14577. <Description>Naver Japan / Korea robot</Description>
  14578. <Type>R</Type>
  14579. <Comment>s. also Python-urllib/1.15 - nabot - cowbot &amp; dloader</Comment>
  14580. <Link1>http://www.naver.co.jp/</Link1>
  14581. <Link2></Link2>
  14582. </user-agent>
  14583. <user-agent>
  14584. <ID>id_n_s_181205_1</ID>
  14585. <String>NavissoBot</String>
  14586. <Description>Navisso closed beta robot (69.41.162.1xx)</Description>
  14587. <Type>R</Type>
  14588. <Comment></Comment>
  14589. <Link1>http://navisso.com/</Link1>
  14590. <Link2></Link2>
  14591. </user-agent>
  14592. <user-agent>
  14593. <ID>id_n_s_181205_2</ID>
  14594. <String>NavissoBot/1.7  (+http://navisso.com/)</String>
  14595. <Description>Navisso closed beta robot (69.41.162.1xx)</Description>
  14596. <Type>R</Type>
  14597. <Comment></Comment>
  14598. <Link1>http://navisso.com/</Link1>
  14599. <Link2></Link2>
  14600. </user-agent>
  14601. <user-agent>
  14602. <ID>id_n_s_1026</ID>
  14603. <String>NCSA Beta 1 (http://vias.ncsa.uiuc.edu/viasarchivinginformation.html)</String>
  14604. <Description>Vias Information Archival robot</Description>
  14605. <Type>R</Type>
  14606. <Comment></Comment>
  14607. <Link1>http://vias.ncsa.uiuc.edu/</Link1>
  14608. <Link2></Link2>
  14609. </user-agent>
  14610. <user-agent>
  14611. <ID>id_n_s_250507_1</ID>
  14612. <String>Nebullabot/2.2 (http://bot.nebulla.info)</String>
  14613. <Description>Nebulla.info distributed crawler (Germany)</Description>
  14614. <Type>R</Type>
  14615. <Comment>81.169.180.2xx</Comment>
  14616. <Link1>http://www.nebulla.info/</Link1>
  14617. <Link2>http://bot.nebulla.info/</Link2>
  14618. </user-agent>
  14619. <user-agent>
  14620. <ID>id_n_s_1027</ID>
  14621. <String>NEC Research Agent -- compuman at research.nj.nec.com</String>
  14622. <Description>NEC Researchindex robot - now CiteSeer.IST scientific document index</Description>
  14623. <Type>R</Type>
  14624. <Comment></Comment>
  14625. <Link1>http://citeseer.ist.psu.edu/</Link1>
  14626. <Link2></Link2>
  14627. </user-agent>
  14628. <user-agent>
  14629. <ID>id_n_s_1028</ID>
  14630. <String>NEC-Hayek/1.0</String>
  14631. <Description>rcn.com user agent ? NEC Researchindex robot ?</Description>
  14632. <Type></Type>
  14633. <Comment>s. NEC Research Agent</Comment>
  14634. <Link1></Link1>
  14635. <Link2></Link2>
  14636. </user-agent>
  14637. <user-agent>
  14638. <ID>id_n_s_291108_4</ID>
  14639. <String>Net-Seekr Bot/Net-Seekr Bot V1 (http://www.net-seekr.com)</String>
  14640. <Description>Net Seekr search robot</Description>
  14641. <Type>R</Type>
  14642. <Comment>78.129.201.19x</Comment>
  14643. <Link1>http://www.net-seekr.com/</Link1>
  14644. <Link2></Link2>
  14645. </user-agent>
  14646. <user-agent>
  14647. <ID>id_n_s_1029</ID>
  14648. <String>NetAnts/1.2x</String>
  14649. <Description>NetAnts download manager</Description>
  14650. <Type>D</Type>
  14651. <Comment></Comment>
  14652. <Link1>http://www.netants.com/en/index.html</Link1>
  14653. <Link2></Link2>
  14654. </user-agent>
  14655. <user-agent>
  14656. <ID>id_n_s_1030</ID>
  14657. <String>NETCOMplete/x.xx</String>
  14658. <Description>NetComplete IE browser package</Description>
  14659. <Type>B</Type>
  14660. <Comment></Comment>
  14661. <Link1>http://www.netcom.net.uk/</Link1>
  14662. <Link2></Link2>
  14663. </user-agent>
  14664. <user-agent>
  14665. <ID>id_n_s_010807_2</ID>
  14666. <String>NetinfoBot/1.0 (http://netinfo.bg/netinfobot.html)</String>
  14667. <Description>Netinfo.bg search (Bulgaria) robot</Description>
  14668. <Type>R</Type>
  14669. <Comment>194.153.145.x[xx]</Comment>
  14670. <Link1>http://netinfo.bg/</Link1>
  14671. <Link2></Link2>
  14672. </user-agent>
  14673. <user-agent>
  14674. <ID>id_n_s_1031</ID>
  14675. <String>NetLookout/2.24</String>
  14676. <Description>Netlookout internet notifier</Description>
  14677. <Type>R</Type>
  14678. <Comment>site is offline</Comment>
  14679. <Link1>http://www.frugalsoft.com</Link1>
  14680. <Link2></Link2>
  14681. </user-agent>
  14682. <user-agent>
  14683. <ID>id_n_s_230406_3</ID>
  14684. <String>Netluchs/0.8-dev ( ; http://www.netluchs.de/; ___don't___spam_me_@netluchs.de)</String>
  14685. <Description>Netluchs (Germany) search (193.164.8.xx)</Description>
  14686. <Type>R</Type>
  14687. <Comment>Same IP-range as Metager search - powered by Nutch</Comment>
  14688. <Link1>http://www.netluchs.de/</Link1>
  14689. <Link2></Link2>
  14690. </user-agent>
  14691. <user-agent>
  14692. <ID>id_n_s_1032</ID>
  14693. <String>NetMechanic Vx.0</String>
  14694. <Description>NetMechanic link checker</Description>
  14695. <Type>C</Type>
  14696. <Comment></Comment>
  14697. <Link1>http://www.netmechanic.com/</Link1>
  14698. <Link2></Link2>
  14699. </user-agent>
  14700. <user-agent>
  14701. <ID>id_n_s_030906_1</ID>
  14702. <String>NetNewsWire/2.x (Mac OS X; http://ranchero.com/netnewswire/)</String>
  14703. <Description>NewsGator NetNewsWire - Mac RSS feed reader</Description>
  14704. <Type>B</Type>
  14705. <Comment></Comment>
  14706. <Link1>http://www.newsgator.com/NGOLProduct.aspx?ProdID=NetNewsWire</Link1>
  14707. <Link2></Link2>
  14708. </user-agent>
  14709. <user-agent>
  14710. <ID>id_n_s_1033</ID>
  14711. <String>NetNoseCrawler/v1.0</String>
  14712. <Description>unknown InCom (216.0.107.xx) robot</Description>
  14713. <Type>R</Type>
  14714. <Comment></Comment>
  14715. <Link1>http://www.incom.net/</Link1>
  14716. <Link2></Link2>
  14717. </user-agent>
  14718. <user-agent>
  14719. <ID>id_n_s_1034</ID>
  14720. <String>Netprospector JavaCrawler</String>
  14721. <Description>Netprospector metasearch software</Description>
  14722. <Type>R</Type>
  14723. <Comment></Comment>
  14724. <Link1>http://www.actaddons.com/products/netprospector.asp</Link1>
  14725. <Link2></Link2>
  14726. </user-agent>
  14727. <user-agent>
  14728. <ID>id_n_s_1035</ID>
  14729. <String>NetPumper/x.xx</String>
  14730. <Description>Netpumper download manager</Description>
  14731. <Type>D</Type>
  14732. <Comment></Comment>
  14733. <Link1>http://www.netpumper.com/</Link1>
  14734. <Link2></Link2>
  14735. </user-agent>
  14736. <user-agent>
  14737. <ID>id_n_s_1036</ID>
  14738. <String>NetResearchServer(http://www.look.com)</String>
  14739. <Description>Look.com robot (209.87.232.x)</Description>
  14740. <Type>R</Type>
  14741. <Comment></Comment>
  14742. <Link1>http://www.look.com/</Link1>
  14743. <Link2></Link2>
  14744. </user-agent>
  14745. <user-agent>
  14746. <ID>id_n_s_1037</ID>
  14747. <String>NetResearchServer/x.x(loopimprovements.com/robot.html)</String>
  14748. <Description>IncyWincy search engine using DMOZ database</Description>
  14749. <Type>R</Type>
  14750. <Comment></Comment>
  14751. <Link1>http://www.loopimprovements.com/</Link1>
  14752. <Link2></Link2>
  14753. </user-agent>
  14754. <user-agent>
  14755. <ID>id_n_s_140209_5</ID>
  14756. <String>NetSeer/Nutch-0.9 (NetSeer Crawler; http://www.netseer.com; crawler@netseer.com)</String>
  14757. <Description>NetSeer search (beta) crawler via Amazon Web Services - see also Teemer</Description>
  14758. <Type>R</Type>
  14759. <Comment>67.202.26.1xx</Comment>
  14760. <Link1>http://www.netseer.com/</Link1>
  14761. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  14762. </user-agent>
  14763. <user-agent>
  14764. <ID>id_n_s_150906_2</ID>
  14765. <String>NetSprint -- 2.0</String>
  14766. <Description>Wirtualna Polska / Netsprint search (Poland) robot</Description>
  14767. <Type>R</Type>
  14768. <Comment>212.77.102.1xx</Comment>
  14769. <Link1>http://www.wp.pl/</Link1>
  14770. <Link2>http://www.netsprint.pl/serwis/</Link2>
  14771. </user-agent>
  14772. <user-agent>
  14773. <ID>id_n_s_190306_1</ID>
  14774. <String>NetWhatCrawler/0.06-dev (NetWhatCrawler from NetWhat.com; http://www.netwhat.com; support@netwhat.com)</String>
  14775. <Description>NetWhat Search crawler (69.9.167.1xx)</Description>
  14776. <Type>R</Type>
  14777. <Comment></Comment>
  14778. <Link1>http://www.netwhat.com/</Link1>
  14779. <Link2></Link2>
  14780. </user-agent>
  14781. <user-agent>
  14782. <ID>id_n_s_1038</ID>
  14783. <String>NetZippy</String>
  14784. <Description>Netzippy robot</Description>
  14785. <Type>R</Type>
  14786. <Comment>site is closed</Comment>
  14787. <Link1>http://www.netzippy.com/</Link1>
  14788. <Link2></Link2>
  14789. </user-agent>
  14790. <user-agent>
  14791. <ID>id_n_s_1039</ID>
  14792. <String>NeuralBot/0.2</String>
  14793. <Description>unknown</Description>
  14794. <Type></Type>
  14795. <Comment></Comment>
  14796. <Link1></Link1>
  14797. <Link2></Link2>
  14798. </user-agent>
  14799. <user-agent>
  14800. <ID>id_n_s_1040</ID>
  14801. <String>newsearchengine (ThisUser@unspecified.mail)</String>
  14802. <Description>Unknown (12.238.4.xxx) attbi.com client robot</Description>
  14803. <Type></Type>
  14804. <Comment></Comment>
  14805. <Link1></Link1>
  14806. <Link2></Link2>
  14807. </user-agent>
  14808. <user-agent>
  14809. <ID>id_n_s_250707_3</ID>
  14810. <String>NewsGator FetchLinks extension/0.2.0 (http://graemef.com)</String>
  14811. <Description>FetchLinks plugin for NewsGator RSS reader</Description>
  14812. <Type>B</Type>
  14813. <Comment></Comment>
  14814. <Link1>http://graemef.com/project/fetchlinks</Link1>
  14815. <Link2></Link2>
  14816. </user-agent>
  14817. <user-agent>
  14818. <ID>id_n_s_250707_4</ID>
  14819. <String>NewsGatorOnline/2.0 (http://www.newsgator.com; 1 subscribers)</String>
  14820. <Description>NewsGator online RSS reader</Description>
  14821. <Type>B</Type>
  14822. <Comment>64.78.155.1xx</Comment>
  14823. <Link1>http://www.newsgator.com/</Link1>
  14824. <Link2></Link2>
  14825. </user-agent>
  14826. <user-agent>
  14827. <ID>id_n_s_1041</ID>
  14828. <String>NextGenSearchBot 1 (for information visit http://www.eliyon.com/NextGenSearchBot)</String>
  14829. <Description>Eliyon Crawler for Business People Search</Description>
  14830. <Type>R</Type>
  14831. <Comment></Comment>
  14832. <Link1>http://www.eliyon.com/NextGenSearchBot</Link1>
  14833. <Link2></Link2>
  14834. </user-agent>
  14835. <user-agent>
  14836. <ID>id_n_s_1042</ID>
  14837. <String>NextopiaBOT (+http://www.nextopia.com) distributed crawler client beta v0.x</String>
  14838. <Description>Nextopia crawler</Description>
  14839. <Type>R</Type>
  14840. <Comment></Comment>
  14841. <Link1>http://www.nextopia.com/</Link1>
  14842. <Link2></Link2>
  14843. </user-agent>
  14844. <user-agent>
  14845. <ID>id_n_s_060906_1</ID>
  14846. <String>NG-Search/0.90 (NG-SearchBot; http://www.ng-search.com;  )</String>
  14847. <Description>find your keywords - semantic search (Germany) robot</Description>
  14848. <Type>R</Type>
  14849. <Comment>84.56.87.1xx</Comment>
  14850. <Link1>http://www.ng-search.com/</Link1>
  14851. <Link2></Link2>
  14852. </user-agent>
  14853. <user-agent>
  14854. <ID>id_n_s_1043</ID>
  14855. <String>NG/1.0</String>
  14856. <Description>Exalead (France) search robot (193.47.80.xx)</Description>
  14857. <Type>R</Type>
  14858. <Comment>s. Harvest-NG/1.0.2 and Exalead NG...</Comment>
  14859. <Link1>http://www.exabot.com/</Link1>
  14860. <Link2></Link2>
  14861. </user-agent>
  14862. <user-agent>
  14863. <ID>id_n_s_050406_3</ID>
  14864. <String>NG/4.0.1229</String>
  14865. <Description>Exalead Websearch image crawler (193.47.80.xx)</Description>
  14866. <Type>R</Type>
  14867. <Comment>s. also Exabot-Images/1.0</Comment>
  14868. <Link1>http://www.exalead.com/search</Link1>
  14869. <Link2></Link2>
  14870. </user-agent>
  14871. <user-agent>
  14872. <ID>id_n_s_071106_1</ID>
  14873. <String>nicebot</String>
  14874. <Description>Unknown UA from PlanetLab distributed network</Description>
  14875. <Type></Type>
  14876. <Comment>128.8.126.xx</Comment>
  14877. <Link1>http://planetlab2.cs.umd.edu/</Link1>
  14878. <Link2></Link2>
  14879. </user-agent>
  14880. <user-agent>
  14881. <ID>id_n_s_1044</ID>
  14882. <String>NICO/1.0</String>
  14883. <Description>NicoZone childsafe search robot </Description>
  14884. <Type>R P</Type>
  14885. <Comment>-site is offline-</Comment>
  14886. <Link1>http://www.nicozone.net/</Link1>
  14887. <Link2></Link2>
  14888. </user-agent>
  14889. <user-agent>
  14890. <ID>id_n_s_291007_2</ID>
  14891. <String>Nikita the Spider (http://NikitaTheSpider.com/)</String>
  14892. <Description>Nikita the Spider - Online HTML validation &#44; link checking</Description>
  14893. <Type>C</Type>
  14894. <Comment>69.61.23.11x</Comment>
  14895. <Link1>http://nikitathespider.com/</Link1>
  14896. <Link2></Link2>
  14897. </user-agent>
  14898. <user-agent>
  14899. <ID>id_n_s_1045</ID>
  14900. <String>NITLE Blog Spider/0.01</String>
  14901. <Description>Experimental LSI (?) robot from 140.233.69.xx (Middlebury.edu)</Description>
  14902. <Type>R</Type>
  14903. <Comment></Comment>
  14904. <Link1>http://javelina.cet.middlebury.edu/lsa/out/lsa_intro.htm</Link1>
  14905. <Link2></Link2>
  14906. </user-agent>
  14907. <user-agent>
  14908. <ID>id_n_s_1046</ID>
  14909. <String>Nitro Downloader 1.x (www.klsofttools.com)</String>
  14910. <Description>Download manager</Description>
  14911. <Type>D</Type>
  14912. <Comment></Comment>
  14913. <Link1>http://www.klsofttools.com</Link1>
  14914. <Link2></Link2>
  14915. </user-agent>
  14916. <user-agent>
  14917. <ID>id_n_s_1047</ID>
  14918. <String>Noago Spider</String>
  14919. <Description>Noago spider</Description>
  14920. <Type>R</Type>
  14921. <Comment></Comment>
  14922. <Link1>http://www.noago.com/</Link1>
  14923. <Link2></Link2>
  14924. </user-agent>
  14925. <user-agent>
  14926. <ID>id_n_s_1048</ID>
  14927. <String>Nocilla/1.0</String>
  14928. <Description>telefonica.es user robot</Description>
  14929. <Type></Type>
  14930. <Comment></Comment>
  14931. <Link1></Link1>
  14932. <Link2></Link2>
  14933. </user-agent>
  14934. <user-agent>
  14935. <ID>id_n_s_1049</ID>
  14936. <String>Nokia-WAPToolkit/1.2 googlebot(at)googlebot.com</String>
  14937. <Description>Google WAP robot</Description>
  14938. <Type>R</Type>
  14939. <Comment></Comment>
  14940. <Link1>http://www.google.com/</Link1>
  14941. <Link2></Link2>
  14942. </user-agent>
  14943. <user-agent>
  14944. <ID>id_n_s_290708_3</ID>
  14945. <String>Nokia6300/2.0 (05.50) Profile/MIDP-2.0 Configuration/CLDC-1.1 (botmobi http://find.mobi/bot.html abuse@mtld.mobi)</String>
  14946. <Description>Botmobi crawler for Find.mobi mobile search</Description>
  14947. <Type>C</Type>
  14948. <Comment></Comment>
  14949. <Link1>http://find.mobi/bot.html</Link1>
  14950. <Link2>http://find.mobi/</Link2>
  14951. </user-agent>
  14952. <user-agent>
  14953. <ID>id_n_s_200108_3</ID>
  14954. <String>Nokia6610/1.0 (3.09) Profile/MIDP-1.0 Configuration/CLDC-1.0 (compatible;YahooSeeker/M1A1-R2D2; http://help.yahoo.com/help/us/ysearch/crawling/crawling-01.html)</String>
  14955. <Description>YahooSeeker/M1A1-R2D2 - Yahoo mobile web crawling robot</Description>
  14956. <Type>R</Type>
  14957. <Comment>68.180.2xx.[x]xx</Comment>
  14958. <Link1>http://help.yahoo.com/l/us/yahoo/search/mobilecrawler/mobilecrawler-01.html</Link1>
  14959. <Link2></Link2>
  14960. </user-agent>
  14961. <user-agent>
  14962. <ID>id_n_s_1050</ID>
  14963. <String>Nokia7110/1.0 (05.01) (Google WAP Proxy/1.0)</String>
  14964. <Description>Google WAP proxy</Description>
  14965. <Type>P</Type>
  14966. <Comment></Comment>
  14967. <Link1>http://www.google.com/</Link1>
  14968. <Link2></Link2>
  14969. </user-agent>
  14970. <user-agent>
  14971. <ID>id_n_s_1051</ID>
  14972. <String>NokodoBot/1.x (+http://nokodo.com/bot.htm)</String>
  14973. <Description>Nokodo public beta search robot (67.18.222.xx)</Description>
  14974. <Type>R</Type>
  14975. <Comment></Comment>
  14976. <Link1>http://www.nokodo.com/</Link1>
  14977. <Link2></Link2>
  14978. </user-agent>
  14979. <user-agent>
  14980. <ID>id_n_s_1052</ID>
  14981. <String>Norbert the Spider(Burf.com)</String>
  14982. <Description>Burf.com UK Search Engine robot</Description>
  14983. <Type>R</Type>
  14984. <Comment></Comment>
  14985. <Link1>http://www.burf.com/</Link1>
  14986. <Link2></Link2>
  14987. </user-agent>
  14988. <user-agent>
  14989. <ID>id_n_s_1053</ID>
  14990. <String>noxtrumbot/1.0 (crawler@noxtrum.com)</String>
  14991. <Description>noXtrum search robot (Spain)</Description>
  14992. <Type>R</Type>
  14993. <Comment>194.224.199.xx</Comment>
  14994. <Link1>http://www.noxtrum.com/</Link1>
  14995. <Link2></Link2>
  14996. </user-agent>
  14997. <user-agent>
  14998. <ID>id_n_s_040506_2</ID>
  14999. <String>noyona_0_1</String>
  15000. <Description>Noyona job search (preview)</Description>
  15001. <Type>R</Type>
  15002. <Comment>207.210.106.1xx</Comment>
  15003. <Link1>http://www.noyona.com/index.pl</Link1>
  15004. <Link2></Link2>
  15005. </user-agent>
  15006. <user-agent>
  15007. <ID>id_n_s_1054</ID>
  15008. <String>NP/0.1 (NP; http://www.nameprotect.com; npbot@nameprotect.com)</String>
  15009. <Description>Nameprotect copyright search robot (24.177.134.x)</Description>
  15010. <Type>R</Type>
  15011. <Comment>s. also - aipbot/1.0 (aipbot; http://www.aipbot.com... - NPBot ...</Comment>
  15012. <Link1>http://www.nameprotect.com/</Link1>
  15013. <Link2></Link2>
  15014. </user-agent>
  15015. <user-agent>
  15016. <ID>id_n_s_1553</ID>
  15017. <String>NPBot (http://www.nameprotect.com/botinfo.html)</String>
  15018. <Description>Nameprotect copyright search robot (24.177.134.x)</Description>
  15019. <Type>R</Type>
  15020. <Comment></Comment>
  15021. <Link1>http://www.nameprotect.com/</Link1>
  15022. <Link2></Link2>
  15023. </user-agent>
  15024. <user-agent>
  15025. <ID>id_n_s_1552</ID>
  15026. <String>NPBot-1/2.0</String>
  15027. <Description>Nameprotect copyright search robot (24.177.134.x)</Description>
  15028. <Type>R</Type>
  15029. <Comment></Comment>
  15030. <Link1>http://www.nameprotect.com/</Link1>
  15031. <Link2></Link2>
  15032. </user-agent>
  15033. <user-agent>
  15034. <ID>id_n_s_291205_3</ID>
  15035. <String>Nsauditor/1.x</String>
  15036. <Description>Nsauditor Network Security Auditor</Description>
  15037. <Type>S</Type>
  15038. <Comment></Comment>
  15039. <Link1>http://www.nsauditor.com/</Link1>
  15040. <Link2></Link2>
  15041. </user-agent>
  15042. <user-agent>
  15043. <ID>id_n_s_1055</ID>
  15044. <String>NSPlayer/10.0.0.xxxx WMFSDK/10.0</String>
  15045. <Description>NetShow Media Player = Windows Media Player 10</Description>
  15046. <Type>B</Type>
  15047. <Comment></Comment>
  15048. <Link1></Link1>
  15049. <Link2></Link2>
  15050. </user-agent>
  15051. <user-agent>
  15052. <ID>id_n_s_281207_2</ID>
  15053. <String>nsyght.com/Nutch-1.0-dev (nsyght.com; Nsyght.com)</String>
  15054. <Description>Nsyght social search application</Description>
  15055. <Type>R</Type>
  15056. <Comment></Comment>
  15057. <Link1>http://search.nsyght.com/</Link1>
  15058. <Link2></Link2>
  15059. </user-agent>
  15060. <user-agent>
  15061. <ID>id_n_s_161007_1</ID>
  15062. <String>nsyght.com/Nutch-x.x (nsyght.com; search.nsyght.com)</String>
  15063. <Description>Nsyght social search application</Description>
  15064. <Type>R</Type>
  15065. <Comment></Comment>
  15066. <Link1>http://search.nsyght.com/</Link1>
  15067. <Link2></Link2>
  15068. </user-agent>
  15069. <user-agent>
  15070. <ID>id_n_s_1056</ID>
  15071. <String>nttdirectory_robot/0.9 (super-robot@super.navi.ocn.ne.jp)</String>
  15072. <Description>NTT Directory robot</Description>
  15073. <Type>R</Type>
  15074. <Comment></Comment>
  15075. <Link1>http://navi.ocn.ne.jp/</Link1>
  15076. <Link2></Link2>
  15077. </user-agent>
  15078. <user-agent>
  15079. <ID>id_n_s_180206_1</ID>
  15080. <String>Nucleus SiteList LinkChecker/1.1</String>
  15081. <Description>Nucleus CMS SiteList link managing plugin</Description>
  15082. <Type>C</Type>
  15083. <Comment></Comment>
  15084. <Link1>http://wakka.xiffy.nl/sitelist</Link1>
  15085. <Link2></Link2>
  15086. </user-agent>
  15087. <user-agent>
  15088. <ID>id_n_s_1058</ID>
  15089. <String>nuSearch Spider &lt;a href='http://www.nusearch.com'>www.nusearch.com&lt;/a> (compatible; MSIE 4.01)</String>
  15090. <Description>nuSearch spider (84.9.136.xxx)</Description>
  15091. <Type>R</Type>
  15092. <Comment></Comment>
  15093. <Link1>http://www.nusearch.com/</Link1>
  15094. <Link2></Link2>
  15095. </user-agent>
  15096. <user-agent>
  15097. <ID>id_n_s_1057</ID>
  15098. <String>NuSearch Spider (compatible; MSIE 6.0)</String>
  15099. <Description>nuSearch spider (84.9.136.xxx)</Description>
  15100. <Type>R</Type>
  15101. <Comment></Comment>
  15102. <Link1>http://www.nusearch.com/</Link1>
  15103. <Link2></Link2>
  15104. </user-agent>
  15105. <user-agent>
  15106. <ID>id_n_s_1059</ID>
  15107. <String>NuSearch Spider www.nusearch.com</String>
  15108. <Description>nuSearch spider (84.9.136.xxx)</Description>
  15109. <Type>R</Type>
  15110. <Comment></Comment>
  15111. <Link1>http://www.nusearch.com/</Link1>
  15112. <Link2></Link2>
  15113. </user-agent>
  15114. <user-agent>
  15115. <ID>id_n_s_1060</ID>
  15116. <String>Nutch</String>
  15117. <Description>Nutch open source robot</Description>
  15118. <Type>R</Type>
  15119. <Comment></Comment>
  15120. <Link1>http://www.nutch.org/docs/bot.html</Link1>
  15121. <Link2></Link2>
  15122. </user-agent>
  15123. <user-agent>
  15124. <ID>id_n_s_211107_1</ID>
  15125. <String>Nutch crawler/Nutch-0.9 (picapage.com; admin@picapage.com)</String>
  15126. <Description>Picapage search for handheld devices using Nutch</Description>
  15127. <Type>R</Type>
  15128. <Comment></Comment>
  15129. <Link1>http://picapage.biz/</Link1>
  15130. <Link2></Link2>
  15131. </user-agent>
  15132. <user-agent>
  15133. <ID>id_n_s_230408_1</ID>
  15134. <String>Nutch/Nutch-0.9 (Eurobot; http://www.ayell.eu )</String>
  15135. <Description>Ayell Euronet business directory robot using Nutch</Description>
  15136. <Type>R</Type>
  15137. <Comment></Comment>
  15138. <Link1>http://www.ayell.eu/</Link1>
  15139. <Link2></Link2>
  15140. </user-agent>
  15141. <user-agent>
  15142. <ID>id_n_s_120406_1</ID>
  15143. <String>NutchCVS/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net)</String>
  15144. <Description>Netsweeper content filtering engine (66.207.120.2xx) powered by Nutch</Description>
  15145. <Type>P</Type>
  15146. <Comment>uses also: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.7.5) Gecko/20041107 Firefox/1.0</Comment>
  15147. <Link1>http://www.netsweeper.com/</Link1>
  15148. <Link2></Link2>
  15149. </user-agent>
  15150. <user-agent>
  15151. <ID>id_n_s_1061</ID>
  15152. <String>NutchCVS/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net)</String>
  15153. <Description>Nutch open source robot</Description>
  15154. <Type>R</Type>
  15155. <Comment></Comment>
  15156. <Link1>http://www.nutch.org/docs/bot.html</Link1>
  15157. <Link2></Link2>
  15158. </user-agent>
  15159. <user-agent>
  15160. <ID>id_n_s_010406_1</ID>
  15161. <String>NutchCVS/0.7.1 (Nutch running at UW; http://www.nutch.org/docs/en/bot.html; sycrawl@cs.washington.edu)</String>
  15162. <Description>Robot from University of Washington Computer Science &amp; Engineering (128.208.6.2xx)</Description>
  15163. <Type>R</Type>
  15164. <Comment>powered by Nutch</Comment>
  15165. <Link1>http://qbert.cs.washington.edu/</Link1>
  15166. <Link2></Link2>
  15167. </user-agent>
  15168. <user-agent>
  15169. <ID>id_n_s_251006_2</ID>
  15170. <String>NutchEC2Test/Nutch-0.9-dev (Testing Nutch on Amazon EC2.; http://lucene.apache.org/nutch/bot.html; ec2test at lucene.com)</String>
  15171. <Description>Amazon Elastic Compute Cloud (Amazon EC2) robot</Description>
  15172. <Type>R</Type>
  15173. <Comment>216.182.236.xx</Comment>
  15174. <Link1>http://www.amazon.com/b/ref=sc_fe_l_2/104-6713356-1433533?ie=UTF8&amp;node=201590011&amp;no=3435361&amp;me=A36L942TSJ2AJA</Link1>
  15175. <Link2></Link2>
  15176. </user-agent>
  15177. <user-agent>
  15178. <ID>id_n_s_1062</ID>
  15179. <String>NutchOrg/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net)</String>
  15180. <Description>Nutch open source robot</Description>
  15181. <Type>R</Type>
  15182. <Comment></Comment>
  15183. <Link1>http://www.nutch.org/docs/bot.html</Link1>
  15184. <Link2></Link2>
  15185. </user-agent>
  15186. <user-agent>
  15187. <ID>id_n_s_210108_1</ID>
  15188. <String>nutchsearch/Nutch-0.9 (Nutch Search 1.0; herceg_novi at yahoo dot com)</String>
  15189. <Description>Unknown robot using Nutch (maybe private crawling) via Cox network (70.187.130.25x)</Description>
  15190. <Type>R</Type>
  15191. <Comment>reads robots.txt</Comment>
  15192. <Link1>http://lucene.apache.org/nutch/</Link1>
  15193. <Link2></Link2>
  15194. </user-agent>
  15195. <user-agent>
  15196. <ID>id_n_s_041106_1</ID>
  15197. <String>NutchVinegarCrawl/Nutch-0.8.1 (Vinegar; http://www.cs.washington.edu; eytanadar at gmail dot com)</String>
  15198. <Description>Unknown crawler from University of Washington - Computer science</Description>
  15199. <Type>R</Type>
  15200. <Comment>128.208.3.1xx</Comment>
  15201. <Link1>http://www.cs.washington.edu/</Link1>
  15202. <Link2></Link2>
  15203. </user-agent>
  15204. <user-agent>
  15205. <ID>id_n_s_1063</ID>
  15206. <String>obidos-bot (just looking for books.)</String>
  15207. <Description>Weblog bookwatch robot</Description>
  15208. <Type>R</Type>
  15209. <Comment></Comment>
  15210. <Link1>http://www.onfocus.com/bookwatch/</Link1>
  15211. <Link2></Link2>
  15212. </user-agent>
  15213. <user-agent>
  15214. <ID>id_n_s_1064</ID>
  15215. <String>ObjectsSearch/0.01-dev (ObjectsSearch;http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com)</String>
  15216. <Description>Objects Search robot</Description>
  15217. <Type>R</Type>
  15218. <Comment></Comment>
  15219. <Link1>http://www.objectssearch.com/</Link1>
  15220. <Link2></Link2>
  15221. </user-agent>
  15222. <user-agent>
  15223. <ID>id_n_s_1065</ID>
  15224. <String>ObjectsSearch/0.0x (ObjectsSearch; http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com)</String>
  15225. <Description>Objects Search robot</Description>
  15226. <Type>R</Type>
  15227. <Comment></Comment>
  15228. <Link1>http://www.objectssearch.com/</Link1>
  15229. <Link2></Link2>
  15230. </user-agent>
  15231. <user-agent>
  15232. <ID>id_n_s_1066</ID>
  15233. <String>oBot ((compatible;Win32))</String>
  15234. <Description>Cobion Germany Brand Protection Services robot</Description>
  15235. <Type>R</Type>
  15236. <Comment></Comment>
  15237. <Link1>http://www.cobion.com/</Link1>
  15238. <Link2></Link2>
  15239. </user-agent>
  15240. <user-agent>
  15241. <ID>id_n_s_1067</ID>
  15242. <String>Ocelli/1.x (http://www.globalspec.com/Ocelli)</String>
  15243. <Description>GlobalSpec Engineering Search robot (66.194.55.xxx)</Description>
  15244. <Type>R</Type>
  15245. <Comment></Comment>
  15246. <Link1>http://www.globalspec.com/</Link1>
  15247. <Link2></Link2>
  15248. </user-agent>
  15249. <user-agent>
  15250. <ID>id_n_s_1068</ID>
  15251. <String>Octopus</String>
  15252. <Description>Octopus download manager</Description>
  15253. <Type>D</Type>
  15254. <Comment></Comment>
  15255. <Link1>http://moskalyuk.com/octopus/</Link1>
  15256. <Link2></Link2>
  15257. </user-agent>
  15258. <user-agent>
  15259. <ID>id_n_s_230306_1</ID>
  15260. <String>Octora Beta - www.octora.com</String>
  15261. <Description>Octora blog or RSS information crawler - beta (66.228.114.xx)</Description>
  15262. <Type>R</Type>
  15263. <Comment></Comment>
  15264. <Link1>http://www.octora.com/</Link1>
  15265. <Link2></Link2>
  15266. </user-agent>
  15267. <user-agent>
  15268. <ID>id_n_s_230606_4</ID>
  15269. <String>Octora Beta Bot - www.octora.com</String>
  15270. <Description>Octora RSS feed search</Description>
  15271. <Type>R</Type>
  15272. <Comment>66.228.114.xx</Comment>
  15273. <Link1>http://www.octora.com/</Link1>
  15274. <Link2></Link2>
  15275. </user-agent>
  15276. <user-agent>
  15277. <ID>id_n_s_1069</ID>
  15278. <String>Offline Explorer 1.*</String>
  15279. <Description>Meta Products Offlinebrowser</Description>
  15280. <Type>B D</Type>
  15281. <Comment></Comment>
  15282. <Link1>http://www.metaproducts.com/</Link1>
  15283. <Link2></Link2>
  15284. </user-agent>
  15285. <user-agent>
  15286. <ID>id_n_s_1070</ID>
  15287. <String>OliverPerry</String>
  15288. <Description>Claymont robot / Internetseer Web Site Monitoring</Description>
  15289. <Type>R C</Type>
  15290. <Comment></Comment>
  15291. <Link1>http://www.claymont.com/</Link1>
  15292. <Link2></Link2>
  15293. </user-agent>
  15294. <user-agent>
  15295. <ID>id_n_s_1071</ID>
  15296. <String>OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Internet CategorizerOmniExplorer http://www.omni-explorer.com/ car &amp; shopping search (64.62.175.xxx)</String>
  15297. <Description>OmniExplorer car &amp; shopping search (64.62.175.xxx)</Description>
  15298. <Type>R</Type>
  15299. <Comment>based on YottaCars... (see there)</Comment>
  15300. <Link1>http://www.omni-explorer.com</Link1>
  15301. <Link2></Link2>
  15302. </user-agent>
  15303. <user-agent>
  15304. <ID>id_n_s_1072</ID>
  15305. <String>OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Job Crawler</String>
  15306. <Description>OmniExplorer car &amp; shopping search (64.62.175.xxx)</Description>
  15307. <Type>R</Type>
  15308. <Comment>based on YottaCars... (see there)</Comment>
  15309. <Link1>http://www.omni-explorer.com</Link1>
  15310. <Link2></Link2>
  15311. </user-agent>
  15312. <user-agent>
  15313. <ID>id_n_s_1073</ID>
  15314. <String>OmniExplorer_Bot/1.1x (+http://www.omni-explorer.com) Torrent Crawler</String>
  15315. <Description>OmniExplorer car &amp; shopping search (64.62.175.xxx)</Description>
  15316. <Type>R</Type>
  15317. <Comment>based on YottaCars... (see there)</Comment>
  15318. <Link1>http://www.omni-explorer.com</Link1>
  15319. <Link2></Link2>
  15320. </user-agent>
  15321. <user-agent>
  15322. <ID>id_n_s_1074</ID>
  15323. <String>OmniExplorer_Bot/x.xx (+http://www.omni-explorer.com) WorldIndexer</String>
  15324. <Description>OmniExplorer car &amp; shopping search (64.62.175.xxx)</Description>
  15325. <Type>R</Type>
  15326. <Comment>based on YottaCars... (see there)</Comment>
  15327. <Link1>http://www.omni-explorer.com</Link1>
  15328. <Link2></Link2>
  15329. </user-agent>
  15330. <user-agent>
  15331. <ID>id_n_s_290106_3</ID>
  15332. <String>onCHECK Linkchecker von www.scientec.de fuer www.onsinn.de</String>
  15333. <Description>onsearch.de German web directory link checking </Description>
  15334. <Type>C</Type>
  15335. <Comment>85.176.108.2xx</Comment>
  15336. <Link1>http://www.onsearch.de/</Link1>
  15337. <Link2></Link2>
  15338. </user-agent>
  15339. <user-agent>
  15340. <ID>id_n_s_290106_2</ID>
  15341. <String>onCHECK-Robot&#44; www.onsearch.de</String>
  15342. <Description>onsearch.de German web directory link checking </Description>
  15343. <Type>C</Type>
  15344. <Comment>85.176.108.2xx</Comment>
  15345. <Link1>http://www.onsearch.de/</Link1>
  15346. <Link2></Link2>
  15347. </user-agent>
  15348. <user-agent>
  15349. <ID>id_n_s_1075</ID>
  15350. <String>Onet.pl SA- http://szukaj.onet.pl</String>
  15351. <Description>onet.pl Szukaj (Search) robot (213.180.128.1xx)</Description>
  15352. <Type>R</Type>
  15353. <Comment>s. also - Mozilla/5.0 (compatible; OnetSzukaj/5.0....</Comment>
  15354. <Link1>http://szukaj.onet.pl/</Link1>
  15355. <Link2></Link2>
  15356. </user-agent>
  15357. <user-agent>
  15358. <ID>id_n_s_1076</ID>
  15359. <String>online link validator (http://www.dead-links.com/)</String>
  15360. <Description>Dead-Links.com link validation spider</Description>
  15361. <Type>C</Type>
  15362. <Comment></Comment>
  15363. <Link1>http://www.dead-links.com/</Link1>
  15364. <Link2></Link2>
  15365. </user-agent>
  15366. <user-agent>
  15367. <ID>id_n_s_040206_3</ID>
  15368. <String>Online24-Bot (Version: 1.0x&#44; powered by www.online24.de)</String>
  15369. <Description>Online24 shopping portal (Germany) link checking</Description>
  15370. <Type>C</Type>
  15371. <Comment></Comment>
  15372. <Link1>http://www.online24.de/</Link1>
  15373. <Link2></Link2>
  15374. </user-agent>
  15375. <user-agent>
  15376. <ID>id_n_s_1077</ID>
  15377. <String>OntoSpider/1.0 libwww-perl/5.65</String>
  15378. <Description>OntoSpider - Dutch robot for a research project. (195.11.244.xx)</Description>
  15379. <Type>R</Type>
  15380. <Comment></Comment>
  15381. <Link1>http://ontospider.i-n.info</Link1>
  15382. <Link2></Link2>
  15383. </user-agent>
  15384. <user-agent>
  15385. <ID>id_n_s_030110_6</ID>
  15386. <String>OOZBOT/0.20 ( http://www.setooz.com/oozbot.html ; agentname at setooz dot_com )</String>
  15387. <Description>SeetooZ search crawler</Description>
  15388. <Type>R</Type>
  15389. <Comment>67.215.230.xx</Comment>
  15390. <Link1>http://www.setooz.com/</Link1>
  15391. <Link2></Link2>
  15392. </user-agent>
  15393. <user-agent>
  15394. <ID>id_g_m_280508_4</ID>
  15395. <String>OpenAcoon v4.0.x (www.openacoon.de)</String>
  15396. <Description>OpenAcoon open source search engine (used by Acoon search)</Description>
  15397. <Type>R</Type>
  15398. <Comment>(80.237.209.xx)</Comment>
  15399. <Link1>http://www.openacoon.de/</Link1>
  15400. <Link2>http://www.acoon.de/</Link2>
  15401. </user-agent>
  15402. <user-agent>
  15403. <ID>id_n_s_1078</ID>
  15404. <String>Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html)</String>
  15405. <Description>Openfind.com.tw robot</Description>
  15406. <Type>R</Type>
  15407. <Comment></Comment>
  15408. <Link1>http://www.openfind.com.tw/</Link1>
  15409. <Link2></Link2>
  15410. </user-agent>
  15411. <user-agent>
  15412. <ID>id_n_s_1079</ID>
  15413. <String>Openfind data gatherer- Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html)</String>
  15414. <Description>Openfind.com.tw robot</Description>
  15415. <Type>R</Type>
  15416. <Comment></Comment>
  15417. <Link1>http://www.openfind.com.tw/</Link1>
  15418. <Link2></Link2>
  15419. </user-agent>
  15420. <user-agent>
  15421. <ID>id_n_s_1080</ID>
  15422. <String>Openfind Robot/1.1A2</String>
  15423. <Description>Openfind.com.tw robot</Description>
  15424. <Type>R</Type>
  15425. <Comment></Comment>
  15426. <Link1>http://www.openfind.com.tw/</Link1>
  15427. <Link2></Link2>
  15428. </user-agent>
  15429. <user-agent>
  15430. <ID>id_n_s_250107_2</ID>
  15431. <String>OpenISearch/1.x (www.openisearch.com)</String>
  15432. <Description>open i search robot  - search engine in development</Description>
  15433. <Type>R</Type>
  15434. <Comment>216.182.236.1xx</Comment>
  15435. <Link1>http://www.openisearch.com/</Link1>
  15436. <Link2></Link2>
  15437. </user-agent>
  15438. <user-agent>
  15439. <ID>id_n_s_291105_4</ID>
  15440. <String>OpenTaggerBot (http://www.opentagger.com/opentaggerbot.htm)</String>
  15441. <Description>Opentagger social bookmarking system</Description>
  15442. <Type>R</Type>
  15443. <Comment></Comment>
  15444. <Link1>http://www.opentagger.com/</Link1>
  15445. <Link2></Link2>
  15446. </user-agent>
  15447. <user-agent>
  15448. <ID>id_n_s_1081</ID>
  15449. <String>OpenTextSiteCrawler/2.9.2</String>
  15450. <Description>OpenText crawler</Description>
  15451. <Type>R</Type>
  15452. <Comment></Comment>
  15453. <Link1>http://www.opentext.net/</Link1>
  15454. <Link2></Link2>
  15455. </user-agent>
  15456. <user-agent>
  15457. <ID>id_n_s_310806_1</ID>
  15458. <String>OpenWebSpider/0.x.x (http://www.openwebspider.org)</String>
  15459. <Description>OpenWebSpider - Open Source web search engine</Description>
  15460. <Type>R</Type>
  15461. <Comment></Comment>
  15462. <Link1>http://www.openwebspider.org/</Link1>
  15463. <Link2></Link2>
  15464. </user-agent>
  15465. <user-agent>
  15466. <ID>id_n_s_1082</ID>
  15467. <String>OpenWebSpider/x</String>
  15468. <Description>OpenWebSpider - Open Source web search engine</Description>
  15469. <Type>R</Type>
  15470. <Comment></Comment>
  15471. <Link1>http://www.openwebspider.org/</Link1>
  15472. <Link2></Link2>
  15473. </user-agent>
  15474. <user-agent>
  15475. <ID>id_n_s_1083</ID>
  15476. <String>Opera/5.0 (Linux 2.0.38 i386; U) [en]</String>
  15477. <Description>Opera 5.0 Linux</Description>
  15478. <Type>B</Type>
  15479. <Comment></Comment>
  15480. <Link1></Link1>
  15481. <Link2></Link2>
  15482. </user-agent>
  15483. <user-agent>
  15484. <ID>id_n_s_1084</ID>
  15485. <String>Opera/5.11 (Windows ME; U) [ru]</String>
  15486. <Description>Opera 5.11 faked WinME referer</Description>
  15487. <Type>B</Type>
  15488. <Comment></Comment>
  15489. <Link1></Link1>
  15490. <Link2></Link2>
  15491. </user-agent>
  15492. <user-agent>
  15493. <ID>id_n_s_1085</ID>
  15494. <String>Opera/5.12 (Windows 98; U) [en]</String>
  15495. <Description>Opera 5.12 Win98</Description>
  15496. <Type>B</Type>
  15497. <Comment></Comment>
  15498. <Link1></Link1>
  15499. <Link2></Link2>
  15500. </user-agent>
  15501. <user-agent>
  15502. <ID>id_n_s_1086</ID>
  15503. <String>Opera/6.01 (larbin@unspecified.mail)</String>
  15504. <Description>unknown robot from gw.ocg-corp.com (209.126.176.x)</Description>
  15505. <Type></Type>
  15506. <Comment>see also: - MSIE-5.13 (larbin@.....) - WinampMPEG/2.00 larbin@....</Comment>
  15507. <Link1></Link1>
  15508. <Link2></Link2>
  15509. </user-agent>
  15510. <user-agent>
  15511. <ID>id_n_s_1087</ID>
  15512. <String>Opera/6.x (Linux 2.4.8-26mdk i686; U) [en]</String>
  15513. <Description>Opera 6.x- Mandrake Linux</Description>
  15514. <Type>B</Type>
  15515. <Comment></Comment>
  15516. <Link1></Link1>
  15517. <Link2></Link2>
  15518. </user-agent>
  15519. <user-agent>
  15520. <ID>id_n_s_1088</ID>
  15521. <String>Opera/6.x (Windows NT 4.0; U) [de]</String>
  15522. <Description>Opera 6.x WinNT</Description>
  15523. <Type>B</Type>
  15524. <Comment></Comment>
  15525. <Link1></Link1>
  15526. <Link2></Link2>
  15527. </user-agent>
  15528. <user-agent>
  15529. <ID>id_n_s_1089</ID>
  15530. <String>Opera/7.x (Windows NT 5.1; U) [en]</String>
  15531. <Description>Opera 7.x WinXP</Description>
  15532. <Type>B</Type>
  15533. <Comment></Comment>
  15534. <Link1></Link1>
  15535. <Link2></Link2>
  15536. </user-agent>
  15537. <user-agent>
  15538. <ID>id_n_s_1090</ID>
  15539. <String>Opera/8.xx (Windows NT 5.1; U; en)</String>
  15540. <Description>Opera 8.x (Beta) WinXP</Description>
  15541. <Type>B</Type>
  15542. <Comment></Comment>
  15543. <Link1></Link1>
  15544. <Link2></Link2>
  15545. </user-agent>
  15546. <user-agent>
  15547. <ID>id_n_s_141105_2</ID>
  15548. <String>Opera/9.0 (Windows NT 5.1; U; en)</String>
  15549. <Description>Opera 9 (Beta) Browser</Description>
  15550. <Type>B</Type>
  15551. <Comment></Comment>
  15552. <Link1>http://snapshot.opera.com/</Link1>
  15553. <Link2></Link2>
  15554. </user-agent>
  15555. <user-agent>
  15556. <ID>id_n_s_250606_1</ID>
  15557. <String>Opera/9.00 (Windows NT 5.1; U; de)</String>
  15558. <Description>Opera 9 (final)</Description>
  15559. <Type>B</Type>
  15560. <Comment></Comment>
  15561. <Link1>http://www.opera.com/</Link1>
  15562. <Link2></Link2>
  15563. </user-agent>
  15564. <user-agent>
  15565. <ID>id_n_s_201008_1</ID>
  15566. <String>Opera/9.60 (Windows NT 5.1; U; de) Presto/2.1.1</String>
  15567. <Description>Opera browser 9.6x on WinXP (Presto = Operas rendering engine)</Description>
  15568. <Type>B</Type>
  15569. <Comment></Comment>
  15570. <Link1>http://my.opera.com/ODIN/blog/a-look-under-the-hood-of-opera-9-6</Link1>
  15571. <Link2></Link2>
  15572. </user-agent>
  15573. <user-agent>
  15574. <ID>id_n_s_1091</ID>
  15575. <String>OpidooBOT (larbin2.6.3@unspecified.mail)</String>
  15576. <Description>Opidoo Search Belgium robot (62.4.83.xxx)</Description>
  15577. <Type>R</Type>
  15578. <Comment></Comment>
  15579. <Link1>http://www.opidoo.com/</Link1>
  15580. <Link2></Link2>
  15581. </user-agent>
  15582. <user-agent>
  15583. <ID>id_n_s_080208_1</ID>
  15584. <String>OPWV-SDK UP.Browser/7.0.2.3.119 (GUI) MMP/2.0 Push/PO</String>
  15585. <Description>Open Wave Phone Simulator SDK</Description>
  15586. <Type>B</Type>
  15587. <Comment></Comment>
  15588. <Link1>http://developer.openwave.com/dvl/tools_and_sdk/phone_simulator/</Link1>
  15589. <Link2></Link2>
  15590. </user-agent>
  15591. <user-agent>
  15592. <ID>id_n_s_190406_2</ID>
  15593. <String>Oracle Application Server Web Cache 10g</String>
  15594. <Description>Oracle Application Server cache</Description>
  15595. <Type>P</Type>
  15596. <Comment></Comment>
  15597. <Link1>http://www.oracle.com/appserver/index.html</Link1>
  15598. <Link2></Link2>
  15599. </user-agent>
  15600. <user-agent>
  15601. <ID>id_n_s_1092</ID>
  15602. <String>Oracle iMTCrawler</String>
  15603. <Description>Oracle interMedia Text - Text and web documents indexing</Description>
  15604. <Type>D</Type>
  15605. <Comment></Comment>
  15606. <Link1>http://www.oracle.com/technology//products/text/index.html</Link1>
  15607. <Link2></Link2>
  15608. </user-agent>
  15609. <user-agent>
  15610. <ID>id_n_s_1093</ID>
  15611. <String>Oracle Ultra Search</String>
  15612. <Description>Oracle Search</Description>
  15613. <Type>R</Type>
  15614. <Comment></Comment>
  15615. <Link1>http://www.oracle.com/</Link1>
  15616. <Link2></Link2>
  15617. </user-agent>
  15618. <user-agent>
  15619. <ID>id_n_s_220306_1</ID>
  15620. <String>OrangeSpider</String>
  15621. <Description>Orangeslicer semantic search (Beta) Germany (193.201.52.1xx)</Description>
  15622. <Type>R</Type>
  15623. <Comment></Comment>
  15624. <Link1>http://www.orangeslicer.com/</Link1>
  15625. <Link2></Link2>
  15626. </user-agent>
  15627. <user-agent>
  15628. <ID>id_n_s_1094</ID>
  15629. <String>Orbiter/T-2.0 (+http://www.dailyorbit.com/bot.htm)</String>
  15630. <Description>Orbiter - DailyOrbit search spider</Description>
  15631. <Type>R</Type>
  15632. <Comment></Comment>
  15633. <Link1>http://www.dailyorbit.com/</Link1>
  15634. <Link2></Link2>
  15635. </user-agent>
  15636. <user-agent>
  15637. <ID>id_n_s_150206_1</ID>
  15638. <String>Orca Browser (http://www.orcabrowser.com)</String>
  15639. <Description>Orca browser - based on Gecko</Description>
  15640. <Type>B</Type>
  15641. <Comment></Comment>
  15642. <Link1>http://www.orcabrowser.com</Link1>
  15643. <Link2></Link2>
  15644. </user-agent>
  15645. <user-agent>
  15646. <ID>id_n_s_251205_1</ID>
  15647. <String>OSSProxy 1.3.305.321 (Build 305.321 Win32 en-us)(Dec 21 2005 16:30:54)</String>
  15648. <Description>Marketscore (was Netsetter) internet accelerator</Description>
  15649. <Type>P</Type>
  15650. <Comment>Spyware proxy service</Comment>
  15651. <Link1>http://www.marketscore.com/Home.aspx</Link1>
  15652. <Link2></Link2>
  15653. </user-agent>
  15654. <user-agent>
  15655. <ID>id_n_s_141105_1</ID>
  15656. <String>OutfoxBot/0.x (For internet experiments; http://; outfox.agent@gmail.com)</String>
  15657. <Description>Unknown robot from Chinanet (220.181.8.xxx)</Description>
  15658. <Type></Type>
  15659. <Comment></Comment>
  15660. <Link1></Link1>
  15661. <Link2></Link2>
  15662. </user-agent>
  15663. <user-agent>
  15664. <ID>id_n_s_221106_1</ID>
  15665. <String>OutfoxMelonBot/0.5 (for internet experiments; http://; outfoxbot@gmail.com)</String>
  15666. <Description>Unknown robot from Chinanet (60.191.80.1)</Description>
  15667. <Type></Type>
  15668. <Comment></Comment>
  15669. <Link1></Link1>
  15670. <Link2></Link2>
  15671. </user-agent>
  15672. <user-agent>
  15673. <ID>id_n_s_1095</ID>
  15674. <String>Overture-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)</String>
  15675. <Description>Overture/Fast/Alltheweb crawler (66.77.73.xxx)</Description>
  15676. <Type>R</Type>
  15677. <Comment></Comment>
  15678. <Link1>http://www.alltheweb.com/</Link1>
  15679. <Link2></Link2>
  15680. </user-agent>
  15681. <user-agent>
  15682. <ID>id_n_s_1096</ID>
  15683. <String>OWR_Crawler 0.1</String>
  15684. <Description>Unknown robot from 198.169.127.xx (innovationplace.com)</Description>
  15685. <Type></Type>
  15686. <Comment></Comment>
  15687. <Link1></Link1>
  15688. <Link2></Link2>
  15689. </user-agent>
  15690. <user-agent>
  15691. <ID>id_n_s_090906_1</ID>
  15692. <String>ozelot/2.7.3 (Search engine indexer; www.flying-cat.de/ozelot; ozelot@flying-cat.de)</String>
  15693. <Description>Ozelot - Flying Cat's search engine robot (Germany)</Description>
  15694. <Type>R</Type>
  15695. <Comment>87.139.106.xx</Comment>
  15696. <Link1>http://www.flying-cat.de/ozelot/</Link1>
  15697. <Link2></Link2>
  15698. </user-agent>
  15699. <user-agent>
  15700. <ID>id_n_s_290108_2</ID>
  15701. <String>PADLibrary Spider</String>
  15702. <Description>PADLibrary.com - PAD file software robot for FindFiles.com</Description>
  15703. <Type>R</Type>
  15704. <Comment>72.167.37.20x</Comment>
  15705. <Link1>http://padlibrary.com/</Link1>
  15706. <Link2>http://www.findfiles.com/</Link2>
  15707. </user-agent>
  15708. <user-agent>
  15709. <ID>id_n_s_150207_3</ID>
  15710. <String>PageBitesHyperBot/600 (http://www.pagebites.com/)</String>
  15711. <Description>Pagebites job search crawler</Description>
  15712. <Type>R</Type>
  15713. <Comment>208.185.247.xx</Comment>
  15714. <Link1>http://www.pagebites.com/</Link1>
  15715. <Link2></Link2>
  15716. </user-agent>
  15717. <user-agent>
  15718. <ID>id_n_s_111206_1</ID>
  15719. <String>Pagebull http://www.pagebull.com/</String>
  15720. <Description>Pagebull visual search engine</Description>
  15721. <Type>R</Type>
  15722. <Comment>209.9.228.1xx</Comment>
  15723. <Link1>http://www.pagebull.com/</Link1>
  15724. <Link2></Link2>
  15725. </user-agent>
  15726. <user-agent>
  15727. <ID>id_n_s_051207_3</ID>
  15728. <String>Pagestacker Bot</String>
  15729. <Description>Pagestacker online bookmark service</Description>
  15730. <Type>C</Type>
  15731. <Comment>70.85.129.12x</Comment>
  15732. <Link1>http://www.pagestacker.com/</Link1>
  15733. <Link2></Link2>
  15734. </user-agent>
  15735. <user-agent>
  15736. <ID>id_n_s_290506_1</ID>
  15737. <String>page_verifier (http://www.securecomputing.com/goto/pv)</String>
  15738. <Description>Secure Computing SmartFilter Tools - malware crawler</Description>
  15739. <Type>R</Type>
  15740. <Comment>206.169.110.xx</Comment>
  15741. <Link1>http://www.securecomputing.com/PageVerifier.cfm</Link1>
  15742. <Link2></Link2>
  15743. </user-agent>
  15744. <user-agent>
  15745. <ID>id_n_s_1097</ID>
  15746. <String>PagmIEDownload</String>
  15747. <Description>Downloadmanager ?</Description>
  15748. <Type>D</Type>
  15749. <Comment></Comment>
  15750. <Link1></Link1>
  15751. <Link2></Link2>
  15752. </user-agent>
  15753. <user-agent>
  15754. <ID>id_n_s_1098</ID>
  15755. <String>parallelContextFocusCrawler1.1parallelContextFocusCrawler1.1</String>
  15756. <Description>CFC crawler used by Italian academic and research network (GARR)</Description>
  15757. <Type>R</Type>
  15758. <Comment></Comment>
  15759. <Link1>http://www.garr.it/</Link1>
  15760. <Link2></Link2>
  15761. </user-agent>
  15762. <user-agent>
  15763. <ID>id_n_s_1099</ID>
  15764. <String>ParaSite/1.0b (http://www.ianett.com/parasite/)</String>
  15765. <Description>http://www.ianett.com robot</Description>
  15766. <Type>R</Type>
  15767. <Comment></Comment>
  15768. <Link1>http://www.ianett.com/</Link1>
  15769. <Link2></Link2>
  15770. </user-agent>
  15771. <user-agent>
  15772. <ID>id_n_s_1100</ID>
  15773. <String>Patwebbot (http://www.herz-power.de/technik.html)</String>
  15774. <Description>Patsearch (Germany) robot</Description>
  15775. <Type>R</Type>
  15776. <Comment></Comment>
  15777. <Link1>http://www.herz-power.de/</Link1>
  15778. <Link2></Link2>
  15779. </user-agent>
  15780. <user-agent>
  15781. <ID>id_n_s_1101</ID>
  15782. <String>pavuk/0.9pl29b i686-pc-linux-gnu</String>
  15783. <Description>Pavuk web downloading program for Unix</Description>
  15784. <Type>D</Type>
  15785. <Comment></Comment>
  15786. <Link1>http://www.idata.sk/%7Eondrej/pavuk/about.html</Link1>
  15787. <Link2></Link2>
  15788. </user-agent>
  15789. <user-agent>
  15790. <ID>id_n_s_1102</ID>
  15791. <String>PBrowse 1.4b</String>
  15792. <Description>Some site scanning tool via diff. IPs- i.e.: - cox.net (68.4.xxx.xxx)</Description>
  15793. <Type>S</Type>
  15794. <Comment>- UA sometimes DSurf15a</Comment>
  15795. <Link1></Link1>
  15796. <Link2></Link2>
  15797. </user-agent>
  15798. <user-agent>
  15799. <ID>id_n_s_1103</ID>
  15800. <String>pd02_1.0.0 pd02_1.0.0@dzimi@post.sk</String>
  15801. <Description>Post.sk / Eurotel.sk robot</Description>
  15802. <Type>R</Type>
  15803. <Comment></Comment>
  15804. <Link1></Link1>
  15805. <Link2></Link2>
  15806. </user-agent>
  15807. <user-agent>
  15808. <ID>id_n_s_1104</ID>
  15809. <String>PEAR HTTP_Request class ( http://pear.php.net/ )</String>
  15810. <Description>Pear HTTP_Request PHP extension package</Description>
  15811. <Type></Type>
  15812. <Comment></Comment>
  15813. <Link1>http://pear.php.net/</Link1>
  15814. <Link2></Link2>
  15815. </user-agent>
  15816. <user-agent>
  15817. <ID>id_n_s_1105</ID>
  15818. <String>PEERbot www.peerbot.com</String>
  15819. <Description>Peerbot - favicon search robot</Description>
  15820. <Type>R</Type>
  15821. <Comment></Comment>
  15822. <Link1>http://www.peerbot.com/</Link1>
  15823. <Link2></Link2>
  15824. </user-agent>
  15825. <user-agent>
  15826. <ID>id_n_s_1106</ID>
  15827. <String>PeopleChat/Search_Engine</String>
  15828. <Description>Unknown robot from 64.5.48.xxx (Plethoric.net)</Description>
  15829. <Type></Type>
  15830. <Comment></Comment>
  15831. <Link1></Link1>
  15832. <Link2></Link2>
  15833. </user-agent>
  15834. <user-agent>
  15835. <ID>id_n_s_1107</ID>
  15836. <String>PEval 1.4b</String>
  15837. <Description>Some site scanning tool via diff. IPs</Description>
  15838. <Type>S</Type>
  15839. <Comment>s. DBrowse- PSurf etc.</Comment>
  15840. <Link1></Link1>
  15841. <Link2></Link2>
  15842. </user-agent>
  15843. <user-agent>
  15844. <ID>id_n_s_1108</ID>
  15845. <String>PHP/3.x.xx</String>
  15846. <Description>diff. IPs / services</Description>
  15847. <Type></Type>
  15848. <Comment></Comment>
  15849. <Link1></Link1>
  15850. <Link2></Link2>
  15851. </user-agent>
  15852. <user-agent>
  15853. <ID>id_n_s_1109</ID>
  15854. <String>PHP/4.0.4pl1</String>
  15855. <Description>diff. IPs / services</Description>
  15856. <Type></Type>
  15857. <Comment></Comment>
  15858. <Link1></Link1>
  15859. <Link2></Link2>
  15860. </user-agent>
  15861. <user-agent>
  15862. <ID>id_n_s_1110</ID>
  15863. <String>PHP/4.0.6</String>
  15864. <Description>diff. IPs / services- i.e.: -NTT/Verio Inc. link checker</Description>
  15865. <Type>C</Type>
  15866. <Comment>in conjunction w. Weblink's Checker UA</Comment>
  15867. <Link1>http://www.verio.com/</Link1>
  15868. <Link2></Link2>
  15869. </user-agent>
  15870. <user-agent>
  15871. <ID>id_n_s_1111</ID>
  15872. <String>PHP/4.1.1</String>
  15873. <Description>diff. IPs / services- i.e.: - Phenominet.com link checking</Description>
  15874. <Type>C</Type>
  15875. <Comment></Comment>
  15876. <Link1>http://www.phenominet.com</Link1>
  15877. <Link2></Link2>
  15878. </user-agent>
  15879. <user-agent>
  15880. <ID>id_n_s_1112</ID>
  15881. <String>PHP/4.1.2</String>
  15882. <Description>diff. IPs / services- i.e.: - 209.114.200.xx = MyNetCrawler link checking - 216.139.207.xxx = Mixcat crawler</Description>
  15883. <Type></Type>
  15884. <Comment>Mixcat s. also Felix and Morris</Comment>
  15885. <Link1>http://mynetcrawler.com/</Link1>
  15886. <Link2>http://mixcat.com</Link2>
  15887. </user-agent>
  15888. <user-agent>
  15889. <ID>id_n_s_1113</ID>
  15890. <String>PicoSearch/1.0</String>
  15891. <Description>Pico Search robot</Description>
  15892. <Type>R</Type>
  15893. <Comment></Comment>
  15894. <Link1>http://www.picosearch.com/</Link1>
  15895. <Link2></Link2>
  15896. </user-agent>
  15897. <user-agent>
  15898. <ID>id_n_s_010506_3</ID>
  15899. <String>Piffany_Web_Scraper_v0.x</String>
  15900. <Description>Piffany targeted search web spider</Description>
  15901. <Type>R</Type>
  15902. <Comment></Comment>
  15903. <Link1>http://www.piffany.com/</Link1>
  15904. <Link2>http://www.piffany.com/spider.html</Link2>
  15905. </user-agent>
  15906. <user-agent>
  15907. <ID>id_n_s_010506_2</ID>
  15908. <String>Piffany_Web_Spider_v0.x</String>
  15909. <Description>Piffany targeted search web spider</Description>
  15910. <Type>R</Type>
  15911. <Comment></Comment>
  15912. <Link1>http://www.piffany.com/</Link1>
  15913. <Link2>http://www.piffany.com/spider.html</Link2>
  15914. </user-agent>
  15915. <user-agent>
  15916. <ID>id_n_s_1114</ID>
  15917. <String>PigeonBot1.0 BETA</String>
  15918. <Description>Whois Source domain name information robot (66.249.26.xx)- s.also: - SurveyBot</Description>
  15919. <Type>R C</Type>
  15920. <Comment></Comment>
  15921. <Link1>http://www.whois.sc/</Link1>
  15922. <Link2></Link2>
  15923. </user-agent>
  15924. <user-agent>
  15925. <ID>id_n_s_1115</ID>
  15926. <String>PingALink Monitoring Services 1.0</String>
  15927. <Description>PingALink website monitoring</Description>
  15928. <Type>R C</Type>
  15929. <Comment></Comment>
  15930. <Link1>http://www.pingalink.com/</Link1>
  15931. <Link2></Link2>
  15932. </user-agent>
  15933. <user-agent>
  15934. <ID>id_n_s_1116</ID>
  15935. <String>PingALink Monitoring Services 1.0 (http://www.pingalink.com)</String>
  15936. <Description>PingALink website monitoring</Description>
  15937. <Type>R C</Type>
  15938. <Comment></Comment>
  15939. <Link1>http://www.pingalink.com/</Link1>
  15940. <Link2></Link2>
  15941. </user-agent>
  15942. <user-agent>
  15943. <ID>id_n_s_120607_1</ID>
  15944. <String>Pingdom GIGRIB (http://www.pingdom.com)</String>
  15945. <Description>Pingdom web site monitoring</Description>
  15946. <Type>C</Type>
  15947. <Comment>66.98.148.xx</Comment>
  15948. <Link1>http://www.pingdom.com/</Link1>
  15949. <Link2></Link2>
  15950. </user-agent>
  15951. <user-agent>
  15952. <ID>id_n_s_1117</ID>
  15953. <String>pipeLiner/0.3a (PipeLine Spider;http://www.pipeline-search.com/webmaster.html; webmaster'at'pipeline-search.com)</String>
  15954. <Description>pipeline search (DMOZ based) search robot (24.106.39. xxx)</Description>
  15955. <Type>R</Type>
  15956. <Comment></Comment>
  15957. <Link1>http://www.pipeline-search.com/</Link1>
  15958. <Link2></Link2>
  15959. </user-agent>
  15960. <user-agent>
  15961. <ID>id_n_s_1118</ID>
  15962. <String>pipeLiner/0.xx (PipeLine Spider; http://www.pipeline-search.com/webmaster.html)</String>
  15963. <Description>pipeline search (DMOZ based) search robot (24.106.39. xxx)</Description>
  15964. <Type>R</Type>
  15965. <Comment></Comment>
  15966. <Link1>http://www.pipeline-search.com/</Link1>
  15967. <Link2></Link2>
  15968. </user-agent>
  15969. <user-agent>
  15970. <ID>id_n_s_1119</ID>
  15971. <String>Pita</String>
  15972. <Description>Pita crawler</Description>
  15973. <Type>R</Type>
  15974. <Comment>now WebVac s. there</Comment>
  15975. <Link1>http://www-diglib.stanford.edu/~testbed/doc2/WebBase/webbase-pages.html</Link1>
  15976. <Link2></Link2>
  15977. </user-agent>
  15978. <user-agent>
  15979. <ID>id_n_s_1120</ID>
  15980. <String>Pizilla++ ver 2.45</String>
  15981. <Description>Private user-agent via Hurricane Electric Internet Services</Description>
  15982. <Type>B ?</Type>
  15983. <Comment></Comment>
  15984. <Link1>http://www.he.net/</Link1>
  15985. <Link2></Link2>
  15986. </user-agent>
  15987. <user-agent>
  15988. <ID>id_n_s_1121</ID>
  15989. <String>PJspider/3.0 (pjspider@portaljuice.com; http://www.portaljuice.com)</String>
  15990. <Description>Portaljuice spider</Description>
  15991. <Type>R</Type>
  15992. <Comment></Comment>
  15993. <Link1>http://www.portaljuice.com/</Link1>
  15994. <Link2></Link2>
  15995. </user-agent>
  15996. <user-agent>
  15997. <ID>id_n_s_121106_1</ID>
  15998. <String>Plagger/0.x.xx (http://plagger.org/)</String>
  15999. <Description>Plagger - pluggable RSS/Atom feed aggregator written in Perl</Description>
  16000. <Type>B</Type>
  16001. <Comment></Comment>
  16002. <Link1>http://plagger.org/trac</Link1>
  16003. <Link2></Link2>
  16004. </user-agent>
  16005. <user-agent>
  16006. <ID>id_n_s_1122</ID>
  16007. <String>PlagiarBot/1.0</String>
  16008. <Description>unknown ucsd.edu robot</Description>
  16009. <Type>R</Type>
  16010. <Comment></Comment>
  16011. <Link1></Link1>
  16012. <Link2></Link2>
  16013. </user-agent>
  16014. <user-agent>
  16015. <ID>id_n_s_1123</ID>
  16016. <String>PlantyNet_WebRobot_V1.9 dhkang@plantynet.com</String>
  16017. <Description>Plantynet web filtering services - Blacklist DB robot</Description>
  16018. <Type>R P</Type>
  16019. <Comment></Comment>
  16020. <Link1>http://www.plantynet.com/</Link1>
  16021. <Link2></Link2>
  16022. </user-agent>
  16023. <user-agent>
  16024. <ID>id_n_s_120106_1</ID>
  16025. <String>plinki/0.1 (you got plinked! (thats a good thing..); http://www.plinki.com; crawl@plinki.com)</String>
  16026. <Description>Unknown UA from 66.220.23.2xx</Description>
  16027. <Type></Type>
  16028. <Comment>Doesn't read robots.txt - Plinki.com's website has no content</Comment>
  16029. <Link1>http://www.plinki.com/</Link1>
  16030. <Link2></Link2>
  16031. </user-agent>
  16032. <user-agent>
  16033. <ID>id_n_s_061206_2</ID>
  16034. <String>PluckFeedCrawler/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://www.pluck.com; 1 subscribers)</String>
  16035. <Description>Pluck RSS feed crawler</Description>
  16036. <Type>R</Type>
  16037. <Comment>66.179.81.1xx</Comment>
  16038. <Link1>http://www.pluck.com/</Link1>
  16039. <Link2></Link2>
  16040. </user-agent>
  16041. <user-agent>
  16042. <ID>id_n_s_140807_1</ID>
  16043. <String>Pluggd/Nutch-0.9 (automated crawler http://www.pluggd.com;support at pluggd dot com)</String>
  16044. <Description>Pluggd Podcast search engine</Description>
  16045. <Type>R</Type>
  16046. <Comment>209.85.62.1xx</Comment>
  16047. <Link1>http://www.pluggd.com/</Link1>
  16048. <Link2></Link2>
  16049. </user-agent>
  16050. <user-agent>
  16051. <ID>id_n_s_1124</ID>
  16052. <String>Pockey-GetHTML/4.12.0 (Win32; GUI; ix86)</String>
  16053. <Description>Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan</Description>
  16054. <Type>D</Type>
  16055. <Comment></Comment>
  16056. <Link1>http://www.vector.co.jp/soft/win95/net/se077067.html</Link1>
  16057. <Link2></Link2>
  16058. </user-agent>
  16059. <user-agent>
  16060. <ID>id_n_s_1125</ID>
  16061. <String>Pockey-GetHTML/x.xx</String>
  16062. <Description>Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan</Description>
  16063. <Type>D</Type>
  16064. <Comment></Comment>
  16065. <Link1>http://www.vector.co.jp/soft/win95/net/se077067.html</Link1>
  16066. <Link2></Link2>
  16067. </user-agent>
  16068. <user-agent>
  16069. <ID>id_n_s_1126</ID>
  16070. <String>Pockey/x.x.x</String>
  16071. <Description>Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan</Description>
  16072. <Type>D</Type>
  16073. <Comment></Comment>
  16074. <Link1>http://www.vector.co.jp/soft/win95/net/se077067.html</Link1>
  16075. <Link2></Link2>
  16076. </user-agent>
  16077. <user-agent>
  16078. <ID>id_n_s_1127</ID>
  16079. <String>Pockey7.x.x(WIN32GUI)</String>
  16080. <Description>Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan</Description>
  16081. <Type>D</Type>
  16082. <Comment></Comment>
  16083. <Link1>http://www.vector.co.jp/soft/win95/net/se077067.html</Link1>
  16084. <Link2></Link2>
  16085. </user-agent>
  16086. <user-agent>
  16087. <ID>id_n_s_1128</ID>
  16088. <String>POE-Component-Client-HTTP/0.64 (perl; N; POE; en; rv:0.640000)</String>
  16089. <Description>HTTP user-agent for POE (portable networking framework for Perl )</Description>
  16090. <Type></Type>
  16091. <Comment></Comment>
  16092. <Link1>http://search.cpan.org/dist/POE-Component-Client-HTTP/HTTP.pm</Link1>
  16093. <Link2></Link2>
  16094. </user-agent>
  16095. <user-agent>
  16096. <ID>id_n_s_291105_2</ID>
  16097. <String>Poirot</String>
  16098. <Description>ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx</Description>
  16099. <Type>S</Type>
  16100. <Comment>appears also as LWP::Simple/5.803 - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)</Comment>
  16101. <Link1>http://spamhuntress.com/wiki/Manila_Industries</Link1>
  16102. <Link2></Link2>
  16103. </user-agent>
  16104. <user-agent>
  16105. <ID>id_n_s_1129</ID>
  16106. <String>polybot 1.0 (http://cis.poly.edu/polybot/)</String>
  16107. <Description>Polybot webcrawler</Description>
  16108. <Type>R</Type>
  16109. <Comment></Comment>
  16110. <Link1>http://cis.poly.edu/polybot/</Link1>
  16111. <Link2></Link2>
  16112. </user-agent>
  16113. <user-agent>
  16114. <ID>id_n_s_1130</ID>
  16115. <String>Pompos/1.x http://dir.com/pompos.html</String>
  16116. <Description>Dir.com / Iliad French recherche robot</Description>
  16117. <Type>R</Type>
  16118. <Comment></Comment>
  16119. <Link1>http://www.iliad.fr/</Link1>
  16120. <Link2></Link2>
  16121. </user-agent>
  16122. <user-agent>
  16123. <ID>id_n_s_1131</ID>
  16124. <String>Pompos/1.x pompos@iliad.fr</String>
  16125. <Description>Iliad / Free French recherche robot</Description>
  16126. <Type>R</Type>
  16127. <Comment></Comment>
  16128. <Link1>http://www.iliad.fr/</Link1>
  16129. <Link2></Link2>
  16130. </user-agent>
  16131. <user-agent>
  16132. <ID>id_n_s_1132</ID>
  16133. <String>Popdexter/1.0</String>
  16134. <Description>Popdex - web site popularity crawler</Description>
  16135. <Type>R</Type>
  16136. <Comment></Comment>
  16137. <Link1>http://www.popdex.com/</Link1>
  16138. <Link2></Link2>
  16139. </user-agent>
  16140. <user-agent>
  16141. <ID>id_n_s_1133</ID>
  16142. <String>Port Huron Labs</String>
  16143. <Description>Unknown spam bot / harvester (63.223.10.***)</Description>
  16144. <Type>S</Type>
  16145. <Comment>s. also - Wells Search II</Comment>
  16146. <Link1></Link1>
  16147. <Link2></Link2>
  16148. </user-agent>
  16149. <user-agent>
  16150. <ID>id_n_s_1134</ID>
  16151. <String>PortalBSpider/2.0 (spider@portalb.com)</String>
  16152. <Description>PortalB (now Alacra search) spider</Description>
  16153. <Type>R</Type>
  16154. <Comment></Comment>
  16155. <Link1>http://www.portalb.com/alacra/index.htm</Link1>
  16156. <Link2></Link2>
  16157. </user-agent>
  16158. <user-agent>
  16159. <ID>id_n_s_080706_2</ID>
  16160. <String>portalmmm/2.0 S500i(c20;TB)</String>
  16161. <Description>portalmmm IMode mobile browser</Description>
  16162. <Type>B</Type>
  16163. <Comment></Comment>
  16164. <Link1></Link1>
  16165. <Link2></Link2>
  16166. </user-agent>
  16167. <user-agent>
  16168. <ID>id_n_s_1135</ID>
  16169. <String>PostFavorites</String>
  16170. <Description>Yahoo (66.94.237.1xx / 216.109.121.xx) favorites tracking robot</Description>
  16171. <Type>C</Type>
  16172. <Comment></Comment>
  16173. <Link1></Link1>
  16174. <Link2></Link2>
  16175. </user-agent>
  16176. <user-agent>
  16177. <ID>id_n_s_1136</ID>
  16178. <String>potbot 1.0</String>
  16179. <Description>Potbot : A simple IRC bot written in Perl</Description>
  16180. <Type>R</Type>
  16181. <Comment></Comment>
  16182. <Link1>http://sourceforge.net/projects/potbot/</Link1>
  16183. <Link2></Link2>
  16184. </user-agent>
  16185. <user-agent>
  16186. <ID>id_n_s_050408_2</ID>
  16187. <String>PRCrawler/Nutch-0.9 (data mining development project; crawler@projectrialto.com)</String>
  16188. <Description>Project Rialto - data mining development project</Description>
  16189. <Type>R</Type>
  16190. <Comment></Comment>
  16191. <Link1>http://projectrialto.com/index.html</Link1>
  16192. <Link2></Link2>
  16193. </user-agent>
  16194. <user-agent>
  16195. <ID>id_n_s_1137</ID>
  16196. <String>PrivacyFinder Cache Bot v1.0</String>
  16197. <Description>CUPS robot for AT&amp;T Privacy Bird Privacy Preferences (P3P) enhancements</Description>
  16198. <Type>R</Type>
  16199. <Comment></Comment>
  16200. <Link1>http://cups.cs.cmu.edu/</Link1>
  16201. <Link2>http://privacybird.com/</Link2>
  16202. </user-agent>
  16203. <user-agent>
  16204. <ID>id_n_s_111205_2</ID>
  16205. <String>PrivacyFinder/1.1</String>
  16206. <Description>CUPS robot for AT&amp;T Privacy Bird Privacy Preferences (P3P) enhancements</Description>
  16207. <Type>R</Type>
  16208. <Comment></Comment>
  16209. <Link1>http://cups.cs.cmu.edu/</Link1>
  16210. <Link2>http://privacybird.com/</Link2>
  16211. </user-agent>
  16212. <user-agent>
  16213. <ID>id_n_s_1138</ID>
  16214. <String>Privoxy/3.0 (Anonymous)</String>
  16215. <Description>Privoxy web proxy</Description>
  16216. <Type>P</Type>
  16217. <Comment>s.also (Privoxy/1.0)</Comment>
  16218. <Link1>http://www.privoxy.org/</Link1>
  16219. <Link2></Link2>
  16220. </user-agent>
  16221. <user-agent>
  16222. <ID>id_n_s_1139</ID>
  16223. <String>Production Bot 0116B</String>
  16224. <Description>Some site scanning tool from diff. IPs- i.e.: - 67.99.33.x (lightningcon.broadwing.net)</Description>
  16225. <Type>S</Type>
  16226. <Comment></Comment>
  16227. <Link1></Link1>
  16228. <Link2></Link2>
  16229. </user-agent>
  16230. <user-agent>
  16231. <ID>id_n_s_1140</ID>
  16232. <String>Production Bot 2016B</String>
  16233. <Description>Some site scanning tool from diff. IPs- i.e.: - 216.232.64.xx (telus.net)</Description>
  16234. <Type>S</Type>
  16235. <Comment></Comment>
  16236. <Link1></Link1>
  16237. <Link2></Link2>
  16238. </user-agent>
  16239. <user-agent>
  16240. <ID>id_n_s_1141</ID>
  16241. <String>Production Bot DOT 3016B</String>
  16242. <Description>Some site scanning tool from diff. IPs- i.e.: - 141.154.181.xxx (east.verizon.net)</Description>
  16243. <Type>S</Type>
  16244. <Comment></Comment>
  16245. <Link1></Link1>
  16246. <Link2></Link2>
  16247. </user-agent>
  16248. <user-agent>
  16249. <ID>id_n_s_1142</ID>
  16250. <String>Program Shareware 1.0.2</String>
  16251. <Description>Some spam bot</Description>
  16252. <Type>S</Type>
  16253. <Comment>- see here: http://www.kloth.net/internet/badbots-2004.php</Comment>
  16254. <Link1>http://www.kloth.net/internet/badbots-2004.php</Link1>
  16255. <Link2></Link2>
  16256. </user-agent>
  16257. <user-agent>
  16258. <ID>id_n_s_1143</ID>
  16259. <String>Progressive Download</String>
  16260. <Description>unknown</Description>
  16261. <Type></Type>
  16262. <Comment></Comment>
  16263. <Link1></Link1>
  16264. <Link2></Link2>
  16265. </user-agent>
  16266. <user-agent>
  16267. <ID>id_n_s_1144</ID>
  16268. <String>Progressive Download HTTP check</String>
  16269. <Description>unknown</Description>
  16270. <Type></Type>
  16271. <Comment></Comment>
  16272. <Link1></Link1>
  16273. <Link2></Link2>
  16274. </user-agent>
  16275. <user-agent>
  16276. <ID>id_n_s_1145</ID>
  16277. <String>Project XP5 [2.03.07-111203]</String>
  16278. <Description>XP5 robot</Description>
  16279. <Type>R</Type>
  16280. <Comment></Comment>
  16281. <Link1>http://marty.anstey.ca/projects/robots/index.html</Link1>
  16282. <Link2></Link2>
  16283. </user-agent>
  16284. <user-agent>
  16285. <ID>id_n_s_1146</ID>
  16286. <String>PROve AnswerBot 4.0</String>
  16287. <Description>Answerchase PROve Answerbot</Description>
  16288. <Type>R</Type>
  16289. <Comment></Comment>
  16290. <Link1>http://www.answerchase.com/</Link1>
  16291. <Link2></Link2>
  16292. </user-agent>
  16293. <user-agent>
  16294. <ID>id_n_s_1147</ID>
  16295. <String>ProWebGuide Link Checker (http://www.prowebguide.com)</String>
  16296. <Description>ProWebguide robot</Description>
  16297. <Type>R</Type>
  16298. <Comment></Comment>
  16299. <Link1>http://www.prowebguide.com/</Link1>
  16300. <Link2></Link2>
  16301. </user-agent>
  16302. <user-agent>
  16303. <ID>id_n_s_1148</ID>
  16304. <String>psbot/0.1 (+http://www.picsearch.com/bot.html)</String>
  16305. <Description>Picsearch robot (62.119.21.13x)</Description>
  16306. <Type>R</Type>
  16307. <Comment></Comment>
  16308. <Link1>http://www.picsearch.com/</Link1>
  16309. <Link2></Link2>
  16310. </user-agent>
  16311. <user-agent>
  16312. <ID>id_n_s_1149</ID>
  16313. <String>PSurf15a 11</String>
  16314. <Description>Some site scanning tool via diff. IPs- i.e.: QWest Net</Description>
  16315. <Type>S</Type>
  16316. <Comment></Comment>
  16317. <Link1></Link1>
  16318. <Link2></Link2>
  16319. </user-agent>
  16320. <user-agent>
  16321. <ID>id_n_s_1150</ID>
  16322. <String>PSurf15a 51</String>
  16323. <Description>Some site scanning tool via diff. IPs- i.e.: Optonline net (24.191.xxx.xxx)</Description>
  16324. <Type>S</Type>
  16325. <Comment></Comment>
  16326. <Link1></Link1>
  16327. <Link2></Link2>
  16328. </user-agent>
  16329. <user-agent>
  16330. <ID>id_n_s_1151</ID>
  16331. <String>PSurf15a VA</String>
  16332. <Description>Some site scanning tool via diff. IPs- i.e.: - choiceone.net (216.153.xxx.xxx) - attbi.com (12.250.xxx.xxx) - optonline.net (24.191.xxx.xxx)</Description>
  16333. <Type>S</Type>
  16334. <Comment>UA sometimes SSurf15a 11 or random letters like RXMYRCJ</Comment>
  16335. <Link1></Link1>
  16336. <Link2></Link2>
  16337. </user-agent>
  16338. <user-agent>
  16339. <ID>id_n_s_160606_1</ID>
  16340. <String>psycheclone</String>
  16341. <Description>Unknown website grabbing / ripping for unknown purposes from 208.66.195.x - Digitalinfinity.org Russia</Description>
  16342. <Type>S</Type>
  16343. <Comment>no active website</Comment>
  16344. <Link1></Link1>
  16345. <Link2></Link2>
  16346. </user-agent>
  16347. <user-agent>
  16348. <ID>id_n_s_1152</ID>
  16349. <String>PubCrawl (pubcrawl.stanford.edu)</String>
  16350. <Description>Some robot from Stanford University (171.64.75.xxx = PubCrawl.Stanford.EDU)</Description>
  16351. <Type>R</Type>
  16352. <Comment></Comment>
  16353. <Link1></Link1>
  16354. <Link2></Link2>
  16355. </user-agent>
  16356. <user-agent>
  16357. <ID>id_n_s_1153</ID>
  16358. <String>puf/0.91beta6a (Linux 2.2.18; i686)</String>
  16359. <Description>Parallel URL Fetcher downloading tool</Description>
  16360. <Type>D</Type>
  16361. <Comment></Comment>
  16362. <Link1>http://puf.sourceforge.net/</Link1>
  16363. <Link2></Link2>
  16364. </user-agent>
  16365. <user-agent>
  16366. <ID>id_n_s_1154</ID>
  16367. <String>puf/0.93.2a (Linux 2.4.18; i686)</String>
  16368. <Description>Parallel URL Fetcher downloading tool</Description>
  16369. <Type>D</Type>
  16370. <Comment></Comment>
  16371. <Link1>http://puf.sourceforge.net/</Link1>
  16372. <Link2></Link2>
  16373. </user-agent>
  16374. <user-agent>
  16375. <ID>id_n_s_130407_1</ID>
  16376. <String>pulseBot (pulse Web Miner)</String>
  16377. <Description>WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)</Description>
  16378. <Type>R</Type>
  16379. <Comment>s. also RufusBot</Comment>
  16380. <Link1>http://www.webaroo.com/index</Link1>
  16381. <Link2>http://www.webaroo.com/company/site-owners</Link2>
  16382. </user-agent>
  16383. <user-agent>
  16384. <ID>id_n_s_1155</ID>
  16385. <String>PureSight</String>
  16386. <Description>PureSight Internet content filter</Description>
  16387. <Type>P</Type>
  16388. <Comment></Comment>
  16389. <Link1>http://www.puresight.com/Products/PureSightHomeDescription.shtml</Link1>
  16390. <Link2></Link2>
  16391. </user-agent>
  16392. <user-agent>
  16393. <ID>id_n_s_1156</ID>
  16394. <String>PuxaRapido v1.0</String>
  16395. <Description>Puxa Rapido download manager</Description>
  16396. <Type>D</Type>
  16397. <Comment></Comment>
  16398. <Link1>http://www.puxarapido.com.br/</Link1>
  16399. <Link2></Link2>
  16400. </user-agent>
  16401. <user-agent>
  16402. <ID>id_n_s_230907_2</ID>
  16403. <String>PWeBot/1.2 Inspector (http://www.programacionweb.net/robot.php)</String>
  16404. <Description>ProgramacionWeb.net PWeBot link checking (Argentina)</Description>
  16405. <Type>R</Type>
  16406. <Comment>62.149.236.2xx</Comment>
  16407. <Link1>http://www.programacionweb.net/robot-en.php</Link1>
  16408. <Link2>http://www.programacionweb.net/</Link2>
  16409. </user-agent>
  16410. <user-agent>
  16411. <ID>id_n_s_1157</ID>
  16412. <String>PycURL</String>
  16413. <Description>Fast Search robot (using PycURL Python component- s. below)</Description>
  16414. <Type>R</Type>
  16415. <Comment></Comment>
  16416. <Link1>http://www.fastsearch.net/</Link1>
  16417. <Link2>http://pycurl.sourceforge.net/</Link2>
  16418. </user-agent>
  16419. <user-agent>
  16420. <ID>id_n_s_060107_1</ID>
  16421. <String>PycURL/7.xx.x</String>
  16422. <Description>PycURL - Python interface to libcurl</Description>
  16423. <Type>D</Type>
  16424. <Comment></Comment>
  16425. <Link1>http://pycurl.sourceforge.net/</Link1>
  16426. <Link2></Link2>
  16427. </user-agent>
  16428. <user-agent>
  16429. <ID>id_n_s_1158</ID>
  16430. <String>Python-urllib/1.1x</String>
  16431. <Description>Python URL fetcher - robot used by Naver Japan/Korea</Description>
  16432. <Type>R</Type>
  16433. <Comment>s. also nabot- dloader- NaverBot &amp; Cowbot</Comment>
  16434. <Link1>http://www.indyproject.org/</Link1>
  16435. <Link2>http://www.python.org/</Link2>
  16436. </user-agent>
  16437. <user-agent>
  16438. <ID>id_n_s_1159</ID>
  16439. <String>Python-urllib/2.0a1</String>
  16440. <Description>Python URL fetcher - robot used by Google</Description>
  16441. <Type>R</Type>
  16442. <Comment></Comment>
  16443. <Link1>http://labs.google.com</Link1>
  16444. <Link2>http://www.python.org/</Link2>
  16445. </user-agent>
  16446. <user-agent>
  16447. <ID>id_n_s_1160</ID>
  16448. <String>Qango.com Web Directory (http://www.qango.com/)</String>
  16449. <Description>Qango.com Web Directory robot</Description>
  16450. <Type>R</Type>
  16451. <Comment></Comment>
  16452. <Link1>http://www.qango.com/</Link1>
  16453. <Link2></Link2>
  16454. </user-agent>
  16455. <user-agent>
  16456. <ID>id_n_s_170408_1</ID>
  16457. <String>QEAVis Agent/Nutch-0.9 (Quantitative Evaluation of Academic Websites Visibility; http://nlp.uned.es/qeavis</String>
  16458. <Description>QEAVis: Quantitative Evaluation of Academic Websites Visibility using Nutch</Description>
  16459. <Type>R</Type>
  16460. <Comment>83.33.209.10x</Comment>
  16461. <Link1>http://nlp.uned.es/qeavis/</Link1>
  16462. <Link2></Link2>
  16463. </user-agent>
  16464. <user-agent>
  16465. <ID>id_n_s_1161</ID>
  16466. <String>QPCreep Test Rig ( We are not indexing- just testing )</String>
  16467. <Description>Quepasa!com (Latin American search) robot</Description>
  16468. <Type>R</Type>
  16469. <Comment></Comment>
  16470. <Link1>http://www.quepasa.com/</Link1>
  16471. <Link2></Link2>
  16472. </user-agent>
  16473. <user-agent>
  16474. <ID>id_n_s_1162</ID>
  16475. <String>QuepasaCreep ( crawler@quepasacorp.com )</String>
  16476. <Description>Quepasa!com (Latin American search) robot</Description>
  16477. <Type>R</Type>
  16478. <Comment></Comment>
  16479. <Link1>http://www.quepasa.com/</Link1>
  16480. <Link2></Link2>
  16481. </user-agent>
  16482. <user-agent>
  16483. <ID>id_n_s_1163</ID>
  16484. <String>QuepasaCreep v0.9.1x</String>
  16485. <Description>Quepasa!com (Latin American search) robot</Description>
  16486. <Type>R</Type>
  16487. <Comment></Comment>
  16488. <Link1>http://www.quepasa.com/</Link1>
  16489. <Link2></Link2>
  16490. </user-agent>
  16491. <user-agent>
  16492. <ID>id_n_s_1164</ID>
  16493. <String>QueryN Metasearch</String>
  16494. <Description>QueryN Metasearch robot</Description>
  16495. <Type>R</Type>
  16496. <Comment></Comment>
  16497. <Link1>http://www.queryn.com/queryn/</Link1>
  16498. <Link2></Link2>
  16499. </user-agent>
  16500. <user-agent>
  16501. <ID>id_n_s_230108_2</ID>
  16502. <String>Quicksilver (Blacktree&#44;MacOSX)</String>
  16503. <Description>Blacktrees Quicksilver helper application for Mac</Description>
  16504. <Type>B</Type>
  16505. <Comment></Comment>
  16506. <Link1>http://docs.blacktree.com/quicksilver/what_is_quicksilver</Link1>
  16507. <Link2></Link2>
  16508. </user-agent>
  16509. <user-agent>
  16510. <ID>id_n_s_230606_3</ID>
  16511. <String>QuickTime\xaa.7.0.4 (qtver=7.0.4;cpu=PPC;os=Mac 10.3.9)</String>
  16512. <Description>Quicktime for Macintosh</Description>
  16513. <Type>B</Type>
  16514. <Comment></Comment>
  16515. <Link1></Link1>
  16516. <Link2></Link2>
  16517. </user-agent>
  16518. <user-agent>
  16519. <ID>id_n_s_060107_4</ID>
  16520. <String>QweeryBot/3.01 ( http://qweerybot.qweery.nl)</String>
  16521. <Description>Qweerybot for the Qweery search engine (in development) - Netherland</Description>
  16522. <Type>R</Type>
  16523. <Comment>85.158.204.2xx</Comment>
  16524. <Link1>http://qweerybot.qweery.nl/</Link1>
  16525. <Link2></Link2>
  16526. </user-agent>
  16527. <user-agent>
  16528. <ID>id_n_s_060107_3</ID>
  16529. <String>Qweery_robot.txt_CheckBot/3.01 (http://qweerybot.qweery.com)</String>
  16530. <Description>Qweerybot for the Qweery search engine (in development) - Netherland</Description>
  16531. <Type>R</Type>
  16532. <Comment>85.158.204.2xx</Comment>
  16533. <Link1>http://qweerybot.qweery.nl/</Link1>
  16534. <Link2></Link2>
  16535. </user-agent>
  16536. <user-agent>
  16537. <ID>id_n_s_160208_1</ID>
  16538. <String>R6_CommentReader_(www.radian6.com/crawler)</String>
  16539. <Description>Radian6 RSS feed comment crawler</Description>
  16540. <Type>R</Type>
  16541. <Comment></Comment>
  16542. <Link1>http://www.radian6.com/cms/index.php</Link1>
  16543. <Link2>http://www.radian6.com/crawler/</Link2>
  16544. </user-agent>
  16545. <user-agent>
  16546. <ID>id_n_s_160208_2</ID>
  16547. <String>R6_FeedFetcher_(www.radian6.com/crawler)</String>
  16548. <Description>Radian6 Rss feed crawler</Description>
  16549. <Type>R</Type>
  16550. <Comment></Comment>
  16551. <Link1>http://www.radian6.com/cms/index.php</Link1>
  16552. <Link2>http://www.radian6.com/crawler/</Link2>
  16553. </user-agent>
  16554. <user-agent>
  16555. <ID>id_n_s_1165</ID>
  16556. <String>rabaz (rabaz at gigabaz dot com)</String>
  16557. <Description>gigaBaz - the brainbot (Germany) robot</Description>
  16558. <Type>R</Type>
  16559. <Comment></Comment>
  16560. <Link1>http://brainbot.com//site3</Link1>
  16561. <Link2></Link2>
  16562. </user-agent>
  16563. <user-agent>
  16564. <ID>id_n_s_1166</ID>
  16565. <String>RaBot/1.0 Agent-admin/phortse@hanmail.net</String>
  16566. <Description>DAUMOA - Daum search Korea robot (211.115.109.xxx)</Description>
  16567. <Type>R</Type>
  16568. <Comment>s. also Mozilla/4.0 (compatible; MSIE is not me; DAUMOA ...</Comment>
  16569. <Link1>http://www.daum.net/</Link1>
  16570. <Link2></Link2>
  16571. </user-agent>
  16572. <user-agent>
  16573. <ID>id_n_s_1167</ID>
  16574. <String>Rainbot1.1</String>
  16575. <Description>Bot Provider for the All Womans Bot Service?</Description>
  16576. <Type></Type>
  16577. <Comment> - site is dead</Comment>
  16578. <Link1>http://bservice.org/bots/</Link1>
  16579. <Link2></Link2>
  16580. </user-agent>
  16581. <user-agent>
  16582. <ID>id_n_s_1168</ID>
  16583. <String>ramBot xtreme x.x</String>
  16584. <Description>Intersearch.de (was www.intersearch.de) robot (Germany)</Description>
  16585. <Type>R</Type>
  16586. <Comment></Comment>
  16587. <Link1></Link1>
  16588. <Link2></Link2>
  16589. </user-agent>
  16590. <user-agent>
  16591. <ID>id_n_s_160406_2</ID>
  16592. <String>RAMPyBot - www.giveRAMP.com/0.1 (RAMPyBot - www.giveRAMP.com; http://www.giveramp.com/bot.html; support@giveRAMP.com)</String>
  16593. <Description>giveRAMP Search Engine robot (64.69.43.1xx)</Description>
  16594. <Type>R</Type>
  16595. <Comment></Comment>
  16596. <Link1>http://www.giveramp.com/</Link1>
  16597. <Link2></Link2>
  16598. </user-agent>
  16599. <user-agent>
  16600. <ID>id_n_s_260206_1</ID>
  16601. <String>RAMPyBot/0.8-dev (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)</String>
  16602. <Description>giveRAMP Search Engine robot (64.69.43.1xx)</Description>
  16603. <Type>R</Type>
  16604. <Comment>powered by Nutch</Comment>
  16605. <Link1>http://www.giveramp.com/</Link1>
  16606. <Link2>http://lucene.apache.org/nutch/</Link2>
  16607. </user-agent>
  16608. <user-agent>
  16609. <ID>id_n_s_1169</ID>
  16610. <String>Rank Exec (rankexec.com) Reciprocal Link Manager 1.x/bot</String>
  16611. <Description>Rank Exec reciprocal link checking</Description>
  16612. <Type>C</Type>
  16613. <Comment></Comment>
  16614. <Link1>http://www.rankexec.com/</Link1>
  16615. <Link2></Link2>
  16616. </user-agent>
  16617. <user-agent>
  16618. <ID>id_n_s_180408_5</ID>
  16619. <String>Rankivabot/3.2 (www.rankiva.com; 3.2; vzmxikn)</String>
  16620. <Description>Rankiva website popularity robot</Description>
  16621. <Type>R</Type>
  16622. <Comment></Comment>
  16623. <Link1>http://www.rankiva.com/</Link1>
  16624. <Link2></Link2>
  16625. </user-agent>
  16626. <user-agent>
  16627. <ID>id_n_s_1170</ID>
  16628. <String>Rational SiteCheck (Windows NT)</String>
  16629. <Description>Innova/IBM Rational SiteCheck - Rational robot</Description>
  16630. <Type>R</Type>
  16631. <Comment></Comment>
  16632. <Link1>http://www.rational.com.ar/defaultenglish.html</Link1>
  16633. <Link2></Link2>
  16634. </user-agent>
  16635. <user-agent>
  16636. <ID>id_n_s_290708_2</ID>
  16637. <String>RAYSPIDER/Nutch-0.9</String>
  16638. <Description>Unknown spider from Raytheon Company - maybe Raytheon High Speed Guard proxy</Description>
  16639. <Type>P</Type>
  16640. <Comment>199.46.198.xxx</Comment>
  16641. <Link1>http://www.raytheon.com/</Link1>
  16642. <Link2></Link2>
  16643. </user-agent>
  16644. <user-agent>
  16645. <ID>id_n_s_230207_3</ID>
  16646. <String>ReadABlog Spider (compatible; 1.1; feed update; www.readablog.com)</String>
  16647. <Description>Read A Blog - RSS feed and blog search engine</Description>
  16648. <Type>C</Type>
  16649. <Comment>70.85.24.xx</Comment>
  16650. <Link1>http://www.readablog.com/</Link1>
  16651. <Link2></Link2>
  16652. </user-agent>
  16653. <user-agent>
  16654. <ID>id_n_s_1171</ID>
  16655. <String>RealDownload/4.0.0.4x</String>
  16656. <Description>RealDownload download manager</Description>
  16657. <Type>D</Type>
  16658. <Comment></Comment>
  16659. <Link1>http://service.real.com/help/faq/rdown4/rdownfaqa01.html</Link1>
  16660. <Link2></Link2>
  16661. </user-agent>
  16662. <user-agent>
  16663. <ID>id_n_s_100408_3</ID>
  16664. <String>REAP-crawler Nutch/Nutch-1.0-dev (Reap Project; http://reap.cs.cmu.edu/REAP-crawler/; Reap Project)</String>
  16665. <Description>The REAP Web Crawler for the REAP project</Description>
  16666. <Type>C</Type>
  16667. <Comment></Comment>
  16668. <Link1>http://reap.cs.cmu.edu/REAP-crawler/</Link1>
  16669. <Link2>http://reap.cs.cmu.edu/</Link2>
  16670. </user-agent>
  16671. <user-agent>
  16672. <ID>id_n_s_1172</ID>
  16673. <String>Reaper [2.03.10-031204] (http://www.sitesearch.ca/reaper/)</String>
  16674. <Description>Reaper robot for SiteSearch</Description>
  16675. <Type>R</Type>
  16676. <Comment></Comment>
  16677. <Link1>http://marty.anstey.ca/projects/robots/reaper.html</Link1>
  16678. <Link2></Link2>
  16679. </user-agent>
  16680. <user-agent>
  16681. <ID>id_n_s_1173</ID>
  16682. <String>Reaper/2.0x (+http://www.sitesearch.ca/reaper)</String>
  16683. <Description>Reaper robot for SiteSearch</Description>
  16684. <Type>R</Type>
  16685. <Comment></Comment>
  16686. <Link1>http://marty.anstey.ca/projects/robots/reaper.html</Link1>
  16687. <Link2></Link2>
  16688. </user-agent>
  16689. <user-agent>
  16690. <ID>id_n_s_1174</ID>
  16691. <String>REBOL Core 2.x.x.x.x</String>
  16692. <Description>REBOL messaging language for distributed Internet apps</Description>
  16693. <Type></Type>
  16694. <Comment></Comment>
  16695. <Link1>http://www.rebol.com/</Link1>
  16696. <Link2></Link2>
  16697. </user-agent>
  16698. <user-agent>
  16699. <ID>id_n_s_250307_1</ID>
  16700. <String>REBOL View 1.x.x.x.x</String>
  16701. <Description>REBOL/View - machine independent internet client application</Description>
  16702. <Type>B</Type>
  16703. <Comment></Comment>
  16704. <Link1>http://www.rebol.com/prod-view.html</Link1>
  16705. <Link2></Link2>
  16706. </user-agent>
  16707. <user-agent>
  16708. <ID>id_n_s_1175</ID>
  16709. <String>RebusnetBot (+http://www.rebusnet.biz)</String>
  16710. <Description>Rebusnet software site - link / submission checking</Description>
  16711. <Type>R C</Type>
  16712. <Comment></Comment>
  16713. <Link1>http://www.rebusnet.biz</Link1>
  16714. <Link2></Link2>
  16715. </user-agent>
  16716. <user-agent>
  16717. <ID>id_n_s_1176</ID>
  16718. <String>RebusnetPADBot/1.5x (+http://www.rebusnet.biz)</String>
  16719. <Description>Rebusnet software site - link / submission checking</Description>
  16720. <Type>R C</Type>
  16721. <Comment></Comment>
  16722. <Link1>http://www.rebusnet.biz</Link1>
  16723. <Link2></Link2>
  16724. </user-agent>
  16725. <user-agent>
  16726. <ID>id_n_s_171205_1</ID>
  16727. <String>reciprocal links checker (http://www.recip-links.com/)</String>
  16728. <Description>Online reciprocal link checker</Description>
  16729. <Type>C</Type>
  16730. <Comment></Comment>
  16731. <Link1>http://www.recip-links.com/</Link1>
  16732. <Link2></Link2>
  16733. </user-agent>
  16734. <user-agent>
  16735. <ID>id_n_s_110307_2</ID>
  16736. <String>RedBot/redbot-1.0 (Rediff.com Crawler; redbot at rediff dot com)</String>
  16737. <Description>rediff.com search link checking</Description>
  16738. <Type>C</Type>
  16739. <Comment>220.226.198.xx</Comment>
  16740. <Link1>http://www.rediff.com/</Link1>
  16741. <Link2></Link2>
  16742. </user-agent>
  16743. <user-agent>
  16744. <ID>id_n_s_130106_1</ID>
  16745. <String>RedCarpet/1.2 (http://www.redcarpet-inc.com/robots.html)</String>
  16746. <Description>RedCarpet crawler for Pronto price comparison search(66.179.107.1xx)</Description>
  16747. <Type>R</Type>
  16748. <Comment></Comment>
  16749. <Link1>http://www.redcarpet-inc.com/robots.html</Link1>
  16750. <Link2>http://www.pronto.com/</Link2>
  16751. </user-agent>
  16752. <user-agent>
  16753. <ID>id_n_s_171205_2</ID>
  16754. <String>RedCell/0.1 (InfoSec Search Bot (Coming Soon); http://www.telegenetic.net/bot.html; lhall@telegenetic.net)</String>
  16755. <Description>Der Bot for telegenetic.net's security related search (65.220.67.2xx)</Description>
  16756. <Type>R</Type>
  16757. <Comment>Based on Nutch</Comment>
  16758. <Link1>http://www.telegenetic.net/bot.html</Link1>
  16759. <Link2></Link2>
  16760. </user-agent>
  16761. <user-agent>
  16762. <ID>id_n_s_040106_1</ID>
  16763. <String>RedCell/0.1 (RedCell; telegenetic.net/bot.html; lhall_at_telegenetic.net)</String>
  16764. <Description>Der Bot for telegenetic.net's security related search (65.220.67.2xx)</Description>
  16765. <Type>R</Type>
  16766. <Comment>Based on Nutch</Comment>
  16767. <Link1>http://www.telegenetic.net/bot.html</Link1>
  16768. <Link2></Link2>
  16769. </user-agent>
  16770. <user-agent>
  16771. <ID>id_n_s_1177</ID>
  16772. <String>RedKernel WWW-Spider 2/0 (+http://www-spider.redkernel-softwares.com/)</String>
  16773. <Description>RedKernel Softwares robot</Description>
  16774. <Type>R</Type>
  16775. <Comment></Comment>
  16776. <Link1>http://www.redkernel-softwares.com/</Link1>
  16777. <Link2></Link2>
  16778. </user-agent>
  16779. <user-agent>
  16780. <ID>id_n_s_1178</ID>
  16781. <String>REL Link Checker Lite x.x</String>
  16782. <Description>REL Link Checker Lite free version of Web Link Validator</Description>
  16783. <Type>C</Type>
  16784. <Comment></Comment>
  16785. <Link1>http://www.relsoftware.com/rlc/</Link1>
  16786. <Link2></Link2>
  16787. </user-agent>
  16788. <user-agent>
  16789. <ID>id_n_s_1179</ID>
  16790. <String>RepoMonkey Bait &amp; Tackle/v1.01</String>
  16791. <Description>unknown</Description>
  16792. <Type></Type>
  16793. <Comment></Comment>
  16794. <Link1></Link1>
  16795. <Link2></Link2>
  16796. </user-agent>
  16797. <user-agent>
  16798. <ID>id_n_s_1180</ID>
  16799. <String>Rewebber/1.2 libwww-perl/5.41</String>
  16800. <Description>Rewebber proxy service</Description>
  16801. <Type>P</Type>
  16802. <Comment></Comment>
  16803. <Link1>http://www.rewebber.com/</Link1>
  16804. <Link2></Link2>
  16805. </user-agent>
  16806. <user-agent>
  16807. <ID>id_n_s_1181</ID>
  16808. <String>rico/0.1</String>
  16809. <Description>Applied Semantics Auto-Categorizer for QWestDex Direct</Description>
  16810. <Type>R</Type>
  16811. <Comment></Comment>
  16812. <Link1>http://www.dotcomdirectory.com</Link1>
  16813. <Link2></Link2>
  16814. </user-agent>
  16815. <user-agent>
  16816. <ID>id_n_s_241105_2</ID>
  16817. <String>RixBot (http://babelserver.org/rix)</String>
  16818. <Description>RixBot Rebol Indexer for the RIX - Rebol related search (195.204.121.xx)</Description>
  16819. <Type>R</Type>
  16820. <Comment></Comment>
  16821. <Link1>http://babelserver.org/rix</Link1>
  16822. <Link2></Link2>
  16823. </user-agent>
  16824. <user-agent>
  16825. <ID>id_n_s_070406_2</ID>
  16826. <String>RMA/1.0 (compatible; RealMedia)</String>
  16827. <Description>StreamBox VCR user agent</Description>
  16828. <Type>D</Type>
  16829. <Comment></Comment>
  16830. <Link1>http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm</Link1>
  16831. <Link2></Link2>
  16832. </user-agent>
  16833. <user-agent>
  16834. <ID>id_n_s_1182</ID>
  16835. <String>RMA/1.0 (compatible; RealMedia)</String>
  16836. <Description>Real Media server acting as client</Description>
  16837. <Type>B P</Type>
  16838. <Comment></Comment>
  16839. <Link1>http://service.real.com/help/library/whitepapers/wpaper.html</Link1>
  16840. <Link2></Link2>
  16841. </user-agent>
  16842. <user-agent>
  16843. <ID>id_n_s_061206_4</ID>
  16844. <String>RoboCrawl (http://www.canadiancontent.net)</String>
  16845. <Description>Canadian Content search crawler</Description>
  16846. <Type>R</Type>
  16847. <Comment></Comment>
  16848. <Link1>http://www.canadiancontent.net/</Link1>
  16849. <Link2></Link2>
  16850. </user-agent>
  16851. <user-agent>
  16852. <ID>id_n_s_1183</ID>
  16853. <String>RoboCrawl (www.canadiancontent.net)</String>
  16854. <Description>Canadian Content Search (207.44.220.xx) robot</Description>
  16855. <Type>R</Type>
  16856. <Comment></Comment>
  16857. <Link1>http://www.canadiancontent.net/</Link1>
  16858. <Link2></Link2>
  16859. </user-agent>
  16860. <user-agent>
  16861. <ID>id_n_s_1184</ID>
  16862. <String>RoboPal (http://www.findpal.com/)</String>
  16863. <Description>FindPal Australia metasearch robot (61.68.139.xx)</Description>
  16864. <Type>R</Type>
  16865. <Comment></Comment>
  16866. <Link1>http://www.findpal.com/</Link1>
  16867. <Link2></Link2>
  16868. </user-agent>
  16869. <user-agent>
  16870. <ID>id_n_s_1187</ID>
  16871. <String>Robot/www.pj-search.com</String>
  16872. <Description>PopJapanSearch robot</Description>
  16873. <Type>R</Type>
  16874. <Comment></Comment>
  16875. <Link1>http://www.pj-search.com/</Link1>
  16876. <Link2></Link2>
  16877. </user-agent>
  16878. <user-agent>
  16879. <ID>id_n_s_1185</ID>
  16880. <String>Robot: NutchCrawler- Owner: wdavies@acm.org</String>
  16881. <Description>Experimental robot using Wget via attbi.net</Description>
  16882. <Type>R</Type>
  16883. <Comment></Comment>
  16884. <Link1></Link1>
  16885. <Link2></Link2>
  16886. </user-agent>
  16887. <user-agent>
  16888. <ID>id_n_s_1186</ID>
  16889. <String>Robot@SuperSnooper.Com</String>
  16890. <Description>Supersnooper robot</Description>
  16891. <Type>R</Type>
  16892. <Comment></Comment>
  16893. <Link1>http://www.Supersnooper.com/</Link1>
  16894. <Link2></Link2>
  16895. </user-agent>
  16896. <user-agent>
  16897. <ID>id_n_s_1188</ID>
  16898. <String>Robozilla/1.0</String>
  16899. <Description>Netscape Directory / DMOZ Open Directory link crawler</Description>
  16900. <Type>R</Type>
  16901. <Comment></Comment>
  16902. <Link1>http://directory.mozilla.org/</Link1>
  16903. <Link2></Link2>
  16904. </user-agent>
  16905. <user-agent>
  16906. <ID>id_n_s_220208_1</ID>
  16907. <String>Rome Client (http://tinyurl.com/64t5n) Ver: 0.9</String>
  16908. <Description>ROME - Open source Java tools for RSS and Atom feeds</Description>
  16909. <Type>B</Type>
  16910. <Comment></Comment>
  16911. <Link1>https://rome.dev.java.net/</Link1>
  16912. <Link2></Link2>
  16913. </user-agent>
  16914. <user-agent>
  16915. <ID>id_n_s_1189</ID>
  16916. <String>Rotondo/3.1 libwww/5.3.1</String>
  16917. <Description>Qualigo.de robot</Description>
  16918. <Type>R</Type>
  16919. <Comment></Comment>
  16920. <Link1>http://www.qualigo.de/</Link1>
  16921. <Link2></Link2>
  16922. </user-agent>
  16923. <user-agent>
  16924. <ID>id_n_s_1190</ID>
  16925. <String>RPT-HTTPClient/0.3-x</String>
  16926. <Description>different IPs using the HTTPClient library (mostly link checking)</Description>
  16927. <Type>C</Type>
  16928. <Comment>Java1.4.0</Comment>
  16929. <Link1>http://www.innovation.ch/java/HTTPClient/</Link1>
  16930. <Link2></Link2>
  16931. </user-agent>
  16932. <user-agent>
  16933. <ID>id_n_s_1191</ID>
  16934. <String>RRC (crawler_admin@bigfoot.com)</String>
  16935. <Description>Metacarta.com (66.28.xx.xxx) robot</Description>
  16936. <Type>R</Type>
  16937. <Comment>s. Larbin...</Comment>
  16938. <Link1>http://www.metacarta.com</Link1>
  16939. <Link2></Link2>
  16940. </user-agent>
  16941. <user-agent>
  16942. <ID>id_n_s_250707_5</ID>
  16943. <String>RssBandit/1.5.0.10 (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; http://www.rssbandit.org) (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; )</String>
  16944. <Description>RSS Bandit RSS/Atom reader for .NET framework</Description>
  16945. <Type>B</Type>
  16946. <Comment></Comment>
  16947. <Link1>http://www.rssbandit.org/</Link1>
  16948. <Link2></Link2>
  16949. </user-agent>
  16950. <user-agent>
  16951. <ID>id_n_s_230607_3</ID>
  16952. <String>RSSMicro.com RSS/Atom Feed Robot</String>
  16953. <Description>RSS Micro Search - RSS feed search engine</Description>
  16954. <Type>R</Type>
  16955. <Comment>209.216.63.xx</Comment>
  16956. <Link1>http://www.rssmicro.com/</Link1>
  16957. <Link2></Link2>
  16958. </user-agent>
  16959. <user-agent>
  16960. <ID>id_n_s_080307_2</ID>
  16961. <String>RSSOwl/1.2.3 2006-11-26 (Windows; U; zhtw)</String>
  16962. <Description>RSSOwl embedded RSS feed reader</Description>
  16963. <Type>B</Type>
  16964. <Comment></Comment>
  16965. <Link1>http://www.rssowl.org/</Link1>
  16966. <Link2></Link2>
  16967. </user-agent>
  16968. <user-agent>
  16969. <ID>id_n_s_060108_1</ID>
  16970. <String>RSSOwl/1.2.4 Preview Release 2007-04-15 (Windows; U; zhtw)</String>
  16971. <Description>RSSOwl embedded RSS feed reader</Description>
  16972. <Type>B</Type>
  16973. <Comment></Comment>
  16974. <Link1>http://www.rssowl.org/</Link1>
  16975. <Link2></Link2>
  16976. </user-agent>
  16977. <user-agent>
  16978. <ID>id_n_s_181006_3</ID>
  16979. <String>RssReader/1.0.xx.x (http://www.rssreader.com) Microsoft Windows NT 5.1.2600.0</String>
  16980. <Description>Ykoon RssReader news feed reader</Description>
  16981. <Type>B</Type>
  16982. <Comment></Comment>
  16983. <Link1>http://www.rssreader.com/</Link1>
  16984. <Link2></Link2>
  16985. </user-agent>
  16986. <user-agent>
  16987. <ID>id_n_s_1192</ID>
  16988. <String>RSurf15a 41</String>
  16989. <Description>Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com</Description>
  16990. <Type>S</Type>
  16991. <Comment></Comment>
  16992. <Link1></Link1>
  16993. <Link2></Link2>
  16994. </user-agent>
  16995. <user-agent>
  16996. <ID>id_n_s_1193</ID>
  16997. <String>RSurf15a 51</String>
  16998. <Description>Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com</Description>
  16999. <Type>S</Type>
  17000. <Comment></Comment>
  17001. <Link1></Link1>
  17002. <Link2></Link2>
  17003. </user-agent>
  17004. <user-agent>
  17005. <ID>id_n_s_1194</ID>
  17006. <String>RSurf15a 81</String>
  17007. <Description>Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com</Description>
  17008. <Type>S</Type>
  17009. <Comment></Comment>
  17010. <Link1></Link1>
  17011. <Link2></Link2>
  17012. </user-agent>
  17013. <user-agent>
  17014. <ID>id_n_s_080206_2</ID>
  17015. <String>Rubbot/1.0 (+http://rubhub.com/)</String>
  17016. <Description>rubhub blog spider</Description>
  17017. <Type>C</Type>
  17018. <Comment>based on XFN relationship lookup engine</Comment>
  17019. <Link1>http://rubhub.com/main/</Link1>
  17020. <Link2>http://gmpg.org/xfn/more</Link2>
  17021. </user-agent>
  17022. <user-agent>
  17023. <ID>id_n_s_191105_1</ID>
  17024. <String>RufusBot (Rufus Web Miner; http://64.124.122.252/feedback.html)</String>
  17025. <Description>WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)</Description>
  17026. <Type>R</Type>
  17027. <Comment>s. also pulseBot</Comment>
  17028. <Link1>http://www.webaroo.com/index</Link1>
  17029. <Link2>http://www.webaroo.com/company/site-owners</Link2>
  17030. </user-agent>
  17031. <user-agent>
  17032. <ID>id_n_s_020407_1</ID>
  17033. <String>RufusBot (Rufus Web Miner; http://www.webaroo.com/rooSiteOwners.html)</String>
  17034. <Description>WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)</Description>
  17035. <Type>R</Type>
  17036. <Comment>s. also pulseBot</Comment>
  17037. <Link1>http://www.webaroo.com/index</Link1>
  17038. <Link2>http://www.webaroo.com/company/site-owners</Link2>
  17039. </user-agent>
  17040. <user-agent>
  17041. <ID>id_n_s_1195</ID>
  17042. <String>Rumours-Agent</String>
  17043. <Description>unknown robot from rumours.jp (202.214.69.xxx)</Description>
  17044. <Type></Type>
  17045. <Comment></Comment>
  17046. <Link1></Link1>
  17047. <Link2></Link2>
  17048. </user-agent>
  17049. <user-agent>
  17050. <ID>id_n_s_1196</ID>
  17051. <String>RX Bar</String>
  17052. <Description>RX (Reflexive Search) Bar for IE</Description>
  17053. <Type>B</Type>
  17054. <Comment></Comment>
  17055. <Link1>http://www.searchenginebar.com/</Link1>
  17056. <Link2></Link2>
  17057. </user-agent>
  17058. <user-agent>
  17059. <ID>id_n_s_160506_1</ID>
  17060. <String>S&amp;L Spider (http://search.hirners.com/)</String>
  17061. <Description>Search &amp; Links directory spider</Description>
  17062. <Type>C</Type>
  17063. <Comment>80.108.7.xx</Comment>
  17064. <Link1>http://search.hirners.com/</Link1>
  17065. <Link2></Link2>
  17066. </user-agent>
  17067. <user-agent>
  17068. <ID>id_n_s_1197</ID>
  17069. <String>S.T.A.L.K.E.R. (http://www.seo-tools.net/en/bot.aspx)</String>
  17070. <Description>SEO-Tools.net link checking ?</Description>
  17071. <Type>C</Type>
  17072. <Comment></Comment>
  17073. <Link1>http://www.seo-tools.net/</Link1>
  17074. <Link2></Link2>
  17075. </user-agent>
  17076. <user-agent>
  17077. <ID>id_n_s_1198</ID>
  17078. <String>SafariBookmarkChecker (+http://www.coriolis.ch/)</String>
  17079. <Description>SafariBookmarkChecker for Mac OS X</Description>
  17080. <Type>C</Type>
  17081. <Comment></Comment>
  17082. <Link1>http://www.coriolis.ch/</Link1>
  17083. <Link2></Link2>
  17084. </user-agent>
  17085. <user-agent>
  17086. <ID>id_n_s_061107_1</ID>
  17087. <String>sait/Nutch-0.9 (SAIT Research; http://www.samsung.com)</String>
  17088. <Description>sait robot - unknown robot from Samsung International Korea</Description>
  17089. <Type>R</Type>
  17090. <Comment>202.20.190.xx</Comment>
  17091. <Link1>http://samsungnetworks.co.kr/eng/index.jsp</Link1>
  17092. <Link2></Link2>
  17093. </user-agent>
  17094. <user-agent>
  17095. <ID>id_n_s_191105_2</ID>
  17096. <String>SandCrawler - Compatibility Testing</String>
  17097. <Description>Sandcrawler robot from Microsoft (131.107.0.xx)</Description>
  17098. <Type>R</Type>
  17099. <Comment></Comment>
  17100. <Link1></Link1>
  17101. <Link2></Link2>
  17102. </user-agent>
  17103. <user-agent>
  17104. <ID>id_n_s_170109_3</ID>
  17105. <String>SapphireWebCrawler/1.0 (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu)</String>
  17106. <Description>Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute</Description>
  17107. <Type>R</Type>
  17108. <Comment></Comment>
  17109. <Link1>http://boston.lti.cs.cmu.edu/crawler/</Link1>
  17110. <Link2></Link2>
  17111. </user-agent>
  17112. <user-agent>
  17113. <ID>id_n_s_170109_4</ID>
  17114. <String>SapphireWebCrawler/Nutch-1.0-dev (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu)</String>
  17115. <Description>Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute</Description>
  17116. <Type>R</Type>
  17117. <Comment></Comment>
  17118. <Link1>http://boston.lti.cs.cmu.edu/crawler/</Link1>
  17119. <Link2></Link2>
  17120. </user-agent>
  17121. <user-agent>
  17122. <ID>id_n_s_021205_4</ID>
  17123. <String>savvybot/0.2</String>
  17124. <Description>WebSavvy Directory robot</Description>
  17125. <Type>R</Type>
  17126. <Comment></Comment>
  17127. <Link1>http://www.websavvy.cc/bot.php</Link1>
  17128. <Link2></Link2>
  17129. </user-agent>
  17130. <user-agent>
  17131. <ID>id_n_s_1199</ID>
  17132. <String>SBIder/0.7 (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html)</String>
  17133. <Description>SiteSell SBIder Nutch based crawler</Description>
  17134. <Type>R</Type>
  17135. <Comment></Comment>
  17136. <Link1>http://www.sitesell.com/</Link1>
  17137. <Link2></Link2>
  17138. </user-agent>
  17139. <user-agent>
  17140. <ID>id_n_s_030106_2</ID>
  17141. <String>SBIder/0.8-dev (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html)</String>
  17142. <Description>SiteSell SBIder Nutch based crawler</Description>
  17143. <Type>R</Type>
  17144. <Comment></Comment>
  17145. <Link1>http://www.sitesell.com/</Link1>
  17146. <Link2></Link2>
  17147. </user-agent>
  17148. <user-agent>
  17149. <ID>id_n_s_1200</ID>
  17150. <String>SBL-BOT (http://sbl.net)</String>
  17151. <Description>Softbyte Labs Black Widow web site ripper</Description>
  17152. <Type>D B</Type>
  17153. <Comment></Comment>
  17154. <Link1>http://sbl.net/</Link1>
  17155. <Link2></Link2>
  17156. </user-agent>
  17157. <user-agent>
  17158. <ID>id_n_s_1201</ID>
  17159. <String>ScanWeb</String>
  17160. <Description>ScanWeb - regular expression based web page searching tool</Description>
  17161. <Type>R</Type>
  17162. <Comment></Comment>
  17163. <Link1>http://eserver.host.sk/</Link1>
  17164. <Link2></Link2>
  17165. </user-agent>
  17166. <user-agent>
  17167. <ID>id_n_s_301006_1</ID>
  17168. <String>ScholarUniverse/0.8 (Nutch;+http://scholaruniverse.com/bot.jsp; fetch-agent@scholaruniverse.com)</String>
  17169. <Description>ScholarUniverse - Scholarly experts search robot</Description>
  17170. <Type>R</Type>
  17171. <Comment>209.216.243.xx</Comment>
  17172. <Link1>http://www.scholaruniverse.com/index.jsp</Link1>
  17173. <Link2></Link2>
  17174. </user-agent>
  17175. <user-agent>
  17176. <ID>id_n_s_1202</ID>
  17177. <String>schwarzmann.biz-Spider_for_paddel.org+(http://www.innerprise.net/usp-spider.asp)</String>
  17178. <Description>URL Spider Pro (USP) used by German Schwarzmann GmbH</Description>
  17179. <Type>R</Type>
  17180. <Comment></Comment>
  17181. <Link1>http://www.schwarzmann.biz/</Link1>
  17182. <Link2></Link2>
  17183. </user-agent>
  17184. <user-agent>
  17185. <ID>id_n_s_1203</ID>
  17186. <String>Science Traveller International 1X/1.0</String>
  17187. <Description>1X Web Browser</Description>
  17188. <Type>B</Type>
  17189. <Comment></Comment>
  17190. <Link1>http://www.scitrav.com/</Link1>
  17191. <Link2></Link2>
  17192. </user-agent>
  17193. <user-agent>
  17194. <ID>id_n_s_190407_1</ID>
  17195. <String>ScollSpider/2.0 (+http://www.webwobot.com/ScollSpider.php)</String>
  17196. <Description>WebWobot UK search engine robot (82.43.129.2xx)</Description>
  17197. <Type>R</Type>
  17198. <Comment>s. also Mozilla/3.0 (compatible; ScollSpider ...</Comment>
  17199. <Link1>http://www.webwobot.com/</Link1>
  17200. <Link2></Link2>
  17201. </user-agent>
  17202. <user-agent>
  17203. <ID>id_n_s_1206</ID>
  17204. <String>Scooter-3.0.EU</String>
  17205. <Description>Altavista robot</Description>
  17206. <Type>R</Type>
  17207. <Comment></Comment>
  17208. <Link1>http://www.altavista.com/</Link1>
  17209. <Link2></Link2>
  17210. </user-agent>
  17211. <user-agent>
  17212. <ID>id_n_s_1207</ID>
  17213. <String>Scooter-3.0.FS</String>
  17214. <Description>Altavista robot</Description>
  17215. <Type>R</Type>
  17216. <Comment></Comment>
  17217. <Link1>http://www.altavista.com/</Link1>
  17218. <Link2></Link2>
  17219. </user-agent>
  17220. <user-agent>
  17221. <ID>id_n_s_1208</ID>
  17222. <String>Scooter-3.0.HD</String>
  17223. <Description>Altavista robot</Description>
  17224. <Type>R</Type>
  17225. <Comment></Comment>
  17226. <Link1>http://www.altavista.com/</Link1>
  17227. <Link2></Link2>
  17228. </user-agent>
  17229. <user-agent>
  17230. <ID>id_n_s_1209</ID>
  17231. <String>Scooter-3.0.VNS</String>
  17232. <Description>Altavista robot</Description>
  17233. <Type>R</Type>
  17234. <Comment></Comment>
  17235. <Link1>http://www.altavista.com/</Link1>
  17236. <Link2></Link2>
  17237. </user-agent>
  17238. <user-agent>
  17239. <ID>id_n_s_1210</ID>
  17240. <String>Scooter-3.0QI</String>
  17241. <Description>Altavista robot</Description>
  17242. <Type>R</Type>
  17243. <Comment></Comment>
  17244. <Link1>http://www.altavista.com/</Link1>
  17245. <Link2></Link2>
  17246. </user-agent>
  17247. <user-agent>
  17248. <ID>id_n_s_1211</ID>
  17249. <String>Scooter-3.2</String>
  17250. <Description>Altavista robot</Description>
  17251. <Type>R</Type>
  17252. <Comment></Comment>
  17253. <Link1>http://www.altavista.com/</Link1>
  17254. <Link2></Link2>
  17255. </user-agent>
  17256. <user-agent>
  17257. <ID>id_n_s_1212</ID>
  17258. <String>Scooter-3.2.BT</String>
  17259. <Description>Altavista robot</Description>
  17260. <Type>R</Type>
  17261. <Comment></Comment>
  17262. <Link1>http://www.altavista.com/</Link1>
  17263. <Link2></Link2>
  17264. </user-agent>
  17265. <user-agent>
  17266. <ID>id_n_s_1213</ID>
  17267. <String>Scooter-3.2.DIL</String>
  17268. <Description>Altavista robot</Description>
  17269. <Type>R</Type>
  17270. <Comment></Comment>
  17271. <Link1>http://www.altavista.com/</Link1>
  17272. <Link2></Link2>
  17273. </user-agent>
  17274. <user-agent>
  17275. <ID>id_n_s_1214</ID>
  17276. <String>Scooter-3.2.EX</String>
  17277. <Description>Altavista robot</Description>
  17278. <Type>R</Type>
  17279. <Comment></Comment>
  17280. <Link1>http://www.altavista.com/</Link1>
  17281. <Link2></Link2>
  17282. </user-agent>
  17283. <user-agent>
  17284. <ID>id_n_s_1215</ID>
  17285. <String>Scooter-3.2.JT</String>
  17286. <Description>Altavista robot</Description>
  17287. <Type>R</Type>
  17288. <Comment></Comment>
  17289. <Link1>http://www.altavista.com/</Link1>
  17290. <Link2></Link2>
  17291. </user-agent>
  17292. <user-agent>
  17293. <ID>id_n_s_1216</ID>
  17294. <String>Scooter-3.2.NIV</String>
  17295. <Description>Altavista robot</Description>
  17296. <Type>R</Type>
  17297. <Comment></Comment>
  17298. <Link1>http://www.altavista.com/</Link1>
  17299. <Link2></Link2>
  17300. </user-agent>
  17301. <user-agent>
  17302. <ID>id_n_s_1217</ID>
  17303. <String>Scooter-3.2.SF0</String>
  17304. <Description>Altavista robot</Description>
  17305. <Type>R</Type>
  17306. <Comment></Comment>
  17307. <Link1>http://www.altavista.com/</Link1>
  17308. <Link2></Link2>
  17309. </user-agent>
  17310. <user-agent>
  17311. <ID>id_n_s_1218</ID>
  17312. <String>Scooter-3.2.snippet</String>
  17313. <Description>Altavista robot</Description>
  17314. <Type>R</Type>
  17315. <Comment></Comment>
  17316. <Link1>http://www.altavista.com/</Link1>
  17317. <Link2></Link2>
  17318. </user-agent>
  17319. <user-agent>
  17320. <ID>id_n_s_1219</ID>
  17321. <String>Scooter-3.3dev</String>
  17322. <Description>Altavista robot</Description>
  17323. <Type>R</Type>
  17324. <Comment></Comment>
  17325. <Link1>http://www.altavista.com/</Link1>
  17326. <Link2></Link2>
  17327. </user-agent>
  17328. <user-agent>
  17329. <ID>id_n_s_1220</ID>
  17330. <String>Scooter-ARS-1.1</String>
  17331. <Description>Altavista robot</Description>
  17332. <Type>R</Type>
  17333. <Comment></Comment>
  17334. <Link1>http://www.altavista.com/</Link1>
  17335. <Link2></Link2>
  17336. </user-agent>
  17337. <user-agent>
  17338. <ID>id_n_s_1221</ID>
  17339. <String>Scooter-ARS-1.1-ih</String>
  17340. <Description>Altavista robot</Description>
  17341. <Type>R</Type>
  17342. <Comment></Comment>
  17343. <Link1>http://www.altavista.com/</Link1>
  17344. <Link2></Link2>
  17345. </user-agent>
  17346. <user-agent>
  17347. <ID>id_n_s_1222</ID>
  17348. <String>scooter-venus-3.0.vns</String>
  17349. <Description>Altavista robot</Description>
  17350. <Type>R</Type>
  17351. <Comment></Comment>
  17352. <Link1>http://www.altavista.com/</Link1>
  17353. <Link2></Link2>
  17354. </user-agent>
  17355. <user-agent>
  17356. <ID>id_n_s_1223</ID>
  17357. <String>Scooter-W3-1.0</String>
  17358. <Description>Altavista robot</Description>
  17359. <Type>R</Type>
  17360. <Comment></Comment>
  17361. <Link1>http://www.altavista.com/</Link1>
  17362. <Link2></Link2>
  17363. </user-agent>
  17364. <user-agent>
  17365. <ID>id_n_s_1224</ID>
  17366. <String>Scooter-W3.1.2</String>
  17367. <Description>Altavista robot</Description>
  17368. <Type>R</Type>
  17369. <Comment></Comment>
  17370. <Link1>http://www.altavista.com/</Link1>
  17371. <Link2></Link2>
  17372. </user-agent>
  17373. <user-agent>
  17374. <ID>id_n_s_1225</ID>
  17375. <String>Scooter/1.0</String>
  17376. <Description>Altavista robot</Description>
  17377. <Type>R</Type>
  17378. <Comment></Comment>
  17379. <Link1>http://www.altavista.com/</Link1>
  17380. <Link2></Link2>
  17381. </user-agent>
  17382. <user-agent>
  17383. <ID>id_n_s_1226</ID>
  17384. <String>Scooter/1.0 scooter@pa.dec.com</String>
  17385. <Description>Altavista robot</Description>
  17386. <Type>R</Type>
  17387. <Comment></Comment>
  17388. <Link1>http://www.altavista.com/</Link1>
  17389. <Link2></Link2>
  17390. </user-agent>
  17391. <user-agent>
  17392. <ID>id_n_s_1227</ID>
  17393. <String>Scooter/1.1 (custom)</String>
  17394. <Description>Altavista robot</Description>
  17395. <Type>R</Type>
  17396. <Comment></Comment>
  17397. <Link1>http://www.altavista.com/</Link1>
  17398. <Link2></Link2>
  17399. </user-agent>
  17400. <user-agent>
  17401. <ID>id_n_s_1228</ID>
  17402. <String>Scooter/2.0 G.R.A.B. V1.1.0</String>
  17403. <Description>Altavista robot</Description>
  17404. <Type>R</Type>
  17405. <Comment></Comment>
  17406. <Link1>http://www.altavista.com/</Link1>
  17407. <Link2></Link2>
  17408. </user-agent>
  17409. <user-agent>
  17410. <ID>id_n_s_1229</ID>
  17411. <String>Scooter/2.0 G.R.A.B. X2.0</String>
  17412. <Description>Altavista robot</Description>
  17413. <Type>R</Type>
  17414. <Comment></Comment>
  17415. <Link1>http://www.altavista.com/</Link1>
  17416. <Link2></Link2>
  17417. </user-agent>
  17418. <user-agent>
  17419. <ID>id_n_s_1230</ID>
  17420. <String>Scooter/3.3</String>
  17421. <Description>Altavista robot</Description>
  17422. <Type>R</Type>
  17423. <Comment></Comment>
  17424. <Link1>http://www.altavista.com/</Link1>
  17425. <Link2></Link2>
  17426. </user-agent>
  17427. <user-agent>
  17428. <ID>id_n_s_1232</ID>
  17429. <String>Scooter/3.3.QA.pczukor</String>
  17430. <Description>Altavista robot</Description>
  17431. <Type>R</Type>
  17432. <Comment></Comment>
  17433. <Link1>http://www.altavista.com/</Link1>
  17434. <Link2></Link2>
  17435. </user-agent>
  17436. <user-agent>
  17437. <ID>id_n_s_1233</ID>
  17438. <String>Scooter/3.3.vscooter</String>
  17439. <Description>Altavista robot</Description>
  17440. <Type>R</Type>
  17441. <Comment></Comment>
  17442. <Link1>http://www.altavista.com/</Link1>
  17443. <Link2></Link2>
  17444. </user-agent>
  17445. <user-agent>
  17446. <ID>id_n_s_1231</ID>
  17447. <String>Scooter/3.3_SF</String>
  17448. <Description>Altavista robot</Description>
  17449. <Type>R</Type>
  17450. <Comment></Comment>
  17451. <Link1>http://www.altavista.com/</Link1>
  17452. <Link2></Link2>
  17453. </user-agent>
  17454. <user-agent>
  17455. <ID>id_n_s_1234</ID>
  17456. <String>Scooter2_Mercator_x-x.0</String>
  17457. <Description>Altavista using Mercator robot</Description>
  17458. <Type>R</Type>
  17459. <Comment></Comment>
  17460. <Link1>http://www.altavista.com/</Link1>
  17461. <Link2>http://www.research.compaq.com/SRC/mercator/</Link2>
  17462. </user-agent>
  17463. <user-agent>
  17464. <ID>id_n_s_1204</ID>
  17465. <String>Scooter_bh0-3.0.3</String>
  17466. <Description>Altavista robot</Description>
  17467. <Type>R</Type>
  17468. <Comment></Comment>
  17469. <Link1>http://www.altavista.com/</Link1>
  17470. <Link2></Link2>
  17471. </user-agent>
  17472. <user-agent>
  17473. <ID>id_n_s_1205</ID>
  17474. <String>Scooter_trk3-3.0.3</String>
  17475. <Description>Altavista robot</Description>
  17476. <Type>R</Type>
  17477. <Comment></Comment>
  17478. <Link1>http://www.altavista.com/</Link1>
  17479. <Link2></Link2>
  17480. </user-agent>
  17481. <user-agent>
  17482. <ID>id_n_s_190306_3</ID>
  17483. <String>Scope (Mars+)</String>
  17484. <Description>Scope Navigator mobile browser (Japan)</Description>
  17485. <Type>B</Type>
  17486. <Comment></Comment>
  17487. <Link1>http://www.programmer.co.jp/scope.shtml</Link1>
  17488. <Link2></Link2>
  17489. </user-agent>
  17490. <user-agent>
  17491. <ID>id_n_s_1235</ID>
  17492. <String>ScoutAbout</String>
  17493. <Description>Some nec.com robot using Research Republic ScoutAbout Research Tool</Description>
  17494. <Type>R</Type>
  17495. <Comment></Comment>
  17496. <Link1>http://www.researchrepublic.com/</Link1>
  17497. <Link2></Link2>
  17498. </user-agent>
  17499. <user-agent>
  17500. <ID>id_n_s_051207_4</ID>
  17501. <String>ScoutAnt/0.1; +http://www.ant.com/what_is_ant.com/</String>
  17502. <Description>Ant.com search robot</Description>
  17503. <Type>R</Type>
  17504. <Comment>66.230.171.17x</Comment>
  17505. <Link1>http://www.ant.com/</Link1>
  17506. <Link2></Link2>
  17507. </user-agent>
  17508. <user-agent>
  17509. <ID>id_n_s_271105_3</ID>
  17510. <String>scoutmaster</String>
  17511. <Description>ScoutMaster information retrieval software</Description>
  17512. <Type>R</Type>
  17513. <Comment></Comment>
  17514. <Link1>http://www.scoutmaster.de/</Link1>
  17515. <Link2></Link2>
  17516. </user-agent>
  17517. <user-agent>
  17518. <ID>id_n_s_1236</ID>
  17519. <String>Scrubby/2.x (http://www.scrubtheweb.com/)</String>
  17520. <Description>Scrub the web robot (66.93.156.xx)</Description>
  17521. <Type>R</Type>
  17522. <Comment>s.also Mozilla/5.0 (compatible; Scrubby/2.2 ...</Comment>
  17523. <Link1>http://www.scrubtheweb.com/</Link1>
  17524. <Link2></Link2>
  17525. </user-agent>
  17526. <user-agent>
  17527. <ID>id_n_s_030308_3</ID>
  17528. <String>Scrubby/3.0 (+http://www.scrubtheweb.com/help/technology.html)</String>
  17529. <Description>Scrub the web robot (66.93.156.xx)</Description>
  17530. <Type>R</Type>
  17531. <Comment>s.also Mozilla/5.0 (compatible; Scrubby/2.2 ...</Comment>
  17532. <Link1>http://www.scrubtheweb.com/</Link1>
  17533. <Link2></Link2>
  17534. </user-agent>
  17535. <user-agent>
  17536. <ID>id_n_s_1240</ID>
  17537. <String>Search+</String>
  17538. <Description>URL Search+ search software</Description>
  17539. <Type>R</Type>
  17540. <Comment></Comment>
  17541. <Link1>http://srchplus.chat.ru/index.htm</Link1>
  17542. <Link2></Link2>
  17543. </user-agent>
  17544. <user-agent>
  17545. <ID>id_n_s_110606_3</ID>
  17546. <String>Search-Engine-Studio</String>
  17547. <Description>Xtreem Search Engine Studio - SE software</Description>
  17548. <Type>R</Type>
  17549. <Comment></Comment>
  17550. <Link1>http://www.xtreeme.com/search-engine-studio/</Link1>
  17551. <Link2></Link2>
  17552. </user-agent>
  17553. <user-agent>
  17554. <ID>id_n_s_1237</ID>
  17555. <String>search.ch V1.4</String>
  17556. <Description>Search.ch robot</Description>
  17557. <Type>R</Type>
  17558. <Comment></Comment>
  17559. <Link1>http://www.search.ch/</Link1>
  17560. <Link2></Link2>
  17561. </user-agent>
  17562. <user-agent>
  17563. <ID>id_n_s_1238</ID>
  17564. <String>search.ch V1.4.2 (spiderman@search.ch; http://www.search.ch)</String>
  17565. <Description>Search.ch robot</Description>
  17566. <Type>R</Type>
  17567. <Comment></Comment>
  17568. <Link1>http://www.search.ch/</Link1>
  17569. <Link2></Link2>
  17570. </user-agent>
  17571. <user-agent>
  17572. <ID>id_n_s_1239</ID>
  17573. <String>Search/1.0 (http://www.innerprise.net/es-spider.asp)</String>
  17574. <Description>Enterprise Search web indexing / site searching tool</Description>
  17575. <Type>R</Type>
  17576. <Comment></Comment>
  17577. <Link1>http://www.innerprise.net/es-bi.asp</Link1>
  17578. <Link2></Link2>
  17579. </user-agent>
  17580. <user-agent>
  17581. <ID>id_n_s_1241</ID>
  17582. <String>searchbot admin@google.com</String>
  17583. <Description>Unknown robot  / website grabber from Chinatelecom (219.142.78.xxx)</Description>
  17584. <Type>S</Type>
  17585. <Comment></Comment>
  17586. <Link1></Link1>
  17587. <Link2></Link2>
  17588. </user-agent>
  17589. <user-agent>
  17590. <ID>id_n_s_1242</ID>
  17591. <String>SearchByUsa/2 (SearchByUsa; http://www.SearchByUsa.com/bot.html; info@SearchByUsa.com)</String>
  17592. <Description>SearchByUSA robot (69.150.7.xxx)</Description>
  17593. <Type>R</Type>
  17594. <Comment></Comment>
  17595. <Link1>http://www.searchbyusa.com/</Link1>
  17596. <Link2></Link2>
  17597. </user-agent>
  17598. <user-agent>
  17599. <ID>id_n_s_231006_1</ID>
  17600. <String>SearchdayBot</String>
  17601. <Description>Searchday (Germany) search robot</Description>
  17602. <Type>R</Type>
  17603. <Comment>85.25.131.1xx</Comment>
  17604. <Link1>http://www.searchday.de/</Link1>
  17605. <Link2></Link2>
  17606. </user-agent>
  17607. <user-agent>
  17608. <ID>id_n_s_1243</ID>
  17609. <String>SearchExpress Spider0.99</String>
  17610. <Description>Searchexpress spider</Description>
  17611. <Type>R</Type>
  17612. <Comment></Comment>
  17613. <Link1>http://www.searchexpress.com/</Link1>
  17614. <Link2></Link2>
  17615. </user-agent>
  17616. <user-agent>
  17617. <ID>id_n_s_1245</ID>
  17618. <String>SearchGuild/DMOZ/Experiment (searchguild@gmail.com)</String>
  17619. <Description>Searchguild forum &amp; directory robot (81.3.75.xxx)</Description>
  17620. <Type>R</Type>
  17621. <Comment></Comment>
  17622. <Link1>http://searchguild.com/</Link1>
  17623. <Link2></Link2>
  17624. </user-agent>
  17625. <user-agent>
  17626. <ID>id_n_s_1244</ID>
  17627. <String>SearchGuild_DMOZ_Experiment (chris@searchguild.com)</String>
  17628. <Description>Searchguild forum &amp; directory robot (81.3.75.xxx)</Description>
  17629. <Type>R</Type>
  17630. <Comment></Comment>
  17631. <Link1>http://searchguild.com/</Link1>
  17632. <Link2></Link2>
  17633. </user-agent>
  17634. <user-agent>
  17635. <ID>id_n_s_1246</ID>
  17636. <String>Searchit-Now Robot/2.2 (+http://www.searchit-now.co.uk)</String>
  17637. <Description>Searchit robot (69.93.107.xx)</Description>
  17638. <Type>R</Type>
  17639. <Comment></Comment>
  17640. <Link1>http://www.searchit-now.co.uk</Link1>
  17641. <Link2></Link2>
  17642. </user-agent>
  17643. <user-agent>
  17644. <ID>id_n_s_220906_3</ID>
  17645. <String>Searchmee! Spider v0.98a</String>
  17646. <Description>Searchmee!  Search Engine (prototype) robot by findanisp.com</Description>
  17647. <Type>R</Type>
  17648. <Comment>64.202.100.</Comment>
  17649. <Link1>http://www.searchmee.com/</Link1>
  17650. <Link2></Link2>
  17651. </user-agent>
  17652. <user-agent>
  17653. <ID>id_n_s_100506_1</ID>
  17654. <String>SearchSight/2.0 (http://SearchSight.com/)</String>
  17655. <Description>SearchSight search robot</Description>
  17656. <Type>R</Type>
  17657. <Comment></Comment>
  17658. <Link1>http://searchsight.com/</Link1>
  17659. <Link2></Link2>
  17660. </user-agent>
  17661. <user-agent>
  17662. <ID>id_n_s_1247</ID>
  17663. <String>SearchSpider.com/1.1</String>
  17664. <Description>SearchSpider robot</Description>
  17665. <Type>R</Type>
  17666. <Comment></Comment>
  17667. <Link1>http://www.searchspider.com/</Link1>
  17668. <Link2></Link2>
  17669. </user-agent>
  17670. <user-agent>
  17671. <ID>id_n_s_1248</ID>
  17672. <String>Searchspider/1.2 (SearchSpider; http://www.searchspider.com; webmaster@searchspider.com)</String>
  17673. <Description>SearchSpider robot</Description>
  17674. <Type>R</Type>
  17675. <Comment></Comment>
  17676. <Link1>http://www.searchspider.com/</Link1>
  17677. <Link2></Link2>
  17678. </user-agent>
  17679. <user-agent>
  17680. <ID>id_n_s_1249</ID>
  17681. <String>SearchTone2.0 - IDEARE</String>
  17682. <Description>Janas (Ideare.com / Tiscali.it) robot</Description>
  17683. <Type>R</Type>
  17684. <Comment></Comment>
  17685. <Link1>http://www.ideare.com/</Link1>
  17686. <Link2>http://www.tiscali.it</Link2>
  17687. </user-agent>
  17688. <user-agent>
  17689. <ID>id_n_s_1250</ID>
  17690. <String>Seekbot/1.0 (http://www.seekbot.net/bot.html) HTTPFetcher/0.3</String>
  17691. <Description>seekport. beta search (Germany) robot</Description>
  17692. <Type>R</Type>
  17693. <Comment>195.27.215.xx</Comment>
  17694. <Link1>http://www.seekbot.net/</Link1>
  17695. <Link2></Link2>
  17696. </user-agent>
  17697. <user-agent>
  17698. <ID>id_n_s_1251</ID>
  17699. <String>Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.0 (XDF)</String>
  17700. <Description>seekport. beta search (Germany) robot</Description>
  17701. <Type>R</Type>
  17702. <Comment>195.27.215.xx</Comment>
  17703. <Link1>http://www.seekbot.net/</Link1>
  17704. <Link2></Link2>
  17705. </user-agent>
  17706. <user-agent>
  17707. <ID>id_n_s_1252</ID>
  17708. <String>Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.2</String>
  17709. <Description>seekport. beta search (Germany) robot</Description>
  17710. <Type>R</Type>
  17711. <Comment>195.27.215.xx</Comment>
  17712. <Link1>http://www.seekbot.net/</Link1>
  17713. <Link2></Link2>
  17714. </user-agent>
  17715. <user-agent>
  17716. <ID>id_n_s_1253</ID>
  17717. <String>Seeker.lookseek.com</String>
  17718. <Description>Lookseek search robot / link checking</Description>
  17719. <Type>R</Type>
  17720. <Comment>12.199.64.xx</Comment>
  17721. <Link1>http://www.lookseek.com/</Link1>
  17722. <Link2></Link2>
  17723. </user-agent>
  17724. <user-agent>
  17725. <ID>id_n_s_011006_3</ID>
  17726. <String>semaforo.net</String>
  17727. <Description>semaforo.net web filtering software</Description>
  17728. <Type>P</Type>
  17729. <Comment></Comment>
  17730. <Link1>http://www.semaforo.net/en/default.htm</Link1>
  17731. <Link2></Link2>
  17732. </user-agent>
  17733. <user-agent>
  17734. <ID>id_n_s_020807_2</ID>
  17735. <String>Semager/1.1 (http://www.semager.de/blog/semager-bots/)</String>
  17736. <Description>Semager.de (was NG-Search) semantic search - Germany</Description>
  17737. <Type>R</Type>
  17738. <Comment>212.114.209.2xx</Comment>
  17739. <Link1>http://www.semager.de/</Link1>
  17740. <Link2>http://www.semager.de/blog/semager-bots/</Link2>
  17741. </user-agent>
  17742. <user-agent>
  17743. <ID>id_n_s_230507_2</ID>
  17744. <String>Semager/1.x (http://www.semager.de)</String>
  17745. <Description>Semager.de (was NG-Search) semantic search - Germany</Description>
  17746. <Type>R</Type>
  17747. <Comment>212.114.209.2xx</Comment>
  17748. <Link1>http://www.semager.de/</Link1>
  17749. <Link2>http://www.semager.de/blog/semager-bots/</Link2>
  17750. </user-agent>
  17751. <user-agent>
  17752. <ID>id_n_s_1254</ID>
  17753. <String>semanticdiscovery/0.x</String>
  17754. <Description>Semantic Discovery domain checking tool</Description>
  17755. <Type>R C</Type>
  17756. <Comment></Comment>
  17757. <Link1>http://www.semanticdiscovery.com/products.html</Link1>
  17758. <Link2></Link2>
  17759. </user-agent>
  17760. <user-agent>
  17761. <ID>id_n_s_1255</ID>
  17762. <String>Sensis Web Crawler (search_comments\at\sensis\dot\com\dot\au)</String>
  17763. <Description>Sensis Australia search robot</Description>
  17764. <Type>R</Type>
  17765. <Comment></Comment>
  17766. <Link1>http://www.sensis.com.au/</Link1>
  17767. <Link2></Link2>
  17768. </user-agent>
  17769. <user-agent>
  17770. <ID>id_n_s_1256</ID>
  17771. <String>Sensis.com.au Web Crawler (search_comments\at\sensis\dot\com\dot\au)</String>
  17772. <Description>Sensis Australia search robot</Description>
  17773. <Type>R</Type>
  17774. <Comment></Comment>
  17775. <Link1>http://www.sensis.com.au/</Link1>
  17776. <Link2></Link2>
  17777. </user-agent>
  17778. <user-agent>
  17779. <ID>id_n_s_1257</ID>
  17780. <String>SeznamBot/1.0</String>
  17781. <Description>Seznam Search (Czech Republic) robot</Description>
  17782. <Type>R</Type>
  17783. <Comment>212.80.76.xx</Comment>
  17784. <Link1>http://www.seznam.cz/</Link1>
  17785. <Link2></Link2>
  17786. </user-agent>
  17787. <user-agent>
  17788. <ID>id_n_s_1258</ID>
  17789. <String>SeznamBot/1.0 (+http://fulltext.seznam.cz/)</String>
  17790. <Description>Seznam Search (Czech Republic) robot</Description>
  17791. <Type>R</Type>
  17792. <Comment>212.80.76.xx</Comment>
  17793. <Link1>http://www.seznam.cz/</Link1>
  17794. <Link2></Link2>
  17795. </user-agent>
  17796. <user-agent>
  17797. <ID>id_n_s_080907_2</ID>
  17798. <String>SeznamBot/2.0-test (+http://fulltext.sblog.cz/)</String>
  17799. <Description>Seznam Search (Czech Republic) robot</Description>
  17800. <Type>R</Type>
  17801. <Comment>212.80.76.xx</Comment>
  17802. <Link1>http://www.seznam.cz/</Link1>
  17803. <Link2></Link2>
  17804. </user-agent>
  17805. <user-agent>
  17806. <ID>id_n_s_280208_2</ID>
  17807. <String>ShablastBot 1.0</String>
  17808. <Description>Unknown robot from Shablast.com - Website has no content - Ignores robots.txt</Description>
  17809. <Type>S</Type>
  17810. <Comment>67.228.100.1xx / 67.228.102.2xx</Comment>
  17811. <Link1>http://shablast.com/</Link1>
  17812. <Link2></Link2>
  17813. </user-agent>
  17814. <user-agent>
  17815. <ID>id_n_s_1259</ID>
  17816. <String>Shareaza v1.x.x.xx</String>
  17817. <Description>Shareaza P2P peer-to-peer download client</Description>
  17818. <Type>D B</Type>
  17819. <Comment></Comment>
  17820. <Link1>http://www.shareaza.com/</Link1>
  17821. <Link2></Link2>
  17822. </user-agent>
  17823. <user-agent>
  17824. <ID>id_n_s_1260</ID>
  17825. <String>SharewarePlazaFileCheckBot/1.0+(+http://www.SharewarePlaza.com)</String>
  17826. <Description>SharewarePlaza File Check Bot - link checking</Description>
  17827. <Type>R C</Type>
  17828. <Comment></Comment>
  17829. <Link1>http://www.sharewareplaza.com/</Link1>
  17830. <Link2></Link2>
  17831. </user-agent>
  17832. <user-agent>
  17833. <ID>id_n_s_1261</ID>
  17834. <String>Shim Crawler</String>
  17835. <Description>Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx)</Description>
  17836. <Type>R</Type>
  17837. <Comment>s. also Shim-Crawler ...</Comment>
  17838. <Link1>http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html</Link1>
  17839. <Link2>http://www.kototoi.org/index.html</Link2>
  17840. </user-agent>
  17841. <user-agent>
  17842. <ID>id_n_s_240106_2</ID>
  17843. <String>Shim-Crawler(Mozilla-compatible; http://www.logos.ic.i.u-tokyo.ac.jp/crawler/; crawl@logos.ic.i.u-tokyo.ac.jp)</String>
  17844. <Description>Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx)</Description>
  17845. <Type>R</Type>
  17846. <Comment>s. also Shim Crawler</Comment>
  17847. <Link1>http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html</Link1>
  17848. <Link2>http://www.kototoi.org/index.html</Link2>
  17849. </user-agent>
  17850. <user-agent>
  17851. <ID>id_n_s_131205_1</ID>
  17852. <String>ShopWiki/1.0 ( +http://www.shopwiki.com/)</String>
  17853. <Description>ShopWiki shopping search based on LittleWiki search</Description>
  17854. <Type>R</Type>
  17855. <Comment>4.78.166.1xx</Comment>
  17856. <Link1>http://www.shopwiki.com/</Link1>
  17857. <Link2>http://dev.littlewiki.com/wiki/Home</Link2>
  17858. </user-agent>
  17859. <user-agent>
  17860. <ID>id_n_s_250706_1</ID>
  17861. <String>ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)</String>
  17862. <Description>ShopWiki shopping search based on LittleWiki search</Description>
  17863. <Type>R</Type>
  17864. <Comment>4.78.166.1xx</Comment>
  17865. <Link1>http://www.shopwiki.com/</Link1>
  17866. <Link2>http://dev.littlewiki.com/wiki/Home</Link2>
  17867. </user-agent>
  17868. <user-agent>
  17869. <ID>id_n_s_1262</ID>
  17870. <String>Shoula.com Crawler 2.0</String>
  17871. <Description>Shoula Search Engine crawler</Description>
  17872. <Type>R</Type>
  17873. <Comment></Comment>
  17874. <Link1>http://www.shoula.com/</Link1>
  17875. <Link2></Link2>
  17876. </user-agent>
  17877. <user-agent>
  17878. <ID>id_n_s_230107_1</ID>
  17879. <String>SietsCrawler/1.1 (+http://www.siets.biz)</String>
  17880. <Description>Siets Crawler - Web based site crawling application</Description>
  17881. <Type>R</Type>
  17882. <Comment></Comment>
  17883. <Link1>http://www.siets.biz/products/crawler/</Link1>
  17884. <Link2></Link2>
  17885. </user-agent>
  17886. <user-agent>
  17887. <ID>id_n_s_070308_1</ID>
  17888. <String>Sigram/Nutch-1.0-dev (Test agent for Nutch development; http://www.sigram.com/bot.html; bot at sigram dot com)</String>
  17889. <Description>Sigram's Nutch robot - crawler testing</Description>
  17890. <Type>R</Type>
  17891. <Comment></Comment>
  17892. <Link1>http://www.sigram.com/bot.html</Link1>
  17893. <Link2></Link2>
  17894. </user-agent>
  17895. <user-agent>
  17896. <ID>id_n_s_050906_1</ID>
  17897. <String>Siigle Orumcex v.001 Turkey (http://www.siigle.com)</String>
  17898. <Description>Siigle search (Turkey) robot</Description>
  17899. <Type>R</Type>
  17900. <Comment>62.68.196.xx</Comment>
  17901. <Link1>http://www.siigle.com/</Link1>
  17902. <Link2></Link2>
  17903. </user-agent>
  17904. <user-agent>
  17905. <ID>id_n_s_171006_1</ID>
  17906. <String>silk/1.0</String>
  17907. <Description>Slider Search directory robot (194.213.194.2xx)</Description>
  17908. <Type>R</Type>
  17909. <Comment>s. also Slider_Search...</Comment>
  17910. <Link1>http://www.slider.com/index.html</Link1>
  17911. <Link2></Link2>
  17912. </user-agent>
  17913. <user-agent>
  17914. <ID>id_n_s_281205_1</ID>
  17915. <String>silk/1.0 (+http://www.slider.com/silk.htm)/3.7</String>
  17916. <Description>Slider Search directory robot (194.213.194.2xx)</Description>
  17917. <Type>R</Type>
  17918. <Comment>s. also Slider_Search...</Comment>
  17919. <Link1>http://www.slider.com/index.html</Link1>
  17920. <Link2></Link2>
  17921. </user-agent>
  17922. <user-agent>
  17923. <ID>id_n_s_131206_2</ID>
  17924. <String>SimpleFavPanel/1.2</String>
  17925. <Description>SimpleFavPanel - IE newsfeed panel plugin</Description>
  17926. <Type>B</Type>
  17927. <Comment></Comment>
  17928. <Link1>http://www.egrath.net/index.php?ExplorerBarPlus%2F%A5%D1%A5%CD%A5%EB%B0%EC%CD%F7%2FSimpleFavPanel</Link1>
  17929. <Link2></Link2>
  17930. </user-agent>
  17931. <user-agent>
  17932. <ID>id_n_s_1263</ID>
  17933. <String>Simpy 1.x; http://www.simpy.com/</String>
  17934. <Description>Simpy bookmarking and personal search engine</Description>
  17935. <Type>R C</Type>
  17936. <Comment>s. also Argus</Comment>
  17937. <Link1>http://www.simpy.com/</Link1>
  17938. <Link2></Link2>
  17939. </user-agent>
  17940. <user-agent>
  17941. <ID>id_n_s_1264</ID>
  17942. <String>Simpy/1.x (Simpy; http://www.simpy.com/?ref=bot; feedback at simpy dot com)</String>
  17943. <Description>Simpy bookmarking and personal search engine</Description>
  17944. <Type>R C</Type>
  17945. <Comment>s. also Argus</Comment>
  17946. <Link1>http://www.simpy.com/</Link1>
  17947. <Link2></Link2>
  17948. </user-agent>
  17949. <user-agent>
  17950. <ID>id_n_s_180707_2</ID>
  17951. <String>Sirketcebot/v.01 (http://www.sirketce.com/bot.html)</String>
  17952. <Description>Sirket&#231;e search - Turkey</Description>
  17953. <Type>R</Type>
  17954. <Comment>88.255.173.xx</Comment>
  17955. <Link1>http://www.sirketce.com/</Link1>
  17956. <Link2></Link2>
  17957. </user-agent>
  17958. <user-agent>
  17959. <ID>id_n_s_070207_3</ID>
  17960. <String>SiteBar/3.x.x (Bookmark Server; http://sitebar.org/)</String>
  17961. <Description>SiteBar online bookmark manager</Description>
  17962. <Type>C</Type>
  17963. <Comment></Comment>
  17964. <Link1>http://sitebar.org/</Link1>
  17965. <Link2></Link2>
  17966. </user-agent>
  17967. <user-agent>
  17968. <ID>id_n_s_1265</ID>
  17969. <String>SiteBar/x.x</String>
  17970. <Description>SiteBar bookmark server</Description>
  17971. <Type>C</Type>
  17972. <Comment></Comment>
  17973. <Link1>http://sitebar.sourceforge.net/</Link1>
  17974. <Link2></Link2>
  17975. </user-agent>
  17976. <user-agent>
  17977. <ID>id_n_s_1266</ID>
  17978. <String>SiteBar/x.x.x (Bookmark Server; http://sitebar.org/)</String>
  17979. <Description>SiteBar bookmark server</Description>
  17980. <Type>C</Type>
  17981. <Comment></Comment>
  17982. <Link1>http://sitebar.sourceforge.net/</Link1>
  17983. <Link2></Link2>
  17984. </user-agent>
  17985. <user-agent>
  17986. <ID>id_n_s_1267</ID>
  17987. <String>sitecheck.internetseer.com</String>
  17988. <Description>Internetseer Web Site Monitoring / Claymont robot</Description>
  17989. <Type>R C</Type>
  17990. <Comment></Comment>
  17991. <Link1>http://www.internetseer.com/</Link1>
  17992. <Link2>http://www.claymont.com/</Link2>
  17993. </user-agent>
  17994. <user-agent>
  17995. <ID>id_n_s_1268</ID>
  17996. <String>sitecheck.internetseer.com (For more info see: http://sitecheck.internetseer.com)</String>
  17997. <Description>Internetseer Web Site Monitoring</Description>
  17998. <Type>R C</Type>
  17999. <Comment></Comment>
  18000. <Link1>http://www.internetseer.com/</Link1>
  18001. <Link2></Link2>
  18002. </user-agent>
  18003. <user-agent>
  18004. <ID>id_n_s_1269</ID>
  18005. <String>SiteRecon+(xx)</String>
  18006. <Description>SiteRecon website monitoring spider at xx minute intervals</Description>
  18007. <Type>R C</Type>
  18008. <Comment></Comment>
  18009. <Link1>http://www.siterecon.com/</Link1>
  18010. <Link2></Link2>
  18011. </user-agent>
  18012. <user-agent>
  18013. <ID>id_n_s_1270</ID>
  18014. <String>SiteSnagger</String>
  18015. <Description>PC Magazin web site downloadmanager</Description>
  18016. <Type>D</Type>
  18017. <Comment></Comment>
  18018. <Link1>http://www.zdnet.com/pcmag/pctech/content/17/04/ut1704.001.html</Link1>
  18019. <Link2></Link2>
  18020. </user-agent>
  18021. <user-agent>
  18022. <ID>id_n_s_1271</ID>
  18023. <String>SiteSpider +(http://www.SiteSpider.com/)</String>
  18024. <Description>Site Spider robot (66.249.17.xx)</Description>
  18025. <Type>R</Type>
  18026. <Comment></Comment>
  18027. <Link1>http://www.SiteSpider.com/</Link1>
  18028. <Link2></Link2>
  18029. </user-agent>
  18030. <user-agent>
  18031. <ID>id_n_s_021205_3</ID>
  18032. <String>SiteSucker/1.x.x</String>
  18033. <Description>SiteSucker Mac website downloading tool</Description>
  18034. <Type>D</Type>
  18035. <Comment></Comment>
  18036. <Link1>http://www.sitesucker.us/</Link1>
  18037. <Link2></Link2>
  18038. </user-agent>
  18039. <user-agent>
  18040. <ID>id_n_s_140306_2</ID>
  18041. <String>SiteTaggerBot (http://www.sitetagger.com/bot.htm)</String>
  18042. <Description>SiteTagger.com bookmark organizer</Description>
  18043. <Type>C</Type>
  18044. <Comment></Comment>
  18045. <Link1>http://www.sitetagger.com/</Link1>
  18046. <Link2></Link2>
  18047. </user-agent>
  18048. <user-agent>
  18049. <ID>id_n_s_030407_1</ID>
  18050. <String>SiteTruth.com site rating system</String>
  18051. <Description>SiteTruth - Automatic site legitimacy rating system</Description>
  18052. <Type>R</Type>
  18053. <Comment>69.64.67.xx</Comment>
  18054. <Link1>http://www.sitetruth.com/</Link1>
  18055. <Link2></Link2>
  18056. </user-agent>
  18057. <user-agent>
  18058. <ID>id_n_s_1272</ID>
  18059. <String>SiteWinder</String>
  18060. <Description>Webwasher.com (217.146.159.xx) internet filter</Description>
  18061. <Type>B P</Type>
  18062. <Comment></Comment>
  18063. <Link1>http://www.webwasher.com/</Link1>
  18064. <Link2></Link2>
  18065. </user-agent>
  18066. <user-agent>
  18067. <ID>id_n_s_1273</ID>
  18068. <String>SiteXpert</String>
  18069. <Description>Xtreeme SiteXpert sitemap &amp; search engine builder</Description>
  18070. <Type>R</Type>
  18071. <Comment></Comment>
  18072. <Link1>http://www.xtreeme.com/sitexpert/index.php</Link1>
  18073. <Link2></Link2>
  18074. </user-agent>
  18075. <user-agent>
  18076. <ID>id_n_s_1274</ID>
  18077. <String>Skampy/0.9.x (http://www.skaffe.com/skampy-info.html)</String>
  18078. <Description>Skaffe.com directory link checker</Description>
  18079. <Type>R</Type>
  18080. <Comment></Comment>
  18081. <Link1>http://www.skaffe.com/</Link1>
  18082. <Link2></Link2>
  18083. </user-agent>
  18084. <user-agent>
  18085. <ID>id_n_s_1275</ID>
  18086. <String>Skimpy/0.x (http://www.skaffe.com/skampy-info.html)</String>
  18087. <Description>Skaffe.com directory link checker</Description>
  18088. <Type>R</Type>
  18089. <Comment></Comment>
  18090. <Link1>http://www.skaffe.com/</Link1>
  18091. <Link2></Link2>
  18092. </user-agent>
  18093. <user-agent>
  18094. <ID>id_n_s_090706_1</ID>
  18095. <String>Skywalker/0.1 (Skywalker; anonymous; anonymous)</String>
  18096. <Description>Visvo distributed website crawler based on Nutch</Description>
  18097. <Type>R</Type>
  18098. <Comment>63.133.162.xx</Comment>
  18099. <Link1>http://www.visvo.com/bot.html</Link1>
  18100. <Link2></Link2>
  18101. </user-agent>
  18102. <user-agent>
  18103. <ID>id_n_s_1276</ID>
  18104. <String>Slarp/0.1</String>
  18105. <Description>Only.com robot</Description>
  18106. <Type>R</Type>
  18107. <Comment></Comment>
  18108. <Link1>http://www.only.com/</Link1>
  18109. <Link2></Link2>
  18110. </user-agent>
  18111. <user-agent>
  18112. <ID>id_n_s_1277</ID>
  18113. <String>Sleipnir</String>
  18114. <Description>Sleipnir - Japanese Explorer based browser &amp; search bar</Description>
  18115. <Type>B</Type>
  18116. <Comment></Comment>
  18117. <Link1>http://www20.pos.to/~sleipnir/software/sleipnir/index.html</Link1>
  18118. <Link2></Link2>
  18119. </user-agent>
  18120. <user-agent>
  18121. <ID>id_n_s_1278</ID>
  18122. <String>Sleipnir Version 1.xx</String>
  18123. <Description>Sleipnir - Japanese Explorer based browser &amp; search bar</Description>
  18124. <Type>B</Type>
  18125. <Comment></Comment>
  18126. <Link1>http://www20.pos.to/~sleipnir/software/sleipnir/index.html</Link1>
  18127. <Link2></Link2>
  18128. </user-agent>
  18129. <user-agent>
  18130. <ID>id_n_s_170207_5</ID>
  18131. <String>Sleipnir Version2.x</String>
  18132. <Description>Sleipnir - Japanese Explorer based browser &amp; search bar</Description>
  18133. <Type>B</Type>
  18134. <Comment></Comment>
  18135. <Link1>http://www20.pos.to/~sleipnir/software/sleipnir/index.html</Link1>
  18136. <Link2></Link2>
  18137. </user-agent>
  18138. <user-agent>
  18139. <ID>id_n_s_260706_1</ID>
  18140. <String>Sleipnir/2.xx</String>
  18141. <Description>Sleipnir - Japanese Explorer based browser &amp; search bar</Description>
  18142. <Type>B</Type>
  18143. <Comment></Comment>
  18144. <Link1>http://www20.pos.to/~sleipnir/software/sleipnir/index.html</Link1>
  18145. <Link2></Link2>
  18146. </user-agent>
  18147. <user-agent>
  18148. <ID>id_n_s_1279</ID>
  18149. <String>Slider_Search_v1-de</String>
  18150. <Description>Slider Search directory robot (194.213.194.2xx)</Description>
  18151. <Type>R</Type>
  18152. <Comment>s. also silk/1.0...</Comment>
  18153. <Link1>http://www.slider.com/index.html</Link1>
  18154. <Link2></Link2>
  18155. </user-agent>
  18156. <user-agent>
  18157. <ID>id_n_s_1280</ID>
  18158. <String>SlimBrowser</String>
  18159. <Description>Slim Browser (IE based browser) - uses this user agent for favicon.ico only</Description>
  18160. <Type>B</Type>
  18161. <Comment></Comment>
  18162. <Link1>http://www.flashpeak.com/sbrowser/</Link1>
  18163. <Link2></Link2>
  18164. </user-agent>
  18165. <user-agent>
  18166. <ID>id_n_s_1281</ID>
  18167. <String>Slurp/2.0 (slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  18168. <Description>Inktomi (Hotbot-Lycos-NBCi) robot</Description>
  18169. <Type>R</Type>
  18170. <Comment></Comment>
  18171. <Link1>http://www.inktomi.com/slurp.html</Link1>
  18172. <Link2></Link2>
  18173. </user-agent>
  18174. <user-agent>
  18175. <ID>id_n_s_1282</ID>
  18176. <String>Slurp/2.0-KiteWeekly (slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  18177. <Description>Inktomi (Hotbot-Lycos-NBCi) robot</Description>
  18178. <Type>R</Type>
  18179. <Comment></Comment>
  18180. <Link1>http://www.inktomi.com/slurp.html</Link1>
  18181. <Link2></Link2>
  18182. </user-agent>
  18183. <user-agent>
  18184. <ID>id_n_s_1283</ID>
  18185. <String>Slurp/si (slurp@inktomi.com; http://www.inktomi.com/slurp.html)</String>
  18186. <Description>Inktomi (Hotbot-Lycos-NBCi) robot</Description>
  18187. <Type>R</Type>
  18188. <Comment></Comment>
  18189. <Link1>http://www.inktomi.com/slurp.html</Link1>
  18190. <Link2></Link2>
  18191. </user-agent>
  18192. <user-agent>
  18193. <ID>id_n_s_240806_1</ID>
  18194. <String>Slurpy Verifier/1.0</String>
  18195. <Description>Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)</Description>
  18196. <Type>R</Type>
  18197. <Comment>s. also Mozilla/3.0 (Slurp/.....</Comment>
  18198. <Link1>http://www.inktomi.com/</Link1>
  18199. <Link2></Link2>
  18200. </user-agent>
  18201. <user-agent>
  18202. <ID>id_n_s_1284</ID>
  18203. <String>SlySearch (slysearch@slysearch.com)</String>
  18204. <Description>Slysearch robot (now Turnitin robot)</Description>
  18205. <Type>R</Type>
  18206. <Comment></Comment>
  18207. <Link1>http://www.slysearch.com/</Link1>
  18208. <Link2></Link2>
  18209. </user-agent>
  18210. <user-agent>
  18211. <ID>id_n_s_1285</ID>
  18212. <String>SlySearch/1.0 http://www.plagiarism.org/crawler/robotinfo.html</String>
  18213. <Description>Slysearch robot (now Turnitin robot)</Description>
  18214. <Type>R</Type>
  18215. <Comment></Comment>
  18216. <Link1>http://www.slysearch.com/</Link1>
  18217. <Link2></Link2>
  18218. </user-agent>
  18219. <user-agent>
  18220. <ID>id_n_s_1286</ID>
  18221. <String>SlySearch/1.x http://www.slysearch.com</String>
  18222. <Description>Slysearch robot (now Turnitin robot)</Description>
  18223. <Type>R</Type>
  18224. <Comment></Comment>
  18225. <Link1>http://www.slysearch.com/</Link1>
  18226. <Link2></Link2>
  18227. </user-agent>
  18228. <user-agent>
  18229. <ID>id_n_s_1287</ID>
  18230. <String>SmartDownload/1.2.67 (Win32; Jan 12 1999)</String>
  18231. <Description>Netzip/Smartdownload download manager</Description>
  18232. <Type>D</Type>
  18233. <Comment></Comment>
  18234. <Link1>http://www.netzip.com/</Link1>
  18235. <Link2></Link2>
  18236. </user-agent>
  18237. <user-agent>
  18238. <ID>id_n_s_1288</ID>
  18239. <String>SmartDownload/1.2.77 (Win32; Feb 1 2000)</String>
  18240. <Description>Netzip/Smartdownload download manager</Description>
  18241. <Type>D</Type>
  18242. <Comment></Comment>
  18243. <Link1>http://www.netzip.com/</Link1>
  18244. <Link2></Link2>
  18245. </user-agent>
  18246. <user-agent>
  18247. <ID>id_n_s_1289</ID>
  18248. <String>SmartDownload/1.2.77 (Win32; Jun 19 2001)</String>
  18249. <Description>Netzip/Smartdownload download manager</Description>
  18250. <Type>D</Type>
  18251. <Comment></Comment>
  18252. <Link1>http://www.netzip.com/</Link1>
  18253. <Link2></Link2>
  18254. </user-agent>
  18255. <user-agent>
  18256. <ID>id_n_s_1290</ID>
  18257. <String>smartwit.com</String>
  18258. <Description>Loop Improvements NRS Enterprise search (69.44.155.xx[x])</Description>
  18259. <Type>R</Type>
  18260. <Comment></Comment>
  18261. <Link1>http://www.loopimprovements.com/</Link1>
  18262. <Link2>http://demo.loopimprovements.com/demo/</Link2>
  18263. </user-agent>
  18264. <user-agent>
  18265. <ID>id_n_s_020307_2</ID>
  18266. <String>SmiffyDCMetaSpider/1.0</String>
  18267. <Description>SmiffyDCMetaSpider - Robot to check the retro-adding of Dublin Core metadata</Description>
  18268. <Type>R</Type>
  18269. <Comment>64.71.152.xx</Comment>
  18270. <Link1>http://www.smiffysplace.com</Link1>
  18271. <Link2>http://www.smiffysplace.com/smiffydcmetaspider</Link2>
  18272. </user-agent>
  18273. <user-agent>
  18274. <ID>id_n_s_1291</ID>
  18275. <String>sna-0.0.1 (mikemuzio@msn.com)</String>
  18276. <Description>Snoopy PHP-client</Description>
  18277. <Type></Type>
  18278. <Comment>see Snoopy</Comment>
  18279. <Link1>http://sourceforge.net/projects/snoopy/</Link1>
  18280. <Link2></Link2>
  18281. </user-agent>
  18282. <user-agent>
  18283. <ID>id_n_s_1292</ID>
  18284. <String>sna-0.0.1 mikeelliott@hotmail.com</String>
  18285. <Description>Snoopy PHP-client</Description>
  18286. <Type></Type>
  18287. <Comment>see Snoopy</Comment>
  18288. <Link1>http://sourceforge.net/projects/snoopy/</Link1>
  18289. <Link2></Link2>
  18290. </user-agent>
  18291. <user-agent>
  18292. <ID>id_n_s_080106_1</ID>
  18293. <String>snap.com beta crawler v0</String>
  18294. <Description>Unknown bot from bb2.net (66.234.139.xxx) also as Snapbot/1.0</Description>
  18295. <Type>S</Type>
  18296. <Comment>Gets only the robots.txt - Not from Snap.com / Idealab (63.251.211.xxx)</Comment>
  18297. <Link1>http://www.kloth.net/internet/badbots.php</Link1>
  18298. <Link2></Link2>
  18299. </user-agent>
  18300. <user-agent>
  18301. <ID>id_n_s_250506_1</ID>
  18302. <String>Snapbot/1.0</String>
  18303. <Description>Unknown bot from bb2.net (66.234.139.xxx) - also as snap.com</Description>
  18304. <Type>S</Type>
  18305. <Comment>Not from Snap.com / Idealab (63.251.211.xxx)</Comment>
  18306. <Link1>http://www.kloth.net/internet/badbots.php</Link1>
  18307. <Link2></Link2>
  18308. </user-agent>
  18309. <user-agent>
  18310. <ID>id_n_s_250408_1</ID>
  18311. <String>Snapbot/1.0 (Snap Shots&#44; +http://www.snap.com)</String>
  18312. <Description>Unknown bot from Psinet / Cogentco - not from Snap.com</Description>
  18313. <Type>S</Type>
  18314. <Comment>38.98.19.6x</Comment>
  18315. <Link1></Link1>
  18316. <Link2></Link2>
  18317. </user-agent>
  18318. <user-agent>
  18319. <ID>id_n_s_270906_2</ID>
  18320. <String>Snappy/1.1 ( http://www.urltrends.com/ )</String>
  18321. <Description>My UrlTrends online web ranking service</Description>
  18322. <Type>C</Type>
  18323. <Comment>205.138.199.1xx / 209.85.36.x</Comment>
  18324. <Link1>http://www.urltrends.com/</Link1>
  18325. <Link2></Link2>
  18326. </user-agent>
  18327. <user-agent>
  18328. <ID>id_n_s_100707_1</ID>
  18329. <String>Snarfer/0.x.x (http://www.snarfware.com/)</String>
  18330. <Description>Snarfer RSS reader</Description>
  18331. <Type>B</Type>
  18332. <Comment></Comment>
  18333. <Link1>http://www.snarfware.com/</Link1>
  18334. <Link2></Link2>
  18335. </user-agent>
  18336. <user-agent>
  18337. <ID>id_n_s_1293</ID>
  18338. <String>SnoopRob/x.x</String>
  18339. <Description>Unknown robot from 217.229.156.xx (T-Online Germany)</Description>
  18340. <Type></Type>
  18341. <Comment></Comment>
  18342. <Link1></Link1>
  18343. <Link2></Link2>
  18344. </user-agent>
  18345. <user-agent>
  18346. <ID>id_n_s_1294</ID>
  18347. <String>Snoopy v1.xx</String>
  18348. <Description>Snoopy PHP-client</Description>
  18349. <Type></Type>
  18350. <Comment>s. also sna-x.x.x</Comment>
  18351. <Link1>http://sourceforge.net/projects/snoopy/</Link1>
  18352. <Link2></Link2>
  18353. </user-agent>
  18354. <user-agent>
  18355. <ID>id_n_s_1295</ID>
  18356. <String>Snoopy v1.xx- : User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MyIE2)</String>
  18357. <Description>Snoopy PHP-client</Description>
  18358. <Type></Type>
  18359. <Comment>s. also sna-x.x.x</Comment>
  18360. <Link1>http://sourceforge.net/projects/snoopy/</Link1>
  18361. <Link2></Link2>
  18362. </user-agent>
  18363. <user-agent>
  18364. <ID>id_n_s_1296</ID>
  18365. <String>Snoopy_v0.xx</String>
  18366. <Description>Snoopy PHP-client</Description>
  18367. <Type></Type>
  18368. <Comment>s. also sna-x.x.x</Comment>
  18369. <Link1>http://sourceforge.net/projects/snoopy/</Link1>
  18370. <Link2></Link2>
  18371. </user-agent>
  18372. <user-agent>
  18373. <ID>id_n_s_1297</ID>
  18374. <String>SnykeBot/0.6 (http://www.snyke.com)</String>
  18375. <Description>Snyke.com France robot</Description>
  18376. <Type>R</Type>
  18377. <Comment></Comment>
  18378. <Link1>http://www.snyke.com/</Link1>
  18379. <Link2></Link2>
  18380. </user-agent>
  18381. <user-agent>
  18382. <ID>id_n_s_250706_2</ID>
  18383. <String>SocSciBot ()</String>
  18384. <Description>Link crawler for the social sciences</Description>
  18385. <Type>R</Type>
  18386. <Comment></Comment>
  18387. <Link1>http://socscibot.wlv.ac.uk/</Link1>
  18388. <Link2></Link2>
  18389. </user-agent>
  18390. <user-agent>
  18391. <ID>id_n_s_170407_1</ID>
  18392. <String>SoftBank/1.0/812SH/SHJ001 Browser/NetFront/3.3 Profile/MIDP-2.0 Configuration/CLDC-1.1</String>
  18393. <Description>NetFront browser on Softbank mobile phone</Description>
  18394. <Type>B</Type>
  18395. <Comment></Comment>
  18396. <Link1>http://www.access-company.com/products/netfrontmobile/browser/index.html</Link1>
  18397. <Link2>http://mb.softbank.jp/mb/en/product/</Link2>
  18398. </user-agent>
  18399. <user-agent>
  18400. <ID>id_n_s_1298</ID>
  18401. <String>SoftHypermarketFileCheckBot/1.0+(+http://www.softhypermaket.com)</String>
  18402. <Description>Soft Hypermarket link checking</Description>
  18403. <Type>R</Type>
  18404. <Comment></Comment>
  18405. <Link1>http://www.softhypermarket.com/</Link1>
  18406. <Link2></Link2>
  18407. </user-agent>
  18408. <user-agent>
  18409. <ID>id_n_s_1299</ID>
  18410. <String>Softizerbot (http://www.softizer.com)</String>
  18411. <Description>Softizer.com software directory link checking</Description>
  18412. <Type>C</Type>
  18413. <Comment>72.9.97.xx</Comment>
  18414. <Link1>http://www.softizer.com/</Link1>
  18415. <Link2></Link2>
  18416. </user-agent>
  18417. <user-agent>
  18418. <ID>id_n_s_090208_1</ID>
  18419. <String>sogou develop spider</String>
  18420. <Description>Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot</Description>
  18421. <Type>S</Type>
  18422. <Comment>s. also sohu agent &amp; Sogou web spider</Comment>
  18423. <Link1></Link1>
  18424. <Link2></Link2>
  18425. </user-agent>
  18426. <user-agent>
  18427. <ID>id_n_s_011207_2</ID>
  18428. <String>Sogou Orion spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)</String>
  18429. <Description>Unknown UA from Chinanet (220.181.18.xx) faking Sogou search robot</Description>
  18430. <Type>S</Type>
  18431. <Comment>s. also sohu agent &#44; Sogou web spider &amp; sogou develop spider</Comment>
  18432. <Link1></Link1>
  18433. <Link2></Link2>
  18434. </user-agent>
  18435. <user-agent>
  18436. <ID>id_n_s_150106_1</ID>
  18437. <String>sogou spider</String>
  18438. <Description>Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot</Description>
  18439. <Type>S</Type>
  18440. <Comment>s. also sohu agent &#44; Sogou web spider &amp; sogou develop spider</Comment>
  18441. <Link1></Link1>
  18442. <Link2></Link2>
  18443. </user-agent>
  18444. <user-agent>
  18445. <ID>id_n_s_280407_1</ID>
  18446. <String>Sogou web spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)</String>
  18447. <Description>Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot</Description>
  18448. <Type>S</Type>
  18449. <Comment>s. also sohu agent &#44; sogou spider &amp; sogou develop spider</Comment>
  18450. <Link1></Link1>
  18451. <Link2></Link2>
  18452. </user-agent>
  18453. <user-agent>
  18454. <ID>id_n_s_291105_1</ID>
  18455. <String>sohu agent</String>
  18456. <Description>Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot</Description>
  18457. <Type>S</Type>
  18458. <Comment>s. also sogou spider &#44; sogou spider &amp; sogou develop spider</Comment>
  18459. <Link1></Link1>
  18460. <Link2></Link2>
  18461. </user-agent>
  18462. <user-agent>
  18463. <ID>id_n_s_1300</ID>
  18464. <String>sohu-search</String>
  18465. <Description>Sohu (Search Fox) search robot China (61.135.131.xxx)</Description>
  18466. <Type>R</Type>
  18467. <Comment>this UA also comes from 220.181.26.xxx (not Sohus IP range) as spam bot - s.also sohu agent</Comment>
  18468. <Link1>http://www.sohu.com/</Link1>
  18469. <Link2></Link2>
  18470. </user-agent>
  18471. <user-agent>
  18472. <ID>id_n_s_160308_3</ID>
  18473. <String>Sosospider+(+http://help.soso.com/webspider.htm)</String>
  18474. <Description>SOSO search (China) spider</Description>
  18475. <Type>R</Type>
  18476. <Comment></Comment>
  18477. <Link1>http://www.soso.com/</Link1>
  18478. <Link2>http://help.soso.com/webspider.htm</Link2>
  18479. </user-agent>
  18480. <user-agent>
  18481. <ID>id_n_s_1301</ID>
  18482. <String>Space Bison/0.02 [fu] (Win67; X; SK)</String>
  18483. <Description>Default Proxomitron (discontinued) filtering proxy user agent identifier</Description>
  18484. <Type>P B</Type>
  18485. <Comment></Comment>
  18486. <Link1>http://duke.usask.ca/~macphed/prox/</Link1>
  18487. <Link2></Link2>
  18488. </user-agent>
  18489. <user-agent>
  18490. <ID>id_n_s_1302</ID>
  18491. <String>SpeedDownload/1.x</String>
  18492. <Description>Speed Download (Mac) download manager</Description>
  18493. <Type>D</Type>
  18494. <Comment></Comment>
  18495. <Link1>http://www.yazsoft.com/</Link1>
  18496. <Link2></Link2>
  18497. </user-agent>
  18498. <user-agent>
  18499. <ID>id_n_s_1303</ID>
  18500. <String>speedfind ramBot xtreme 8.1</String>
  18501. <Description>Speedfind.de robot</Description>
  18502. <Type>R</Type>
  18503. <Comment></Comment>
  18504. <Link1>http://www.speedfind.de/</Link1>
  18505. <Link2></Link2>
  18506. </user-agent>
  18507. <user-agent>
  18508. <ID>id_n_s_1304</ID>
  18509. <String>Speedy Spider (Beta/x.x; speedy@entireweb.com)</String>
  18510. <Description>Entireweb search robot</Description>
  18511. <Type>R</Type>
  18512. <Comment>62.13.25.2xx</Comment>
  18513. <Link1>http://www.entireweb.com/</Link1>
  18514. <Link2></Link2>
  18515. </user-agent>
  18516. <user-agent>
  18517. <ID>id_n_s_070906_1</ID>
  18518. <String>Speedy Spider (Entireweb; Beta/1.0; http://www.entireweb.com/about/search_tech/speedyspider/)</String>
  18519. <Description>Entireweb search spider</Description>
  18520. <Type>R</Type>
  18521. <Comment>62.13.25.2xx</Comment>
  18522. <Link1>http://www.entireweb.com/</Link1>
  18523. <Link2></Link2>
  18524. </user-agent>
  18525. <user-agent>
  18526. <ID>id_n_s_1305</ID>
  18527. <String>Speedy_Spider (http://www.entireweb.com)</String>
  18528. <Description>Entireweb search robot</Description>
  18529. <Type>R</Type>
  18530. <Comment>62.13.25.2xx</Comment>
  18531. <Link1>http://www.entireweb.com/</Link1>
  18532. <Link2></Link2>
  18533. </user-agent>
  18534. <user-agent>
  18535. <ID>id_n_s_050208_4</ID>
  18536. <String>Sphere Scout&#38;v4.0 - scout at sphere dot com</String>
  18537. <Description>Sphere blog and news search robot</Description>
  18538. <Type>R</Type>
  18539. <Comment>64.40.11[7-8].[x]xx</Comment>
  18540. <Link1>http://www.sphere.com/</Link1>
  18541. <Link2></Link2>
  18542. </user-agent>
  18543. <user-agent>
  18544. <ID>id_n_s_040106_3</ID>
  18545. <String>Sphider</String>
  18546. <Description>Sphider - a lightweight search engine in PHP</Description>
  18547. <Type>R</Type>
  18548. <Comment></Comment>
  18549. <Link1>http://www.cs.ioc.ee/~ando/sphider/</Link1>
  18550. <Link2></Link2>
  18551. </user-agent>
  18552. <user-agent>
  18553. <ID>id_n_s_1306</ID>
  18554. <String>Spida/0.1</String>
  18555. <Description>Only.com robot</Description>
  18556. <Type>R</Type>
  18557. <Comment>in conjunction with LWP::Simple/5.53</Comment>
  18558. <Link1>http://www.only.com/</Link1>
  18559. <Link2></Link2>
  18560. </user-agent>
  18561. <user-agent>
  18562. <ID>id_n_s_1307</ID>
  18563. <String>Spider-Sleek/2.0 (+http://search-info.com/linktous.html)</String>
  18564. <Description>Search-Info ODP/DMOZ spider</Description>
  18565. <Type>R</Type>
  18566. <Comment></Comment>
  18567. <Link1>http://search-info.com/</Link1>
  18568. <Link2></Link2>
  18569. </user-agent>
  18570. <user-agent>
  18571. <ID>id_n_s_1308</ID>
  18572. <String>spider.batsch.com</String>
  18573. <Description>Batsch robot</Description>
  18574. <Type>R</Type>
  18575. <Comment> - site unreachable</Comment>
  18576. <Link1>http://www.batsch.com</Link1>
  18577. <Link2></Link2>
  18578. </user-agent>
  18579. <user-agent>
  18580. <ID>id_n_s_110206_4</ID>
  18581. <String>Spider.TerraNautic.net - v:1.04</String>
  18582. <Description>TerraNautic spider for Schnellsuchen touristic search (Germany)</Description>
  18583. <Type>C</Type>
  18584. <Comment></Comment>
  18585. <Link1>http://www.terranautic.net/</Link1>
  18586. <Link2>http://www.schnellsuchen.com/</Link2>
  18587. </user-agent>
  18588. <user-agent>
  18589. <ID>id_n_s_1309</ID>
  18590. <String>spider.yellopet.com - www.yellopet.com</String>
  18591. <Description>Yellopet spider</Description>
  18592. <Type>R</Type>
  18593. <Comment></Comment>
  18594. <Link1>http://www.yellopet.com/</Link1>
  18595. <Link2></Link2>
  18596. </user-agent>
  18597. <user-agent>
  18598. <ID>id_n_s_1310</ID>
  18599. <String>Spider/maxbot.com admin@maxbot.com</String>
  18600. <Description>Maxbot .gov .mil .edu indexing robot</Description>
  18601. <Type>R</Type>
  18602. <Comment></Comment>
  18603. <Link1>http://www.maxbot.com/</Link1>
  18604. <Link2></Link2>
  18605. </user-agent>
  18606. <user-agent>
  18607. <ID>id_n_s_1311</ID>
  18608. <String>SpiderKU/0.x</String>
  18609. <Description>Unknown robot from CPE at Kasetsart University (158.108.35.xxx)</Description>
  18610. <Type>R</Type>
  18611. <Comment></Comment>
  18612. <Link1>http://www.cpe.ku.ac.th/</Link1>
  18613. <Link2></Link2>
  18614. </user-agent>
  18615. <user-agent>
  18616. <ID>id_n_s_1312</ID>
  18617. <String>SpiderMan</String>
  18618. <Description>Yahoo Search user agent or spider (202.165.102.xxx)</Description>
  18619. <Type>R</Type>
  18620. <Comment></Comment>
  18621. <Link1>http://search.yahoo.com/</Link1>
  18622. <Link2></Link2>
  18623. </user-agent>
  18624. <user-agent>
  18625. <ID>id_n_s_1313</ID>
  18626. <String>SpiderMonkey/7.0x (SpiderMonkey.ca info at http://spidermonkey.ca/sm.shtml)</String>
  18627. <Description>SpiderMonkey Canada robot</Description>
  18628. <Type>R</Type>
  18629. <Comment></Comment>
  18630. <Link1>http://spidermonkey.ca/</Link1>
  18631. <Link2></Link2>
  18632. </user-agent>
  18633. <user-agent>
  18634. <ID>id_n_s_1314</ID>
  18635. <String>Spinne/2.0</String>
  18636. <Description>Spider.de robot</Description>
  18637. <Type>R</Type>
  18638. <Comment></Comment>
  18639. <Link1>http://www.spider.de/</Link1>
  18640. <Link2></Link2>
  18641. </user-agent>
  18642. <user-agent>
  18643. <ID>id_n_s_1315</ID>
  18644. <String>Spinne/2.0 med</String>
  18645. <Description>Medkatalog (medical catalogue) Austria robot</Description>
  18646. <Type>R</Type>
  18647. <Comment></Comment>
  18648. <Link1>http://www.medkatalog.com/</Link1>
  18649. <Link2></Link2>
  18650. </user-agent>
  18651. <user-agent>
  18652. <ID>id_n_s_1316</ID>
  18653. <String>Spinne/2.0 med_AH</String>
  18654. <Description>Medkatalog (medical catalogue) Austria robot</Description>
  18655. <Type>R</Type>
  18656. <Comment></Comment>
  18657. <Link1>http://www.medkatalog.com/</Link1>
  18658. <Link2></Link2>
  18659. </user-agent>
  18660. <user-agent>
  18661. <ID>id_n_s_180707_3</ID>
  18662. <String>Spock Crawler (http://www.spock.com/crawler)</String>
  18663. <Description>Spock - people search application - via Amazon web services</Description>
  18664. <Type>R</Type>
  18665. <Comment>72.44.62.1xx</Comment>
  18666. <Link1>http://www.spock.com/crawler</Link1>
  18667. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  18668. </user-agent>
  18669. <user-agent>
  18670. <ID>id_n_s_1317</ID>
  18671. <String>sportsuchmaschine.de-Robot (Version: 1.02- powered by www.sportsuchmaschine.de)</String>
  18672. <Description>Sportsuchmaschine (German sports related search) link checking / robot</Description>
  18673. <Type>R</Type>
  18674. <Comment></Comment>
  18675. <Link1>http://www.sportsuchmaschine.de/</Link1>
  18676. <Link2></Link2>
  18677. </user-agent>
  18678. <user-agent>
  18679. <ID>id_n_s_040306_1</ID>
  18680. <String>sproose/0.1-alpha (sproose crawler; http://www.sproose.com/bot.html; crawler@sproose.com)</String>
  18681. <Description>Sproose personalized search (38.100.225.xx)</Description>
  18682. <Type>R</Type>
  18683. <Comment>powered by Nutch</Comment>
  18684. <Link1>http://www.sproose.com/</Link1>
  18685. <Link2>http://lucene.apache.org/nutch/</Link2>
  18686. </user-agent>
  18687. <user-agent>
  18688. <ID>id_n_s_1318</ID>
  18689. <String>SQ Webscanner</String>
  18690. <Description>SQ Webscanner Mac download manager</Description>
  18691. <Type>D</Type>
  18692. <Comment>product is discontinued</Comment>
  18693. <Link1>http://macinsearch.com/users/webscanner/</Link1>
  18694. <Link2></Link2>
  18695. </user-agent>
  18696. <user-agent>
  18697. <ID>id_n_s_1319</ID>
  18698. <String>Squid-Prefetch</String>
  18699. <Description>Simple page-prefetch for Squid web proxy</Description>
  18700. <Type>P</Type>
  18701. <Comment></Comment>
  18702. <Link1>http://packages.debian.org/stable/web/squid-prefetch</Link1>
  18703. <Link2></Link2>
  18704. </user-agent>
  18705. <user-agent>
  18706. <ID>id_n_s_171105_2</ID>
  18707. <String>squidclam</String>
  18708. <Description>Squidclam is a replacement for SquidClamAV-Redirector</Description>
  18709. <Type>P</Type>
  18710. <Comment>s.also SquidClamAV_Redirector 1.x.x</Comment>
  18711. <Link1>http://sourceforge.net/projects/squidclam</Link1>
  18712. <Link2></Link2>
  18713. </user-agent>
  18714. <user-agent>
  18715. <ID>id_n_s_1320</ID>
  18716. <String>SquidClamAV_Redirector 1.x.x</String>
  18717. <Description>SCAVR - Squid helper script for scanning download URLs for viruses</Description>
  18718. <Type>P</Type>
  18719. <Comment>s.also squidclam</Comment>
  18720. <Link1>http://www.jackal-net.at/tiki-read_article.php?articleId=1</Link1>
  18721. <Link2></Link2>
  18722. </user-agent>
  18723. <user-agent>
  18724. <ID>id_n_s_1321</ID>
  18725. <String>Sqworm/2.9.81-BETA (beta_release; 20011102-760; i686-pc-linux-gnu)</String>
  18726. <Description>AOL Search / Pacific Internet Exchange robot</Description>
  18727. <Type>R</Type>
  18728. <Comment></Comment>
  18729. <Link1>http://www.aol.com/</Link1>
  18730. <Link2></Link2>
  18731. </user-agent>
  18732. <user-agent>
  18733. <ID>id_n_s_1322</ID>
  18734. <String>Sqworm/2.9.85-BETA (beta_release; 20011115-775; i686-pc-linux-gnu)</String>
  18735. <Description>diff. IPs / services i.e.: - Inria.fr robot - Websense (Internet filtering) robot</Description>
  18736. <Type>R</Type>
  18737. <Comment></Comment>
  18738. <Link1>http://www.inria.fr/</Link1>
  18739. <Link2>http://www.websense.com/</Link2>
  18740. </user-agent>
  18741. <user-agent>
  18742. <ID>id_n_s_1323</ID>
  18743. <String>Sqworm/2.9.89-BETA (beta_release; 20020130-839; i686-pc-linux-gnu) </String>
  18744. <Description>Time Warner Telecom user robot ?</Description>
  18745. <Type></Type>
  18746. <Comment></Comment>
  18747. <Link1></Link1>
  18748. <Link2></Link2>
  18749. </user-agent>
  18750. <user-agent>
  18751. <ID>id_n_s_1324</ID>
  18752. <String>SSurf15a 11 </String>
  18753. <Description>Some site scanning tool via diff. IPs i.e.: - choiceone.net (216.153.xxx.xxx) - epix.net (216.108.198.xx)</Description>
  18754. <Type>S</Type>
  18755. <Comment>see also - PSurf15a VA or random letters like - AWSCBA - URVUSLNAM</Comment>
  18756. <Link1></Link1>
  18757. <Link2></Link2>
  18758. </user-agent>
  18759. <user-agent>
  18760. <ID>id_n_s_1325</ID>
  18761. <String>StackRambler/x.x </String>
  18762. <Description>Rambler search (Russia) robot (81.19.6x.xx)</Description>
  18763. <Type>R</Type>
  18764. <Comment></Comment>
  18765. <Link1>http://www.rambler.ru</Link1>
  18766. <Link2></Link2>
  18767. </user-agent>
  18768. <user-agent>
  18769. <ID>id_n_s_1326</ID>
  18770. <String>Stamina/1.4</String>
  18771. <Description>Stamina download manager</Description>
  18772. <Type>D</Type>
  18773. <Comment></Comment>
  18774. <Link1>http://www.wildbits.com/stamina/</Link1>
  18775. <Link2></Link2>
  18776. </user-agent>
  18777. <user-agent>
  18778. <ID>id_n_s_1327</ID>
  18779. <String>Star Downloader</String>
  18780. <Description>Star Downloader download manager</Description>
  18781. <Type>D</Type>
  18782. <Comment></Comment>
  18783. <Link1>http://www.stardownloader.com/</Link1>
  18784. <Link2></Link2>
  18785. </user-agent>
  18786. <user-agent>
  18787. <ID>id_n_s_140106_3</ID>
  18788. <String>StarDownloader/1.xx</String>
  18789. <Description>Star Downloader download manager</Description>
  18790. <Type>D</Type>
  18791. <Comment></Comment>
  18792. <Link1>http://www.stardownloader.com/</Link1>
  18793. <Link2></Link2>
  18794. </user-agent>
  18795. <user-agent>
  18796. <ID>id_n_s_1328</ID>
  18797. <String>stat statcrawler@gmail.com</String>
  18798. <Description>Experimental search engine spider from 66.92.186.xxx</Description>
  18799. <Type>R</Type>
  18800. <Comment>66.92.186.xxx</Comment>
  18801. <Link1></Link1>
  18802. <Link2></Link2>
  18803. </user-agent>
  18804. <user-agent>
  18805. <ID>id_n_s_1329</ID>
  18806. <String>Steeler/1.x (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/)</String>
  18807. <Description>Steeler crawler</Description>
  18808. <Type>R</Type>
  18809. <Comment></Comment>
  18810. <Link1>http://www.tkl.iis.u-tokyo.ac.jp/~crawler/</Link1>
  18811. <Link2></Link2>
  18812. </user-agent>
  18813. <user-agent>
  18814. <ID>id_n_s_031107_5</ID>
  18815. <String>Steeler/3.3 (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/)</String>
  18816. <Description>Steeler - University of Tokyo web crawler</Description>
  18817. <Type>R</Type>
  18818. <Comment>157.82.156.xx[x]</Comment>
  18819. <Link1>http://www.tkl.iis.u-tokyo.ac.jp/~crawler/crawler.html.en</Link1>
  18820. <Link2></Link2>
  18821. </user-agent>
  18822. <user-agent>
  18823. <ID>id_n_s_060106_1</ID>
  18824. <String>Strategic Board Bot (+http://www.strategicboard.com)</String>
  18825. <Description>Strategic Board blog &amp; news search robot</Description>
  18826. <Type>R</Type>
  18827. <Comment></Comment>
  18828. <Link1>http://www.strategicboard.com/</Link1>
  18829. <Link2></Link2>
  18830. </user-agent>
  18831. <user-agent>
  18832. <ID>id_n_s_140906_2</ID>
  18833. <String>Strategic Board Bot (+http://www.strategicboard.com)</String>
  18834. <Description>Strategic Board blogs and news aggregator robot</Description>
  18835. <Type>R</Type>
  18836. <Comment>62.0.99.2xx</Comment>
  18837. <Link1>http://www.strategicboard.com/</Link1>
  18838. <Link2></Link2>
  18839. </user-agent>
  18840. <user-agent>
  18841. <ID>id_n_s_1330</ID>
  18842. <String>Submission Spider at surfsafely.com</String>
  18843. <Description>Surfsafely submission verifier</Description>
  18844. <Type>R</Type>
  18845. <Comment></Comment>
  18846. <Link1>http://www.surfsafely.com/</Link1>
  18847. <Link2></Link2>
  18848. </user-agent>
  18849. <user-agent>
  18850. <ID>id_n_s_210106_4</ID>
  18851. <String>suchbaer.de</String>
  18852. <Description>Suchbaer.de (Germany) search robot</Description>
  18853. <Type>R</Type>
  18854. <Comment></Comment>
  18855. <Link1>http://www.suchbaer.de/</Link1>
  18856. <Link2></Link2>
  18857. </user-agent>
  18858. <user-agent>
  18859. <ID>id_n_s_010206_3</ID>
  18860. <String>suchbaer.de (CrawlerAgent v0.103)</String>
  18861. <Description>Suchbaer.de (Germany) search robot</Description>
  18862. <Type>R</Type>
  18863. <Comment></Comment>
  18864. <Link1>http://www.suchbaer.de/</Link1>
  18865. <Link2></Link2>
  18866. </user-agent>
  18867. <user-agent>
  18868. <ID>id_n_s_1331</ID>
  18869. <String>suchbot</String>
  18870. <Description>Suchbot Germany robot</Description>
  18871. <Type>R</Type>
  18872. <Comment></Comment>
  18873. <Link1>http://www.suchbot.de/</Link1>
  18874. <Link2></Link2>
  18875. </user-agent>
  18876. <user-agent>
  18877. <ID>id_n_s_1332</ID>
  18878. <String>Suchknecht.at-Robot</String>
  18879. <Description>Suchknecht Austria robot</Description>
  18880. <Type>R</Type>
  18881. <Comment></Comment>
  18882. <Link1>http://www.suchknecht.at/</Link1>
  18883. <Link2></Link2>
  18884. </user-agent>
  18885. <user-agent>
  18886. <ID>id_n_s_120206_1</ID>
  18887. <String>suchpadbot/1.0 (+http://www.suchpad.de)</String>
  18888. <Description>suchpad search Germany robot (213.239.194.xx)</Description>
  18889. <Type>R</Type>
  18890. <Comment></Comment>
  18891. <Link1>http://www.suchpad.de/</Link1>
  18892. <Link2></Link2>
  18893. </user-agent>
  18894. <user-agent>
  18895. <ID>id_n_s_160107_2</ID>
  18896. <String>Sunrise XP/2.x</String>
  18897. <Description>Sunrise XP handheld news / website reader and converter</Description>
  18898. <Type>B</Type>
  18899. <Comment></Comment>
  18900. <Link1>http://sourceforge.net/projects/sunrisexp</Link1>
  18901. <Link2></Link2>
  18902. </user-agent>
  18903. <user-agent>
  18904. <ID>id_n_s_230406_4</ID>
  18905. <String>Sunrise/0.42g (Windows XP)</String>
  18906. <Description>Sunrise XP web sites and newsfeeds converter and handheld reader</Description>
  18907. <Type>B</Type>
  18908. <Comment></Comment>
  18909. <Link1>http://www.sunrisexp.com/</Link1>
  18910. <Link2></Link2>
  18911. </user-agent>
  18912. <user-agent>
  18913. <ID>id_n_s_1333</ID>
  18914. <String>SuperBot/x.x (Win32)</String>
  18915. <Description>SuperBot website copier</Description>
  18916. <Type>D</Type>
  18917. <Comment></Comment>
  18918. <Link1>http://www.sparkleware.com/superbot/index.html</Link1>
  18919. <Link2></Link2>
  18920. </user-agent>
  18921. <user-agent>
  18922. <ID>id_n_s_260108_2</ID>
  18923. <String>SuperBot/x.x.x.xx (Windows XP)</String>
  18924. <Description>SuperBot website copier</Description>
  18925. <Type>D</Type>
  18926. <Comment></Comment>
  18927. <Link1>http://www.sparkleware.com/superbot/index.html</Link1>
  18928. <Link2></Link2>
  18929. </user-agent>
  18930. <user-agent>
  18931. <ID>id_n_s_1334</ID>
  18932. <String>Superdownloads Spiderman</String>
  18933. <Description>Ubbi Superdownloads (Brazil) link checking</Description>
  18934. <Type>C</Type>
  18935. <Comment></Comment>
  18936. <Link1>http://superdownloads.ubbi.com.br/</Link1>
  18937. <Link2></Link2>
  18938. </user-agent>
  18939. <user-agent>
  18940. <ID>id_n_s_1335</ID>
  18941. <String>SURF </String>
  18942. <Description>SurfControl Web Filtering</Description>
  18943. <Type>P</Type>
  18944. <Comment></Comment>
  18945. <Link1>http://www.surfcontrol.com/</Link1>
  18946. <Link2></Link2>
  18947. </user-agent>
  18948. <user-agent>
  18949. <ID>id_n_s_1336</ID>
  18950. <String>SurferF3 1/0</String>
  18951. <Description>Wanadoo Rechereche robot</Description>
  18952. <Type>R</Type>
  18953. <Comment></Comment>
  18954. <Link1>http://www.wanadoo.fr/qqo/</Link1>
  18955. <Link2></Link2>
  18956. </user-agent>
  18957. <user-agent>
  18958. <ID>id_n_s_1337</ID>
  18959. <String>SurfMaster</String>
  18960. <Description>Maskbit Surfmaster bookmark tool</Description>
  18961. <Type>C</Type>
  18962. <Comment></Comment>
  18963. <Link1>http://www.maskbit.com/surfmaster.htm</Link1>
  18964. <Link2></Link2>
  18965. </user-agent>
  18966. <user-agent>
  18967. <ID>id_n_s_1338</ID>
  18968. <String>SurveyBot/2.2 &lt;a href='http://www.whois.sc'>Whois Source&lt;/a></String>
  18969. <Description>Whois Source domain name information robot (66.249.26.xx)</Description>
  18970. <Type>R C</Type>
  18971. <Comment>s.also: PigeonBot</Comment>
  18972. <Link1>http://www.whois.sc/</Link1>
  18973. <Link2></Link2>
  18974. </user-agent>
  18975. <user-agent>
  18976. <ID>id_n_s_1339</ID>
  18977. <String>SurveyBot/2.3 (Whois Source)</String>
  18978. <Description>Whois Source domain name information robot (66.249.26.xx)</Description>
  18979. <Type>R C</Type>
  18980. <Comment>s.also: PigeonBot</Comment>
  18981. <Link1>http://www.whois.sc/</Link1>
  18982. <Link2></Link2>
  18983. </user-agent>
  18984. <user-agent>
  18985. <ID>id_n_s_1340</ID>
  18986. <String>suzuran</String>
  18987. <Description>Yokogao Search Engine robot (Kanazawa University)</Description>
  18988. <Type>R</Type>
  18989. <Comment></Comment>
  18990. <Link1>http://web.kanazawa-u.ac.jp/esearch.html</Link1>
  18991. <Link2></Link2>
  18992. </user-agent>
  18993. <user-agent>
  18994. <ID>id_n_s_1341</ID>
  18995. <String>SWB/V1.4 (HP)</String>
  18996. <Description>HP Secure Web Browser for OpenVMS</Description>
  18997. <Type>B</Type>
  18998. <Comment></Comment>
  18999. <Link1>http://h71000.www7.hp.com/openvms/products/ips/cswb/cswb.html</Link1>
  19000. <Link2></Link2>
  19001. </user-agent>
  19002. <user-agent>
  19003. <ID>id_n_s_1342</ID>
  19004. <String>swbot/0.9c libwww/5.3.1</String>
  19005. <Description>unknown</Description>
  19006. <Type></Type>
  19007. <Comment></Comment>
  19008. <Link1></Link1>
  19009. <Link2></Link2>
  19010. </user-agent>
  19011. <user-agent>
  19012. <ID>id_n_s_1343</ID>
  19013. <String>Swooglebot/2.0. (+http://swoogle.umbc.edu/swooglebot.htm)</String>
  19014. <Description>Swooglebot Swoogle's semantic web crawler</Description>
  19015. <Type>R</Type>
  19016. <Comment></Comment>
  19017. <Link1>http://swoogle.umbc.edu</Link1>
  19018. <Link2></Link2>
  19019. </user-agent>
  19020. <user-agent>
  19021. <ID>id_n_s_060106_2</ID>
  19022. <String>SWSBot-Images/1.2 http://www.smartwaresoft.com/swsbot12.html</String>
  19023. <Description>SWSBot - SmartWareSoft (85.186.255.xx) software search engine created for Playfuls.com</Description>
  19024. <Type>R</Type>
  19025. <Comment></Comment>
  19026. <Link1>http://www.smartwaresoft.com/swsbot12.html</Link1>
  19027. <Link2>http://www.playfuls.com/</Link2>
  19028. </user-agent>
  19029. <user-agent>
  19030. <ID>id_n_s_300106_2</ID>
  19031. <String>SygolBot http://www.sygol.net</String>
  19032. <Description>Sygol Search (Italy) robot</Description>
  19033. <Type>R</Type>
  19034. <Comment>s.also &lt;http://www.sygol.com/></Comment>
  19035. <Link1>http://www.sygol.com/</Link1>
  19036. <Link2></Link2>
  19037. </user-agent>
  19038. <user-agent>
  19039. <ID>id_n_s_1344</ID>
  19040. <String>Sylera/1.2.x</String>
  19041. <Description>Sylera browser (Japan)</Description>
  19042. <Type>B</Type>
  19043. <Comment></Comment>
  19044. <Link1>http://tabbrowser.ktplan.jp/valinor/sylera.html</Link1>
  19045. <Link2></Link2>
  19046. </user-agent>
  19047. <user-agent>
  19048. <ID>id_n_s_1345</ID>
  19049. <String>SyncBot</String>
  19050. <Description>Mindspring.com user robot</Description>
  19051. <Type></Type>
  19052. <Comment></Comment>
  19053. <Link1>http://www.mindspring.com/</Link1>
  19054. <Link2></Link2>
  19055. </user-agent>
  19056. <user-agent>
  19057. <ID>id_n_s_1346</ID>
  19058. <String>SyncIT/x.x</String>
  19059. <Description>SyncIT link validation</Description>
  19060. <Type>C</Type>
  19061. <Comment></Comment>
  19062. <Link1>http://www.bookmarksync.com/</Link1>
  19063. <Link2></Link2>
  19064. </user-agent>
  19065. <user-agent>
  19066. <ID>id_n_s_140906_1</ID>
  19067. <String>Syndirella/0.91pre</String>
  19068. <Description>Syndirella desktop information aggregator (beta)</Description>
  19069. <Type>B</Type>
  19070. <Comment></Comment>
  19071. <Link1>http://www.yole.ru/projects/syndirella/</Link1>
  19072. <Link2></Link2>
  19073. </user-agent>
  19074. <user-agent>
  19075. <ID>id_n_s_1347</ID>
  19076. <String>SynoBot</String>
  19077. <Description>Synomia (France) robot</Description>
  19078. <Type>R</Type>
  19079. <Comment></Comment>
  19080. <Link1>http://www.synomia.fr/</Link1>
  19081. <Link2></Link2>
  19082. </user-agent>
  19083. <user-agent>
  19084. <ID>id_n_s_150406_1</ID>
  19085. <String>Syntryx ANT Scout Chassis Pheromone; Mozilla/4.0 compatible crawler</String>
  19086. <Description>Syntryx Solution Suite - domain / keyword crawler (216.7.179.xx)</Description>
  19087. <Type>R</Type>
  19088. <Comment></Comment>
  19089. <Link1>http://www.syntryx.com/</Link1>
  19090. <Link2></Link2>
  19091. </user-agent>
  19092. <user-agent>
  19093. <ID>id_n_s_1348</ID>
  19094. <String>Szukacz/1.x</String>
  19095. <Description>Szukacz.pl (Polish search) robot</Description>
  19096. <Type>R</Type>
  19097. <Comment></Comment>
  19098. <Link1>http://www.szukacz.pl/</Link1>
  19099. <Link2></Link2>
  19100. </user-agent>
  19101. <user-agent>
  19102. <ID>id_n_s_1349</ID>
  19103. <String>Szukacz/1.x (robot; www.szukacz.pl/jakdzialarobot.html; szukacz@proszynski.pl)</String>
  19104. <Description>Szukacz.pl (Polish search) robot</Description>
  19105. <Type>R</Type>
  19106. <Comment></Comment>
  19107. <Link1>http://www.szukacz.pl/</Link1>
  19108. <Link2></Link2>
  19109. </user-agent>
  19110. <user-agent>
  19111. <ID>id_t_z_220106_2</ID>
  19112. <String>T-Online Browser</String>
  19113. <Description>German T-Online browser &amp; internet suite </Description>
  19114. <Type>B</Type>
  19115. <Comment></Comment>
  19116. <Link1>http://service.t-online.de/c/06/52/67/652672.html</Link1>
  19117. <Link2></Link2>
  19118. </user-agent>
  19119. <user-agent>
  19120. <ID>id_t_z_070807_1</ID>
  19121. <String>tags2dir.com/0.8 (+http://tags2dir.com/directory/)</String>
  19122. <Description>tags2dir.com directory index</Description>
  19123. <Type>R</Type>
  19124. <Comment>74.115.102.1xx</Comment>
  19125. <Link1>http://tags2dir.com/directory/</Link1>
  19126. <Link2></Link2>
  19127. </user-agent>
  19128. <user-agent>
  19129. <ID>id_t_z_1350</ID>
  19130. <String>Tagword (http://tagword.com/dmoz_survey.php)</String>
  19131. <Description>TAGword DMOZ survey - ODP link checking robot</Description>
  19132. <Type>R</Type>
  19133. <Comment></Comment>
  19134. <Link1>http://tagword.com/dmoz_survey.php</Link1>
  19135. <Link2></Link2>
  19136. </user-agent>
  19137. <user-agent>
  19138. <ID>id_t_z_271105_2</ID>
  19139. <String>Tagyu Agent/1.0</String>
  19140. <Description>Tagyu - del.icio.us bookmark collection online tag generator</Description>
  19141. <Type></Type>
  19142. <Comment></Comment>
  19143. <Link1>http://www.tagyu.com/</Link1>
  19144. <Link2>http://del.icio.us/</Link2>
  19145. </user-agent>
  19146. <user-agent>
  19147. <ID>id_t_z_1351</ID>
  19148. <String>Talkro Web-Shot/1.0 (E-mail: webshot@daumsoft.com- Home: http://222.122.15.190/webshot)</String>
  19149. <Description>Daumsoft Talkro IR robot</Description>
  19150. <Type>R</Type>
  19151. <Comment></Comment>
  19152. <Link1>http://www.daumsoft.com/</Link1>
  19153. <Link2></Link2>
  19154. </user-agent>
  19155. <user-agent>
  19156. <ID>id_t_z_1352</ID>
  19157. <String>TAMU_CS_IRL_CRAWLER/1.0</String>
  19158. <Description>Texas A&amp;M University - Dept. of Computer Science crawler (server or link checking ?)</Description>
  19159. <Type>R C</Type>
  19160. <Comment></Comment>
  19161. <Link1>http://www.cs.tamu.edu/</Link1>
  19162. <Link2></Link2>
  19163. </user-agent>
  19164. <user-agent>
  19165. <ID>id_t_z_1353</ID>
  19166. <String>targetblaster.com/0.9k</String>
  19167. <Description>Targetblaster user link validation ?</Description>
  19168. <Type>R C</Type>
  19169. <Comment></Comment>
  19170. <Link1>http://www.targetblaster.com/</Link1>
  19171. <Link2></Link2>
  19172. </user-agent>
  19173. <user-agent>
  19174. <ID>id_t_z_230706_2</ID>
  19175. <String>TargetYourNews.com bot</String>
  19176. <Description>Target Your News - user submitted links</Description>
  19177. <Type>C</Type>
  19178. <Comment>72.36.160.xxx</Comment>
  19179. <Link1>http://targetyournews.com/</Link1>
  19180. <Link2></Link2>
  19181. </user-agent>
  19182. <user-agent>
  19183. <ID>id_t_z_201006_1</ID>
  19184. <String>TCDBOT/Nutch-0.8 (PhD student research;http://www.tcd.ie; mcgettrs at t c d dot IE)</String>
  19185. <Description>Trinity College Dublin (Ireland) TCDBOT</Description>
  19186. <Type>R</Type>
  19187. <Comment>134.226.1.xx</Comment>
  19188. <Link1>http://www.tcd.ie/</Link1>
  19189. <Link2></Link2>
  19190. </user-agent>
  19191. <user-agent>
  19192. <ID>id_t_z_1354</ID>
  19193. <String>TE</String>
  19194. <Description>HTTP header for transfer encoding used as user agent name ?</Description>
  19195. <Type></Type>
  19196. <Comment></Comment>
  19197. <Link1></Link1>
  19198. <Link2></Link2>
  19199. </user-agent>
  19200. <user-agent>
  19201. <ID>id_t_z_1355</ID>
  19202. <String>TeamSoft WinInet Component</String>
  19203. <Description>WinInet Internet client app.</Description>
  19204. <Type></Type>
  19205. <Comment></Comment>
  19206. <Link1>http://www.winsoft.sk/wininet.htm</Link1>
  19207. <Link2></Link2>
  19208. </user-agent>
  19209. <user-agent>
  19210. <ID>id_t_z_1356</ID>
  19211. <String>TECOMAC-Crawler/0.x</String>
  19212. <Description>Tecomac Gmbh (Germany) crawler software - now Arexera Information Technologies</Description>
  19213. <Type>R</Type>
  19214. <Comment></Comment>
  19215. <Link1>http://www.arexera.de/</Link1>
  19216. <Link2></Link2>
  19217. </user-agent>
  19218. <user-agent>
  19219. <ID>id_t_z_1357</ID>
  19220. <String>Tecomi Bot (http://www.tecomi.com/bot.htm)</String>
  19221. <Description>Tecomi (Germany) beta / test robot (84.201.65.xxx)</Description>
  19222. <Type>R</Type>
  19223. <Comment></Comment>
  19224. <Link1>http://www.tecomi.com/Suchmaschine</Link1>
  19225. <Link2></Link2>
  19226. </user-agent>
  19227. <user-agent>
  19228. <ID>id_t_z_101107_2</ID>
  19229. <String>Teemer (NetSeer&#44; Inc. is a Los Angeles based Internet startup company.; http://www.netseer.com/crawler.html; crawler@netseer.com)</String>
  19230. <Description>Teemer crawler for NetSeer search (beta) via Amazon Web Services - see also NetSeer/Nutch</Description>
  19231. <Type>R</Type>
  19232. <Comment>67.202.26.1xx</Comment>
  19233. <Link1>http://www.netseer.com/</Link1>
  19234. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  19235. </user-agent>
  19236. <user-agent>
  19237. <ID>id_t_z_1358</ID>
  19238. <String>Teleport Pro/1.2x(.1xxx)</String>
  19239. <Description>Teleport (website) downloading tool</Description>
  19240. <Type>D</Type>
  19241. <Comment></Comment>
  19242. <Link1>http://www.tenmax.com/teleport/pro/home.htm</Link1>
  19243. <Link2></Link2>
  19244. </user-agent>
  19245. <user-agent>
  19246. <ID>id_t_z_1359</ID>
  19247. <String>Teoma MP</String>
  19248. <Description>Teoma crawler (65.214.36.xx[x])</Description>
  19249. <Type>R</Type>
  19250. <Comment></Comment>
  19251. <Link1>http://www.teoma.com/</Link1>
  19252. <Link2></Link2>
  19253. </user-agent>
  19254. <user-agent>
  19255. <ID>id_t_z_1361</ID>
  19256. <String>teomaagent crawler-admin@teoma.com</String>
  19257. <Description>Teoma crawler (65.214.36.xx[x])</Description>
  19258. <Type>R</Type>
  19259. <Comment></Comment>
  19260. <Link1>http://www.teoma.com/</Link1>
  19261. <Link2></Link2>
  19262. </user-agent>
  19263. <user-agent>
  19264. <ID>id_t_z_1362</ID>
  19265. <String>teomaagent1 [crawler-admin@teoma.com]</String>
  19266. <Description>Teoma crawler (65.214.36.xx[x])</Description>
  19267. <Type>R</Type>
  19268. <Comment></Comment>
  19269. <Link1>http://www.teoma.com/</Link1>
  19270. <Link2></Link2>
  19271. </user-agent>
  19272. <user-agent>
  19273. <ID>id_t_z_1360</ID>
  19274. <String>teoma_agent1</String>
  19275. <Description>Teoma crawler (65.214.36.xx[x])</Description>
  19276. <Type>R</Type>
  19277. <Comment></Comment>
  19278. <Link1>http://www.teoma.com/</Link1>
  19279. <Link2></Link2>
  19280. </user-agent>
  19281. <user-agent>
  19282. <ID>id_t_z_1363</ID>
  19283. <String>Teradex Mapper; mapper@teradex.com; http://www.teradex.com</String>
  19284. <Description>Teradex Directory robot</Description>
  19285. <Type>R</Type>
  19286. <Comment></Comment>
  19287. <Link1>http://directory.teradex.com/</Link1>
  19288. <Link2></Link2>
  19289. </user-agent>
  19290. <user-agent>
  19291. <ID>id_t_z_010406_4</ID>
  19292. <String>TeragramCrawler</String>
  19293. <Description>Teragram multilingual text &amp; data processing software</Description>
  19294. <Type>D ?</Type>
  19295. <Comment></Comment>
  19296. <Link1>http://www.teragram.com/</Link1>
  19297. <Link2></Link2>
  19298. </user-agent>
  19299. <user-agent>
  19300. <ID>id_t_z_150807_2</ID>
  19301. <String>terraminds-bot/1.0 (support@terraminds.de)</String>
  19302. <Description>Terraminds blog search (Germany)</Description>
  19303. <Type>R</Type>
  19304. <Comment>88.198.44.2xx</Comment>
  19305. <Link1>http://www.terraminds.de/</Link1>
  19306. <Link2></Link2>
  19307. </user-agent>
  19308. <user-agent>
  19309. <ID>id_t_z_220406_1</ID>
  19310. <String>TerrawizBot/1.0 (+http://www.terrawiz.com/bot.html)</String>
  19311. <Description>Terrawiz Indian Search Engine robot</Description>
  19312. <Type>R</Type>
  19313. <Comment>209.128.80.1xx</Comment>
  19314. <Link1>http://www.terrawiz.com/</Link1>
  19315. <Link2></Link2>
  19316. </user-agent>
  19317. <user-agent>
  19318. <ID>id_t_z_1364</ID>
  19319. <String>Test spider</String>
  19320. <Description>Noceans Information Portfolio Manager (66.35.69.x)</Description>
  19321. <Type>R</Type>
  19322. <Comment></Comment>
  19323. <Link1>http://www.noceans.com/</Link1>
  19324. <Link2></Link2>
  19325. </user-agent>
  19326. <user-agent>
  19327. <ID>id_t_z_160507_1</ID>
  19328. <String>TestCrawler/Nutch-0.9 (Testing Crawler for Research ; http://balihoo.com/index.aspx; tgautier at balihoo dot com)</String>
  19329. <Description>Balihoo - Search Engine for Advertising Media</Description>
  19330. <Type>R</Type>
  19331. <Comment>204.228.230.xx</Comment>
  19332. <Link1>http://balihoo.com/</Link1>
  19333. <Link2></Link2>
  19334. </user-agent>
  19335. <user-agent>
  19336. <ID>id_t_z_1365</ID>
  19337. <String>The Expert HTML Source Viewer (http://www.expert-html.com)</String>
  19338. <Description>Expert HTML online source viewer</Description>
  19339. <Type>D B</Type>
  19340. <Comment>in conjunction with lwp-trivial/1.35</Comment>
  19341. <Link1>http://www.expert-html.net - site is offline</Link1>
  19342. <Link2></Link2>
  19343. </user-agent>
  19344. <user-agent>
  19345. <ID>id_t_z_281207_3</ID>
  19346. <String>TheRarestParser/0.2a (http://therarestwords.com/)</String>
  19347. <Description>The Rarest Words - Linguistic experiment crawler via Amazon Web Services</Description>
  19348. <Type>R</Type>
  19349. <Comment>67.202.27.19x</Comment>
  19350. <Link1>http://therarestwords.com/</Link1>
  19351. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  19352. </user-agent>
  19353. <user-agent>
  19354. <ID>id_t_z_1366</ID>
  19355. <String>TheSuBot/0.1 (www.thesubot.de)</String>
  19356. <Description>TheSuBot robot (Germany) for an unknown theme based search engine</Description>
  19357. <Type>R</Type>
  19358. <Comment></Comment>
  19359. <Link1>http://www.thesubot.de/</Link1>
  19360. <Link2></Link2>
  19361. </user-agent>
  19362. <user-agent>
  19363. <ID>id_t_z_171106_1</ID>
  19364. <String>thumbshots-de-Bot (Version: 1.02&#44; powered by www.thumbshots.de)</String>
  19365. <Description>ThumbShots website thumbnail service (Germany) robot</Description>
  19366. <Type>D</Type>
  19367. <Comment>212.112.238.xx</Comment>
  19368. <Link1>http://www.thumbshots.de/</Link1>
  19369. <Link2></Link2>
  19370. </user-agent>
  19371. <user-agent>
  19372. <ID>id_t_z_1367</ID>
  19373. <String>thumbshots-de-Bot (Version: 1.02- powered by www.thumbshots.de)</String>
  19374. <Description>ThumbShots.de (Germany) robot</Description>
  19375. <Type>R</Type>
  19376. <Comment></Comment>
  19377. <Link1>http://www.thumbshots.de/</Link1>
  19378. <Link2></Link2>
  19379. </user-agent>
  19380. <user-agent>
  19381. <ID>id_t_z_250206_1</ID>
  19382. <String>timboBot/0.9 http://www.breakingblogs.com/timbo_bot.html</String>
  19383. <Description>Breaking Blogs timbo bot blog robot</Description>
  19384. <Type>R</Type>
  19385. <Comment></Comment>
  19386. <Link1>http://www.breakingblogs.com/</Link1>
  19387. <Link2></Link2>
  19388. </user-agent>
  19389. <user-agent>
  19390. <ID>id_t_z_140106_4</ID>
  19391. <String>http://www.timelyweb.com/</String>
  19392. <Description>TimelyWeb web page monitoring tool</Description>
  19393. <Type>C</Type>
  19394. <Comment>s. also EldoS ...</Comment>
  19395. <Link1>http://www.eldos.org/timelyweb/timelyweb.html</Link1>
  19396. <Link2></Link2>
  19397. </user-agent>
  19398. <user-agent>
  19399. <ID>id_t_z_180408_6</ID>
  19400. <String>TinEye/1.1 (http://tineye.com/crawler.html)</String>
  19401. <Description>TinEye crawler for an open image search project</Description>
  19402. <Type>R</Type>
  19403. <Comment></Comment>
  19404. <Link1>http://tineye.com/crawler.html</Link1>
  19405. <Link2></Link2>
  19406. </user-agent>
  19407. <user-agent>
  19408. <ID>id_t_z_1368</ID>
  19409. <String>tivraSpider/1.0 (crawler@tivra.com)</String>
  19410. <Description>Tivra spider from AT&amp;T Labs Research</Description>
  19411. <Type>R</Type>
  19412. <Comment>see this document: http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps</Comment>
  19413. <Link1>http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps</Link1>
  19414. <Link2></Link2>
  19415. </user-agent>
  19416. <user-agent>
  19417. <ID>id_t_z_1369</ID>
  19418. <String>TJG/Spider</String>
  19419. <Description>Tjgroup spider</Description>
  19420. <Type>R</Type>
  19421. <Comment></Comment>
  19422. <Link1>http://www.tjgroup.com/</Link1>
  19423. <Link2></Link2>
  19424. </user-agent>
  19425. <user-agent>
  19426. <ID>id_t_z_1370</ID>
  19427. <String>TJvMultiHttpGrabber Component</String>
  19428. <Description>TJvHttpGrabber (JEDI Visual Component Library)</Description>
  19429. <Type></Type>
  19430. <Comment>Possibly used by Bit Torrent Search </Comment>
  19431. <Link1>http://homepages.borland.com/jedi/jedihelp/item.php?Id=22015</Link1>
  19432. <Link2>http://www.btsearch.net/</Link2>
  19433. </user-agent>
  19434. <user-agent>
  19435. <ID>id_t_z_1371</ID>
  19436. <String>Tkensaku/x.x(http://www.tkensaku.com/q.html)</String>
  19437. <Description>Tkensaku Search (Japan) robot from 210.239.46.xxx (www.tken.com)</Description>
  19438. <Type>R</Type>
  19439. <Comment></Comment>
  19440. <Link1>http://www.tkensaku.com/q.html</Link1>
  19441. <Link2></Link2>
  19442. </user-agent>
  19443. <user-agent>
  19444. <ID>id_t_z_1372</ID>
  19445. <String>toCrawl/UrlDispatcher</String>
  19446. <Description>Unknown robot from 195.68.98.xx (coltfrance.com)</Description>
  19447. <Type></Type>
  19448. <Comment></Comment>
  19449. <Link1></Link1>
  19450. <Link2></Link2>
  19451. </user-agent>
  19452. <user-agent>
  19453. <ID>id_t_z_200207_1</ID>
  19454. <String>Topodia/1.2-dev (Topodia - Crawler for HTTP content indexing; http://www.topodia.com/; support@topodia.com)</String>
  19455. <Description>Topodia search engine and personal information assistant (in development)</Description>
  19456. <Type>R</Type>
  19457. <Comment>88.153.148.xx</Comment>
  19458. <Link1>http://www.topodia.com/</Link1>
  19459. <Link2></Link2>
  19460. </user-agent>
  19461. <user-agent>
  19462. <ID>id_t_z_160506_2</ID>
  19463. <String>TOPOS robot/1.1 (http://www.topos.com.ua/)</String>
  19464. <Description>Topos search (Russia) robot</Description>
  19465. <Type>C</Type>
  19466. <Comment>193.17.73.1xx</Comment>
  19467. <Link1>http://www.topos.com.ua/</Link1>
  19468. <Link2></Link2>
  19469. </user-agent>
  19470. <user-agent>
  19471. <ID>id_t_z_1373</ID>
  19472. <String>Toutatis x-xx.x (hoppa.com)</String>
  19473. <Description>Hoppa robot (81.4.78.xxx)</Description>
  19474. <Type>R</Type>
  19475. <Comment></Comment>
  19476. <Link1>http://hoppa.com/</Link1>
  19477. <Link2></Link2>
  19478. </user-agent>
  19479. <user-agent>
  19480. <ID>id_t_z_1374</ID>
  19481. <String>Toutatis x.x (hoppa.com)</String>
  19482. <Description>Hoppa robot (81.4.78.xxx)</Description>
  19483. <Type>R</Type>
  19484. <Comment></Comment>
  19485. <Link1>http://hoppa.com/</Link1>
  19486. <Link2></Link2>
  19487. </user-agent>
  19488. <user-agent>
  19489. <ID>id_t_z_1375</ID>
  19490. <String>Toutatis x.x-x</String>
  19491. <Description>Hoppa robot (81.4.78.xxx)</Description>
  19492. <Type>R</Type>
  19493. <Comment></Comment>
  19494. <Link1>http://hoppa.com/</Link1>
  19495. <Link2></Link2>
  19496. </user-agent>
  19497. <user-agent>
  19498. <ID>id_t_z_050806_2</ID>
  19499. <String>traazibot/testengine (+http://www.traazi.de)</String>
  19500. <Description>Traazi! search (Germany) robot</Description>
  19501. <Type>R</Type>
  19502. <Comment>87.230.5.2xx</Comment>
  19503. <Link1>http://www.traazi.de/</Link1>
  19504. <Link2></Link2>
  19505. </user-agent>
  19506. <user-agent>
  19507. <ID>id_t_z_041007_2</ID>
  19508. <String>Trailfire-bot/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)</String>
  19509. <Description>Trailfire web collection and annotating system</Description>
  19510. <Type>C</Type>
  19511. <Comment></Comment>
  19512. <Link1>http://www.trailfire.com/</Link1>
  19513. <Link2></Link2>
  19514. </user-agent>
  19515. <user-agent>
  19516. <ID>id_t_z_081207_2</ID>
  19517. <String>Trailfire-bot/0.7.1 (Trailfire page content analyzer; http://trailfire.com; info@trailfire.com)</String>
  19518. <Description>Trailfire web collection and annotating system</Description>
  19519. <Type>C</Type>
  19520. <Comment></Comment>
  19521. <Link1>http://www.trailfire.com/</Link1>
  19522. <Link2></Link2>
  19523. </user-agent>
  19524. <user-agent>
  19525. <ID>id_t_z_260807_2</ID>
  19526. <String>Trailfire/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)</String>
  19527. <Description>Trailfire web collection and annotating system</Description>
  19528. <Type>C</Type>
  19529. <Comment></Comment>
  19530. <Link1>http://www.trailfire.com/</Link1>
  19531. <Link2></Link2>
  19532. </user-agent>
  19533. <user-agent>
  19534. <ID>id_t_z_1376</ID>
  19535. <String>Trampelpfad-Spider</String>
  19536. <Description>Trampelpfad Webkatalog spider</Description>
  19537. <Type>R</Type>
  19538. <Comment></Comment>
  19539. <Link1>http://www2.trampelpfad.de/</Link1>
  19540. <Link2></Link2>
  19541. </user-agent>
  19542. <user-agent>
  19543. <ID>id_t_z_1377</ID>
  19544. <String>Trampelpfad-Spider-v0.1</String>
  19545. <Description>Trampelpfad Webkatalog spider</Description>
  19546. <Type>R</Type>
  19547. <Comment></Comment>
  19548. <Link1>http://www2.trampelpfad.de/</Link1>
  19549. <Link2></Link2>
  19550. </user-agent>
  19551. <user-agent>
  19552. <ID>id_t_z_1378</ID>
  19553. <String>tricosMetaCheck 1.2216-08-1999 (http://www.tricos.com/metacheck)</String>
  19554. <Description>Tricos meta tag validation</Description>
  19555. <Type>C</Type>
  19556. <Comment></Comment>
  19557. <Link1>http://www.tricos.us/metaone.php</Link1>
  19558. <Link2></Link2>
  19559. </user-agent>
  19560. <user-agent>
  19561. <ID>id_t_z_1379</ID>
  19562. <String>TSurf15a 11</String>
  19563. <Description>some bad user agent</Description>
  19564. <Type>S</Type>
  19565. <Comment>- s. DBrowse- Dsurf etc.</Comment>
  19566. <Link1></Link1>
  19567. <Link2></Link2>
  19568. </user-agent>
  19569. <user-agent>
  19570. <ID>id_t_z_1380</ID>
  19571. <String>TulipChain/5.x (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://java.sun.com/) Linux/2.4.17</String>
  19572. <Description>Tulip Chain browser / link checker for Dmoz.org directory</Description>
  19573. <Type>B C R</Type>
  19574. <Comment></Comment>
  19575. <Link1>http://ostermiller.org/tulipchain/</Link1>
  19576. <Link2></Link2>
  19577. </user-agent>
  19578. <user-agent>
  19579. <ID>id_t_z_1381</ID>
  19580. <String>TulipChain/5.xx (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://apple.com/) Mac_OS_X/10.2.8</String>
  19581. <Description>Tulip Chain browser / link checker for Dmoz.org directory</Description>
  19582. <Type>B C R</Type>
  19583. <Comment></Comment>
  19584. <Link1>http://ostermiller.org/tulipchain/</Link1>
  19585. <Link2></Link2>
  19586. </user-agent>
  19587. <user-agent>
  19588. <ID>id_t_z_101107_3</ID>
  19589. <String>Tumblr/1.0 RSS syndication (+http://www.tumblr.com/) (support@tumblr.com)</String>
  19590. <Description>Tumblr Tumblelogs RSS and news syndication crawler</Description>
  19591. <Type>R</Type>
  19592. <Comment>72.32.6.15x</Comment>
  19593. <Link1>http://www.tumblr.com/</Link1>
  19594. <Link2></Link2>
  19595. </user-agent>
  19596. <user-agent>
  19597. <ID>id_t_z_1382</ID>
  19598. <String>TurnitinBot/x.x (http://www.turnitin.com/robot/crawlerinfo.html)</String>
  19599. <Description>Turnitin (ex SlySearch) robot for helping educational institutions prevent plagiarism</Description>
  19600. <Type>R</Type>
  19601. <Comment>64.140.49.xx</Comment>
  19602. <Link1>http://www.turnitin.com/robot/crawlerinfo.html</Link1>
  19603. <Link2></Link2>
  19604. </user-agent>
  19605. <user-agent>
  19606. <ID>id_t_z_1383</ID>
  19607. <String>Turnpike Emporium LinkChecker/0.1</String>
  19608. <Description>TurnPike Emporium Directory (207.67.198.x) link checking</Description>
  19609. <Type>R</Type>
  19610. <Comment></Comment>
  19611. <Link1>http://www.turnpike.net/directory.phtml</Link1>
  19612. <Link2></Link2>
  19613. </user-agent>
  19614. <user-agent>
  19615. <ID>id_t_z_1384</ID>
  19616. <String>TutorGig/1.5 (+http://www.tutorgig.com/crawler)</String>
  19617. <Description>TutorGig tutorial search robot</Description>
  19618. <Type>R</Type>
  19619. <Comment></Comment>
  19620. <Link1>http://www.tutorgig.com/crawler/</Link1>
  19621. <Link2></Link2>
  19622. </user-agent>
  19623. <user-agent>
  19624. <ID>id_t_z_1385</ID>
  19625. <String>Tutorial Crawler 1.4 (http://www.tutorgig.com/crawler)</String>
  19626. <Description>TutorGig tutorial search robot</Description>
  19627. <Type>R</Type>
  19628. <Comment></Comment>
  19629. <Link1>http://www.tutorgig.com/crawler/</Link1>
  19630. <Link2></Link2>
  19631. </user-agent>
  19632. <user-agent>
  19633. <ID>id_t_z_1386</ID>
  19634. <String>Twiceler www.cuill.com/robots.html</String>
  19635. <Description>Twiceler experimental web crawler</Description>
  19636. <Type>R</Type>
  19637. <Comment>64.62.136.xxx</Comment>
  19638. <Link1>http://www.cuill.com/</Link1>
  19639. <Link2></Link2>
  19640. </user-agent>
  19641. <user-agent>
  19642. <ID>id_t_z_290407_1</ID>
  19643. <String>Twiceler-0.9 http://www.cuill.com/twiceler/robot.html</String>
  19644. <Description>Twiceler experimental web crawler</Description>
  19645. <Type>R</Type>
  19646. <Comment>64.62.136.xxx</Comment>
  19647. <Link1>http://www.cuill.com/</Link1>
  19648. <Link2></Link2>
  19649. </user-agent>
  19650. <user-agent>
  19651. <ID>id_t_z_291105_5</ID>
  19652. <String>Twisted PageGetter</String>
  19653. <Description>File downloading component from Twisted Python</Description>
  19654. <Type>D</Type>
  19655. <Comment></Comment>
  19656. <Link1>http://twistedmatrix.com/</Link1>
  19657. <Link2></Link2>
  19658. </user-agent>
  19659. <user-agent>
  19660. <ID>id_t_z_140508_5</ID>
  19661. <String>Twitturly / v0.x</String>
  19662. <Description>Twitt(url)y URL tracking service for Twitter via Amazon Web Services</Description>
  19663. <Type>C</Type>
  19664. <Comment>75.101.135.[x]xx</Comment>
  19665. <Link1>http://twitturly.com/</Link1>
  19666. <Link2>http://twitter.com/</Link2>
  19667. </user-agent>
  19668. <user-agent>
  19669. <ID>id_t_z_1387</ID>
  19670. <String>Twotrees Reactive Filter V2.0</String>
  19671. <Description>Twotrees content filter</Description>
  19672. <Type>P</Type>
  19673. <Comment></Comment>
  19674. <Link1>http://www.twotrees.com/</Link1>
  19675. <Link2></Link2>
  19676. </user-agent>
  19677. <user-agent>
  19678. <ID>id_t_z_221207_2</ID>
  19679. <String>Tycoon Agent/Nutch-1.0-dev</String>
  19680. <Description>Tycoon - Hewlett-Packards distributed cluster solution robot</Description>
  19681. <Type>R</Type>
  19682. <Comment>204.123.46.xx[x]</Comment>
  19683. <Link1>http://tycoon.hpl.hp.com/</Link1>
  19684. <Link2></Link2>
  19685. </user-agent>
  19686. <user-agent>
  19687. <ID>id_t_z_1388</ID>
  19688. <String>TygoBot</String>
  19689. <Description>Tygo Search robot</Description>
  19690. <Type>R</Type>
  19691. <Comment></Comment>
  19692. <Link1>http://www.tygo.com/</Link1>
  19693. <Link2></Link2>
  19694. </user-agent>
  19695. <user-agent>
  19696. <ID>id_t_z_1389</ID>
  19697. <String>TygoProwler</String>
  19698. <Description>Tygo Search robot</Description>
  19699. <Type>R</Type>
  19700. <Comment></Comment>
  19701. <Link1>http://www.tygo.com/</Link1>
  19702. <Link2></Link2>
  19703. </user-agent>
  19704. <user-agent>
  19705. <ID>id_t_z_1390</ID>
  19706. <String>UCmore</String>
  19707. <Description>UCMore -  IE navigation and search plugin</Description>
  19708. <Type>B</Type>
  19709. <Comment></Comment>
  19710. <Link1>http://www.ucmore.com/</Link1>
  19711. <Link2></Link2>
  19712. </user-agent>
  19713. <user-agent>
  19714. <ID>id_t_z_1391</ID>
  19715. <String>UCMore Crawler App</String>
  19716. <Description>UCMore -  IE navigation and search plugin</Description>
  19717. <Type>B</Type>
  19718. <Comment></Comment>
  19719. <Link1>http://www.ucmore.com/</Link1>
  19720. <Link2></Link2>
  19721. </user-agent>
  19722. <user-agent>
  19723. <ID>id_t_z_290208_1</ID>
  19724. <String>UCWEB5.1</String>
  19725. <Description>Ucweb mobile browser</Description>
  19726. <Type>B</Type>
  19727. <Comment></Comment>
  19728. <Link1>http://www.ucweb.com/English/product.shtml</Link1>
  19729. <Link2></Link2>
  19730. </user-agent>
  19731. <user-agent>
  19732. <ID>id_t_z_1392</ID>
  19733. <String>UDM</String>
  19734. <Description>user agent - maybe UdmSearch (see UdmSearch) ?</Description>
  19735. <Type></Type>
  19736. <Comment></Comment>
  19737. <Link1></Link1>
  19738. <Link2></Link2>
  19739. </user-agent>
  19740. <user-agent>
  19741. <ID>id_t_z_1393</ID>
  19742. <String>UdmSearch/3.1.x</String>
  19743. <Description>UdmSearch / MySearch (now mnoGoSeach) offline browser/search client</Description>
  19744. <Type>R B</Type>
  19745. <Comment></Comment>
  19746. <Link1>http://mnogosearch.org/</Link1>
  19747. <Link2></Link2>
  19748. </user-agent>
  19749. <user-agent>
  19750. <ID>id_t_z_1394</ID>
  19751. <String>UIowaCrawler/1.0</String>
  19752. <Description>University of Iowa Crawler- possibly MySpiders</Description>
  19753. <Type>R</Type>
  19754. <Comment></Comment>
  19755. <Link1>http://myspiders.biz.uiowa.edu/</Link1>
  19756. <Link2></Link2>
  19757. </user-agent>
  19758. <user-agent>
  19759. <ID>id_t_z_231106_1</ID>
  19760. <String>UKWizz/Nutch-0.8.1 (UKWizz Nutch crawler; http://www.ukwizz.com/)</String>
  19761. <Description>UKWizz search robot</Description>
  19762. <Type>R</Type>
  19763. <Comment>s. also Mackster</Comment>
  19764. <Link1>http://www.ukwizz.com</Link1>
  19765. <Link2></Link2>
  19766. </user-agent>
  19767. <user-agent>
  19768. <ID>id_t_z_1395</ID>
  19769. <String>Ultraseek</String>
  19770. <Description>Infoseek robot</Description>
  19771. <Type>R</Type>
  19772. <Comment></Comment>
  19773. <Link1>http://www.infoseek.com/</Link1>
  19774. <Link2></Link2>
  19775. </user-agent>
  19776. <user-agent>
  19777. <ID>id_t_z_1396</ID>
  19778. <String>Under the Rainbow 2.2</String>
  19779. <Description>Unknown mail harvester/spambot from 80.58.13.xxx (proxycache.rima-tde.net)</Description>
  19780. <Type>S</Type>
  19781. <Comment></Comment>
  19782. <Link1>http://www.honeypot.be/</Link1>
  19783. <Link2></Link2>
  19784. </user-agent>
  19785. <user-agent>
  19786. <ID>id_a_f_140308_1</ID>
  19787. <String>unknownght.com Web Server IIS vs Apache Survey. See Results at www.DNSRight.com</String>
  19788. <Description>DNS Right - Online DNS tools</Description>
  19789. <Type>C</Type>
  19790. <Comment>203.161.71.17x</Comment>
  19791. <Link1>http://www.dnsright.com/</Link1>
  19792. <Link2></Link2>
  19793. </user-agent>
  19794. <user-agent>
  19795. <ID>id_t_z_1397</ID>
  19796. <String>UofTDB_experiment (leehyun@cs.toronto.edu)</String>
  19797. <Description>Unknown robot from University of Toronto (128.100.5.1xx)</Description>
  19798. <Type>R</Type>
  19799. <Comment></Comment>
  19800. <Link1></Link1>
  19801. <Link2></Link2>
  19802. </user-agent>
  19803. <user-agent>
  19804. <ID>id_t_z_1398</ID>
  19805. <String>UP.Browser/3.01-IG01 UP.Link/3.2.3.4</String>
  19806. <Description>Mobile phone browser</Description>
  19807. <Type>B</Type>
  19808. <Comment></Comment>
  19809. <Link1></Link1>
  19810. <Link2></Link2>
  19811. </user-agent>
  19812. <user-agent>
  19813. <ID>id_t_z_050806_1</ID>
  19814. <String>updated/0.1-alpha (updated crawler; http://www.updated.com; crawler@updated.com)</String>
  19815. <Description>Updated! search robot</Description>
  19816. <Type>R</Type>
  19817. <Comment>38.119.96.1xx</Comment>
  19818. <Link1>http://www.updated.com/</Link1>
  19819. <Link2></Link2>
  19820. </user-agent>
  19821. <user-agent>
  19822. <ID>id_t_z_1399</ID>
  19823. <String>updated/0.1beta (updated.com; http://www.updated.com; crawler@updated.om)</String>
  19824. <Description>Updated! search robot</Description>
  19825. <Type>R</Type>
  19826. <Comment>38.119.96.1xx</Comment>
  19827. <Link1>http://www.updated.com/</Link1>
  19828. <Link2></Link2>
  19829. </user-agent>
  19830. <user-agent>
  19831. <ID>id_t_z_1400</ID>
  19832. <String>UPG1 UP/4.0 (compatible; Blazer 1.0)</String>
  19833. <Description>Handspring (PalmOS powered cellphone) Treo Blazer browser</Description>
  19834. <Type>B</Type>
  19835. <Comment></Comment>
  19836. <Link1></Link1>
  19837. <Link2></Link2>
  19838. </user-agent>
  19839. <user-agent>
  19840. <ID>id_t_z_1401</ID>
  19841. <String>Uptimebot</String>
  19842. <Description>UptimeBot.com online link popularity check</Description>
  19843. <Type>R</Type>
  19844. <Comment></Comment>
  19845. <Link1>http://www.uptimebot.com/</Link1>
  19846. <Link2></Link2>
  19847. </user-agent>
  19848. <user-agent>
  19849. <ID>id_t_z_1402</ID>
  19850. <String>UptimeBot(www.uptimebot.com)</String>
  19851. <Description>UptimeBot.com online link popularity check</Description>
  19852. <Type>R</Type>
  19853. <Comment></Comment>
  19854. <Link1>http://www.uptimebot.com/</Link1>
  19855. <Link2></Link2>
  19856. </user-agent>
  19857. <user-agent>
  19858. <ID>id_t_z_160706_2</ID>
  19859. <String>URI::Fetch/0.06</String>
  19860. <Description>URI::Fetch - client for fetching HTTP pages and syndication feeds (RSS Atom)</Description>
  19861. <Type>D</Type>
  19862. <Comment></Comment>
  19863. <Link1>http://search.cpan.org/dist/URI-Fetch/</Link1>
  19864. <Link2></Link2>
  19865. </user-agent>
  19866. <user-agent>
  19867. <ID>id_t_z_1403</ID>
  19868. <String>URL Spider Pro/x.xx (innerprise.net)</String>
  19869. <Description>Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool</Description>
  19870. <Type>R</Type>
  19871. <Comment></Comment>
  19872. <Link1>http://www.innerprise.net/</Link1>
  19873. <Link2></Link2>
  19874. </user-agent>
  19875. <user-agent>
  19876. <ID>id_t_z_121106_2</ID>
  19877. <String>URLBase/6.x</String>
  19878. <Description>URLBase - Internet shortcut manager</Description>
  19879. <Type>C</Type>
  19880. <Comment>s. also Mozilla/4.0 (Compatible); URLBase 6</Comment>
  19881. <Link1>http://www.terriadev.com/products/urlbase/</Link1>
  19882. <Link2></Link2>
  19883. </user-agent>
  19884. <user-agent>
  19885. <ID>id_t_z_1406</ID>
  19886. <String>URLBlaze</String>
  19887. <Description>URLBlaze file sharing link toolkit</Description>
  19888. <Type>C</Type>
  19889. <Comment></Comment>
  19890. <Link1>http://www.urlblaze.net/</Link1>
  19891. <Link2></Link2>
  19892. </user-agent>
  19893. <user-agent>
  19894. <ID>id_t_z_011108_4</ID>
  19895. <String>urlfan-bot/1.0; +http://www.urlfan.com/site/bot/350.html</String>
  19896. <Description>://URLFAN news crawler</Description>
  19897. <Type>R</Type>
  19898. <Comment>70.165.48.16x</Comment>
  19899. <Link1>http://www.urlfan.com/</Link1>
  19900. <Link2></Link2>
  19901. </user-agent>
  19902. <user-agent>
  19903. <ID>id_t_z_1407</ID>
  19904. <String>URLGetFile</String>
  19905. <Description>URLGetFile downloading tool</Description>
  19906. <Type>D</Type>
  19907. <Comment></Comment>
  19908. <Link1>http://shazron.com/freeware/java-utils/</Link1>
  19909. <Link2></Link2>
  19910. </user-agent>
  19911. <user-agent>
  19912. <ID>id_t_z_1404</ID>
  19913. <String>URL_Spider_Pro/x.x</String>
  19914. <Description>Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool</Description>
  19915. <Type>R</Type>
  19916. <Comment></Comment>
  19917. <Link1>http://www.innerprise.net/</Link1>
  19918. <Link2></Link2>
  19919. </user-agent>
  19920. <user-agent>
  19921. <ID>id_t_z_1405</ID>
  19922. <String>URL_Spider_Pro/x.x+(http://www.innerprise.net/usp-spider.asp)</String>
  19923. <Description>Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool</Description>
  19924. <Type>R</Type>
  19925. <Comment></Comment>
  19926. <Link1>http://www.innerprise.net/</Link1>
  19927. <Link2></Link2>
  19928. </user-agent>
  19929. <user-agent>
  19930. <ID>id_t_z_291006_1</ID>
  19931. <String>User-Agent:  BoardReader Favicon Fetcher /1.0 info@boardreader.com</String>
  19932. <Description>BoardReader search favicon fetcher</Description>
  19933. <Type>D</Type>
  19934. <Comment>208.65.71.xx</Comment>
  19935. <Link1>http://www.boardreader.com/</Link1>
  19936. <Link2>http://www.internetadsales.com/modules/news/article.php?storyid=4050</Link2>
  19937. </user-agent>
  19938. <user-agent>
  19939. <ID>id_t_z_081206_1</ID>
  19940. <String>User-Agent:  BoardReader Image Fetcher /1.0 info@boardreader.com</String>
  19941. <Description>BoardReader search image fetcher</Description>
  19942. <Type>D</Type>
  19943. <Comment>208.65.71.xx</Comment>
  19944. <Link1>http://www.boardreader.com/</Link1>
  19945. <Link2>http://www.internetadsales.com/modules/news/article.php?storyid=4050</Link2>
  19946. </user-agent>
  19947. <user-agent>
  19948. <ID>id_t_z_060206_2</ID>
  19949. <String>User-Agent:  LjSEEK Picture-Bot /1.0 contact@ljseek.com</String>
  19950. <Description>ljpic.com - LiveJournal picture feed search</Description>
  19951. <Type>C</Type>
  19952. <Comment></Comment>
  19953. <Link1>http://www.ljpic.com/</Link1>
  19954. <Link2></Link2>
  19955. </user-agent>
  19956. <user-agent>
  19957. <ID>id_t_z_1408</ID>
  19958. <String>User-Agent: FileHeap! file downloader (http://www.fileheap.com)</String>
  19959. <Description>FileHeap download manager</Description>
  19960. <Type>D</Type>
  19961. <Comment></Comment>
  19962. <Link1>http://www.fileheap.com</Link1>
  19963. <Link2></Link2>
  19964. </user-agent>
  19965. <user-agent>
  19966. <ID>id_t_z_270306_2</ID>
  19967. <String>User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)</String>
  19968. <Description>Malformed UA header from some guestbook/forum spammer</Description>
  19969. <Type>S</Type>
  19970. <Comment></Comment>
  19971. <Link1></Link1>
  19972. <Link2></Link2>
  19973. </user-agent>
  19974. <user-agent>
  19975. <ID>id_t_z_1409</ID>
  19976. <String>User-Agent: Mozilla/4.0 (SKIZZLE! Distributed Internet Spider v1.0 - www.SKIZZLE.com)</String>
  19977. <Description>Skizzle search robot</Description>
  19978. <Type>R</Type>
  19979. <Comment></Comment>
  19980. <Link1>http://www.skizzle.com/</Link1>
  19981. <Link2></Link2>
  19982. </user-agent>
  19983. <user-agent>
  19984. <ID>id_t_z_1410</ID>
  19985. <String>user-agent=Mozilla/3.01Gold</String>
  19986. <Description>unknown robot (reads robots.txt) or sitegrabber. From different IPs- ie.: 62.98.8.xx (wind.it)</Description>
  19987. <Type>R D ?</Type>
  19988. <Comment></Comment>
  19989. <Link1></Link1>
  19990. <Link2></Link2>
  19991. </user-agent>
  19992. <user-agent>
  19993. <ID>id_t_z_1411</ID>
  19994. <String>USyd-NLP-Spider (http://www.it.usyd.edu.au/~vinci/bot.html)</String>
  19995. <Description>University of Sydney NLP Spider for research in Natural Language Processing </Description>
  19996. <Type>R</Type>
  19997. <Comment></Comment>
  19998. <Link1>http://www.it.usyd.edu.au/~vinci/bot.html</Link1>
  19999. <Link2></Link2>
  20000. </user-agent>
  20001. <user-agent>
  20002. <ID>id_t_z_1412</ID>
  20003. <String>UtilMind HTTPGet</String>
  20004. <Description>Web Thief Site Grabber</Description>
  20005. <Type>D</Type>
  20006. <Comment></Comment>
  20007. <Link1>http://www.utilmind.com/scripts/webthief.html</Link1>
  20008. <Link2></Link2>
  20009. </user-agent>
  20010. <user-agent>
  20011. <ID>id_t_z_1413</ID>
  20012. <String>Utopia WebWasher 3.0</String>
  20013. <Description>WebWasher ad filter</Description>
  20014. <Type>P B</Type>
  20015. <Comment></Comment>
  20016. <Link1>http://www.webwasher.com/</Link1>
  20017. <Link2></Link2>
  20018. </user-agent>
  20019. <user-agent>
  20020. <ID>id_t_z_100406_1</ID>
  20021. <String>uTorrent/1500</String>
  20022. <Description>uTorrent BitTorrent client</Description>
  20023. <Type>D</Type>
  20024. <Comment></Comment>
  20025. <Link1>http://www.utorrent.com/</Link1>
  20026. <Link2></Link2>
  20027. </user-agent>
  20028. <user-agent>
  20029. <ID>id_t_z_060108_2</ID>
  20030. <String>VadixBot</String>
  20031. <Description>Unknown bad behaving bot via Road Runner - see link</Description>
  20032. <Type>S</Type>
  20033. <Comment>67.78.34.1[6-7][0-9] - 70.112.211.2x</Comment>
  20034. <Link1>http://mikesblog.americasdebate.com/2007/06/06/vadixbot-look-out/</Link1>
  20035. <Link2></Link2>
  20036. </user-agent>
  20037. <user-agent>
  20038. <ID>id_t_z_050406_4</ID>
  20039. <String>Vagabondo-WAP/2.0 (webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)/1.0 Profile</String>
  20040. <Description>WiseGuys WAP pages robot</Description>
  20041. <Type>R</Type>
  20042. <Comment></Comment>
  20043. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  20044. <Link2></Link2>
  20045. </user-agent>
  20046. <user-agent>
  20047. <ID>id_t_z_1414</ID>
  20048. <String>Vagabondo/1.x MT (webagent@wise-guys.nl)</String>
  20049. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  20050. <Type>R</Type>
  20051. <Comment>s. also Mozilla/3.0 (Vagabondo...</Comment>
  20052. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  20053. <Link2></Link2>
  20054. </user-agent>
  20055. <user-agent>
  20056. <ID>id_t_z_1415</ID>
  20057. <String>Vagabondo/2.0 MT</String>
  20058. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  20059. <Type>R</Type>
  20060. <Comment>s. also Mozilla/3.0 (Vagabondo...</Comment>
  20061. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  20062. <Link2></Link2>
  20063. </user-agent>
  20064. <user-agent>
  20065. <ID>id_t_z_1416</ID>
  20066. <String>Vagabondo/2.0 MT (webagent at wise-guys dot nl)</String>
  20067. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  20068. <Type>R</Type>
  20069. <Comment>s. also Mozilla/3.0 (Vagabondo...</Comment>
  20070. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  20071. <Link2></Link2>
  20072. </user-agent>
  20073. <user-agent>
  20074. <ID>id_t_z_1417</ID>
  20075. <String>Vagabondo/2.0 MT (webagent@NOSPAMwise-guys.nl)</String>
  20076. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  20077. <Type>R</Type>
  20078. <Comment>s. also Mozilla/3.0 (Vagabondo...</Comment>
  20079. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  20080. <Link2></Link2>
  20081. </user-agent>
  20082. <user-agent>
  20083. <ID>id_t_z_021205_2</ID>
  20084. <String>Vagabondo/3.0 (webagent at wise-guys dot nl)</String>
  20085. <Description>WiseGuys robot Netherland - 82.94.216.2</Description>
  20086. <Type>R</Type>
  20087. <Comment>s.also - Mozilla/3.0 (Vagabondo...</Comment>
  20088. <Link1>http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk</Link1>
  20089. <Link2></Link2>
  20090. </user-agent>
  20091. <user-agent>
  20092. <ID>id_t_z_1418</ID>
  20093. <String>Vakes/0.01 (Vakes; http://www.vakes.com/; search@vakes.com)</String>
  20094. <Description>Open Directory link checking from Vakes</Description>
  20095. <Type>R</Type>
  20096. <Comment></Comment>
  20097. <Link1>http://www.vakes.com/</Link1>
  20098. <Link2></Link2>
  20099. </user-agent>
  20100. <user-agent>
  20101. <ID>id_t_z_1420</ID>
  20102. <String>VayalaCreep-v0.0.1 (haploid@haploid.com)</String>
  20103. <Description>unknown level3.net (63.214.172.xxx) robot</Description>
  20104. <Type></Type>
  20105. <Comment></Comment>
  20106. <Link1></Link1>
  20107. <Link2></Link2>
  20108. </user-agent>
  20109. <user-agent>
  20110. <ID>id_t_z_1419</ID>
  20111. <String>Vayala|Creep-v0.0.1 (codepoet@wildties.com)</String>
  20112. <Description>unknown level3.net (63.214.172.xxx) robot</Description>
  20113. <Type></Type>
  20114. <Comment></Comment>
  20115. <Link1></Link1>
  20116. <Link2></Link2>
  20117. </user-agent>
  20118. <user-agent>
  20119. <ID>id_t_z_1421</ID>
  20120. <String>vb wininet</String>
  20121. <Description>iNet Grabber - Internet content grabber</Description>
  20122. <Type>D</Type>
  20123. <Comment></Comment>
  20124. <Link1>http://www.aldostools.com/igrabber.html</Link1>
  20125. <Link2></Link2>
  20126. </user-agent>
  20127. <user-agent>
  20128. <ID>id_t_z_1422</ID>
  20129. <String>versus 0.2 (+http://versus.integis.ch)</String>
  20130. <Description>Versus Project robot - Comparing methods for near-uniform URL sampling</Description>
  20131. <Type>R</Type>
  20132. <Comment></Comment>
  20133. <Link1>http://versus.integis.ch/</Link1>
  20134. <Link2></Link2>
  20135. </user-agent>
  20136. <user-agent>
  20137. <ID>id_t_z_1423</ID>
  20138. <String>versus crawler eda.baykan@epfl.ch</String>
  20139. <Description>Unknown robot from EPFL University Switzerland (128.178.155.xxx)</Description>
  20140. <Type>R</Type>
  20141. <Comment></Comment>
  20142. <Link1>http://www.epfl.ch/Eindex.html</Link1>
  20143. <Link2></Link2>
  20144. </user-agent>
  20145. <user-agent>
  20146. <ID>id_t_z_120408_1</ID>
  20147. <String>Verticrawlbot</String>
  20148. <Description>Verticrawl - Semantic search engine solution (French)</Description>
  20149. <Type>C</Type>
  20150. <Comment></Comment>
  20151. <Link1>http://www.verticrawl.com/fr/homepage.php</Link1>
  20152. <Link2></Link2>
  20153. </user-agent>
  20154. <user-agent>
  20155. <ID>id_t_z_1424</ID>
  20156. <String>VeryGoodSearch.com.DaddyLongLegs</String>
  20157. <Description>VeryGoodSearch.com link submission checking</Description>
  20158. <Type>R</Type>
  20159. <Comment></Comment>
  20160. <Link1>http://www.verygoodsearch.com/</Link1>
  20161. <Link2></Link2>
  20162. </user-agent>
  20163. <user-agent>
  20164. <ID>id_t_z_1425</ID>
  20165. <String>verzamelgids.nl - Networking4all Bot/x.x</String>
  20166. <Description>Verzamelgids NL link checking robot</Description>
  20167. <Type>R</Type>
  20168. <Comment>213.247.50.xx</Comment>
  20169. <Link1>http://www.verzamelgids.nl/</Link1>
  20170. <Link2></Link2>
  20171. </user-agent>
  20172. <user-agent>
  20173. <ID>id_t_z_181006_2</ID>
  20174. <String>Verzamelgids/2.2 (http://www.verzamelgids.nl)</String>
  20175. <Description>Verzamelgids NL link checking robot</Description>
  20176. <Type>R</Type>
  20177. <Comment>213.247.50.xx</Comment>
  20178. <Link1>http://www.verzamelgids.nl/</Link1>
  20179. <Link2></Link2>
  20180. </user-agent>
  20181. <user-agent>
  20182. <ID>id_t_z_030406_1</ID>
  20183. <String>Vespa Crawler</String>
  20184. <Description>Unknown robot from Yahoo Norway</Description>
  20185. <Type>R</Type>
  20186. <Comment>217.144.236.x</Comment>
  20187. <Link1>http://no.yahoo.com/</Link1>
  20188. <Link2></Link2>
  20189. </user-agent>
  20190. <user-agent>
  20191. <ID>id_t_z_190206_1</ID>
  20192. <String>virus_detector (virus_harvester@securecomputing.com)</String>
  20193. <Description>Sidewinder G2 anti-virus and anti-spyware protection</Description>
  20194. <Type>D</Type>
  20195. <Comment></Comment>
  20196. <Link1>http://www.securecomputing.com/sg2_antivirus.cfm?menu=solutions</Link1>
  20197. <Link2></Link2>
  20198. </user-agent>
  20199. <user-agent>
  20200. <ID>id_t_z_140407_1</ID>
  20201. <String>VisBot/2.0 (Visvo.com Crawler; http://www.visvo.com/bot.html; bot@visvo.com)</String>
  20202. <Description>Visbot crawler for a search software under development</Description>
  20203. <Type>R</Type>
  20204. <Comment>63.133.162..xx</Comment>
  20205. <Link1>http://www.visvo.com/bot.html</Link1>
  20206. <Link2></Link2>
  20207. </user-agent>
  20208. <user-agent>
  20209. <ID>id_t_z_1426</ID>
  20210. <String>Visicom Toolbar</String>
  20211. <Description>Some IE toolbar made with Visicom Media Dynamic Toolbar software</Description>
  20212. <Type>B</Type>
  20213. <Comment></Comment>
  20214. <Link1>http://www.dynamictoolbar.com/en/products/toolbar/</Link1>
  20215. <Link2></Link2>
  20216. </user-agent>
  20217. <user-agent>
  20218. <ID>id_t_z_1427</ID>
  20219. <String>Vision Research Lab image spider at vision.ece.ucsb.edu</String>
  20220. <Description>Vision research lab's Cortina - content based image retrieval (128.111.60.xx)</Description>
  20221. <Type>R</Type>
  20222. <Comment></Comment>
  20223. <Link1>http://vision.ece.ucsb.edu/multimedia/cortina.html</Link1>
  20224. <Link2></Link2>
  20225. </user-agent>
  20226. <user-agent>
  20227. <ID>id_t_z_160906_1</ID>
  20228. <String>VLC media player - version 0.8.5 Janus - (c) 1996-2006 the VideoLAN team</String>
  20229. <Description>VLC - Cross-platform media player and streaming server</Description>
  20230. <Type>B</Type>
  20231. <Comment></Comment>
  20232. <Link1>http://www.videolan.org/vlc/</Link1>
  20233. <Link2></Link2>
  20234. </user-agent>
  20235. <user-agent>
  20236. <ID>id_t_z_140806_1</ID>
  20237. <String>VMBot/0.x.x (VMBot; http://www.VerticalMatch.com/; vmbot@tradedot.com)</String>
  20238. <Description>VM - Vertical Search Engine (China)</Description>
  20239. <Type>R</Type>
  20240. <Comment>202.83.221.2xx</Comment>
  20241. <Link1>http://www.verticalmatch.com/</Link1>
  20242. <Link2></Link2>
  20243. </user-agent>
  20244. <user-agent>
  20245. <ID>id_t_z_020106_1</ID>
  20246. <String>Vortex/2.2 (+http://marty.anstey.ca/robots/vortex/)</String>
  20247. <Description>Vortex Web Indexing Robot for a study on  internet link distribution</Description>
  20248. <Type>R</Type>
  20249. <Comment></Comment>
  20250. <Link1>http://marty.anstey.ca/projects/robots/vortex/</Link1>
  20251. <Link2></Link2>
  20252. </user-agent>
  20253. <user-agent>
  20254. <ID>id_t_z_041207_1</ID>
  20255. <String>voyager-hc/1.0</String>
  20256. <Description>Kosmix health&#44; auto and travel search crawler (204.14.48.x / 38.113.234.xxx)</Description>
  20257. <Type>R</Type>
  20258. <Comment>s. also - cfetch/1.x - carleson/1.x</Comment>
  20259. <Link1>http://www.kosmix.com/</Link1>
  20260. <Link2></Link2>
  20261. </user-agent>
  20262. <user-agent>
  20263. <ID>id_t_z_231105_1</ID>
  20264. <String>voyager/1.0</String>
  20265. <Description>Kosmix health&#44; auto and travel search crawler (204.14.48.x / 38.113.234.xxx)</Description>
  20266. <Type>R</Type>
  20267. <Comment>s. also - cfetch/1.x - carleson/1.x</Comment>
  20268. <Link1>http://www.kosmix.com/</Link1>
  20269. <Link2></Link2>
  20270. </user-agent>
  20271. <user-agent>
  20272. <ID>id_t_z_301108_3</ID>
  20273. <String>voyager/2.0 (http://www.kosmix.com/html/crawler.html)</String>
  20274. <Description>Kosmix health&#44; auto and travel search crawler (204.14.48.x / 38.113.234.xxx)</Description>
  20275. <Type>R</Type>
  20276. <Comment>s. also - cfetch/1.x - carleson/1.x</Comment>
  20277. <Link1>http://www.kosmix.com/</Link1>
  20278. <Link2></Link2>
  20279. </user-agent>
  20280. <user-agent>
  20281. <ID>id_t_z_171105_3</ID>
  20282. <String>VSE/1.0 (testcrawler@hotmail.com)</String>
  20283. <Description>Vivisimo search crawler (206.210.89.xxx)</Description>
  20284. <Type>R</Type>
  20285. <Comment></Comment>
  20286. <Link1>http://www.vivisimo.com/</Link1>
  20287. <Link2></Link2>
  20288. </user-agent>
  20289. <user-agent>
  20290. <ID>id_t_z_171105_4</ID>
  20291. <String>VSE/1.0 (testcrawler@vivisimo.com)</String>
  20292. <Description>Vivisimo search crawler (206.210.89.xxx)</Description>
  20293. <Type>R</Type>
  20294. <Comment></Comment>
  20295. <Link1>http://www.vivisimo.com/</Link1>
  20296. <Link2></Link2>
  20297. </user-agent>
  20298. <user-agent>
  20299. <ID>id_t_z_1428</ID>
  20300. <String>vspider</String>
  20301. <Description>Verity vspider indexing software</Description>
  20302. <Type>R</Type>
  20303. <Comment></Comment>
  20304. <Link1>http://www.verity.com/</Link1>
  20305. <Link2></Link2>
  20306. </user-agent>
  20307. <user-agent>
  20308. <ID>id_t_z_1429</ID>
  20309. <String>vspider/3.x</String>
  20310. <Description>Verity vspider indexing software</Description>
  20311. <Type>R</Type>
  20312. <Comment></Comment>
  20313. <Link1>http://www.verity.com/</Link1>
  20314. <Link2></Link2>
  20315. </user-agent>
  20316. <user-agent>
  20317. <ID>id_t_z_130707_1</ID>
  20318. <String>VWBOT/Nutch-0.9-dev (VWBOT Nutch Crawler; http://vwbot.cs.uiuc.edu;+vwbot@cs.uiuc.edu</String>
  20319. <Description>VWBot - MetaQuerier Crawler for the MetaQuerier project at the University of Illinois</Description>
  20320. <Type>R</Type>
  20321. <Comment>192.17.240.xx</Comment>
  20322. <Link1>http://vwbot.cs.uiuc.edu/</Link1>
  20323. <Link2>http://metaquerier.cs.uiuc.edu/</Link2>
  20324. </user-agent>
  20325. <user-agent>
  20326. <ID>id_t_z_1431</ID>
  20327. <String>W3C-checklink/3.x.x.x libwww-perl/5.xx</String>
  20328. <Description>W3C Link Checker</Description>
  20329. <Type>C</Type>
  20330. <Comment></Comment>
  20331. <Link1>http://validator.w3.org/checklink</Link1>
  20332. <Link2></Link2>
  20333. </user-agent>
  20334. <user-agent>
  20335. <ID>id_t_z_1432</ID>
  20336. <String>W3C-checklink/4.x [4.xx] libwww-perl/5.xxx</String>
  20337. <Description>W3C Link Checker</Description>
  20338. <Type>C</Type>
  20339. <Comment></Comment>
  20340. <Link1>http://validator.w3.org/checklink</Link1>
  20341. <Link2></Link2>
  20342. </user-agent>
  20343. <user-agent>
  20344. <ID>id_t_z_080806_1</ID>
  20345. <String>W3C-WebCon/5.x.x libwww/5.x.x</String>
  20346. <Description>WebCon - the Libwww command line tool</Description>
  20347. <Type>D</Type>
  20348. <Comment></Comment>
  20349. <Link1>http://www.w3.org/ComLine/</Link1>
  20350. <Link2></Link2>
  20351. </user-agent>
  20352. <user-agent>
  20353. <ID>id_t_z_1433</ID>
  20354. <String>W3CLineMode/5.4.0 libwww/5.x.x</String>
  20355. <Description>W3C Line Mode (character based Web browser)</Description>
  20356. <Type>B</Type>
  20357. <Comment></Comment>
  20358. <Link1>http://www.w3.org/LineMode/</Link1>
  20359. <Link2></Link2>
  20360. </user-agent>
  20361. <user-agent>
  20362. <ID>id_t_z_1434</ID>
  20363. <String>W3CRobot/5.4.0 libwww/5.4.0</String>
  20364. <Description>Unknown link checking using Libwww via Korea Telecom (221.148.44.xxx)</Description>
  20365. <Type>C</Type>
  20366. <Comment></Comment>
  20367. <Link1>http://www.w3.org/Library/</Link1>
  20368. <Link2></Link2>
  20369. </user-agent>
  20370. <user-agent>
  20371. <ID>id_t_z_1430</ID>
  20372. <String>W3C_Validator/1.xxx libwww-perl/5.xx</String>
  20373. <Description>W3C HTML-Code Validator</Description>
  20374. <Type>C</Type>
  20375. <Comment></Comment>
  20376. <Link1>http://validator.w3.org/</Link1>
  20377. <Link2></Link2>
  20378. </user-agent>
  20379. <user-agent>
  20380. <ID>id_t_z_1435</ID>
  20381. <String>w3m/0.x.xx</String>
  20382. <Description>w3m Linux pager / text-based browser</Description>
  20383. <Type>B</Type>
  20384. <Comment></Comment>
  20385. <Link1>http://w3m.sourceforge.net/</Link1>
  20386. <Link2></Link2>
  20387. </user-agent>
  20388. <user-agent>
  20389. <ID>id_t_z_1436</ID>
  20390. <String>W3SiteSearch Crawler_v1.1 http://www.w3sitesearch.de</String>
  20391. <Description>W3 Site Search (Germany) search engine solution</Description>
  20392. <Type>R</Type>
  20393. <Comment></Comment>
  20394. <Link1>http://www.w3sitesearch.de/</Link1>
  20395. <Link2></Link2>
  20396. </user-agent>
  20397. <user-agent>
  20398. <ID>id_t_z_061206_3</ID>
  20399. <String>wadaino.jp-crawler 0.2 (http://wadaino.jp/)</String>
  20400. <Description>Wadain (Japan) Blog / RSS search crawler</Description>
  20401. <Type>R</Type>
  20402. <Comment>202.51.14.1xx</Comment>
  20403. <Link1>http://wadaino.jp/</Link1>
  20404. <Link2></Link2>
  20405. </user-agent>
  20406. <user-agent>
  20407. <ID>id_t_z_1437</ID>
  20408. <String>WannaBe (Macintosh; PPC)</String>
  20409. <Description>Wanna-Be text mode browser</Description>
  20410. <Type>B</Type>
  20411. <Comment></Comment>
  20412. <Link1>http://mindstory.com/wb2/</Link1>
  20413. <Link2></Link2>
  20414. </user-agent>
  20415. <user-agent>
  20416. <ID>id_t_z_270906_1</ID>
  20417. <String>WapOnWindows 1.0</String>
  20418. <Description>WapOnWindows WAP browser for PCs</Description>
  20419. <Type>B</Type>
  20420. <Comment>Site is dead</Comment>
  20421. <Link1>http://www.waponwindows.com/</Link1>
  20422. <Link2></Link2>
  20423. </user-agent>
  20424. <user-agent>
  20425. <ID>id_t_z_250206_2</ID>
  20426. <String>Watchfire WebXM 1.0</String>
  20427. <Description>Watchfire WebXM intranet solution</Description>
  20428. <Type>P</Type>
  20429. <Comment></Comment>
  20430. <Link1>http://www.watchfire.com/products/webxm/default.aspx</Link1>
  20431. <Link2></Link2>
  20432. </user-agent>
  20433. <user-agent>
  20434. <ID>id_t_z_200706_1</ID>
  20435. <String>WAVcheck 1.0.x (http://www.webbanalys.se/apps/WAVcheck/)</String>
  20436. <Description>WAVcheck - Simple Vendor Discovery Tool for detecting client-side tags from web analytics vendors</Description>
  20437. <Type>C</Type>
  20438. <Comment></Comment>
  20439. <Link1>http://www.webbanalys.se/apps/WAVcheck/</Link1>
  20440. <Link2></Link2>
  20441. </user-agent>
  20442. <user-agent>
  20443. <ID>id_t_z_110106_1</ID>
  20444. <String>Wavefire/0.8-dev (Wavefire; http://www.wavefire.com; info@wavefire.com)</String>
  20445. <Description>Wavefire local search community engine (64.141.15.1xx)</Description>
  20446. <Type>R</Type>
  20447. <Comment></Comment>
  20448. <Link1>http://www.wavefire.com/</Link1>
  20449. <Link2></Link2>
  20450. </user-agent>
  20451. <user-agent>
  20452. <ID>id_t_z_110206_5</ID>
  20453. <String>Waypath development crawler - info at waypath dot com</String>
  20454. <Description>Waypath blog discovery engine robot</Description>
  20455. <Type>R</Type>
  20456. <Comment></Comment>
  20457. <Link1>http://www.waypath.com/</Link1>
  20458. <Link2></Link2>
  20459. </user-agent>
  20460. <user-agent>
  20461. <ID>id_t_z_110206_6</ID>
  20462. <String>Waypath Scout v2.x - info at waypath dot com</String>
  20463. <Description>Waypath blog discovery engine robot</Description>
  20464. <Type>R</Type>
  20465. <Comment></Comment>
  20466. <Link1>http://www.waypath.com/</Link1>
  20467. <Link2></Link2>
  20468. </user-agent>
  20469. <user-agent>
  20470. <ID>id_t_z_1438</ID>
  20471. <String>WDG_Validator/1.1</String>
  20472. <Description>WDG HTML-code validator</Description>
  20473. <Type>C</Type>
  20474. <Comment></Comment>
  20475. <Link1>http://www.htmlhelp.tne.co.uk/tools/validator/</Link1>
  20476. <Link2></Link2>
  20477. </user-agent>
  20478. <user-agent>
  20479. <ID>id_t_z_1439</ID>
  20480. <String>Web Image Collector</String>
  20481. <Description>Datafire.com's Web Image Collector (graphics downloading tool)</Description>
  20482. <Type>D</Type>
  20483. <Comment></Comment>
  20484. <Link1>http://www.datafire.com/</Link1>
  20485. <Link2></Link2>
  20486. </user-agent>
  20487. <user-agent>
  20488. <ID>id_t_z_1440</ID>
  20489. <String>Web Link Validator 1.5</String>
  20490. <Description>Relsoft link checking software</Description>
  20491. <Type>C</Type>
  20492. <Comment></Comment>
  20493. <Link1>http://www.relsoftware.com/</Link1>
  20494. <Link2></Link2>
  20495. </user-agent>
  20496. <user-agent>
  20497. <ID>id_t_z_1441</ID>
  20498. <String>Web Snooper</String>
  20499. <Description>RankMeter ranking software</Description>
  20500. <Type>R</Type>
  20501. <Comment></Comment>
  20502. <Link1>http://www.searchutilities.com/</Link1>
  20503. <Link2></Link2>
  20504. </user-agent>
  20505. <user-agent>
  20506. <ID>id_t_z_010206_2</ID>
  20507. <String>web-bekannt (Version: 1.02&#44; powered by www.internetservice-franken.de)</String>
  20508. <Description>Web-bekannt German web directory link checking</Description>
  20509. <Type>C</Type>
  20510. <Comment></Comment>
  20511. <Link1>http://www.web-bekannt.de/</Link1>
  20512. <Link2></Link2>
  20513. </user-agent>
  20514. <user-agent>
  20515. <ID>id_t_z_010206_1</ID>
  20516. <String>web-bekannt (Version: 1.02&#44; powered by www.web-bekannt.de)</String>
  20517. <Description>Web-bekannt German web directory link checking</Description>
  20518. <Type>C</Type>
  20519. <Comment></Comment>
  20520. <Link1>http://www.web-bekannt.de/</Link1>
  20521. <Link2></Link2>
  20522. </user-agent>
  20523. <user-agent>
  20524. <ID>id_t_z_1442</ID>
  20525. <String>Web-Bot V1.03</String>
  20526. <Description>Unkown link or server checking from W&#252;rzburg University Germany (132.187.10.xx)</Description>
  20527. <Type>R C</Type>
  20528. <Comment></Comment>
  20529. <Link1>http://informatik.uni-wuerzburg.de/</Link1>
  20530. <Link2></Link2>
  20531. </user-agent>
  20532. <user-agent>
  20533. <ID>id_t_z_1443</ID>
  20534. <String>Web-Robot/5.0 (en-US; web-robot.com/policy.html) Web-Robot Crawler/2.0.3</String>
  20535. <Description>Unknown robot from 69.50.233.x (nectartech.com)</Description>
  20536. <Type></Type>
  20537. <Comment>no active website</Comment>
  20538. <Link1></Link1>
  20539. <Link2></Link2>
  20540. </user-agent>
  20541. <user-agent>
  20542. <ID>id_t_z_010107_2</ID>
  20543. <String>web2express.org/Nutch-0.9-dev (leveled playing field; http://web2express.org/; info at web2express.org)</String>
  20544. <Description>Web2Express / Web2x - Open data searching tool</Description>
  20545. <Type>R</Type>
  20546. <Comment></Comment>
  20547. <Link1>http://search.web2express.org/search/search.html</Link1>
  20548. <Link2></Link2>
  20549. </user-agent>
  20550. <user-agent>
  20551. <ID>id_t_z_050206_1</ID>
  20552. <String>WebAlta Crawler/1.2.1 (http://www.webalta.ru/bot.html)</String>
  20553. <Description>WebAlta search Russia crawler (85.21.201.xx)</Description>
  20554. <Type>R</Type>
  20555. <Comment></Comment>
  20556. <Link1>http://www.webalta.ru/</Link1>
  20557. <Link2></Link2>
  20558. </user-agent>
  20559. <user-agent>
  20560. <ID>id_t_z_250806_1</ID>
  20561. <String>WebarooBot (Webaroo Bot; http://64.124.122.252/feedback.html)</String>
  20562. <Description>WebarooBot / RufusBot from webaroo offline search service</Description>
  20563. <Type>R</Type>
  20564. <Comment>64.124.122.2xx</Comment>
  20565. <Link1>http://www.webaroo.com/</Link1>
  20566. <Link2>http://www.webaroo.com/company/site-owners</Link2>
  20567. </user-agent>
  20568. <user-agent>
  20569. <ID>id_t_z_210407_1</ID>
  20570. <String>WebarooBot (Webaroo Bot; http://www.webaroo.com/rooSiteOwners.html)</String>
  20571. <Description>WebarooBot / RufusBot from webaroo offline search service</Description>
  20572. <Type>R</Type>
  20573. <Comment>64.124.122.2xx</Comment>
  20574. <Link1>http://www.webaroo.com/</Link1>
  20575. <Link2>http://www.webaroo.com/company/site-owners</Link2>
  20576. </user-agent>
  20577. <user-agent>
  20578. <ID>id_t_z_1444</ID>
  20579. <String>WebAuto/3.4xxx (WinNT; I)</String>
  20580. <Description>Yanasoft WebAuto website copier / downloading tool</Description>
  20581. <Type>D</Type>
  20582. <Comment></Comment>
  20583. <Link1>http://www.yanasoft.co.jp/webauto.html</Link1>
  20584. <Link2></Link2>
  20585. </user-agent>
  20586. <user-agent>
  20587. <ID>id_t_z_1445</ID>
  20588. <String>webbandit/4.xx.0</String>
  20589. <Description>Web Bandit personal search software</Description>
  20590. <Type>R</Type>
  20591. <Comment></Comment>
  20592. <Link1>http://softwaresolutions.net/webbandit/</Link1>
  20593. <Link2></Link2>
  20594. </user-agent>
  20595. <user-agent>
  20596. <ID>id_t_z_140106_2</ID>
  20597. <String>WebBug/5.x</String>
  20598. <Description>Amansoft WebBug web server protocol test</Description>
  20599. <Type>C</Type>
  20600. <Comment></Comment>
  20601. <Link1>http://www.cyberspyder.com/webbug.html</Link1>
  20602. <Link2></Link2>
  20603. </user-agent>
  20604. <user-agent>
  20605. <ID>id_t_z_1446</ID>
  20606. <String>Webclipping.com</String>
  20607. <Description>WebClipping.com - online news monitoring service</Description>
  20608. <Type>R</Type>
  20609. <Comment></Comment>
  20610. <Link1>http://www.webclipping.com</Link1>
  20611. <Link2></Link2>
  20612. </user-agent>
  20613. <user-agent>
  20614. <ID>id_t_z_1447</ID>
  20615. <String>webcollage/1.xx</String>
  20616. <Description>WebCollage Syndicator graphics crawler/collector</Description>
  20617. <Type>R D</Type>
  20618. <Comment>s. also collage.cgi/1.xx</Comment>
  20619. <Link1>http://www.webcollage.com/</Link1>
  20620. <Link2></Link2>
  20621. </user-agent>
  20622. <user-agent>
  20623. <ID>id_t_z_1448</ID>
  20624. <String>WebCompass 2.0</String>
  20625. <Description>Quarterdecks WebCompass search tool</Description>
  20626. <Type>R</Type>
  20627. <Comment></Comment>
  20628. <Link1></Link1>
  20629. <Link2></Link2>
  20630. </user-agent>
  20631. <user-agent>
  20632. <ID>id_t_z_1449</ID>
  20633. <String>WebCopier vx.x</String>
  20634. <Description>WebCopier offline browser</Description>
  20635. <Type>D B</Type>
  20636. <Comment></Comment>
  20637. <Link1>http://www.maximumsoft.com/</Link1>
  20638. <Link2></Link2>
  20639. </user-agent>
  20640. <user-agent>
  20641. <ID>id_t_z_1450</ID>
  20642. <String>WebCopier vx.xa</String>
  20643. <Description>WebCopier offline browser</Description>
  20644. <Type>D B</Type>
  20645. <Comment></Comment>
  20646. <Link1>http://www.maximumsoft.com/</Link1>
  20647. <Link2></Link2>
  20648. </user-agent>
  20649. <user-agent>
  20650. <ID>id_t_z_210506_1</ID>
  20651. <String>WebCorp/1.0</String>
  20652. <Description>WebCorp linguistic search engine (UK)</Description>
  20653. <Type>R</Type>
  20654. <Comment>193.60.130.xx</Comment>
  20655. <Link1>http://webcorp.uce.ac.uk/</Link1>
  20656. <Link2></Link2>
  20657. </user-agent>
  20658. <user-agent>
  20659. <ID>id_t_z_1451</ID>
  20660. <String>webcrawl.net</String>
  20661. <Description>Webcrawl Search robot (64.40.105.xxx)</Description>
  20662. <Type>R</Type>
  20663. <Comment></Comment>
  20664. <Link1>http://www.webcrawl.net/</Link1>
  20665. <Link2></Link2>
  20666. </user-agent>
  20667. <user-agent>
  20668. <ID>id_t_z_1452</ID>
  20669. <String>WebDownloader for X x.xx</String>
  20670. <Description>Unix/Linux Web Downloader</Description>
  20671. <Type>D</Type>
  20672. <Comment></Comment>
  20673. <Link1>http://www.krasu.ru/soft/chuchelo/</Link1>
  20674. <Link2></Link2>
  20675. </user-agent>
  20676. <user-agent>
  20677. <ID>id_t_z_1453</ID>
  20678. <String>Webdup/0.9</String>
  20679. <Description>Unknown robot from china-netcom.com</Description>
  20680. <Type></Type>
  20681. <Comment></Comment>
  20682. <Link1></Link1>
  20683. <Link2></Link2>
  20684. </user-agent>
  20685. <user-agent>
  20686. <ID>id_t_z_1454</ID>
  20687. <String>WebFetch</String>
  20688. <Description>WingFlyer WebFetch website downloading tool</Description>
  20689. <Type>D B</Type>
  20690. <Comment></Comment>
  20691. <Link1>http://www.wingflyer.com/</Link1>
  20692. <Link2></Link2>
  20693. </user-agent>
  20694. <user-agent>
  20695. <ID>id_t_z_1455</ID>
  20696. <String>webfetch/5.x.x</String>
  20697. <Description>webfetch - command line tool to fetch files via HTTP</Description>
  20698. <Type>D</Type>
  20699. <Comment></Comment>
  20700. <Link1>http://tony.aiu.to/sa/webfetch/</Link1>
  20701. <Link2></Link2>
  20702. </user-agent>
  20703. <user-agent>
  20704. <ID>id_t_z_310806_2</ID>
  20705. <String>WebFilter Robot 1.0</String>
  20706. <Description>Verso NetSpective WebFilter</Description>
  20707. <Type>P</Type>
  20708. <Comment></Comment>
  20709. <Link1>http://www.verso.com/enterprise/netspective/webfilter.asp</Link1>
  20710. <Link2></Link2>
  20711. </user-agent>
  20712. <user-agent>
  20713. <ID>id_t_z_1456</ID>
  20714. <String>WebFilter Robot 1.x</String>
  20715. <Description>Telemate.net NetSpective WebFilter</Description>
  20716. <Type>P</Type>
  20717. <Comment></Comment>
  20718. <Link1>http://www.telemate.net/</Link1>
  20719. <Link2></Link2>
  20720. </user-agent>
  20721. <user-agent>
  20722. <ID>id_t_z_1457</ID>
  20723. <String>WebFindBot(http://www.web-find.com)</String>
  20724. <Description>Webfind search robot</Description>
  20725. <Type>R</Type>
  20726. <Comment></Comment>
  20727. <Link1>http://www.web-find.com/</Link1>
  20728. <Link2></Link2>
  20729. </user-agent>
  20730. <user-agent>
  20731. <ID>id_t_z_1458</ID>
  20732. <String>Webglimpse 2.xx.x (http://webglimpse.net)</String>
  20733. <Description>Webglimpse search engine software</Description>
  20734. <Type>R</Type>
  20735. <Comment></Comment>
  20736. <Link1>http://www.webglimpse.net/</Link1>
  20737. <Link2></Link2>
  20738. </user-agent>
  20739. <user-agent>
  20740. <ID>id_t_z_150306_2</ID>
  20741. <String>webGobbler/1.x.x</String>
  20742. <Description>webGobbler - Online random image generator</Description>
  20743. <Type>R D</Type>
  20744. <Comment></Comment>
  20745. <Link1>http://sebsauvage.net/webgobbler/</Link1>
  20746. <Link2></Link2>
  20747. </user-agent>
  20748. <user-agent>
  20749. <ID>id_t_z_1459</ID>
  20750. <String>webhack</String>
  20751. <Description>fake ?</Description>
  20752. <Type></Type>
  20753. <Comment></Comment>
  20754. <Link1></Link1>
  20755. <Link2></Link2>
  20756. </user-agent>
  20757. <user-agent>
  20758. <ID>id_t_z_290807_2</ID>
  20759. <String>WebImages 0.3 ( http://herbert.groot.jebbink.nl/?app=WebImages )</String>
  20760. <Description>herbert.groot.jebbink.nl Web Images collage generator</Description>
  20761. <Type>D</Type>
  20762. <Comment>212.204.217.1xx</Comment>
  20763. <Link1>http://herbert.groot.jebbink.nl/</Link1>
  20764. <Link2></Link2>
  20765. </user-agent>
  20766. <user-agent>
  20767. <ID>id_t_z_280306_2</ID>
  20768. <String>WebLight/4.x.x (support@illumit.com; http://www.illumit.com/Products/weblight/)</String>
  20769. <Description>WebLight web analyzer &amp; link checker</Description>
  20770. <Type>C</Type>
  20771. <Comment>s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com...</Comment>
  20772. <Link1>http://www.illumit.com/Products/weblight/</Link1>
  20773. <Link2></Link2>
  20774. </user-agent>
  20775. <user-agent>
  20776. <ID>id_t_z_1460</ID>
  20777. <String>Weblink's checker/</String>
  20778. <Description>WebLink's link management system for HTTP- FTP and Mail hyperlinks</Description>
  20779. <Type>C</Type>
  20780. <Comment>sometimes in conjunction w. PHP/4.0.6</Comment>
  20781. <Link1>http://www.harlequin.ch/technologien/tools/weblinks.php</Link1>
  20782. <Link2></Link2>
  20783. </user-agent>
  20784. <user-agent>
  20785. <ID>id_t_z_140307_1</ID>
  20786. <String>Weblog Attitude Diffusion 1.0</String>
  20787. <Description>Los Alamos National Laboratoy weblog research project</Description>
  20788. <Type>R</Type>
  20789. <Comment></Comment>
  20790. <Link1>http://www.user-agents.org/agents/weblogattitude.shtml</Link1>
  20791. <Link2>http://www.lanl.gov/</Link2>
  20792. </user-agent>
  20793. <user-agent>
  20794. <ID>id_t_z_230606_1</ID>
  20795. <String>webmeasurement-bot&#44; http://rvs.informatik.uni-leipzig.de</String>
  20796. <Description>Unknown robot from Leipzig University (Germany) faculty for computer science</Description>
  20797. <Type>R</Type>
  20798. <Comment>139.18.38.1xx</Comment>
  20799. <Link1>http://rvs.informatik.uni-leipzig.de/</Link1>
  20800. <Link2></Link2>
  20801. </user-agent>
  20802. <user-agent>
  20803. <ID>id_t_z_1461</ID>
  20804. <String>WebMiner/x.x [en] (Win98; I)</String>
  20805. <Description>WebMiner bulk file downloader</Description>
  20806. <Type>D</Type>
  20807. <Comment></Comment>
  20808. <Link1>http://tribolic.com/webminer/</Link1>
  20809. <Link2></Link2>
  20810. </user-agent>
  20811. <user-agent>
  20812. <ID>id_t_z_1462</ID>
  20813. <String>WeBoX/0.xx</String>
  20814. <Description>WeBoX (Japan) - Browser and web collector</Description>
  20815. <Type>B D</Type>
  20816. <Comment></Comment>
  20817. <Link1>http://www-nishio.ise.eng.osaka-u.ac.jp/~nakamura/webox/</Link1>
  20818. <Link2></Link2>
  20819. </user-agent>
  20820. <user-agent>
  20821. <ID>id_t_z_1463</ID>
  20822. <String>WebPix 1.0 (www.netwu.com)</String>
  20823. <Description>WebPix - picture downloading tool</Description>
  20824. <Type>D</Type>
  20825. <Comment></Comment>
  20826. <Link1>http://www.netwu.com/webpix/</Link1>
  20827. <Link2></Link2>
  20828. </user-agent>
  20829. <user-agent>
  20830. <ID>id_t_z_1464</ID>
  20831. <String>WebQL</String>
  20832. <Description>Caesius WebQL - Custom robot/agent generator / web extraction software</Description>
  20833. <Type>B D</Type>
  20834. <Comment></Comment>
  20835. <Link1>http://www.caesius.com/</Link1>
  20836. <Link2></Link2>
  20837. </user-agent>
  20838. <user-agent>
  20839. <ID>id_t_z_1465</ID>
  20840. <String>WebRACE/1.1 (University of Cyprus- Distributed Crawler)</String>
  20841. <Description>WebRACE - HTTP retrieval- annotation and caching engine</Description>
  20842. <Type>P</Type>
  20843. <Comment></Comment>
  20844. <Link1>http://www.cs.ucy.ac.cy/Projects/eRACE/webrace.html</Link1>
  20845. <Link2></Link2>
  20846. </user-agent>
  20847. <user-agent>
  20848. <ID>id_t_z_130907_1</ID>
  20849. <String>WebRankSpider/1.37 (+http://ulm191.server4you.de/crawler/)</String>
  20850. <Description>WebRankSpider experimental web crawler</Description>
  20851. <Type>R</Type>
  20852. <Comment>62.75.202.1xx</Comment>
  20853. <Link1>http://ulm191.server4you.de/crawler/</Link1>
  20854. <Link2></Link2>
  20855. </user-agent>
  20856. <user-agent>
  20857. <ID>id_t_z_1468</ID>
  20858. <String>WebReaper vx.x - www.webreaper.net</String>
  20859. <Description>Webreaper download manager</Description>
  20860. <Type>D</Type>
  20861. <Comment></Comment>
  20862. <Link1>http://www.webreaper.net/</Link1>
  20863. <Link2></Link2>
  20864. </user-agent>
  20865. <user-agent>
  20866. <ID>id_t_z_1466</ID>
  20867. <String>WebReaper [info@webreaper.net]</String>
  20868. <Description>Webreaper download manager</Description>
  20869. <Type>D</Type>
  20870. <Comment></Comment>
  20871. <Link1>http://www.webreaper.net/</Link1>
  20872. <Link2></Link2>
  20873. </user-agent>
  20874. <user-agent>
  20875. <ID>id_t_z_1467</ID>
  20876. <String>WebReaper [webreaper@webreaper.net]</String>
  20877. <Description>Webreaper download manager</Description>
  20878. <Type>D</Type>
  20879. <Comment></Comment>
  20880. <Link1>http://www.webreaper.net/</Link1>
  20881. <Link2></Link2>
  20882. </user-agent>
  20883. <user-agent>
  20884. <ID>id_t_z_1469</ID>
  20885. <String>WebSearch.COM.AU/3.0.1 (The Australian Search Engine; http://WebSearch.COM.AU; Search@WebSearch.COM.AU)</String>
  20886. <Description>Websearch Australia robot</Description>
  20887. <Type>R</Type>
  20888. <Comment></Comment>
  20889. <Link1>http://WebSearch.COM.AU/</Link1>
  20890. <Link2></Link2>
  20891. </user-agent>
  20892. <user-agent>
  20893. <ID>id_t_z_1470</ID>
  20894. <String>WebSearchBench WebCrawler v0.1(Experimental)</String>
  20895. <Description>Dortmund University WebSearchBench - Open source search software</Description>
  20896. <Type>R</Type>
  20897. <Comment></Comment>
  20898. <Link1>http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de</Link1>
  20899. <Link2></Link2>
  20900. </user-agent>
  20901. <user-agent>
  20902. <ID>id_t_z_1471</ID>
  20903. <String>WebSearchBench WebCrawler V1.0 (Beta)- Prof. Dr.-Ing. Christoph Lindemann- Universit&#228;t Dortmund- cl@cs.uni-dortmund.de- http://websearchbench.cs.uni-dortmund.de/</String>
  20904. <Description>Dortmund University WebSearchBench - Open source search software</Description>
  20905. <Type>R</Type>
  20906. <Comment></Comment>
  20907. <Link1>http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de</Link1>
  20908. <Link2></Link2>
  20909. </user-agent>
  20910. <user-agent>
  20911. <ID>id_t_z_260806_2</ID>
  20912. <String>Website Explorer/0.9.x.x</String>
  20913. <Description>Web site downloading tool and offline browser (Japan)</Description>
  20914. <Type>D</Type>
  20915. <Comment></Comment>
  20916. <Link1>http://www.umechando.com/webex/</Link1>
  20917. <Link2></Link2>
  20918. </user-agent>
  20919. <user-agent>
  20920. <ID>id_t_z_1472</ID>
  20921. <String>Website eXtractor</String>
  20922. <Description>Website eXtractor web site downloading tool</Description>
  20923. <Type>D</Type>
  20924. <Comment></Comment>
  20925. <Link1>http://www.asona.org/</Link1>
  20926. <Link2>http://www.internet-soft.com/</Link2>
  20927. </user-agent>
  20928. <user-agent>
  20929. <ID>id_t_z_090606_1</ID>
  20930. <String>WebsiteWorth v1.0</String>
  20931. <Description>Sootle web directory Website Worth ranking tool</Description>
  20932. <Type>R</Type>
  20933. <Comment>216.89.111.x</Comment>
  20934. <Link1>http://directory.sootle.com/website-worth/</Link1>
  20935. <Link2></Link2>
  20936. </user-agent>
  20937. <user-agent>
  20938. <ID>id_t_z_1473</ID>
  20939. <String>Webspinne/1.0 webmaster@webspinne.de</String>
  20940. <Description>Webspinne.de robot</Description>
  20941. <Type>R</Type>
  20942. <Comment></Comment>
  20943. <Link1>http://www.webspinne.de/</Link1>
  20944. <Link2></Link2>
  20945. </user-agent>
  20946. <user-agent>
  20947. <ID>id_t_z_1474</ID>
  20948. <String>Websquash.com (Add url robot)</String>
  20949. <Description>Websquash.com Search Engine robot / link checking</Description>
  20950. <Type>R</Type>
  20951. <Comment></Comment>
  20952. <Link1>http://www.websquash.com/</Link1>
  20953. <Link2></Link2>
  20954. </user-agent>
  20955. <user-agent>
  20956. <ID>id_t_z_1475</ID>
  20957. <String>WebStat/1.0 (Unix; beta; 20040314)</String>
  20958. <Description>WebStat - Java statistical computing environment for the web</Description>
  20959. <Type>R</Type>
  20960. <Comment></Comment>
  20961. <Link1>http://www.math.psu.edu/babcock/webstat/version1.0/</Link1>
  20962. <Link2></Link2>
  20963. </user-agent>
  20964. <user-agent>
  20965. <ID>id_t_z_091006_2</ID>
  20966. <String>Webster v0.3 ( http://webster.healeys.net/ )</String>
  20967. <Description>Webster - Rev. Healeys web crawler</Description>
  20968. <Type>R</Type>
  20969. <Comment>24.99.22.xx</Comment>
  20970. <Link1>http://webster.healeys.net/</Link1>
  20971. <Link2>http://webster.healeys.net/search.php</Link2>
  20972. </user-agent>
  20973. <user-agent>
  20974. <ID>id_t_z_1476</ID>
  20975. <String>webster-internet.de pad browser</String>
  20976. <Description>Websters Webmaster Archive (Germany) submission / pad checking</Description>
  20977. <Type>C B</Type>
  20978. <Comment></Comment>
  20979. <Link1>http://webster.de/</Link1>
  20980. <Link2></Link2>
  20981. </user-agent>
  20982. <user-agent>
  20983. <ID>id_t_z_1477</ID>
  20984. <String>WebStripper/2.xx</String>
  20985. <Description>WebStripper download manager</Description>
  20986. <Type>D</Type>
  20987. <Comment></Comment>
  20988. <Link1>http://webstripper.net/index.html</Link1>
  20989. <Link2>http://www.netidea.it</Link2>
  20990. </user-agent>
  20991. <user-agent>
  20992. <ID>id_t_z_1478</ID>
  20993. <String>WebTrafficExpress/x.0</String>
  20994. <Description>WebTrafficExpress IBM server software</Description>
  20995. <Type>P</Type>
  20996. <Comment></Comment>
  20997. <Link1></Link1>
  20998. <Link2></Link2>
  20999. </user-agent>
  21000. <user-agent>
  21001. <ID>id_t_z_1479</ID>
  21002. <String>WebTrends/3.0 (WinNT)</String>
  21003. <Description>Web Trends link analyzer</Description>
  21004. <Type>C</Type>
  21005. <Comment></Comment>
  21006. <Link1>http://www.netiq.com/webtrends/default.asp</Link1>
  21007. <Link2></Link2>
  21008. </user-agent>
  21009. <user-agent>
  21010. <ID>id_t_z_1480</ID>
  21011. <String>WebVac (webmaster@pita.stanford.edu)</String>
  21012. <Description>The Stanford WebBase Project crawler</Description>
  21013. <Type>R</Type>
  21014. <Comment>ex Pita- s. there</Comment>
  21015. <Link1>http://www-diglib.stanford.edu/~testbed/doc2/WebBase/</Link1>
  21016. <Link2></Link2>
  21017. </user-agent>
  21018. <user-agent>
  21019. <ID>id_t_z_1481</ID>
  21020. <String>WebVal/1.0</String>
  21021. <Description>webval - Python link checking tool</Description>
  21022. <Type>C</Type>
  21023. <Comment></Comment>
  21024. <Link1>http://www.alcyone.com/pyos/webval/</Link1>
  21025. <Link2></Link2>
  21026. </user-agent>
  21027. <user-agent>
  21028. <ID>id_t_z_171205_3</ID>
  21029. <String>Webverzeichnis.de - Telefon: 01908 / 26005</String>
  21030. <Description>Webverzeichnis.de (Germany) directory robot</Description>
  21031. <Type>R</Type>
  21032. <Comment></Comment>
  21033. <Link1>http://www.webverzeichnis.de/</Link1>
  21034. <Link2></Link2>
  21035. </user-agent>
  21036. <user-agent>
  21037. <ID>id_t_z_060306_1</ID>
  21038. <String>WebVulnCrawl.unknown/1.0 libwww-perl/5.803</String>
  21039. <Description>Web Vulnerability Crawler</Description>
  21040. <Type>S</Type>
  21041. <Comment>Looking for excluded directories in robots.txt</Comment>
  21042. <Link1>http://webvulncrawl.blogspot.com/2005/12/what-am-i-doing.html</Link1>
  21043. <Link2></Link2>
  21044. </user-agent>
  21045. <user-agent>
  21046. <ID>id_t_z_1482</ID>
  21047. <String>WebWatcherMonitor/2.01</String>
  21048. <Description>Studio Net.Idea's Web Watcher Monitor robot</Description>
  21049. <Type>R C</Type>
  21050. <Comment></Comment>
  21051. <Link1>http://www.web-watcher.com/web-watcher-monitor.html</Link1>
  21052. <Link2></Link2>
  21053. </user-agent>
  21054. <user-agent>
  21055. <ID>id_t_z_1483</ID>
  21056. <String>WebZIP/x.x (http://www.spidersoft.com)</String>
  21057. <Description>WebZip offline browser</Description>
  21058. <Type>B D</Type>
  21059. <Comment></Comment>
  21060. <Link1>http://www.spidersoft.com/</Link1>
  21061. <Link2></Link2>
  21062. </user-agent>
  21063. <user-agent>
  21064. <ID>id_t_z_1484</ID>
  21065. <String>Wells Search II</String>
  21066. <Description>Unknown spam bot / harvester (62.163.**.** / 62.194.**.*)</Description>
  21067. <Type>S</Type>
  21068. <Comment>s.also - Port Huron Labs</Comment>
  21069. <Link1></Link1>
  21070. <Link2></Link2>
  21071. </user-agent>
  21072. <user-agent>
  21073. <ID>id_t_z_1485</ID>
  21074. <String>WEP Search 00</String>
  21075. <Description>Some spam bot- see link</Description>
  21076. <Type>S</Type>
  21077. <Comment></Comment>
  21078. <Link1>http://www.kloth.net/internet/badbots-2004.php</Link1>
  21079. <Link2></Link2>
  21080. </user-agent>
  21081. <user-agent>
  21082. <ID>id_t_z_230606_2</ID>
  21083. <String>West Wind Internet Protocols 4.xx</String>
  21084. <Description>wwIPStuff - Internet client tools for Visual FoxPro</Description>
  21085. <Type>B D</Type>
  21086. <Comment></Comment>
  21087. <Link1>http://www.west-wind.com/wwipstuff.asp</Link1>
  21088. <Link2></Link2>
  21089. </user-agent>
  21090. <user-agent>
  21091. <ID>id_t_z_1486</ID>
  21092. <String>WFARC</String>
  21093. <Description>IBM's Almaden Research robot (Clever search project)</Description>
  21094. <Type>R</Type>
  21095. <Comment>s. also: - http://www.almaden.ibm.com/cs/crawler - FocusedSampler</Comment>
  21096. <Link1>http://www.almaden.ibm.com/cs/k53/clever.html</Link1>
  21097. <Link2></Link2>
  21098. </user-agent>
  21099. <user-agent>
  21100. <ID>id_t_z_1488</ID>
  21101. <String>Wget/1.x(.x)GNU wget http://www.gnu.org/software/wget/wget.html - file downloader</String>
  21102. <Description>GNU wget - file downloader</Description>
  21103. <Type>D</Type>
  21104. <Comment></Comment>
  21105. <Link1>http://www.gnu.org/software/wget/wget.html</Link1>
  21106. <Link2></Link2>
  21107. </user-agent>
  21108. <user-agent>
  21109. <ID>id_t_z_1489</ID>
  21110. <String>Wget/1.x+cvs-stable (Red Hat modified)</String>
  21111. <Description>GNU wget - file downloader</Description>
  21112. <Type>D</Type>
  21113. <Comment></Comment>
  21114. <Link1>http://www.gnu.org/software/wget/wget.html</Link1>
  21115. <Link2></Link2>
  21116. </user-agent>
  21117. <user-agent>
  21118. <ID>id_t_z_1487</ID>
  21119. <String>Wget/1.x.x+cvs</String>
  21120. <Description>GNU wget - file downloader</Description>
  21121. <Type>D</Type>
  21122. <Comment></Comment>
  21123. <Link1>http://www.gnu.org/software/wget/wget.html</Link1>
  21124. <Link2></Link2>
  21125. </user-agent>
  21126. <user-agent>
  21127. <ID>id_t_z_1490</ID>
  21128. <String>Whatsup/x.x</String>
  21129. <Description>Whatsup Gold network monitor</Description>
  21130. <Type>C</Type>
  21131. <Comment></Comment>
  21132. <Link1>http://www.ipswitch.com/products/network-management.html</Link1>
  21133. <Link2></Link2>
  21134. </user-agent>
  21135. <user-agent>
  21136. <ID>id_t_z_1491</ID>
  21137. <String>whatUseek_winona/3.0</String>
  21138. <Description>WhatUSeek / Chubba robot</Description>
  21139. <Type>R</Type>
  21140. <Comment>166.90.205.x</Comment>
  21141. <Link1>http://www.whatuseek.com/</Link1>
  21142. <Link2></Link2>
  21143. </user-agent>
  21144. <user-agent>
  21145. <ID>id_t_z_1492</ID>
  21146. <String>WhizBang! Lab</String>
  21147. <Description>WhizBang! Labs (closed since May 2002) information extraction robot</Description>
  21148. <Type>R</Type>
  21149. <Comment></Comment>
  21150. <Link1></Link1>
  21151. <Link2></Link2>
  21152. </user-agent>
  21153. <user-agent>
  21154. <ID>id_t_z_1493</ID>
  21155. <String>Wildsoft Surfer</String>
  21156. <Description>some download agent</Description>
  21157. <Type>D</Type>
  21158. <Comment>- in conjunction w. dlman</Comment>
  21159. <Link1></Link1>
  21160. <Link2></Link2>
  21161. </user-agent>
  21162. <user-agent>
  21163. <ID>id_t_z_1494</ID>
  21164. <String>Willow Internet Crawler by Twotrees V2.1</String>
  21165. <Description>Twotrees crawler</Description>
  21166. <Type>R</Type>
  21167. <Comment></Comment>
  21168. <Link1>http://www.twotrees.com/</Link1>
  21169. <Link2></Link2>
  21170. </user-agent>
  21171. <user-agent>
  21172. <ID>id_t_z_1495</ID>
  21173. <String>WinampMPEG/2.00 (larbin@unspecified.mail)</String>
  21174. <Description>unknown robot from gw.ocg-corp.com (209.126.176.x)</Description>
  21175. <Type></Type>
  21176. <Comment>see also: - Opera/6.01 (larbin@.....) - MSIE-5.13 larbin@....</Comment>
  21177. <Link1></Link1>
  21178. <Link2></Link2>
  21179. </user-agent>
  21180. <user-agent>
  21181. <ID>id_t_z_1496</ID>
  21182. <String>WincerSong Agent v1.0</String>
  21183. <Description>Super Affiliate Tracker agent by Wincer Song</Description>
  21184. <Type></Type>
  21185. <Comment></Comment>
  21186. <Link1>http://www.superaffiliatetracker.com/index.htm</Link1>
  21187. <Link2></Link2>
  21188. </user-agent>
  21189. <user-agent>
  21190. <ID>id_t_z_191105_3</ID>
  21191. <String>Windows-Media-Player/10.00.00.xxxx</String>
  21192. <Description>Windows Media Player 10</Description>
  21193. <Type>B</Type>
  21194. <Comment></Comment>
  21195. <Link1></Link1>
  21196. <Link2></Link2>
  21197. </user-agent>
  21198. <user-agent>
  21199. <ID>id_t_z_160107_1</ID>
  21200. <String>WinGet 1.1</String>
  21201. <Description>Nicksoft WinGet download manager</Description>
  21202. <Type>D</Type>
  21203. <Comment>Domain is for sale</Comment>
  21204. <Link1></Link1>
  21205. <Link2></Link2>
  21206. </user-agent>
  21207. <user-agent>
  21208. <ID>id_t_z_060406_1</ID>
  21209. <String>WinHTTP Example/1.0</String>
  21210. <Description>Example code for a WinHTTP C++ library crawler</Description>
  21211. <Type>R</Type>
  21212. <Comment></Comment>
  21213. <Link1>http://www.codeguru.com/cpp/i-n/internet/http/article.php/c6237/</Link1>
  21214. <Link2>http://www.microsoft.com/msdownload/platformsdk/sdkupdate/update.htm</Link2>
  21215. </user-agent>
  21216. <user-agent>
  21217. <ID>id_t_z_260506_1</ID>
  21218. <String>WinkBot/0.06 (Wink.com search engine web crawler; http://www.wink.com/Wink:WinkBot; winkbot@wink.com)</String>
  21219. <Description>Wink beta search robot (64.13.136.x)</Description>
  21220. <Type>R</Type>
  21221. <Comment></Comment>
  21222. <Link1>http://www.wink.com/</Link1>
  21223. <Link2></Link2>
  21224. </user-agent>
  21225. <user-agent>
  21226. <ID>id_t_z_010607_1</ID>
  21227. <String>WinPodder (http://winpodder.com)</String>
  21228. <Description>WinPodder - Podcast player and RSS reader</Description>
  21229. <Type>B</Type>
  21230. <Comment></Comment>
  21231. <Link1>http://winpodder.com/</Link1>
  21232. <Link2></Link2>
  21233. </user-agent>
  21234. <user-agent>
  21235. <ID>id_t_z_251105_1</ID>
  21236. <String>WinWAP/3.x (3.x.x.xx; Win32) (Google WAP Proxy/1.0)</String>
  21237. <Description>WinWap - Windows PC WAP browser</Description>
  21238. <Type>B</Type>
  21239. <Comment></Comment>
  21240. <Link1>http://www.winwap.com/products_2_1.php</Link1>
  21241. <Link2></Link2>
  21242. </user-agent>
  21243. <user-agent>
  21244. <ID>id_t_z_111206_2</ID>
  21245. <String>Wir sind die Borg (Version: 1.03&#44; Sie wurden Assimiliert +http://www.yammba.com/suchmaschine/bot.html)</String>
  21246. <Description>Yammba web directory (Germany) link checking</Description>
  21247. <Type>C</Type>
  21248. <Comment></Comment>
  21249. <Link1>http://www.yammba.com/</Link1>
  21250. <Link2></Link2>
  21251. </user-agent>
  21252. <user-agent>
  21253. <ID>id_t_z_130506_2</ID>
  21254. <String>WIRE/0.11 (Linux; i686; Bot&#44;Robot&#44;Spider&#44;Crawler&#44;aromano@cli.di.unipi.it)</String>
  21255. <Description>WIRE crawler used by the University of Pisa - Italy</Description>
  21256. <Type>R</Type>
  21257. <Comment>146.48.82.xx</Comment>
  21258. <Link1>http://www.cwr.cl/projects/WIRE/</Link1>
  21259. <Link2>http://www.unipi.it/english/index.htm</Link2>
  21260. </user-agent>
  21261. <user-agent>
  21262. <ID>id_t_z_1497</ID>
  21263. <String>WIRE/0.x (Linux; i686; Bot&#44;Robot&#44;Spider&#44;Crawler)</String>
  21264. <Description>WIRE - Web information retrieval environment crawler</Description>
  21265. <Type>R</Type>
  21266. <Comment>Used by different IPs for different purposes</Comment>
  21267. <Link1>http://www.cwr.cl/projects/WIRE/</Link1>
  21268. <Link2></Link2>
  21269. </user-agent>
  21270. <user-agent>
  21271. <ID>id_t_z_1498</ID>
  21272. <String>WISEbot/1.0 (WISEbot@koreawisenut.com; http://wisebot.koreawisenut.com)</String>
  21273. <Description>Korea Wisenut robot</Description>
  21274. <Type>R</Type>
  21275. <Comment></Comment>
  21276. <Link1>http://www.koreawisenut.com/</Link1>
  21277. <Link2></Link2>
  21278. </user-agent>
  21279. <user-agent>
  21280. <ID>id_t_z_1499</ID>
  21281. <String>WiseWire-Spider2</String>
  21282. <Description>Wisewire domain checker (Discontinued)</Description>
  21283. <Type>R C</Type>
  21284. <Comment></Comment>
  21285. <Link1>http://www.wisewire.com/</Link1>
  21286. <Link2></Link2>
  21287. </user-agent>
  21288. <user-agent>
  21289. <ID>id_t_z_110107_2</ID>
  21290. <String>wish-project (http://wish.slis.tsukuba.ac.jp/)</String>
  21291. <Description>WISH academic research project for link checking</Description>
  21292. <Type>C</Type>
  21293. <Comment>133.51.22.xx</Comment>
  21294. <Link1>http://wish.slis.tsukuba.ac.jp/</Link1>
  21295. <Link2></Link2>
  21296. </user-agent>
  21297. <user-agent>
  21298. <ID>id_t_z_1500</ID>
  21299. <String>WordChampBot</String>
  21300. <Description>Wordchamp web page vocabulary / translation robot</Description>
  21301. <Type>B D</Type>
  21302. <Comment></Comment>
  21303. <Link1>http://www.wordchamp.com/</Link1>
  21304. <Link2></Link2>
  21305. </user-agent>
  21306. <user-agent>
  21307. <ID>id_t_z_301105_1</ID>
  21308. <String>WordPress/x.x.x.x PHP/4.x.xx</String>
  21309. <Description>WordPress personal Blog publishing platform</Description>
  21310. <Type>B</Type>
  21311. <Comment></Comment>
  21312. <Link1>http://wordpress.org/</Link1>
  21313. <Link2></Link2>
  21314. </user-agent>
  21315. <user-agent>
  21316. <ID>id_t_z_100207_1</ID>
  21317. <String>worio heritrix bot (+http://worio.com/)</String>
  21318. <Description>WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler</Description>
  21319. <Type>R</Type>
  21320. <Comment>137.82.84.xx</Comment>
  21321. <Link1>http://www.worio.com/</Link1>
  21322. <Link2>http://www.archive.org/</Link2>
  21323. </user-agent>
  21324. <user-agent>
  21325. <ID>id_t_z_291007_1</ID>
  21326. <String>woriobot ( http://www.worio.com/)</String>
  21327. <Description>WORIO (beta) search for computer scientists and programmers via Amazon Web Services</Description>
  21328. <Type>R</Type>
  21329. <Comment>67.202.45.2xx</Comment>
  21330. <Link1>http://www.worio.com/</Link1>
  21331. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  21332. </user-agent>
  21333. <user-agent>
  21334. <ID>id_t_z_1501</ID>
  21335. <String>WorldLight</String>
  21336. <Description>Entireweb Search robot (62.13.25.xxx)</Description>
  21337. <Type>R</Type>
  21338. <Comment>s. also Mozilla/4.0 (compatible; SpeedySpider ....</Comment>
  21339. <Link1>http://www.entireweb.com/</Link1>
  21340. <Link2></Link2>
  21341. </user-agent>
  21342. <user-agent>
  21343. <ID>id_t_z_1502</ID>
  21344. <String>WorQmada/1.0</String>
  21345. <Description>unknown link checking (from 4.18.57.126) ?</Description>
  21346. <Type>C</Type>
  21347. <Comment></Comment>
  21348. <Link1></Link1>
  21349. <Link2></Link2>
  21350. </user-agent>
  21351. <user-agent>
  21352. <ID>id_t_z_1503</ID>
  21353. <String>Wotbox/alpha0.6 (bot@wotbox.com; http://www.wotbox.com)</String>
  21354. <Description>Wotbox spider</Description>
  21355. <Type>R</Type>
  21356. <Comment></Comment>
  21357. <Link1>http://www.wotbox.com/</Link1>
  21358. <Link2></Link2>
  21359. </user-agent>
  21360. <user-agent>
  21361. <ID>id_t_z_1504</ID>
  21362. <String>Wotbox/alpha0.x.x (bot@wotbox.com; http://www.wotbox.com) Java/1.4.1_02</String>
  21363. <Description>Wotbox spider</Description>
  21364. <Type>R</Type>
  21365. <Comment></Comment>
  21366. <Link1>http://www.wotbox.com/</Link1>
  21367. <Link2></Link2>
  21368. </user-agent>
  21369. <user-agent>
  21370. <ID>id_t_z_1505</ID>
  21371. <String>WSB WebCrawler V1.0 (Beta)- cl@cs.uni-dortmund.de</String>
  21372. <Description>WebSearchBench crawler from Dortmund University- Germany</Description>
  21373. <Type>R</Type>
  21374. <Comment></Comment>
  21375. <Link1>http://websearchbench.cs.uni-dortmund.de/</Link1>
  21376. <Link2></Link2>
  21377. </user-agent>
  21378. <user-agent>
  21379. <ID>id_t_z_1506</ID>
  21380. <String>WSB&#44; http://websearchbench.cs.uni-dortmund.de</String>
  21381. <Description>WebSearchBench crawler from Dortmund University- Germany</Description>
  21382. <Type>R</Type>
  21383. <Comment></Comment>
  21384. <Link1>http://websearchbench.cs.uni-dortmund.de/</Link1>
  21385. <Link2></Link2>
  21386. </user-agent>
  21387. <user-agent>
  21388. <ID>id_t_z_1507</ID>
  21389. <String>wume_crawler/1.1 (http://wume.cse.lehigh.edu/~xiq204/crawler/)</String>
  21390. <Description>WUME Lab's web crawler (128.180.121.xxx)</Description>
  21391. <Type>R</Type>
  21392. <Comment></Comment>
  21393. <Link1>http://wume.cse.lehigh.edu/~xiq204/crawler/</Link1>
  21394. <Link2></Link2>
  21395. </user-agent>
  21396. <user-agent>
  21397. <ID>id_t_z_1508</ID>
  21398. <String>Wusage/x.0@boutell.com</String>
  21399. <Description>Wusage log-file analysis</Description>
  21400. <Type>R C</Type>
  21401. <Comment></Comment>
  21402. <Link1>http://www.boutell.com/wusage/</Link1>
  21403. <Link2></Link2>
  21404. </user-agent>
  21405. <user-agent>
  21406. <ID>id_t_z_120106_2</ID>
  21407. <String>Wwlib/Linux</String>
  21408. <Description>WWLib - Wolverhampton Univerity Web Library for classifying web documents</Description>
  21409. <Type>R</Type>
  21410. <Comment></Comment>
  21411. <Link1>http://www.scit.wlv.ac.uk/wwlib/</Link1>
  21412. <Link2></Link2>
  21413. </user-agent>
  21414. <user-agent>
  21415. <ID>id_t_z_1509</ID>
  21416. <String>WWSBOT 1.x [--- http://www.analyzer.nu ---]</String>
  21417. <Description>WWSBOT web server version checker</Description>
  21418. <Type>C</Type>
  21419. <Comment></Comment>
  21420. <Link1>http://www.analyzer.nu/Perl/WWSBOT.html</Link1>
  21421. <Link2></Link2>
  21422. </user-agent>
  21423. <user-agent>
  21424. <ID>id_t_z_170506_2</ID>
  21425. <String>WWW-Mechanize/1.1x</String>
  21426. <Description>Perl web page fetching module</Description>
  21427. <Type>D</Type>
  21428. <Comment></Comment>
  21429. <Link1>http://search.cpan.org/dist/WWW-Mechanize/</Link1>
  21430. <Link2></Link2>
  21431. </user-agent>
  21432. <user-agent>
  21433. <ID>id_t_z_1510</ID>
  21434. <String>www.arianna.it</String>
  21435. <Description>Arianna robot</Description>
  21436. <Type>R</Type>
  21437. <Comment></Comment>
  21438. <Link1>http://arianna.libero.it/</Link1>
  21439. <Link2></Link2>
  21440. </user-agent>
  21441. <user-agent>
  21442. <ID>id_t_z_1511</ID>
  21443. <String>www.business-socket.com registry verify/1.x</String>
  21444. <Description>Business-Socket.com link checking ?</Description>
  21445. <Type>C</Type>
  21446. <Comment></Comment>
  21447. <Link1>http://www.business-socket.com</Link1>
  21448. <Link2></Link2>
  21449. </user-agent>
  21450. <user-agent>
  21451. <ID>id_t_z_221006_2</ID>
  21452. <String>www.doweb.co.uk crawler</String>
  21453. <Description>The DoWeb UK Business directory link checking</Description>
  21454. <Type>C</Type>
  21455. <Comment>85.13.252.x</Comment>
  21456. <Link1>http://www.doweb.co.uk/action_home+page.htm</Link1>
  21457. <Link2></Link2>
  21458. </user-agent>
  21459. <user-agent>
  21460. <ID>id_t_z_1512</ID>
  21461. <String>www4mail/2.x libwww-FM/2.14 (Unix; I)</String>
  21462. <Description>www4mail - web navigation &amp; database search by e-mail</Description>
  21463. <Type></Type>
  21464. <Comment></Comment>
  21465. <Link1>http://www4mail.org/</Link1>
  21466. <Link2></Link2>
  21467. </user-agent>
  21468. <user-agent>
  21469. <ID>id_t_z_1513</ID>
  21470. <String>WWWC/1.0x</String>
  21471. <Description>WWWC Updating check of Web pages. (Japanese only)</Description>
  21472. <Type>C</Type>
  21473. <Comment></Comment>
  21474. <Link1>http://www.nakka.com/soft/index_eng.html</Link1>
  21475. <Link2></Link2>
  21476. </user-agent>
  21477. <user-agent>
  21478. <ID>id_t_z_1514</ID>
  21479. <String>WWWeasel Robot v1.00 (http://wwweasel.de)</String>
  21480. <Description>World Wide Weasel Germany robot</Description>
  21481. <Type>R</Type>
  21482. <Comment></Comment>
  21483. <Link1>http://wwweasel.de/</Link1>
  21484. <Link2></Link2>
  21485. </user-agent>
  21486. <user-agent>
  21487. <ID>id_t_z_1515</ID>
  21488. <String>WWWOFFLE/2.x</String>
  21489. <Description>WWWoffle download manager</Description>
  21490. <Type>D</Type>
  21491. <Comment></Comment>
  21492. <Link1>http://www.gedanken.demon.co.uk/wwwoffle/</Link1>
  21493. <Link2></Link2>
  21494. </user-agent>
  21495. <user-agent>
  21496. <ID>id_t_z_1516</ID>
  21497. <String>wwwster/1.x (Beta- mailto:gue@cis.uni-muenchen.de)</String>
  21498. <Description>Unknown robot from CIS at Munich University</Description>
  21499. <Type>R</Type>
  21500. <Comment>129.187.254.xxx</Comment>
  21501. <Link1>http://www.cis.uni-muenchen.de/</Link1>
  21502. <Link2></Link2>
  21503. </user-agent>
  21504. <user-agent>
  21505. <ID>id_t_z_050208_5</ID>
  21506. <String>wxDownload Fast</String>
  21507. <Description>wxDownload Fast (wxDFast) open source download manager</Description>
  21508. <Type>D</Type>
  21509. <Comment></Comment>
  21510. <Link1>http://dfast.sourceforge.net/index.html</Link1>
  21511. <Link2></Link2>
  21512. </user-agent>
  21513. <user-agent>
  21514. <ID>id_t_z_1517</ID>
  21515. <String>X-Crawler </String>
  21516. <Description>Arexera (Germany) crawler software</Description>
  21517. <Type>R</Type>
  21518. <Comment></Comment>
  21519. <Link1>http://www.arexera.de/de/products/crawler.php</Link1>
  21520. <Link2></Link2>
  21521. </user-agent>
  21522. <user-agent>
  21523. <ID>id_t_z_1518</ID>
  21524. <String>Xaldon WebSpider</String>
  21525. <Description>Xaldon WebSpider offline browser</Description>
  21526. <Type>B D</Type>
  21527. <Comment></Comment>
  21528. <Link1>http://www.xaldon.de/produkte_webspider.html</Link1>
  21529. <Link2></Link2>
  21530. </user-agent>
  21531. <user-agent>
  21532. <ID>id_t_z_1519</ID>
  21533. <String>Xenu Link Sleuth 1.xx</String>
  21534. <Description>Xenu link checker</Description>
  21535. <Type>C</Type>
  21536. <Comment></Comment>
  21537. <Link1>http://home.snafu.de/tilman/xenulink.html</Link1>
  21538. <Link2></Link2>
  21539. </user-agent>
  21540. <user-agent>
  21541. <ID>id_t_z_1520</ID>
  21542. <String>Xenu's Link Sleuth 1.x[a-z]</String>
  21543. <Description>Xenu link checker</Description>
  21544. <Type>C</Type>
  21545. <Comment></Comment>
  21546. <Link1>http://home.snafu.de/tilman/xenulink.html</Link1>
  21547. <Link2></Link2>
  21548. </user-agent>
  21549. <user-agent>
  21550. <ID>id_t_z_270706_2</ID>
  21551. <String>Xerka WebBot v1.0.0 [UPVOpenDir]</String>
  21552. <Description>XerKa text mining and information retrieval software</Description>
  21553. <Type>D</Type>
  21554. <Comment></Comment>
  21555. <Link1>http://www.diana-teknologia.com/www1/english/xerka.htm</Link1>
  21556. <Link2></Link2>
  21557. </user-agent>
  21558. <user-agent>
  21559. <ID>id_t_z_250106_2</ID>
  21560. <String>xine/1.0</String>
  21561. <Description>xine - free Linux / OS/2 multimedia player</Description>
  21562. <Type>B</Type>
  21563. <Comment></Comment>
  21564. <Link1>http://xinehq.de/</Link1>
  21565. <Link2></Link2>
  21566. </user-agent>
  21567. <user-agent>
  21568. <ID>id_t_z_141205_3</ID>
  21569. <String>xirq/0.1-beta (xirq; http://www.xirq.com; xirq@xirq.com)</String>
  21570. <Description>XIRQ search (beta) robot (70.86.206.1xx)</Description>
  21571. <Type>R</Type>
  21572. <Comment></Comment>
  21573. <Link1>http://www.xirq.com/</Link1>
  21574. <Link2></Link2>
  21575. </user-agent>
  21576. <user-agent>
  21577. <ID>id_t_z_160806_1</ID>
  21578. <String>XMLSlurp/0.1 libwww-perl/5.805</String>
  21579. <Description>GPath / XMLSlurp - Expression language for tree structured data</Description>
  21580. <Type></Type>
  21581. <Comment></Comment>
  21582. <Link1>http://groovy.codehaus.org/GPath</Link1>
  21583. <Link2></Link2>
  21584. </user-agent>
  21585. <user-agent>
  21586. <ID>id_t_z_070506_1</ID>
  21587. <String>XRL/2.00b1 (Linux; i686; en-us) (+http://metamark.net/about)</String>
  21588. <Description>Metamark URL Shorten Service</Description>
  21589. <Type>P</Type>
  21590. <Comment></Comment>
  21591. <Link1>http://metamark.net/</Link1>
  21592. <Link2></Link2>
  21593. </user-agent>
  21594. <user-agent>
  21595. <ID>id_t_z_200308_3</ID>
  21596. <String>Xylix</String>
  21597. <Description>Xylix Retrieval System software</Description>
  21598. <Type>C</Type>
  21599. <Comment></Comment>
  21600. <Link1>http://www.xylixsoftware.ch/retrievalsystem.php</Link1>
  21601. <Link2></Link2>
  21602. </user-agent>
  21603. <user-agent>
  21604. <ID>id_t_z_1521</ID>
  21605. <String>xyro_(xcrawler@cosmos.inria.fr)</String>
  21606. <Description>Inria Crawler</Description>
  21607. <Type>R</Type>
  21608. <Comment></Comment>
  21609. <Link1>http://www.inria.fr/</Link1>
  21610. <Link2></Link2>
  21611. </user-agent>
  21612. <user-agent>
  21613. <ID>id_t_z_081205_1</ID>
  21614. <String>Y!J-BSC/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html)</String>
  21615. <Description>Yahoo Search Japan robot (211.14.8.2xx)</Description>
  21616. <Type>R</Type>
  21617. <Comment>s. also Mozilla/4.0 (compatible; Y!J...</Comment>
  21618. <Link1>http://www.yahoo.co.jp/</Link1>
  21619. <Link2></Link2>
  21620. </user-agent>
  21621. <user-agent>
  21622. <ID>id_t_z_271006_2</ID>
  21623. <String>Y!J-SRD/1.0</String>
  21624. <Description>Yahoo Search Japan robot (203.216.197.xxx)</Description>
  21625. <Type>R</Type>
  21626. <Comment>s. also DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0 ...</Comment>
  21627. <Link1>http://www.yahoo.co.jp/</Link1>
  21628. <Link2></Link2>
  21629. </user-agent>
  21630. <user-agent>
  21631. <ID>id_t_z_240106_3</ID>
  21632. <String>Y!J/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html)</String>
  21633. <Description>Yahoo Search Japan robot (211.14.8.2xx)</Description>
  21634. <Type>R</Type>
  21635. <Comment>s. also Mozilla/4.0 (compatible; Y!J...</Comment>
  21636. <Link1>http://www.yahoo.co.jp/</Link1>
  21637. <Link2></Link2>
  21638. </user-agent>
  21639. <user-agent>
  21640. <ID>id_t_z_220206_2</ID>
  21641. <String>Y!OASIS/TEST no-ad Mozilla/4.08 [en] (X11; I; FreeBSD 2.2.8-STABLE i386)</String>
  21642. <Description>Yahoo picture service for mobiles</Description>
  21643. <Type>P</Type>
  21644. <Comment>217.12.4.xx</Comment>
  21645. <Link1></Link1>
  21646. <Link2></Link2>
  21647. </user-agent>
  21648. <user-agent>
  21649. <ID>id_t_z_1522</ID>
  21650. <String>Y!TunnelPro</String>
  21651. <Description>Y!TunnelPro - Yahoo! Messenger companion user agent</Description>
  21652. <Type>B</Type>
  21653. <Comment> s. YTunnelPro</Comment>
  21654. <Link1>http://www.ytunnelpro.com/</Link1>
  21655. <Link2></Link2>
  21656. </user-agent>
  21657. <user-agent>
  21658. <ID>id_t_z_121205_1</ID>
  21659. <String>yacy (www.yacy.net; v20040602; i386 Linux 2.4.26-gentoo-r13; java 1.4.2_06; MET/en)</String>
  21660. <Description>Yacy distributed P2P web search engine robot</Description>
  21661. <Type>R</Type>
  21662. <Comment></Comment>
  21663. <Link1>http://www.yacy.net/</Link1>
  21664. <Link2></Link2>
  21665. </user-agent>
  21666. <user-agent>
  21667. <ID>id_t_z_260306_4</ID>
  21668. <String>yacybot (x86 Windows XP 5.1; java 1.5.0_06; Europe/de) yacy.net</String>
  21669. <Description>Yacy distributed P2P web search engine robot</Description>
  21670. <Type>R</Type>
  21671. <Comment></Comment>
  21672. <Link1>http://www.yacy.net/</Link1>
  21673. <Link2></Link2>
  21674. </user-agent>
  21675. <user-agent>
  21676. <ID>id_t_z_300707_2</ID>
  21677. <String>Yahoo Pipes 1.0</String>
  21678. <Description>(Yahoo) Pipes interactive data aggregator robot</Description>
  21679. <Type>R</Type>
  21680. <Comment></Comment>
  21681. <Link1>http://pipes.yahoo.com/pipes/</Link1>
  21682. <Link2></Link2>
  21683. </user-agent>
  21684. <user-agent>
  21685. <ID>id_t_z_100406_2</ID>
  21686. <String>Yahoo! Mindset</String>
  21687. <Description>Yahoo Mindset: Intent-driven Search (66.228.182.1xx)</Description>
  21688. <Type>R</Type>
  21689. <Comment>s. also Mozilla/4.0</Comment>
  21690. <Link1>http://mindset.research.yahoo.com/</Link1>
  21691. <Link2></Link2>
  21692. </user-agent>
  21693. <user-agent>
  21694. <ID>id_t_z_040106_2</ID>
  21695. <String>Yahoo-Blogs/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html )</String>
  21696. <Description>Yahoo blog indexing robot (209.191.83.1xx)</Description>
  21697. <Type>R</Type>
  21698. <Comment></Comment>
  21699. <Link1>http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html</Link1>
  21700. <Link2></Link2>
  21701. </user-agent>
  21702. <user-agent>
  21703. <ID>id_t_z_1523</ID>
  21704. <String>Yahoo-MMAudVid/1.0 (mms dash mmaudvidcrawler dash support at yahoo dash inc dot com)</String>
  21705. <Description>Yahoo multimedia crawler (206.190.43.xx)</Description>
  21706. <Type>R</Type>
  21707. <Comment></Comment>
  21708. <Link1></Link1>
  21709. <Link2></Link2>
  21710. </user-agent>
  21711. <user-agent>
  21712. <ID>id_t_z_080108_2</ID>
  21713. <String>Yahoo-MMAudVid/2.0(mms dash mm aud vid crawler dash support at yahoo dash inc.com ;Mozilla 4.0 compatible; MSIE 7.0;Windows NT 5.0; .NET CLR 2.0)</String>
  21714. <Description>Yahoo multimedia crawler</Description>
  21715. <Type>R</Type>
  21716. <Comment></Comment>
  21717. <Link1></Link1>
  21718. <Link2></Link2>
  21719. </user-agent>
  21720. <user-agent>
  21721. <ID>id_t_z_1524</ID>
  21722. <String>Yahoo-MMCrawler/3.x (mm dash crawler at trd dot overture dot com)</String>
  21723. <Description>Yahoo multimedia crawler via Fastsearch.net (66.77.73.xx)</Description>
  21724. <Type>R</Type>
  21725. <Comment>see also FAST-WebCrawler/3.x Multimedia...</Comment>
  21726. <Link1></Link1>
  21727. <Link2></Link2>
  21728. </user-agent>
  21729. <user-agent>
  21730. <ID>id_t_z_110806_1</ID>
  21731. <String>Yahoo-Test/4.0</String>
  21732. <Description>Yahoo Search robot</Description>
  21733. <Type>R</Type>
  21734. <Comment>216.145.49.xx</Comment>
  21735. <Link1></Link1>
  21736. <Link2></Link2>
  21737. </user-agent>
  21738. <user-agent>
  21739. <ID>id_t_z_1525</ID>
  21740. <String>Yahoo-VerticalCrawler-FormerWebCrawler/3.9 crawler at trd dot overture dot com; http://www.alltheweb.com/help/webmaster/crawler</String>
  21741. <Description>Yahoo crawler via Overture (66.77.73.3x)</Description>
  21742. <Type>R</Type>
  21743. <Comment></Comment>
  21744. <Link1></Link1>
  21745. <Link2></Link2>
  21746. </user-agent>
  21747. <user-agent>
  21748. <ID>id_t_z_010906_2</ID>
  21749. <String>YahooFeedSeeker/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://publisher.yahoo.com/rssguide)</String>
  21750. <Description>Yahoo Publisher Network RSS crawler</Description>
  21751. <Type>R</Type>
  21752. <Comment></Comment>
  21753. <Link1>http://publisher.yahoo.com/rssguide</Link1>
  21754. <Link2></Link2>
  21755. </user-agent>
  21756. <user-agent>
  21757. <ID>id_t_z_1526</ID>
  21758. <String>YahooSeeker-Testing/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/)</String>
  21759. <Description>Yahoo Product Search crawler ( 68.142.195..x)</Description>
  21760. <Type>R</Type>
  21761. <Comment></Comment>
  21762. <Link1></Link1>
  21763. <Link2></Link2>
  21764. </user-agent>
  21765. <user-agent>
  21766. <ID>id_t_z_1527</ID>
  21767. <String>YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/)</String>
  21768. <Description>Yahoo Product Search crawler ( 66.196.93.x)</Description>
  21769. <Type>R</Type>
  21770. <Comment></Comment>
  21771. <Link1></Link1>
  21772. <Link2></Link2>
  21773. </user-agent>
  21774. <user-agent>
  21775. <ID>id_t_z_1528</ID>
  21776. <String>YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/yahooseeker.html)</String>
  21777. <Description>Yahoo Product Search crawler ( 66.196.93.x)</Description>
  21778. <Type>R</Type>
  21779. <Comment></Comment>
  21780. <Link1></Link1>
  21781. <Link2></Link2>
  21782. </user-agent>
  21783. <user-agent>
  21784. <ID>id_t_z_1529</ID>
  21785. <String>YahooSeeker/1.1 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/)</String>
  21786. <Description>Yahoo Product Search crawler ( 66.196.93.x)</Description>
  21787. <Type>R</Type>
  21788. <Comment></Comment>
  21789. <Link1></Link1>
  21790. <Link2></Link2>
  21791. </user-agent>
  21792. <user-agent>
  21793. <ID>id_t_z_1530</ID>
  21794. <String>YahooSeeker/bsv3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html )</String>
  21795. <Description>Yahoo Product Search crawler ( 68.142.195..x)</Description>
  21796. <Type>R</Type>
  21797. <Comment></Comment>
  21798. <Link1></Link1>
  21799. <Link2></Link2>
  21800. </user-agent>
  21801. <user-agent>
  21802. <ID>id_t_z_1531</ID>
  21803. <String>YahooSeeker/CafeKelsa-dev (compatible; Konqueror/3.2; FreeBSD ;cafekelsa-dev-webmaster@yahoo-inc.com )</String>
  21804. <Description>Yahoo robot</Description>
  21805. <Type>R</Type>
  21806. <Comment>64.157.137.xxx</Comment>
  21807. <Link1></Link1>
  21808. <Link2></Link2>
  21809. </user-agent>
  21810. <user-agent>
  21811. <ID>id_t_z_231106_2</ID>
  21812. <String>Yandex/1.01.001 (compatible; Win16; I)</String>
  21813. <Description>Yandex Search Russia link checking (213.180.206.2xx)</Description>
  21814. <Type>R</Type>
  21815. <Comment>s. also Mozilla/4.0 (compatible; MSIE 5.0; YANDEX)</Comment>
  21816. <Link1>http://www.yandex.ru</Link1>
  21817. <Link2></Link2>
  21818. </user-agent>
  21819. <user-agent>
  21820. <ID>id_t_z_301108_2</ID>
  21821. <String>Yanga WorldSearch Bot v1.1/beta (http://www.yanga.co.uk/)</String>
  21822. <Description>Yanga search robot by Gigabase (Russian Federation)</Description>
  21823. <Type>R</Type>
  21824. <Comment>91.205.124.x</Comment>
  21825. <Link1>http://www.yanga.co.uk/</Link1>
  21826. <Link2></Link2>
  21827. </user-agent>
  21828. <user-agent>
  21829. <ID>id_t_z_1532</ID>
  21830. <String>yarienavoir.net/0.2</String>
  21831. <Description>Yarienavoir search (Belgium) robot</Description>
  21832. <Type>R</Type>
  21833. <Comment>217.71.121.xx</Comment>
  21834. <Link1>http://www.yarienavoir.net/</Link1>
  21835. <Link2></Link2>
  21836. </user-agent>
  21837. <user-agent>
  21838. <ID>id_t_z_300506_1</ID>
  21839. <String>Yeti</String>
  21840. <Description>1noon.com search Korea robot (222.231.21.xxx)</Description>
  21841. <Type>R</Type>
  21842. <Comment>uses also a blank UA field</Comment>
  21843. <Link1>http://www.1noon.com/</Link1>
  21844. <Link2></Link2>
  21845. </user-agent>
  21846. <user-agent>
  21847. <ID>id_t_z_040407_1</ID>
  21848. <String>Yeti/0.01 (nhn/1noon&#44; yetibot@naver.com&#44; check robots.txt daily and follows it)</String>
  21849. <Description>1noon.com search Korea robot (222.231.21.xxx)</Description>
  21850. <Type>R</Type>
  21851. <Comment>uses also a blank UA field</Comment>
  21852. <Link1>http://www.1noon.com/</Link1>
  21853. <Link2></Link2>
  21854. </user-agent>
  21855. <user-agent>
  21856. <ID>id_t_z_301108_1</ID>
  21857. <String>Yeti/1.0 (NHN Corp.; http://help.naver.com/robots/)</String>
  21858. <Description>Naver search (Korea) robot</Description>
  21859. <Type>R</Type>
  21860. <Comment>61.247.222.xx</Comment>
  21861. <Link1>http://www.naver.com/</Link1>
  21862. <Link2></Link2>
  21863. </user-agent>
  21864. <user-agent>
  21865. <ID>id_t_z_290407_2</ID>
  21866. <String>yggdrasil/Nutch-0.9 (yggdrasil biorelated search engine; www dot biotec dot tu minus dresden do de slash schroeder; heiko dot dietze at biotec dot tu minus dresden dot de)</String>
  21867. <Description>yggdrasil spider for GoPubMed biorelated search engine</Description>
  21868. <Type>R</Type>
  21869. <Comment>141.30.193.x[x]</Comment>
  21870. <Link1>http://www.biotec.tu-dresden.de/schroeder</Link1>
  21871. <Link2>http://gopubmed.biotec.tu-dresden.de/</Link2>
  21872. </user-agent>
  21873. <user-agent>
  21874. <ID>id_t_z_211206_3</ID>
  21875. <String>YodaoBot/1.0 (http://www.yodao.com/help/webmaster/spider/; )</String>
  21876. <Description>Yodao search (China)</Description>
  21877. <Type>R</Type>
  21878. <Comment>60.191.80.xx</Comment>
  21879. <Link1>http://www.yodao.com/</Link1>
  21880. <Link2></Link2>
  21881. </user-agent>
  21882. <user-agent>
  21883. <ID>id_t_z_110308_1</ID>
  21884. <String>yoofind/yoofind-0.1-dev (yoono webcrawler; http://www.yoono.com ; MyEmail)</String>
  21885. <Description>Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)</Description>
  21886. <Type>R</Type>
  21887. <Comment>s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoono/1.0 web-crawler ..</Comment>
  21888. <Link1>http://www.yoono.com/</Link1>
  21889. <Link2></Link2>
  21890. </user-agent>
  21891. <user-agent>
  21892. <ID>id_t_z_210106_3</ID>
  21893. <String>yoogliFetchAgent/0.1</String>
  21894. <Description>Yoogli search (under development) agent</Description>
  21895. <Type>R</Type>
  21896. <Comment></Comment>
  21897. <Link1>http://www.yoogli.com/</Link1>
  21898. <Link2></Link2>
  21899. </user-agent>
  21900. <user-agent>
  21901. <ID>id_t_z_120606_1</ID>
  21902. <String>yoono/1.0 web-crawler/1.0</String>
  21903. <Description>Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)</Description>
  21904. <Type>R</Type>
  21905. <Comment>s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoofind/yoofind ..</Comment>
  21906. <Link1>http://www.yoono.com/</Link1>
  21907. <Link2></Link2>
  21908. </user-agent>
  21909. <user-agent>
  21910. <ID>id_t_z_1533</ID>
  21911. <String>YottaCars_Bot/4.12 (+http://www.yottacars.com) Car Search Engine </String>
  21912. <Description>YottaCars bot - YottaCar car search engine ( 64.62.175.xxx)</Description>
  21913. <Type>R</Type>
  21914. <Comment>s. also OmniExplorer_Bot</Comment>
  21915. <Link1>http://www.yottacars.com/</Link1>
  21916. <Link2></Link2>
  21917. </user-agent>
  21918. <user-agent>
  21919. <ID>id_t_z_1534</ID>
  21920. <String>YottaShopping_Bot/4.12 (+http://www.yottashopping.com) Shopping Search Engine</String>
  21921. <Description>YottaShopping bot - YottaShopping search engine ( 64.62.175.xxx) </Description>
  21922. <Type>R</Type>
  21923. <Comment>s. also OmniExplorer_Bot</Comment>
  21924. <Link1>http://www.yottashopping.com/</Link1>
  21925. <Link2></Link2>
  21926. </user-agent>
  21927. <user-agent>
  21928. <ID>id_t_z_1535</ID>
  21929. <String>YTunnelPro</String>
  21930. <Description>Y!TunnelPro - Yahoo! Messenger companion user agent</Description>
  21931. <Type>B</Type>
  21932. <Comment>s. Y!TunnelPro</Comment>
  21933. <Link1>http://www.ytunnelpro.com/</Link1>
  21934. <Link2></Link2>
  21935. </user-agent>
  21936. <user-agent>
  21937. <ID>id_t_z_1536</ID>
  21938. <String>Z-Add Link Checker (http://w3.z-add.co.uk/linkcheck/)</String>
  21939. <Description>Z-Add online link checker</Description>
  21940. <Type>C</Type>
  21941. <Comment></Comment>
  21942. <Link1>http://w3.z-add.co.uk/linkcheck/</Link1>
  21943. <Link2></Link2>
  21944. </user-agent>
  21945. <user-agent>
  21946. <ID>id_t_z_1537</ID>
  21947. <String>Zao-Crawler</String>
  21948. <Description>Zao crawler for Kototoi Project</Description>
  21949. <Type>R</Type>
  21950. <Comment></Comment>
  21951. <Link1>http://www.kototoi.org/zao/</Link1>
  21952. <Link2></Link2>
  21953. </user-agent>
  21954. <user-agent>
  21955. <ID>id_t_z_1538</ID>
  21956. <String>Zao-Crawler 0.2b</String>
  21957. <Description>Zao crawler for Kototoi Project</Description>
  21958. <Type>R</Type>
  21959. <Comment></Comment>
  21960. <Link1>http://www.kototoi.org/zao/</Link1>
  21961. <Link2></Link2>
  21962. </user-agent>
  21963. <user-agent>
  21964. <ID>id_t_z_1539</ID>
  21965. <String>Zao/0.1 (http://www.kototoi.org/zao/)</String>
  21966. <Description>Zao crawler for Kototoi Project</Description>
  21967. <Type>R</Type>
  21968. <Comment></Comment>
  21969. <Link1>http://www.kototoi.org/zao/</Link1>
  21970. <Link2></Link2>
  21971. </user-agent>
  21972. <user-agent>
  21973. <ID>id_t_z_1540</ID>
  21974. <String>ZBot/1.00 (icaulfield@zeus.com)</String>
  21975. <Description>Zeus Internet Marketing Robot based on Webster Pro component</Description>
  21976. <Type>R</Type>
  21977. <Comment></Comment>
  21978. <Link1>http://cyber-robotics.com/</Link1>
  21979. <Link2>http://www.homepagesw.com/</Link2>
  21980. </user-agent>
  21981. <user-agent>
  21982. <ID>id_t_z_111205_5</ID>
  21983. <String>Zearchit</String>
  21984. <Description>Zearchit German search / directory</Description>
  21985. <Type>R</Type>
  21986. <Comment>212.227.109.1xx</Comment>
  21987. <Link1>http://www.zearchit.de/</Link1>
  21988. <Link2></Link2>
  21989. </user-agent>
  21990. <user-agent>
  21991. <ID>id_t_z_130106_2</ID>
  21992. <String>ZeBot_lseek.net (bot@ze.bz)</String>
  21993. <Description>Ze.bz Moteur de Recherche robot</Description>
  21994. <Type>R</Type>
  21995. <Comment>213.251.135.xx</Comment>
  21996. <Link1>http://www.ze.bz/</Link1>
  21997. <Link2></Link2>
  21998. </user-agent>
  21999. <user-agent>
  22000. <ID>id_t_z_1541</ID>
  22001. <String>ZeBot_www.ze.bz (ze.bz@hotmail.com)</String>
  22002. <Description>Ze.bz Moteur de Recherche robot</Description>
  22003. <Type>R</Type>
  22004. <Comment>213.251.135.xx</Comment>
  22005. <Link1>http://www.ze.bz/</Link1>
  22006. <Link2></Link2>
  22007. </user-agent>
  22008. <user-agent>
  22009. <ID>id_t_z_130806_2</ID>
  22010. <String>zedzo.digest/0.1 (http://www.zedzo.com/)</String>
  22011. <Description>ZedZo Search (beta) robot</Description>
  22012. <Type>R</Type>
  22013. <Comment>24.62.50.1xx</Comment>
  22014. <Link1>http://www.zedzo.com/</Link1>
  22015. <Link2></Link2>
  22016. </user-agent>
  22017. <user-agent>
  22018. <ID>id_t_z_210807_2</ID>
  22019. <String>Zend_Http_Client</String>
  22020. <Description>Zend PHP frameworks Zend_Http_Client component</Description>
  22021. <Type>D</Type>
  22022. <Comment></Comment>
  22023. <Link1>http://framework.zend.com/manual/en/zend.http.html</Link1>
  22024. <Link2></Link2>
  22025. </user-agent>
  22026. <user-agent>
  22027. <ID>id_t_z_290208_2</ID>
  22028. <String>zermelo Mozilla/5.0 compatible; heritrix/1.12.1 (+http://www.powerset.com) [email:crawl@powerset.com&#44;email:paul@page-store.com]</String>
  22029. <Description>Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services</Description>
  22030. <Type>R</Type>
  22031. <Comment>67.202.34.xxx</Comment>
  22032. <Link1>http://www.powerset.com/</Link1>
  22033. <Link2>http://www.amazon.com/gp/browse.html?node=3435361</Link2>
  22034. </user-agent>
  22035. <user-agent>
  22036. <ID>id_t_z_1542</ID>
  22037. <String>zerxbot/Version 0.6 libwww-perl/5.79</String>
  22038. <Description>Zerx search robot ?</Description>
  22039. <Type>R</Type>
  22040. <Comment>138.88.147.xxx</Comment>
  22041. <Link1>http://www.zerx.com/</Link1>
  22042. <Link2></Link2>
  22043. </user-agent>
  22044. <user-agent>
  22045. <ID>id_t_z_1543</ID>
  22046. <String>Zeus ThemeSite Viewer Webster Pro V2.9 Win32</String>
  22047. <Description>Zeus Internet Marketing Robot (based on Webster Pro)</Description>
  22048. <Type>R</Type>
  22049. <Comment></Comment>
  22050. <Link1>http://cyber-robotics.com/</Link1>
  22051. <Link2></Link2>
  22052. </user-agent>
  22053. <user-agent>
  22054. <ID>id_t_z_1544</ID>
  22055. <String>Zeus xxxxx Webster Pro V2.9 Win32</String>
  22056. <Description>Zeus Internet Marketing Robot (based on Webster Pro)</Description>
  22057. <Type>R</Type>
  22058. <Comment></Comment>
  22059. <Link1>http://cyber-robotics.com/</Link1>
  22060. <Link2></Link2>
  22061. </user-agent>
  22062. <user-agent>
  22063. <ID>id_t_z_281105_1</ID>
  22064. <String>Zeusbot/0.07 (Ulysseek's web-crawling robot; http://www.zeusbot.com; agent@zeusbot.com)</String>
  22065. <Description>Zeusbot robot for building the Ulsysseek.com index</Description>
  22066. <Type>R</Type>
  22067. <Comment>powered by Nutch</Comment>
  22068. <Link1>http://www.zeusbot.com/</Link1>
  22069. <Link2>http://www.ulysseek.com/</Link2>
  22070. </user-agent>
  22071. <user-agent>
  22072. <ID>id_t_z_1545</ID>
  22073. <String>Ziggy -- The Clown From Hell!!</String>
  22074. <Description>Unknown agent (server- or link checking ?) from 198.173.158.xx</Description>
  22075. <Type>C</Type>
  22076. <Comment></Comment>
  22077. <Link1></Link1>
  22078. <Link2></Link2>
  22079. </user-agent>
  22080. <user-agent>
  22081. <ID>id_t_z_1546</ID>
  22082. <String>ZipppBot/0.xx (ZipppBot; http://www.zippp.net; webmaster@zippp.net)</String>
  22083. <Description>Zipp.net web search robot</Description>
  22084. <Type>R</Type>
  22085. <Comment></Comment>
  22086. <Link1>http://www.zippp.net/</Link1>
  22087. <Link2></Link2>
  22088. </user-agent>
  22089. <user-agent>
  22090. <ID>id_t_z_1547</ID>
  22091. <String>ZIPPPCVS/0.xx (ZipppBot/.xx;http://www.zippp.net; webmaster@zippp.net)</String>
  22092. <Description>Zipp.net web search robot</Description>
  22093. <Type>R</Type>
  22094. <Comment></Comment>
  22095. <Link1>http://www.zippp.net/</Link1>
  22096. <Link2></Link2>
  22097. </user-agent>
  22098. <user-agent>
  22099. <ID>id_t_z_1548</ID>
  22100. <String>Zippy v2.0 - Zippyfinder.com</String>
  22101. <Description>Zippyfinder robot</Description>
  22102. <Type>R</Type>
  22103. <Comment></Comment>
  22104. <Link1>http://www.zippyfinder.com/</Link1>
  22105. <Link2></Link2>
  22106. </user-agent>
  22107. <user-agent>
  22108. <ID>id_t_z_1549</ID>
  22109. <String>Zoo Tycoon 2 Client -- http://www.zootycoon.com</String>
  22110. <Description>Microsoft Zoo Tycoon 2 game client</Description>
  22111. <Type>B</Type>
  22112. <Comment></Comment>
  22113. <Link1>http://www.zootycoon.com</Link1>
  22114. <Link2></Link2>
  22115. </user-agent>
  22116. <user-agent>
  22117. <ID>id_t_z_1550</ID>
  22118. <String>ZoomSpider - wrensoft.com</String>
  22119. <Description>Zoom Search Engine software spider</Description>
  22120. <Type>R</Type>
  22121. <Comment></Comment>
  22122. <Link1>http://www.wrensoft.com/</Link1>
  22123. <Link2></Link2>
  22124. </user-agent>
  22125. <user-agent>
  22126. <ID>id_new_160110_1</ID>
  22127. <String>Zscho.de Crawler/Nutch-1.0-Zscho.de-semantic_patch (Zscho.de Crawler</String>
  22128. <Description> collecting for machine learning; http://zscho.de/ )</Description>
  22129. <Type>Zscho search crawler (Germany)</Type>
  22130. <Comment>R</Comment>
  22131. <Link1>141.65.161.xx</Link1>
  22132. <Link2>http://www.zscho.de/</Link2>
  22133. </user-agent>
  22134. <user-agent>
  22135. <ID>id_t_z_280306_1</ID>
  22136. <String>zspider/0.9-dev http://feedback.redkolibri.com/</String>
  22137. <Description>zspider robot for a new search engine</Description>
  22138. <Type>R</Type>
  22139. <Comment></Comment>
  22140. <Link1>http://feedback.redkolibri.com/</Link1>
  22141. <Link2></Link2>
  22142. </user-agent>
  22143. <user-agent>
  22144. <ID>id_t_z_1551</ID>
  22145. <String>ZyBorg/1.0 (ZyBorg@WISEnut.com; http://www.WISEnut.com)</String>
  22146. <Description>Wisenut robot</Description>
  22147. <Type>R</Type>
  22148. <Comment></Comment>
  22149. <Link1>http://www.wisenutbot.com/</Link1>
  22150. <Link2></Link2>
  22151. </user-agent>
  22152. </user-agents>
  22153.