mirror of
https://github.com/ai-robots-txt/ai.robots.txt.git
synced 2025-10-05 23:52:38 +02:00
Update from Dark Visitors
This commit is contained in:
36
robots.json
36
robots.json
@@ -1,4 +1,11 @@
|
||||
{
|
||||
"AddSearchBot": {
|
||||
"operator": "Unclear at this time.",
|
||||
"respect": "Unclear at this time.",
|
||||
"function": "AI Search Crawlers",
|
||||
"frequency": "Unclear at this time.",
|
||||
"description": "AddSearchBot is a web crawler that indexes website content for AddSearch's AI-powered site search solution, collecting data to provide fast and accurate search results. More info can be found at https://darkvisitors.com/agents/agents/addsearchbot"
|
||||
},
|
||||
"AI2Bot": {
|
||||
"operator": "[Ai2](https://allenai.org/crawler)",
|
||||
"respect": "Yes",
|
||||
@@ -69,6 +76,13 @@
|
||||
"frequency": "Unclear at this time.",
|
||||
"description": "Connects to and crawls URLs that have been selected for use in a user's AWS bedrock application."
|
||||
},
|
||||
"bigsur.ai": {
|
||||
"operator": "Big Sur AI that fetches website content to enable AI-powered web agents, sales assistants, and content marketing solutions for businesses",
|
||||
"respect": "Unclear at this time.",
|
||||
"function": "AI Assistants",
|
||||
"frequency": "Unclear at this time.",
|
||||
"description": "bigsur.ai is a web crawler operated by Big Sur AI that fetches website content to enable AI-powered web agents, sales assistants, and content marketing solutions for businesses. More info can be found at https://darkvisitors.com/agents/agents/bigsur-ai"
|
||||
},
|
||||
"Brightbot 1.0": {
|
||||
"operator": "Browsing.ai",
|
||||
"respect": "Unclear at this time.",
|
||||
@@ -132,6 +146,13 @@
|
||||
"frequency": "No information provided.",
|
||||
"description": "Scrapes data to train LLMs and AI products offered by Anthropic."
|
||||
},
|
||||
"CloudVertexBot": {
|
||||
"operator": "Unclear at this time.",
|
||||
"respect": "Unclear at this time.",
|
||||
"function": "AI Data Scrapers",
|
||||
"frequency": "Unclear at this time.",
|
||||
"description": "CloudVertexBot is a Google-operated crawler available to site owners to request targeted crawls of their own sites for AI training purposes on the Vertex AI platform. More info can be found at https://darkvisitors.com/agents/agents/cloudvertexbot"
|
||||
},
|
||||
"cohere-ai": {
|
||||
"operator": "[Cohere](https://cohere.com)",
|
||||
"respect": "Unclear at this time.",
|
||||
@@ -266,11 +287,11 @@
|
||||
"description": "GoogleAgent-Mariner is an AI agent created by Google that can use a web browser. It can intelligently navigate and interact with websites to complete multi-step tasks on behalf of a human user. More info can be found at https://darkvisitors.com/agents/agents/googleagent-mariner"
|
||||
},
|
||||
"GoogleOther": {
|
||||
"description": "\"Used by various product teams for fetching publicly accessible content from sites. For example, it may be used for one-off crawls for internal research and development.\"",
|
||||
"frequency": "No information.",
|
||||
"function": "Scrapes data.",
|
||||
"operator": "Google",
|
||||
"respect": "[Yes](https://developers.google.com/search/docs/crawling-indexing/overview-google-crawlers)"
|
||||
"respect": "[Yes](https://developers.google.com/search/docs/crawling-indexing/overview-google-crawlers)",
|
||||
"function": "Scrapes data.",
|
||||
"frequency": "No information.",
|
||||
"description": "\"Used by various product teams for fetching publicly accessible content from sites. For example, it may be used for one-off crawls for internal research and development.\""
|
||||
},
|
||||
"GoogleOther-Image": {
|
||||
"description": "\"Used by various product teams for fetching publicly accessible content from sites. For example, it may be used for one-off crawls for internal research and development.\"",
|
||||
@@ -335,6 +356,13 @@
|
||||
"frequency": "Unclear at this time.",
|
||||
"description": "Kangaroo Bot is used by the company Kangaroo LLM to download data to train AI models tailored to Australian language and culture. More info can be found at https://darkvisitors.com/agents/agents/kangaroo-bot"
|
||||
},
|
||||
"LinerBot": {
|
||||
"operator": "Unclear at this time.",
|
||||
"respect": "Unclear at this time.",
|
||||
"function": "AI Assistants",
|
||||
"frequency": "Unclear at this time.",
|
||||
"description": "LinerBot is the web crawler used by Liner AI assistant to gather information from academic sources and websites to provide accurate answers with line-by-line source citations for research and scholarly work. More info can be found at https://darkvisitors.com/agents/agents/linerbot"
|
||||
},
|
||||
"meta-externalagent": {
|
||||
"operator": "[Meta](https://developers.facebook.com/docs/sharing/webmasters/web-crawlers)",
|
||||
"respect": "Yes",
|
||||
|
Reference in New Issue
Block a user