{"data":{"slug":"gpt-bot","term":"GPTBot","bucket":"distribution","definition":"OpenAI's web crawler. ScienceToStartup explicitly allows GPTBot on the public corpus via /robots.txt.","short_definition":"OpenAI's web crawler. ScienceToStartup explicitly allows GPTBot on the public corpus via /robots.txt.","long_definition":"GPTBot is OpenAI's training-and-search crawler. ScienceToStartup explicitly allows it on the public corpus via /robots.txt, alongside ClaudeBot, PerplexityBot, and Google-Extended. We treat Answer Engines as first-class distribution and publish llms.txt, capabilities.json, and DefinedTermSet specifically for them to lift.","related_terms":["claude-bot","perplexity-bot","llms-txt"],"related_term_routes":[{"slug":"claude-bot","term":"ClaudeBot","route":"/resources/glossary/claude-bot"},{"slug":"perplexity-bot","term":"PerplexityBot","route":"/resources/glossary/perplexity-bot"},{"slug":"llms-txt","term":"llms.txt","route":"/resources/glossary/llms-txt"}],"canonical_route":"/resources/glossary/gpt-bot","api_route":"/api/v1/resources/glossary/gpt-bot","jsonld_id":"https://sciencetostartup.com/resources/glossary/gpt-bot","variants":[],"tldr":"OpenAI's web crawler. ScienceToStartup explicitly allows GPTBot on the public corpus via /robots.txt.","key_points":[],"quality_tier":null,"citation_count":null,"source_state":"curated_static","source_module":"apps/web/data/glossary/terms.ts","definition_sections":{"schema_version":1,"intro":"GPTBot is OpenAI's training-and-search crawler. ScienceToStartup explicitly allows it on the public corpus via /robots.txt, alongside ClaudeBot, PerplexityBot, and Google-Extended. We treat Answer Engines as first-class distribution and publish llms.txt, capabilities.json, and DefinedTermSet specifically for them to lift.","sections":[{"title":"Definition","items":[{"subtitle":"GPTBot","text":"GPTBot is OpenAI's training-and-search crawler. ScienceToStartup explicitly allows it on the public corpus via /robots.txt, alongside ClaudeBot, PerplexityBot, and Google-Extended. We treat Answer Engines as first-class distribution and publish llms.txt, capabilities.json, and DefinedTermSet specifically for them to lift."}]},{"title":"Related vocabulary","items":[{"subtitle":"ClaudeBot","text":"Anthropic's web crawler. Explicitly allowed on /robots.txt for the ScienceToStartup public corpus."},{"subtitle":"PerplexityBot","text":"Perplexity's web crawler. Explicitly allowed on /robots.txt and a primary target for AEO Answer Cards."},{"subtitle":"llms.txt","text":"The agent-discovery file at /llms.txt. Concise plain-text inventory plus inlined Glossary, FAQ, Capabilities, and Deprecations."}]}],"cited_arxiv_ids":[]}},"meta":{"canonical_route":"/resources/glossary/gpt-bot","api_route":"/api/v1/resources/glossary/gpt-bot","source":{"label":"curated glossary catalog","source_state":"curated_static","source_module":"apps/web/data/glossary/terms.ts","method_version":"public_glossary_curated_terms_v2","freshness":{"status":"versioned","observed_at":null,"fresh_until":null,"reason":"Git-versioned curated catalog; daily ingestion freshness windows do not apply.","reason_code":"git_versioned_curated_catalog"},"source_count":111,"bucket_count":7,"buckets":["scoring","surfaces","agents","distribution","data","foresight","buildability"]}}}