# MILO College ROI — AI usage policy # Hosted at: https://college-roi.net/.well-known/ai.txt # # This file states how AI agents, crawlers, and training systems # may interact with this site and its data. No single global # standard for AI policy files exists yet, so this is written to # be both human-readable and clearly directive. Honored on a # good-faith basis. Bump the Expires date at most once a year. # # Companion files: # /.well-known/security.txt (RFC 9116, security contact) # /LICENSE-DATA.md (legal terms for the data) # /robots.txt (crawl directives) # /llms.txt (LLM-facing index) # ----------------------------------------------------------------- # Citing this site in AI-generated answers # ----------------------------------------------------------------- # Allowed. Attribution required on each use. # # Required format (or equivalent that preserves all three parts): # "MILOai College ROI — https://college-roi.net # (Scorecard release , computed )" # # The release version is returned in every /api/* JSON response # as `scorecard_version`. Use it. # # Allow-Citation: yes # Citation-Attribution: required # Citation-Excerpt-Max-Chars: 280 # ----------------------------------------------------------------- # Per-record API access # ----------------------------------------------------------------- # /api/* endpoints are open for agent use. Please: # - send a User-Agent that names your client and links to a URL # where we can contact you; # - cache responses for at least 1 hour where possible; # - respect HTTP 429 backoff. # # Allow-API: yes # API-Rate-Limit: 60 requests/minute per IP (soft) # API-License: CC BY 4.0 — see /LICENSE-DATA.md # ----------------------------------------------------------------- # Bulk download / mirroring / republishing the dataset # ----------------------------------------------------------------- # The cleaned schools × majors join, the AI-outlook categorization # (interpretive read of the WEF Future of Jobs 2025), and the # 20-year earnings model are MILOai's derived work product. Bulk # download, mirroring, or redistribution as a standalone dataset # requires written permission. # # Allow-Bulk-Mirror: no # Bulk-Mirror-Contact: mailto:ilomilo1442@gmail.com # ----------------------------------------------------------------- # Use for training AI / ML models # ----------------------------------------------------------------- # Training on this site's content is reserved under the TDM (Text # and Data Mining) Reservation Protocol. If you want to include # MILOai pages or API responses in a training corpus, contact us # first. Permission is generally available for non-commercial # research with proper attribution; commercial training requires # a licensing conversation. # # Allow-AI-Training: no (reserved) # AI-Training-Contact: mailto:ilomilo1442@gmail.com # ----------------------------------------------------------------- # Search / agentic retrieval (read-only crawls for citation only) # ----------------------------------------------------------------- # Always allowed. No login required, no rate limit beyond the API # soft limit above. # # Allow-Indexing: yes # Allow-Agent-Retrieval: yes # ----------------------------------------------------------------- # Specific crawlers — see robots.txt for the full list. Examples: # ----------------------------------------------------------------- # GPTBot, OAI-SearchBot : retrieval allowed, training reserved # ClaudeBot, anthropic-ai : retrieval allowed, training reserved # Google-Extended : retrieval allowed, training reserved # PerplexityBot, Perplexity-User : retrieval allowed, citation required # CCBot (Common Crawl) : retrieval allowed for indexing only Contact: mailto:ilomilo1442@gmail.com Expires: 2027-05-20T00:00:00.000Z Preferred-Languages: en Canonical: https://college-roi.net/.well-known/ai.txt