# llms.txt for sintemar.com (SINTEMAR) # Last-Updated: 2025-09-22 # Contact: sintemar@sintemar.com # Website: https://www.sintemar.com/es # Scope: Applies to all subdomains unless otherwise stated # # Overview # # This file communicates the site's preferences to AI agents, crawlers, and LLM providers. # It complements robots.txt but is specifically tailored for AI training and inference usage. # AI providers should respect these directives for crawling, storage, training, and output controls. [policy] version = 1 preferred_crawl_rate = weekly allowed_user_agents = * # # Crawl Directives # # Allow essential pages for discovery and indexing while restricting bulk scraping of dynamic listings. [allow] # Public informational pages path = / path = /es path = /en path = /es/* path = /en/* [disallow] # Avoid high-churn and bulk endpoints path = /api/* path = /search* path = /*?* path = /es/search/node path = /es/search/node/* path = /en/search/node path = /en/search/node/* # # Training and Storage # # Permit non-commercial indexing/summarization. Require opt-in for commercial training or dataset storage. [usage] # Non-commercial research and summarization allowed with attribution link to canonical URL non_commercial = allow # Commercial model training, dataset building, and long-term storage require prior written consent commercial_training = allow commercial_storage = allow # # Attribution # [attribution] required = true format = "Source: SINTEMAR (sintemar.com)" link_canonical = true # # Derivative Content Controls # [derivatives] # Do not create synthetic impersonations, logos, or brand voice mimicking brand_impersonation = disallow # Allow factual summaries and quotations within fair-use limits summaries = allow quotes = allow # # Rate Limits (advisory) # [rates] max_requests_per_minute = 10 max_concurrent_requests = 2 # # Data Retention (advisory) # [retention] # Cache text for up to 30 days for indexing purposes only cache_ttl_days = 120 # # Contact and Appeals # [contact] email = sintemar@sintemar.com policy_updates = https://www.sintemar.com/es