|
site_name: Crawl4AI Documentation |
|
site_description: 🔥🕷️ Crawl4AI, Open-source LLM Friendly Web Crawler & Scrapper |
|
site_url: https://docs.crawl4ai.com |
|
repo_url: https://github.com/unclecode/crawl4ai |
|
repo_name: unclecode/crawl4ai |
|
docs_dir: docs/md_v3 |
|
|
|
|
|
nav: |
|
- Home: index.md |
|
|
|
- Tutorials: |
|
- "Getting Started": tutorials/getting-started.md |
|
- "AsyncWebCrawler Basics": tutorials/async-webcrawler-basics.md |
|
- "Targeted Crawling Techniques": tutorials/targeted-crawling.md |
|
- "Link & Media Analysis": tutorials/link-media-analysis.md |
|
- "Advanced Features (Proxy, PDF, Screenshots)": tutorials/advanced-features.md |
|
- "Hooks & Custom Code": tutorials/hooks-custom.md |
|
- "Markdown Generation Basics": tutorials/markdown-basics.md |
|
- "Extracting JSON (No LLM)": tutorials/json-extraction-basic.md |
|
- "Extracting JSON (LLM)": tutorials/json-extraction-llm.md |
|
- "Deploying with Docker (Quickstart)": tutorials/docker-quickstart.md |
|
|
|
- How-To Guides: |
|
- "Advanced Browser Configuration": how-to/advanced-browser-config.md |
|
- "Managing Browser Contexts & Remote Browsers": how-to/browser-contexts-remote.md |
|
- "Identity-Based Crawling (Anti-Bot)": how-to/identity-anti-bot.md |
|
- "Link & Media Analysis": how-to/link-media-analysis.md |
|
- "Markdown Generation Customization": how-to/markdown-custom.md |
|
- "Structured Data Extraction (Advanced)": how-to/structured-data-advanced.md |
|
- "Deployment Options": how-to/deployment-options.md |
|
- "Performance & Caching": how-to/performance-caching.md |
|
|
|
- Explanations: |
|
- "AsyncWebCrawler & Internal Flow": explanations/async-webcrawler-flow.md |
|
- "Configuration Objects Explained": explanations/configuration-objects.md |
|
- "Browser Context & Managed Browser": explanations/browser-management.md |
|
- "Markdown Generation Architecture": explanations/markdown-architecture.md |
|
- "Extraction & Chunking Strategies": explanations/extraction-chunking.md |
|
- "Identity-Based Crawling & Anti-Bot": explanations/identity-anti-bot.md |
|
- "Deployment Architectures": explanations/deployment-architectures.md |
|
|
|
- Reference: |
|
- "Configuration": reference/configuration.md |
|
- "Core Crawler": reference/core-crawler.md |
|
- "Browser Strategies": reference/browser-strategies.md |
|
- "Markdown Generation": reference/markdown-generation.md |
|
- "Content Filters": reference/content-filters.md |
|
- "Extraction Strategies": reference/extraction-strategies.md |
|
- "Chunking Strategies": reference/chunking-strategies.md |
|
- "Identity & Utility": reference/identity-utilities.md |
|
- "Models": reference/models.md |
|
|
|
- Blog: |
|
- "Blog Overview": blog/index.md |
|
|
|
|
|
|
|
|
|
|
|
theme: |
|
name: terminal |
|
palette: dark |
|
|
|
plugins: |
|
- search |
|
- mkdocstrings: |
|
handlers: |
|
python: |
|
analysis: |
|
follow_imports: true |
|
rendering: |
|
show_root_full_path: false |
|
|
|
markdown_extensions: |
|
- codehilite |
|
- toc: |
|
permalink: true |
|
- pymdownx.highlight: |
|
anchor_linenums: true |
|
- pymdownx.inlinehilite |
|
- pymdownx.snippets |
|
- pymdownx.superfences |
|
- admonition |
|
- pymdownx.details |
|
- attr_list |
|
- tables |
|
|
|
extra_css: |
|
- assets/styles.css |
|
- assets/highlight.css |
|
- assets/dmvendor.css |
|
|
|
extra_javascript: |
|
- assets/highlight.min.js |
|
- assets/highlight_init.js |