File size: 3,534 Bytes
03c0888
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
site_name: Crawl4AI Documentation
site_description: 🔥🕷️ Crawl4AI, Open-source LLM Friendly Web Crawler & Scrapper
site_url: https://docs.crawl4ai.com
repo_url: https://github.com/unclecode/crawl4ai
repo_name: unclecode/crawl4ai
docs_dir: docs/md_v3


nav:
  - Home: index.md

  - Tutorials:
    - "Getting Started": tutorials/getting-started.md
    - "AsyncWebCrawler Basics": tutorials/async-webcrawler-basics.md
    - "Targeted Crawling Techniques": tutorials/targeted-crawling.md
    - "Link & Media Analysis": tutorials/link-media-analysis.md
    - "Advanced Features (Proxy, PDF, Screenshots)": tutorials/advanced-features.md
    - "Hooks & Custom Code": tutorials/hooks-custom.md
    - "Markdown Generation Basics": tutorials/markdown-basics.md
    - "Extracting JSON (No LLM)": tutorials/json-extraction-basic.md
    - "Extracting JSON (LLM)": tutorials/json-extraction-llm.md
    - "Deploying with Docker (Quickstart)": tutorials/docker-quickstart.md

  - How-To Guides:
    - "Advanced Browser Configuration": how-to/advanced-browser-config.md
    - "Managing Browser Contexts & Remote Browsers": how-to/browser-contexts-remote.md
    - "Identity-Based Crawling (Anti-Bot)": how-to/identity-anti-bot.md
    - "Link & Media Analysis": how-to/link-media-analysis.md
    - "Markdown Generation Customization": how-to/markdown-custom.md
    - "Structured Data Extraction (Advanced)": how-to/structured-data-advanced.md
    - "Deployment Options": how-to/deployment-options.md
    - "Performance & Caching": how-to/performance-caching.md

  - Explanations:
    - "AsyncWebCrawler & Internal Flow": explanations/async-webcrawler-flow.md
    - "Configuration Objects Explained": explanations/configuration-objects.md
    - "Browser Context & Managed Browser": explanations/browser-management.md
    - "Markdown Generation Architecture": explanations/markdown-architecture.md
    - "Extraction & Chunking Strategies": explanations/extraction-chunking.md
    - "Identity-Based Crawling & Anti-Bot": explanations/identity-anti-bot.md
    - "Deployment Architectures": explanations/deployment-architectures.md

  - Reference:
    - "Configuration": reference/configuration.md
    - "Core Crawler": reference/core-crawler.md
    - "Browser Strategies": reference/browser-strategies.md
    - "Markdown Generation": reference/markdown-generation.md
    - "Content Filters": reference/content-filters.md
    - "Extraction Strategies": reference/extraction-strategies.md
    - "Chunking Strategies": reference/chunking-strategies.md
    - "Identity & Utility": reference/identity-utilities.md
    - "Models": reference/models.md

  - Blog: 
    - "Blog Overview": blog/index.md
    #  You can add real-life application posts here in the future
    #  - "Cool Real-World E-Commerce Scraping": blog/ecommerce-case-study.md
    #  - "Dealing with Complex Anti-Bot Systems": blog/anti-bot-tricks.md


theme:
  name: terminal
  palette: dark

plugins:
  - search
  - mkdocstrings:
      handlers:
        python:
          analysis:
            follow_imports: true
          rendering:
            show_root_full_path: false

markdown_extensions:
  - codehilite
  - toc:
      permalink: true
  - pymdownx.highlight:
      anchor_linenums: true
  - pymdownx.inlinehilite
  - pymdownx.snippets
  - pymdownx.superfences
  - admonition
  - pymdownx.details
  - attr_list
  - tables

extra_css:
  - assets/styles.css
  - assets/highlight.css
  - assets/dmvendor.css

extra_javascript:
  - assets/highlight.min.js
  - assets/highlight_init.js