<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://www.contextractor.com/</loc>
<priority>1</priority>
</url>
<url>
<loc>https://www.contextractor.com/press-kit/</loc>
</url>
<url>
<loc>https://www.contextractor.com/about/</loc>
<lastmod>2025-01-01T00:00:00.000Z</lastmod>
<priority>0.5</priority>
</url>
<url>
<loc>https://www.contextractor.com/anti-bot-detection/</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/apify-actor-pattern/</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/content-extraction/</loc>
<lastmod>2026-03-16T00:00:00.000Z</lastmod>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.contextractor.com/content-extraction-benchmark/</loc>
<lastmod>2026-03-25T00:00:00.000Z</lastmod>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.contextractor.com/content-extraction-for-llms/</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.contextractor.com/cookie-consent-handling/</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.contextractor.com/crawlee-contextractor-pipeline/</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/extracting-non-article-pages/</loc>
<lastmod>2026-03-25T00:00:00.000Z</lastmod>
<priority>0.6</priority>
</url>
<url>
<loc>https://www.contextractor.com/extraction-output-formats/</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/extraction-vs-headless-browser/</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/firecrawl-vs-contextractor/</loc>
<lastmod>2026-03-27T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/help/</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<priority>0.5</priority>
</url>
<url>
<loc>https://www.contextractor.com/help/cli/</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<priority>0.5</priority>
</url>
<url>
<loc>https://www.contextractor.com/help/docker/</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<priority>0.5</priority>
</url>
<url>
<loc>https://www.contextractor.com/help/web/</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<priority>0.5</priority>
</url>
<url>
<loc>https://www.contextractor.com/html-to-markdown-for-ai/</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/llm-html-preprocessing/</loc>
<lastmod>2026-03-25T00:00:00.000Z</lastmod>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.contextractor.com/mcp-web-extraction/</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/rag-pipeline-clean-data/</loc>
<lastmod>2026-03-27T00:00:00.000Z</lastmod>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.contextractor.com/reduce-llm-token-costs/</loc>
<lastmod>2026-03-23T00:00:00.000Z</lastmod>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.contextractor.com/structured-data-extraction/</loc>
<lastmod>2026-03-24T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/trafilatura/</loc>
<lastmod>2026-03-16T00:00:00.000Z</lastmod>
<priority>1</priority>
</url>
<url>
<loc>https://www.contextractor.com/trafilatura-vs-jina-readerlm/</loc>
<lastmod>2026-03-25T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/trafilatura-vs-readability-vs-newspaper/</loc>
<lastmod>2026-03-26T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/web-scraping-law/</loc>
<lastmod>2026-03-27T00:00:00.000Z</lastmod>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.contextractor.com/web-scraping-stack/</loc>
<lastmod>2026-03-27T00:00:00.000Z</lastmod>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.contextractor.com/upload/</loc>
</url>
</urlset>
