<!DOCTYPE html>
<html lang="en" class="h-100">

<head>
    <!-- Google tag (gtag.js) -->
<script async src="https://www.googletagmanager.com/gtag/js?id=AW-17827106252"></script>
<script>
  window.dataLayer = window.dataLayer || [];
  function gtag(){dataLayer.push(arguments);}
  gtag('js', new Date());
  gtag('config', 'G-VLXKC92TDR'); // Google Analytics
  gtag('config', 'AW-17827106252'); // Google Ads
</script>
<!-- End Google tag (gtag.js) -->
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <meta name="author" content="Web Data Source">
    <meta name="robots" content="index, follow">
    <title>WDS | Home</title><meta name="description" content="Boost your databases and AI agents with a pluggable web crawler. Web Data Source seamlessly integrates real-time insights from Intranet/Internet into your queries and agentic AI workflows">
<meta name="keywords" content="Web Data Source, WebDataSource, WDS, Pluggable Web Crawler, Databases, AI agents, Agentic AI, Web Crawler, Data Extraction, Intranet Crawler, Internet Data Gathering, Air-Gapped, Web Data Source, WebDataSource, WDS, Pluggable Web Crawler, Databases, AI agents, Agentic AI, Web Crawler, Data Extraction, Intranet Crawler, Internet Data Gathering, Air-Gapped">

<meta property="og:title" content="Web Data Source: Pluggable Web Crawler for Databases and AI Agents">
<meta property="og:description" content="Boost your databases and AI agents with a pluggable web crawler. Web Data Source seamlessly integrates real-time insights from Intranet/Internet into your queries and agentic AI workflows">
<meta property="og:image" content="https://webdatasource.com/assets/img/logo.svg">
<meta property="og:url" content="https://www.webdatasource.com/">

<script type="application/ld+json">
{
    "@context": "https://schema.org",
    "@type": "Organization",
    "name": "Web Data Source",
    "url": "https://www.webdatasource.com/",
    "logo": "https://webdatasource.com/assets/img/logo.svg",
    "sameAs": [
        "https://github.com/webdatasource",
        "https://www.linkedin.com/company/webdatasource"
    ]
}
</script>

<link rel="canonical" href="https://www.webdatasource.com/"><link rel="icon" href="/assets/img/favicon.svg?fp=rPx-AJ5dorzx622O" sizes="any" type="image/svg+xml">
    <link rel="stylesheet" href="/assets/css/bootstrap/bootstrap.min.css?fp=djO3wMl9GeaC_u6K">
    <link rel="stylesheet" href="/assets/css/bootstrap/bootstrap-icons.min.css?fp=9kPW_n5nn53j4WMR">
    <link rel="stylesheet" href="/assets/css/highlight/vs2015.min.css?fp=Pi771--jBrwgeHVY">
    <link rel="stylesheet" href="/assets/css/main.css?fp=Ojv6u5K1BUDpq-to">
</head>

<body class="d-flex flex-column h-100 overflow-auto">
    <!-- Navbar -->
    <nav class="navbar navbar-expand-lg navbar-dark shadow" style="background-color: var(--bs-secondary);">
        <div class="container">
            <a class="navbar-brand p-0" href="/"><img src="/assets/img/logo.svg?fp=PBADpze7bwWIwSFK" class="me-2" height="35">Web Data Source</a>
            <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarNav" aria-controls="navbarNav" aria-expanded="false" aria-label="Toggle navigation">
                <span class="navbar-toggler-icon"></span>
            </button>
            <div class="collapse navbar-collapse justify-content-end" id="navbarNav">
                <ul class="navbar-nav fw-semibold">
                    <li class="nav-item d-flex justify-content-end">
                        <a class="nav-link text-light" href="/releases/index.html">Releases</a> 
                    </li>
                    <li class="nav-item d-flex justify-content-end">
                        <a class="nav-link text-light" href="/posts/index.html">Posts</a> 
                    </li>
                    <li class="nav-item d-flex justify-content-end">
                        <a class="nav-link text-light" href="/pricing.html">Pricing</a> 
                    </li>
                    <li class="nav-item d-flex justify-content-end">
                        <a class="nav-link text-light" href="/contact.html">Contact</a> 
                    </li>
                    <li class="nav-item d-flex justify-content-end">
                        <a class="nav-link text-light" href="https://github.com/webdatasource?tab=repositories" target="_blank">GitHub</a>
                    </li>
                </ul>
            </div>
        </div>
    </nav>

    <main>
        <div class="container">
            <!-- Hero Section -->
<section class="hero-section d-flex align-items-center justify-content-center py-5">
    <div class="container">
        <h1 class="hero-title display-4">Web Crawler for Databases and AI Agents</h1>
        <p class="hero-subtitle lead">
            <div>Empower your database with a pluggable web crawler to enhance your queries with data from the Intranet/Internet</div>
            <div>Supercharge your AI agents with an MCP-ready web crawler that delivers real-time insights from the web and your private knowledge bases</div>
        </p>
        <a href="/releases/latest/server/api/quickstart.html" class="btn btn-primary btn-lg me-2">Get started in 5 minutes, it's absolutely free</a>
    </div>
</section>

<!-- Features Section -->
<section id="features" class="py-5">
    <div class="container">
        <h2 class="text-center mb-4">Why Choose Web Data Source?</h2>
        <p class="lead text-center mb-5">A pluggable solution designed for data enthusiasts that turns Internet and Intranet resources into yet another data source</p>
        <div class="row g-4">
            <div class="col-md-4">
                <div class="feature-box text-center p-4 h-100">
                    <div class="feature-icon mb-3">
                        <i class="bi bi-lightning-charge-fill"></i>
                    </div>
                    <h5 class="mb-3">High Performance</h5>
                    <p>Automatically scales resources to match user demand, ensuring optimal performance</p>
                </div>
            </div>
            <div class="col-md-4">
                <div class="feature-box text-center p-4 h-100">
                    <div class="feature-icon mb-3">
                        <i class="bi bi-lock-fill"></i>
                    </div>
                    <h5 class="mb-3">Secure</h5>
                    <p>Embedded solution provides the best security and anonymization to make the gathering process safe and hidden from competitors</p>
                </div>
            </div>
            <div class="col-md-4">
                <div class="feature-box text-center p-4 h-100">
                    <div class="feature-icon mb-3">
                        <i class="bi bi-gear-fill"></i>
                    </div>
                    <h5 class="mb-3">Customizable</h5>
                    <p>Provides toolsets for popular databases and AI agents, enabling seamless web data extraction</p>
                </div>
            </div>
        </div>
    </div>
</section>

<!-- Advanced Features Section -->
<section id="advanced-features" class="py-5">
    <div class="container">
        <h2 class="text-center mb-4">Advanced Features</h2>
        <p class="lead text-center mb-5">Explore key features that make Web Data Source a powerful solution for your needs</p>
        <div class="row g-4">
            <div class="col-md-4">
                <div class="feature-box text-center p-4 h-100">
                    <div class="feature-icon mb-3">
                        <i class="bi bi-cloud-arrow-up-fill"></i>
                    </div>
                    <h5 class="mb-3">Cloud Integration</h5>
                    <p>This cloud-native solution can be deployed in any Kubernetes-compatible environment</p>
                </div>
            </div>
            <div class="col-md-4">
                <div class="feature-box text-center p-4 h-100">
                    <div class="feature-icon mb-3">
                        <i class="bi bi-shield-shaded"></i>
                    </div>
                    <h5 class="mb-3">Durability</h5>
                    <p>The solution is designed with a minimal component base to work on minimal hardware and restore itself after environmental outages.<br/>It just works!</p>
                </div>
            </div>
            <div class="col-md-4">
                <div class="feature-box text-center p-4 h-100">
                    <div class="feature-icon mb-3">
                        <i class="bi bi-arrow-left-right"></i>
                    </div>
                    <h5 class="mb-3">Backward Compatibility</h5>
                    <p>Losing backward compatibility in work tools is painful! This solution is designed with Backward Compatibility as one of the main Architecture Significant Requirements</p>
                </div>
            </div>
        </div>
    </div>
</section>

<!-- SQL Examples Section -->
<section class="examples py-5">
    <div class="container">
        <h2 class="text-center mb-4">Usage Examples</h2>
        <p class="lead text-center mb-5">Explore how to interact with web data sources in SQL queries</p>
        <div class="sql-card-container d-flex flex-wrap justify-content-center gap-4">
            <!-- SQL Card 1 -->
            <div class="sql-card p-4" style="width: 600px;">
                <div class="sql-card-header">Getting URLs from a page</div>
                <pre><code class="sql overflow-hidden">
SELECT 
    nav.Task.Url URL
FROM wds.Start(@jobConfig) root
    OUTER APPLY wds.Crawl(root.Task, 'css: ul.nav a', null) nav
                    </code></pre>
            </div>
            <!-- SQL Card 2 -->
            <div class="sql-card p-4" style="width: 600px;">
                <div class="sql-card-header">Getting data from pages</div>
                <pre><code class="sql overflow-hidden">
SELECT  
    p.Task.Url URL,
    wds.ScrapeFirst(p.Task, 'css: h1', null) Name,
    wds.ScrapeFirst(p.Task, 'css: .price span', null) Price
FROM wds.Start(@jobConfig) r
    OUTER APPLY wds.Crawl(r.Task, 'css: table a', null) p
                </code></pre>
            </div>
            <!-- Additional SQL Cards as needed -->
        </div>
    </div>
    <!-- Syntax Highlighter -->
</section>

<!-- CTA Section -->
<section id="cta" class="cta-section py-5">
    <div class="container">
        <h2 class="mb-4">Ready to Dive In?</h2>
        <p class="mb-4">Start your journey with Web Data Source today</p>
        <a href="/releases/latest/index.html" class="btn btn-light btn-lg me-2">Browse Documentation</a>
    </div>
</section>
        </div>
    </main>
    
    <!-- Footer -->
    <footer class="footer py-3 d-flex flex-wrap justify-content-between align-items-center">
    <div class="col-md-2 d-flex text-muted ps-2"></div>
    <div class="col-md-8 d-flex justify-content-center">
        <span class="ms-3">© 2026 Web Data Source</span>
        <a href="https://www.linkedin.com/company/webdatasource" class="ms-3" target="_blank" aria-label="LinkedIn"><i class="bi bi-linkedin"></i></a>
        <a href="https://www.youtube.com/@webdatasource" class="ms-3" target="_blank" aria-label="YouTube"><i class="bi bi-youtube"></i></a>
        <a href="https://www.instagram.com/webdatasource" class="ms-3" target="_blank" aria-label="Instagram"><i class="bi bi-instagram"></i></a>
    </div>
    <div class="col-md-2 d-flex justify-content-end text-muted pe-2"></div>
</footer>

    <script src="/assets/js/bootstrap/bootstrap.bundle.min.js?fp=fh8VA992XMpeCZiR"></script>
    <script src="/assets/js/highlight/highlight.min.js?fp=obQjGqK_O1s_PDSM"></script>
    <script src="/assets/js/highlight/languages/sql.min.js?fp=VsxG9yjdimnfEyyZ"></script>    
    <script>hljs.highlightAll();</script></body>

</html>
