InternScience · us · Jun 14, 2026 · Jun 15, 2026 · gemini-code-assist · Jun 14, 2026
diff --git a/internagent/mas/agents/dr_agents/camel/loaders/__init__.py b/internagent/mas/agents/dr_agents/camel/loaders/__init__.py
@@ -16,6 +16,7 @@
 from .base_io import File, create_file, create_file_from_raw_bytes
 from .chunkr_reader import ChunkrReader
 from .crawl4ai_reader import Crawl4AI
+from .crw_reader import Crw
 from .firecrawl_reader import Firecrawl
 from .jina_url_reader import JinaURLReader
 from .mineru_extractor import MinerU
@@ -29,6 +30,7 @@
     'UnstructuredIO',
     'JinaURLReader',
     'Firecrawl',
+    'Crw',
     'Apify',
     'ChunkrReader',
     'PandasReader',

diff --git a/internagent/mas/agents/dr_agents/camel/loaders/crw_reader.py b/internagent/mas/agents/dr_agents/camel/loaders/crw_reader.py
@@ -0,0 +1,183 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+
+import os
+from typing import Any, Dict, Optional
+
+from pydantic import BaseModel
+
+
+class Crw:
+    r"""fastCRW allows you to turn entire websites into LLM-ready markdown.
+
+    fastCRW is a Firecrawl-compatible web scraper shipped as a single binary;
+    self-host (free, open core) or use the managed cloud.
+
+    Args:
+        api_key (Optional[str]): API key for authenticating with the fastCRW
+            API.
+        api_url (Optional[str]): Base URL for the fastCRW API. Defaults to the
+            managed cloud at ``https://fastcrw.com/api``; override for
+            self-hosted deployments.
+
+    References:
+        https://fastcrw.com/docs/rest-api
+    """
+
+    def __init__(
+        self,
+        api_key: Optional[str] = None,
+        api_url: Optional[str] = None,
+    ) -> None:
+        from crw import CrwClient
+
+        self._api_key = api_key or os.environ.get("CRW_API_KEY")
+        self._api_url = (
+            api_url
+            or os.environ.get("CRW_API_URL")
+            or "https://fastcrw.com/api"
+        )
+
+        self.app = CrwClient(api_key=self._api_key, api_url=self._api_url)
+
+    def crawl(
+        self,
+        url: str,
+        params: Optional[Dict[str, Any]] = None,
+        **kwargs: Any,
+    ) -> Any:
+        r"""Crawl a URL and all accessible subpages. Customize the crawl by
+        setting different parameters, and receive the full response or a job
+        ID based on the specified options.
+
+        Args:
+            url (str): The URL to crawl.
+            params (Optional[Dict[str, Any]]): Additional parameters for the
+                crawl request. Defaults to `None`.
+            **kwargs (Any): Additional keyword arguments, such as
+                `poll_interval`, `idempotency_key`.
+
+        Returns:
+            Any: The crawl job ID or the crawl results if waiting until
+                completion.
+
+        Raises:
+            RuntimeError: If the crawling process fails.
+        """
+
+        try:
+            # CrwClient.crawl() takes url + keyword args directly (no params
+            # dict) and handles polling internally, returning list[dict].
+            crawl_response = self.app.crawl(
+                url=url,
+                **(params or {}),
+                **kwargs,
+            )
-            crawl_response = self.app.crawl(
-                url=url,
-                **({} if params is None else params),
-                **kwargs,
-            )
+            crawl_response = self.app.crawl(
+                url=url,
+                **(params or {}),
+                **kwargs,
+            )
-            crawl_response = self.app.crawl(
-                url=url,
-                **({} if params is None else params),
-                **kwargs,
-            )
+            crawl_response = self.app.crawl(
+                url=url,
+                **(params or {}),
+                **kwargs,
+            )
+            return crawl_response
+        except Exception as e:
+            raise RuntimeError(f"Failed to crawl the URL: {e}")
+
+    def check_crawl_job(self, job_id: str) -> Dict:
+        r"""Check the status of a crawl job.
+
+        Not supported: CrwClient encapsulates crawl status polling inside
+        :meth:`crawl`, which blocks until completion and returns the results
+        directly. There is no public status-check method to call with a job ID.
+
+        Args:
+            job_id (str): The ID of the crawl job.
+
+        Raises:
+            NotImplementedError: Always — CrwClient handles polling internally.
+        """
+
+        raise NotImplementedError(
+            "CrwClient handles crawl status polling internally; crawl() blocks "
+            "until completion and returns results directly. There is no "
+            "separate check_crawl_status endpoint to query by job ID."
+        )
+
+    def scrape(
+        self,
+        url: str,
+        params: Optional[Dict[str, Any]] = None,
+    ) -> Dict:
+        r"""To scrape a single URL. This function supports advanced scraping
+        by setting different parameters and returns the full scraped data as a
+        dictionary.
+
+        Reference: https://fastcrw.com/docs/rest-api
+
+        Args:
+            url (str): The URL to read.
+            params (Optional[Dict[str, Any]]): Additional parameters for the
+                scrape request.
+
+        Returns:
+            Dict: The scraped data.
+
+        Raises:
+            RuntimeError: If the scrape process fails.
+        """
+        try:
+            return self.app.scrape(url, **(params or {}))
+        except Exception as e:
+            raise RuntimeError(f"Failed to scrape the URL: {e}")
+
+    def structured_scrape(self, url: str, response_format: BaseModel) -> Dict:
+        r"""Use LLM to extract structured data from given URL.
+
+        Args:
+            url (str): The URL to read.
+            response_format (BaseModel): A pydantic model
+                that includes value types and field descriptions used to
+                generate a structured response by LLM. This schema helps
+                in defining the expected output format.
+
+        Returns:
+            Dict: The content of the URL.
+
+        Raises:
+            RuntimeError: If the scrape process fails.
+        """
+        try:
+            data = self.app.scrape(
+                url,
+                formats=['json'],
+                jsonSchema=response_format.model_json_schema(),
+            )
+            return data.get('json', {}) if isinstance(data, dict) else {}
+        except Exception as e:
+            raise RuntimeError(f"Failed to perform structured scrape: {e}")
+
+    def map_site(
+        self, url: str, params: Optional[Dict[str, Any]] = None
+    ) -> list:
+        r"""Map a website to retrieve all accessible URLs.
+
+        Args:
+            url (str): The URL of the site to map.
+            params (Optional[Dict[str, Any]]): Additional parameters for the
+                map request. Defaults to `None`.
+
+        Returns:
+            list: A list containing the URLs found on the site.
+
+        Raises:
+            RuntimeError: If the mapping process fails.
+        """
+        try:
+            return self.app.map(url, **(params or {}))
+        except Exception as e:
+            raise RuntimeError(f"Failed to map the site: {e}")