ScrapeGraphAI
diff --git a/‎scrapegraph-py/examples/async_searchscraper_example.py
Lines changed: 46 additions & 0 deletions b/‎scrapegraph-py/examples/async_searchscraper_example.py
Lines changed: 46 additions & 0 deletions
diff --git a/‎scrapegraph-py/examples/async_searchscraper_schema_example.py
Lines changed: 119 additions & 0 deletions b/‎scrapegraph-py/examples/async_searchscraper_schema_example.py
Lines changed: 119 additions & 0 deletions
diff --git a/‎scrapegraph-py/examples/searchscraper_example.py
Lines changed: 26 additions & 0 deletions b/‎scrapegraph-py/examples/searchscraper_example.py
Lines changed: 26 additions & 0 deletions
diff --git a/‎scrapegraph-py/examples/searchscraper_schema_example.py
Lines changed: 41 additions & 0 deletions b/‎scrapegraph-py/examples/searchscraper_schema_example.py
Lines changed: 41 additions & 0 deletions
diff --git a/‎scrapegraph-py/examples/feedback_example.py renamed to ‎scrapegraph-py/examples/send_feedback_example.py
Lines changed: 28 additions & 28 deletions b/‎scrapegraph-py/examples/feedback_example.py renamed to ‎scrapegraph-py/examples/send_feedback_example.py
Lines changed: 28 additions & 28 deletions
diff --git a/‎scrapegraph-py/pyproject.toml
Lines changed: 2 additions & 2 deletions b/‎scrapegraph-py/pyproject.toml
Lines changed: 2 additions & 2 deletions
diff --git a/‎scrapegraph-py/scrapegraph_py/async_client.py
Lines changed: 43 additions & 0 deletions b/‎scrapegraph-py/scrapegraph_py/async_client.py
Lines changed: 43 additions & 0 deletions
@@ -0,0 +1,46 @@
+"""
+Example of using the async searchscraper functionality to search for information concurrently.
+"""
+
+import asyncio
+
+from scrapegraph_py import AsyncClient
+from scrapegraph_py.logger import sgai_logger
+
+sgai_logger.set_logging(level="INFO")
+
+
+async def main():
+    # Initialize async client
+    sgai_client = AsyncClient(api_key="your-api-key-here")
+
+    # List of search queries
+    queries = [
+        "What is the latest version of Python and what are its main features?",
+        "What are the key differences between Python 2 and Python 3?",
+        "What is Python's GIL and how does it work?",
+    ]
+
+    # Create tasks for concurrent execution
+    tasks = [sgai_client.searchscraper(user_prompt=query) for query in queries]
+
+    # Execute requests concurrently
+    responses = await asyncio.gather(*tasks, return_exceptions=True)
+
+    # Process results
+    for i, response in enumerate(responses):
+        if isinstance(response, Exception):
+            print(f"\nError for query {i+1}: {response}")
+        else:
+            print(f"\nSearch {i+1}:")
+            print(f"Query: {queries[i]}")
+            print(f"Result: {response['result']}")
+            print("Reference URLs:")
+            for url in response["reference_urls"]:
+                print(f"- {url}")
+
+    await sgai_client.close()
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
@@ -0,0 +1,119 @@
+"""
+Example of using the async searchscraper functionality with output schemas for extraction.
+"""
+
+import asyncio
+from typing import List
+
+from pydantic import BaseModel
+
+from scrapegraph_py import AsyncClient
+from scrapegraph_py.logger import sgai_logger
+
+sgai_logger.set_logging(level="INFO")
+
+
+# Define schemas for extracting structured data
+class PythonVersionInfo(BaseModel):
+    version: str
+    release_date: str
+    major_features: List[str]
+
+
+class PythonComparison(BaseModel):
+    key_differences: List[str]
+    backward_compatible: bool
+    migration_difficulty: str
+
+
+class GILInfo(BaseModel):
+    definition: str
+    purpose: str
+    limitations: List[str]
+    workarounds: List[str]
+
+
+async def main():
+    # Initialize async client
+    sgai_client = AsyncClient(api_key="your-api-key-here")
+
+    # Define search queries with their corresponding schemas
+    searches = [
+        {
+            "prompt": "What is the latest version of Python? Include the release date and main features.",
+            "schema": PythonVersionInfo,
+        },
+        {
+            "prompt": "Compare Python 2 and Python 3, including backward compatibility and migration difficulty.",
+            "schema": PythonComparison,
+        },
+        {
+            "prompt": "Explain Python's GIL, its purpose, limitations, and possible workarounds.",
+            "schema": GILInfo,
+        },
+    ]
+
+    # Create tasks for concurrent execution
+    tasks = [
+        sgai_client.searchscraper(
+            user_prompt=search["prompt"],
+            output_schema=search["schema"],
+        )
+        for search in searches
+    ]
+
+    # Execute requests concurrently
+    responses = await asyncio.gather(*tasks, return_exceptions=True)
+
+    # Process results
+    for i, response in enumerate(responses):
+        if isinstance(response, Exception):
+            print(f"\nError for search {i+1}: {response}")
+        else:
+            print(f"\nSearch {i+1}:")
+            print(f"Query: {searches[i]['prompt']}")
+            # print(f"Raw Result: {response['result']}")
+
+            try:
+                # Try to extract structured data using the schema
+                result = searches[i]["schema"].model_validate(response["result"])
+
+                # Print extracted structured data
+                if isinstance(result, PythonVersionInfo):
+                    print("\nExtracted Data:")
+                    print(f"Python Version: {result.version}")
+                    print(f"Release Date: {result.release_date}")
+                    print("Major Features:")
+                    for feature in result.major_features:
+                        print(f"- {feature}")
+
+                elif isinstance(result, PythonComparison):
+                    print("\nExtracted Data:")
+                    print("Key Differences:")
+                    for diff in result.key_differences:
+                        print(f"- {diff}")
+                    print(f"Backward Compatible: {result.backward_compatible}")
+                    print(f"Migration Difficulty: {result.migration_difficulty}")
+
+                elif isinstance(result, GILInfo):
+                    print("\nExtracted Data:")
+                    print(f"Definition: {result.definition}")
+                    print(f"Purpose: {result.purpose}")
+                    print("Limitations:")
+                    for limit in result.limitations:
+                        print(f"- {limit}")
+                    print("Workarounds:")
+                    for workaround in result.workarounds:
+                        print(f"- {workaround}")
+            except Exception as e:
+                print(f"\nCould not extract structured data: {e}")
+
+            print("\nReference URLs:")
+            for url in response["reference_urls"]:
+                print(f"- {url}")
+
+    await sgai_client.close()
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
@@ -0,0 +1,26 @@
+"""
+Example of using the searchscraper functionality to search for information.
+"""
+
+from scrapegraph_py import Client
+from scrapegraph_py.logger import sgai_logger
+
+sgai_logger.set_logging(level="INFO")
+
+# Initialize the client
+client = Client(api_key="your-api-key-here")
+
+# Send a searchscraper request
+response = client.searchscraper(
+    user_prompt="What is the latest version of Python and what are its main features?"
+)
+
+# Print the results
+print("\nResults:")
+print(f"Answer: {response['result']}")
+print("\nReference URLs:")
+for url in response["reference_urls"]:
+    print(f"- {url}")
+
+# Close the client
+client.close()
@@ -0,0 +1,41 @@
+"""
+Example of using the searchscraper functionality with a custom output schema.
+"""
+
+from typing import List
+
+from pydantic import BaseModel
+
+from scrapegraph_py import Client
+from scrapegraph_py.logger import sgai_logger
+
+sgai_logger.set_logging(level="INFO")
+
+
+# Define a custom schema for the output
+class PythonVersionInfo(BaseModel):
+    version: str
+    release_date: str
+    major_features: List[str]
+    is_latest: bool
+
+
+# Initialize the client
+client = Client(api_key="your-api-key-here")
+
+# Send a searchscraper request with schema
+response = client.searchscraper(
+    user_prompt="What is the latest version of Python? Include the release date and main features.",
+    output_schema=PythonVersionInfo,
+)
+
+# The result will be structured according to our schema
+print(f"Request ID: {response['request_id']}")
+print(f"Result: {response['result']}")
+
+print("\nReference URLs:")
+for url in response["reference_urls"]:
+    print(f"- {url}")
+
+# Close the client
+client.close()
@@ -1,28 +1,28 @@
-from scrapegraph_py import Client
-from scrapegraph_py.logger import sgai_logger
-
-sgai_logger.set_logging(level="INFO")
-
-# Initialize the client
-sgai_client = Client(api_key="your-api-key-here")
-
-# Example request_id (replace with an actual request_id from a previous request)
-request_id = "your-request-id-here"
-
-# Check remaining credits
-credits = sgai_client.get_credits()
-print(f"Credits Info: {credits}")
-
-# Submit feedback for a previous request
-feedback_response = sgai_client.submit_feedback(
-    request_id=request_id,
-    rating=5,  # Rating from 1-5
-    feedback_text="The extraction was accurate and exactly what I needed!",
-)
-print(f"\nFeedback Response: {feedback_response}")
-
-# Get previous results using get_smartscraper
-previous_result = sgai_client.get_smartscraper(request_id=request_id)
-print(f"\nRetrieved Previous Result: {previous_result}")
-
-sgai_client.close()
+from scrapegraph_py import Client
+from scrapegraph_py.logger import sgai_logger
+
+sgai_logger.set_logging(level="INFO")
+
+# Initialize the client
+sgai_client = Client(api_key="your-api-key-here")
+
+# Example request_id (replace with an actual request_id from a previous request)
+request_id = "your-request-id-here"
+
+# Check remaining credits
+credits = sgai_client.get_credits()
+print(f"Credits Info: {credits}")
+
+# Submit feedback for a previous request
+feedback_response = sgai_client.submit_feedback(
+    request_id=request_id,
+    rating=5,  # Rating from 1-5
+    feedback_text="The extraction was accurate and exactly what I needed!",
+)
+print(f"\nFeedback Response: {feedback_response}")
+
+# Get previous results using get_smartscraper
+previous_result = sgai_client.get_smartscraper(request_id=request_id)
+print(f"\nRetrieved Previous Result: {previous_result}")
+
+sgai_client.close()
@@ -83,7 +83,7 @@ line-length = 88
 
 [tool.ruff.lint]
 select = ["F", "E", "W", "C"]
-ignore = ["E203", "E501"]  # Ignore conflicts with Black
+ignore = ["E203", "E501", "C901"]  # Ignore conflicts with Black and function complexity
 
 [tool.mypy]
 python_version = "3.10"
@@ -97,4 +97,4 @@ build-backend = "hatchling.build"
 
 [tool.poe.tasks]
 pylint-local = "pylint scrapegraph_py/**/*.py"
-pylint-ci = "pylint --disable=C0114,C0115,C0116 --exit-zero scrapegraph_py/**/*.py"
+pylint-ci = "pylint --disable=C0114,C0115,C0116,C901 --exit-zero scrapegraph_py/**/*.py"
@@ -10,6 +10,10 @@
 from scrapegraph_py.logger import sgai_logger as logger
 from scrapegraph_py.models.feedback import FeedbackRequest
 from scrapegraph_py.models.markdownify import GetMarkdownifyRequest, MarkdownifyRequest
+from scrapegraph_py.models.searchscraper import (
+    GetSearchScraperRequest,
+    SearchScraperRequest,
+)
 from scrapegraph_py.models.smartscraper import (
     GetSmartScraperRequest,
     SmartScraperRequest,
@@ -241,6 +245,45 @@ async def get_credits(self):
         )
         return result
 
+    async def searchscraper(
+        self,
+        user_prompt: str,
+        headers: Optional[dict[str, str]] = None,
+        output_schema: Optional[BaseModel] = None,
+    ):
+        """Send a searchscraper request"""
+        logger.info("🔍 Starting searchscraper request")
+        logger.debug(f"📝 Prompt: {user_prompt}")
+        if headers:
+            logger.debug("🔧 Using custom headers")
+
+        request = SearchScraperRequest(
+            user_prompt=user_prompt,
+            headers=headers,
+            output_schema=output_schema,
+        )
+        logger.debug("✅ Request validation passed")
+
+        result = await self._make_request(
+            "POST", f"{API_BASE_URL}/searchscraper", json=request.model_dump()
+        )
+        logger.info("✨ Searchscraper request completed successfully")
+        return result
+
+    async def get_searchscraper(self, request_id: str):
+        """Get the result of a previous searchscraper request"""
+        logger.info(f"🔍 Fetching searchscraper result for request {request_id}")
+
+        # Validate input using Pydantic model
+        GetSearchScraperRequest(request_id=request_id)
+        logger.debug("✅ Request ID validation passed")
+
+        result = await self._make_request(
+            "GET", f"{API_BASE_URL}/searchscraper/{request_id}"
+        )
+        logger.info(f"✨ Successfully retrieved result for request {request_id}")
+        return result
+
     async def close(self):
         """Close the session to free up resources"""
         logger.info("🔒 Closing AsyncClient session")