apify
diff --git a/‎docs/deployment/code_examples/google/cloud_run_example.py
Lines changed: 7 additions & 8 deletions b/‎docs/deployment/code_examples/google/cloud_run_example.py
Lines changed: 7 additions & 8 deletions
diff --git a/‎docs/deployment/code_examples/google/google_example.py
Lines changed: 7 additions & 8 deletions b/‎docs/deployment/code_examples/google/google_example.py
Lines changed: 7 additions & 8 deletions
diff --git a/‎docs/examples/code_examples/export_entire_dataset_to_file_csv.py
Lines changed: 1 addition & 1 deletion b/‎docs/examples/code_examples/export_entire_dataset_to_file_csv.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/examples/code_examples/export_entire_dataset_to_file_json.py
Lines changed: 1 addition & 1 deletion b/‎docs/examples/code_examples/export_entire_dataset_to_file_json.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/examples/code_examples/parsel_crawler.py
Lines changed: 1 addition & 1 deletion b/‎docs/examples/code_examples/parsel_crawler.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/guides/code_examples/storage_clients/custom_storage_client_example.py
Lines changed: 65 additions & 0 deletions b/‎docs/guides/code_examples/storage_clients/custom_storage_client_example.py
Lines changed: 65 additions & 0 deletions
diff --git a/‎docs/guides/code_examples/storage_clients/file_system_storage_client_basic_example.py
Lines changed: 8 additions & 0 deletions b/‎docs/guides/code_examples/storage_clients/file_system_storage_client_basic_example.py
Lines changed: 8 additions & 0 deletions
diff --git a/‎docs/guides/code_examples/storage_clients/file_system_storage_client_configuration_example.py
Lines changed: 18 additions & 0 deletions b/‎docs/guides/code_examples/storage_clients/file_system_storage_client_configuration_example.py
Lines changed: 18 additions & 0 deletions
diff --git a/‎docs/guides/code_examples/storage_clients/memory_storage_client_basic_example.py
Lines changed: 8 additions & 0 deletions b/‎docs/guides/code_examples/storage_clients/memory_storage_client_basic_example.py
Lines changed: 8 additions & 0 deletions
diff --git a/‎docs/guides/code_examples/storage_clients/registering_storage_client_example.py
Lines changed: 29 additions & 0 deletions b/‎docs/guides/code_examples/storage_clients/registering_storage_client_example.py
Lines changed: 29 additions & 0 deletions
@@ -5,24 +5,23 @@
 import uvicorn
 from litestar import Litestar, get
 
-from crawlee import service_locator
 from crawlee.crawlers import PlaywrightCrawler, PlaywrightCrawlingContext
-
-# highlight-start
-# Disable writing storage data to the file system
-configuration = service_locator.get_configuration()
-configuration.persist_storage = False
-configuration.write_metadata = False
-# highlight-end
+from crawlee.storage_clients import MemoryStorageClient
 
 
 @get('/')
 async def main() -> str:
     """The crawler entry point that will be called when the HTTP endpoint is accessed."""
+    # highlight-start
+    # Disable writing storage data to the file system
+    storage_client = MemoryStorageClient()
+    # highlight-end
+
     crawler = PlaywrightCrawler(
         headless=True,
         max_requests_per_crawl=10,
         browser_type='firefox',
+        storage_client=storage_client,
     )
 
     @crawler.router.default_handler
 
@@ -6,22 +6,21 @@
 import functions_framework
 from flask import Request, Response
 
-from crawlee import service_locator
 from crawlee.crawlers import (
     BeautifulSoupCrawler,
     BeautifulSoupCrawlingContext,
 )
-
-# highlight-start
-# Disable writing storage data to the file system
-configuration = service_locator.get_configuration()
-configuration.persist_storage = False
-configuration.write_metadata = False
-# highlight-end
+from crawlee.storage_clients import MemoryStorageClient
 
 
 async def main() -> str:
+    # highlight-start
+    # Disable writing storage data to the file system
+    storage_client = MemoryStorageClient()
+    # highlight-end
+
     crawler = BeautifulSoupCrawler(
+        storage_client=storage_client,
         max_request_retries=1,
         request_handler_timeout=timedelta(seconds=30),
         max_requests_per_crawl=10,
 
@@ -30,7 +30,7 @@ async def request_handler(context: BeautifulSoupCrawlingContext) -> None:
     await crawler.run(['https://crawlee.dev'])
 
     # Export the entire dataset to a CSV file.
-    await crawler.export_data_csv(path='results.csv')
+    await crawler.export_data(path='results.csv')
 
 
 if __name__ == '__main__':
 
@@ -30,7 +30,7 @@ async def request_handler(context: BeautifulSoupCrawlingContext) -> None:
     await crawler.run(['https://crawlee.dev'])
 
     # Export the entire dataset to a JSON file.
-    await crawler.export_data_json(path='results.json')
+    await crawler.export_data(path='results.json')
 
 
 if __name__ == '__main__':
 
@@ -40,7 +40,7 @@ async def some_hook(context: BasicCrawlingContext) -> None:
     await crawler.run(['https://github.com'])
 
     # Export the entire dataset to a JSON file.
-    await crawler.export_data_json(path='results.json')
+    await crawler.export_data(path='results.json')
 
 
 if __name__ == '__main__':
 
@@ -0,0 +1,65 @@
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+from crawlee.storage_clients import StorageClient
+from crawlee.storage_clients._base import (
+    DatasetClient,
+    KeyValueStoreClient,
+    RequestQueueClient,
+)
+
+if TYPE_CHECKING:
+    from crawlee.configuration import Configuration
+
+# Implement the storage type clients with your backend logic.
+
+
+class CustomDatasetClient(DatasetClient):
+    # Implement methods like push_data, get_data, iterate_items, etc.
+    pass
+
+
+class CustomKeyValueStoreClient(KeyValueStoreClient):
+    # Implement methods like get_value, set_value, delete, etc.
+    pass
+
+
+class CustomRequestQueueClient(RequestQueueClient):
+    # Implement methods like add_request, fetch_next_request, etc.
+    pass
+
+
+# Implement the storage client factory.
+
+
+class CustomStorageClient(StorageClient):
+    async def create_dataset_client(
+        self,
+        *,
+        id: str | None = None,
+        name: str | None = None,
+        configuration: Configuration | None = None,
+    ) -> CustomDatasetClient:
+        # Create and return your custom dataset client.
+        pass
+
+    async def create_kvs_client(
+        self,
+        *,
+        id: str | None = None,
+        name: str | None = None,
+        configuration: Configuration | None = None,
+    ) -> CustomKeyValueStoreClient:
+        # Create and return your custom key-value store client.
+        pass
+
+    async def create_rq_client(
+        self,
+        *,
+        id: str | None = None,
+        name: str | None = None,
+        configuration: Configuration | None = None,
+    ) -> CustomRequestQueueClient:
+        # Create and return your custom request queue client.
+        pass
@@ -0,0 +1,8 @@
+from crawlee.crawlers import ParselCrawler
+from crawlee.storage_clients import FileSystemStorageClient
+
+# Create a new instance of storage client.
+storage_client = FileSystemStorageClient()
+
+# And pass it to the crawler.
+crawler = ParselCrawler(storage_client=storage_client)
@@ -0,0 +1,18 @@
+from crawlee.configuration import Configuration
+from crawlee.crawlers import ParselCrawler
+from crawlee.storage_clients import FileSystemStorageClient
+
+# Create a new instance of storage client.
+storage_client = FileSystemStorageClient()
+
+# Create a configuration with custom settings.
+configuration = Configuration(
+    storage_dir='./my_storage',
+    purge_on_start=False,
+)
+
+# And pass them to the crawler.
+crawler = ParselCrawler(
+    storage_client=storage_client,
+    configuration=configuration,
+)
@@ -0,0 +1,8 @@
+from crawlee.crawlers import ParselCrawler
+from crawlee.storage_clients import MemoryStorageClient
+
+# Create a new instance of storage client.
+storage_client = MemoryStorageClient()
+
+# And pass it to the crawler.
+crawler = ParselCrawler(storage_client=storage_client)
@@ -0,0 +1,29 @@
+import asyncio
+
+from crawlee import service_locator
+from crawlee.crawlers import ParselCrawler
+from crawlee.storage_clients import MemoryStorageClient
+from crawlee.storages import Dataset
+
+
+async def main() -> None:
+    # Create custom storage client, MemoryStorageClient for example.
+    storage_client = MemoryStorageClient()
+
+    # Register it globally via the service locator.
+    service_locator.set_storage_client(storage_client)
+
+    # Or pass it directly to the crawler, it will be registered globally
+    # to the service locator under the hood.
+    crawler = ParselCrawler(storage_client=storage_client)
+
+    # Or just provide it when opening a storage (e.g. dataset), it will be used
+    # for this storage only, not globally.
+    dataset = await Dataset.open(
+        name='my_dataset',
+        storage_client=storage_client,
+    )
+
+
+if __name__ == '__main__':
+    asyncio.run(main())