dlt-hub · rudolfix · Oct 2, 2024 · Oct 2, 2024 · Oct 2, 2024
diff --git a/sources/pg_replication/schema_types.py b/sources/pg_replication/schema_types.py
@@ -79,7 +79,11 @@ def _get_scale(type_id: int, atttypmod: int) -> Optional[int]:
 @lru_cache(maxsize=None)
 def _type_mapper() -> Any:
     from dlt.destinations import postgres
-    from dlt.destinations.impl.postgres.postgres import PostgresTypeMapper
+
+    try:
+        from dlt.destinations.impl.postgres.postgres import PostgresTypeMapper
+    except ImportError:
+        from dlt.destinations.impl.postgres.factory import PostgresTypeMapper  # type: ignore
 
     return PostgresTypeMapper(postgres().capabilities())
 

diff --git a/sources/scraping/__init__.py b/sources/scraping/__init__.py
@@ -8,7 +8,6 @@
 import dlt
 
 from dlt.sources import DltResource
-from dlt.common.source import _SOURCES, SourceInfo
 
 from scrapy import Spider  # type: ignore
 
@@ -65,10 +64,8 @@ def run_pipeline(  # type: ignore[valid-type]
     scraping_host.run(*args, **kwargs)
 
 
-# This way we allow dlt init to detect scraping source it is indeed hacky
-# and the core team is working to provide a better alternative.
-_SOURCES[run_pipeline.__qualname__] = SourceInfo(
-    ScrapingConfig,
-    run_pipeline,
-    inspect.getmodule(run_pipeline),
-)
+@dlt.source(spec=ScrapingConfig)
+def _register() -> DltResource:
+    raise NotImplementedError(
+        "Due to internal architecture of Scrapy, we could not represent it as a generator. Please use `run_pipeline` function instead"
+    )
diff --git a/sources/scraping/runner.py b/sources/scraping/runner.py
@@ -191,5 +191,5 @@ def run(
         logger.info("Starting scrapy crawler")
         self.scrapy_runner.run()
 
-        # Wait to for pipeline finish it's job
+        # Wait to for pipeline finish its job
         pipeline_worker.join()