Adding eamlis and fuds data to legacy pollution in score (#1832)

Update to add EAMLIS and FUDS data to score
2025-10-01 08:53:18 -07:00 · 2022-08-18 13:32:29 -04:00 · 2022-08-18 13:32:29 -04:00 · cb4866b93f
commit cb4866b93f
parent 6e41e0d9f0
14 changed files with 93 additions and 24 deletions
--- a/data/data-pipeline/data_pipeline/etl/runner.py
+++ b/data/data-pipeline/data_pipeline/etl/runner.py
@ -93,21 +93,23 @@ def etl_runner(dataset_to_run: str = None) -> None:
        dataset for dataset in dataset_list if dataset["is_memory_intensive"]
    ]

-    logger.info("Running concurrent jobs")
-    with concurrent.futures.ThreadPoolExecutor() as executor:
-        futures = {
-            executor.submit(_run_one_dataset, dataset=dataset)
-            for dataset in concurrent_datasets
-        }
+    if concurrent_datasets:
+        logger.info("Running concurrent jobs")
+        with concurrent.futures.ThreadPoolExecutor() as executor:
+            futures = {
+                executor.submit(_run_one_dataset, dataset=dataset)
+                for dataset in concurrent_datasets
+            }

-        for fut in concurrent.futures.as_completed(futures):
-            # Calling result will raise an exception if one occurred.
-            # Otherwise, the exceptions are silently ignored.
-            fut.result()
+            for fut in concurrent.futures.as_completed(futures):
+                # Calling result will raise an exception if one occurred.
+                # Otherwise, the exceptions are silently ignored.
+                fut.result()

-    logger.info("Running high-memory jobs")
-    for dataset in high_memory_datasets:
-        _run_one_dataset(dataset=dataset)
+    if high_memory_datasets:
+        logger.info("Running high-memory jobs")
+        for dataset in high_memory_datasets:
+            _run_one_dataset(dataset=dataset)


 def score_generate() -> None: