mirror of
https://github.com/DOI-DO/j40-cejst-2.git
synced 2025-07-27 22:31:16 -07:00
Add pre-cleaning to a couple of zip files during geo-score (#2151)
Two zip files were not getting cleared prior to running geo score. This was resulting in them growing between runs until the application ground to a halt. This fix clears those two zip files before geo score and before the full run.
This commit is contained in:
parent
d831a808d2
commit
9ba4e790a7
2 changed files with 21 additions and 0 deletions
|
@ -22,6 +22,7 @@ from data_pipeline.utils import downloadable_cleanup
|
|||
from data_pipeline.utils import get_module_logger
|
||||
from data_pipeline.utils import score_folder_cleanup
|
||||
from data_pipeline.utils import temp_folder_cleanup
|
||||
from data_pipeline.utils import geo_score_folder_cleanup
|
||||
|
||||
logger = get_module_logger(__name__)
|
||||
|
||||
|
@ -58,6 +59,7 @@ def data_cleanup():
|
|||
tribal_reset(data_path)
|
||||
score_folder_cleanup()
|
||||
temp_folder_cleanup()
|
||||
geo_score_folder_cleanup()
|
||||
|
||||
logger.info("Cleaned up all data folders")
|
||||
sys.exit()
|
||||
|
@ -179,6 +181,7 @@ def geo_score(data_source: str):
|
|||
None
|
||||
"""
|
||||
|
||||
geo_score_folder_cleanup()
|
||||
score_geo(data_source=data_source)
|
||||
sys.exit()
|
||||
|
||||
|
|
|
@ -17,6 +17,7 @@ from data_pipeline.config import settings
|
|||
from data_pipeline.content.schemas.download_schemas import CodebookConfig
|
||||
from data_pipeline.content.schemas.download_schemas import CSVConfig
|
||||
from data_pipeline.content.schemas.download_schemas import ExcelConfig
|
||||
from data_pipeline.etl.score.constants import SCORE_VERSIONING_SHAPEFILE_CODEBOOK_FILE_PATH
|
||||
from marshmallow import ValidationError
|
||||
from marshmallow_dataclass import class_schema
|
||||
|
||||
|
@ -218,9 +219,26 @@ def score_folder_cleanup() -> None:
|
|||
remove_all_from_dir(data_path / "score" / "csv")
|
||||
remove_all_from_dir(data_path / "score" / "geojson")
|
||||
remove_all_from_dir(data_path / "score" / "tiles")
|
||||
remove_all_from_dir(data_path / "score" / "shapefile")
|
||||
downloadable_cleanup()
|
||||
|
||||
|
||||
def geo_score_folder_cleanup() -> None:
|
||||
"""Removes the necessary files to run geo-score. This works out to be
|
||||
zip files, since if we don't remove them python's zip utils continuously
|
||||
add to them instead of overwriting the contents."""
|
||||
|
||||
data_path = settings.APP_ROOT / "data"
|
||||
|
||||
logger.info("Removing zip files")
|
||||
remove_files_from_dir(data_path / "score" / "shapefile", ".zip")
|
||||
|
||||
shapefile_and_codebook_zipped = SCORE_VERSIONING_SHAPEFILE_CODEBOOK_FILE_PATH
|
||||
|
||||
if os.path.isfile(shapefile_and_codebook_zipped):
|
||||
os.remove(shapefile_and_codebook_zipped)
|
||||
|
||||
|
||||
def downloadable_cleanup() -> None:
|
||||
"""Remove all files from downloadable directory in the local data/score path"""
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue