multithreading

This commit is contained in:
2025-11-18 22:09:20 +00:00
parent 69c1b86bf1
commit aa1879582a
5 changed files with 150 additions and 178 deletions
+60 -32
View File
@@ -2,50 +2,78 @@ from modules.nimrod import Nimrod
import os
from pathlib import Path
import logging
import concurrent.futures
class BatchNimrod:
def __init__(self, config) -> None:
self.config = config
def process_nimrod_files(self) -> None:
def _process_single_file(self, in_file):
"""Process a single Nimrod DAT file.
Args:
in_file (str): Filename of the DAT file.
Returns:
bool: True if successful, False otherwise.
"""
Process all Nimrod files in the input directory, applying bounding box clipping
and exporting to ASC format.
This function reads all files from DAT_TOP_FOLDER, applies the appropriate bounding
box for each area, and exports clipped raster data to OUT_TOP_FOLDER.
"""
# Read all file names in the folder
files_to_process = len([f for f in os.listdir(Path(self.config.DAT_TOP_FOLDER))])
logging.info(f"Processing {files_to_process} files...")
file_counter = 0
for in_file in os.listdir(Path(self.config.DAT_TOP_FOLDER)):
in_file_full = Path(self.config.DAT_TOP_FOLDER, in_file)
try:
image = Nimrod(open(in_file_full, "rb"))
in_file_full = Path(self.config.DAT_TOP_FOLDER, in_file)
try:
# We need to open the file here, inside the thread
with open(in_file_full, "rb") as f:
image = Nimrod(f)
out_file_name = f"{image.get_validity_time()}.asc"
out_file_path = Path(self.config.ASC_TOP_FOLDER, out_file_name)
with open(out_file_path, "w") as outfile:
image.extract_asc(outfile)
if self.config.delete_dat_after_processing:
os.remove(in_file_full)
if self.config.delete_dat_after_processing:
os.remove(in_file_full)
file_counter += 1
logging.debug(f"Successfully processed: {in_file_full}")
if file_counter %10 == 0:
logging.info(f'processed {file_counter} out of {files_to_process} files')
logging.debug(f"Successfully processed: {in_file_full}")
return True
except Nimrod.HeaderReadError as e:
logging.error(f"Failed to read file {in_file_full}, is it corrupt?")
logging.error(e)
return False
except Nimrod.PayloadReadError as e:
logging.error(f"Failed to load the raster data in {in_file_full}")
logging.error(e)
return False
except Exception as e:
logging.error(f"Unexpected error processing {in_file_full}: {e}")
return False
def process_nimrod_files(self) -> None:
"""
Process all Nimrod files in the input directory concurrently, applying bounding box clipping
and exporting to ASC format.
This function reads all files from DAT_TOP_FOLDER, applies the appropriate bounding
box for each area, and exports clipped raster data to OUT_TOP_FOLDER.
"""
# Read all file names in the folder
files_to_process = [f for f in os.listdir(Path(self.config.DAT_TOP_FOLDER)) if not f.startswith('.')]
total_files = len(files_to_process)
logging.info(f"Processing {total_files} files concurrently...")
with concurrent.futures.ThreadPoolExecutor() as executor:
# Submit all tasks
future_to_file = {
executor.submit(self._process_single_file, in_file): in_file
for in_file in files_to_process
}
completed_count = 0
for future in concurrent.futures.as_completed(future_to_file):
completed_count += 1
if completed_count % 10 == 0:
logging.info(f'processed {completed_count} out of {total_files} files')
except Nimrod.HeaderReadError as e:
logging.error(f"Failed to read file {in_file_full}, is it corrupt?")
logging.error(e)
continue
except Nimrod.PayloadReadError as e:
logging.error(f"Failed to load the raster data in {in_file_full}")
logging.error(e)
continue