pyiron · jan-janssen · Oct 27, 2024 · Oct 27, 2024 · Oct 27, 2024 · coderabbitai
@@ -3,7 +3,7 @@
 
 import cloudpickle
 
-from executorlib.shared.cache import backend_load_file, backend_write_file
+from executorlib.cache.backend import backend_load_file, backend_write_file
 
 
 def main() -> None:

@@ -1,6 +1,6 @@
 import sys
 
-from executorlib.shared.cache import execute_task_in_file
+from executorlib.cache.backend import backend_execute_task_in_file
 
 if __name__ == "__main__":
-    execute_task_in_file(file_name=sys.argv[1])
+    backend_execute_task_in_file(file_name=sys.argv[1])
@@ -0,0 +1,64 @@
+import os
+from typing import Any
+
+from executorlib.shared.cache import FutureItem
+from executorlib.shared.hdf import dump, load
+
+
+def backend_load_file(file_name: str) -> dict:
+    """
+    Load the data from an HDF5 file and convert FutureItem objects to their results.
+
+    Args:
+        file_name (str): The name of the HDF5 file.
+
+    Returns:
+        dict: The loaded data from the file.
+
+    """
+    apply_dict = load(file_name=file_name)
+    apply_dict["args"] = [
+        arg if not isinstance(arg, FutureItem) else arg.result()
+        for arg in apply_dict["args"]
+    ]
+    apply_dict["kwargs"] = {
+        key: arg if not isinstance(arg, FutureItem) else arg.result()
+        for key, arg in apply_dict["kwargs"].items()
+    }
+    return apply_dict
-def backend_load_file(file_name: str) -> dict:
-    """
-    Load the data from an HDF5 file and convert FutureItem objects to their results.
-
-    Args:
-        file_name (str): The name of the HDF5 file.
-
-    Returns:
-        dict: The loaded data from the file.
-
-    """
-    apply_dict = load(file_name=file_name)
-    apply_dict["args"] = [
-        arg if not isinstance(arg, FutureItem) else arg.result()
-        for arg in apply_dict["args"]
-    ]
-    apply_dict["kwargs"] = {
-        key: arg if not isinstance(arg, FutureItem) else arg.result()
-        for key, arg in apply_dict["kwargs"].items()
-    }
-    return apply_dict
+def backend_load_file(file_name: str) -> dict:
+    """
+    Load the data from an HDF5 file and convert FutureItem objects to their results.
+
+    Args:
+        file_name (str): The name of the HDF5 file.
+
+    Returns:
+        dict: The loaded data from the file.
+
+    """
+    try:
+        apply_dict = load(file_name=file_name)
+        try:
+            apply_dict["args"] = [
+                arg if not isinstance(arg, FutureItem) else arg.result()
+                for arg in apply_dict["args"]
+            ]
+            apply_dict["kwargs"] = {
+                key: arg if not isinstance(arg, FutureItem) else arg.result()
+                for key, arg in apply_dict["kwargs"].items()
+            }
+            return apply_dict
+        except Exception as e:
+            raise RuntimeError(f"Failed to resolve FutureItems: {str(e)}") from e
+    except Exception as e:
+        raise RuntimeError(f"Failed to load file {file_name}: {str(e)}") from e
-def backend_load_file(file_name: str) -> dict:
-    """
-    Load the data from an HDF5 file and convert FutureItem objects to their results.
-
-    Args:
-        file_name (str): The name of the HDF5 file.
-
-    Returns:
-        dict: The loaded data from the file.
-
-    """
-    apply_dict = load(file_name=file_name)
-    apply_dict["args"] = [
-        arg if not isinstance(arg, FutureItem) else arg.result()
-        for arg in apply_dict["args"]
-    ]
-    apply_dict["kwargs"] = {
-        key: arg if not isinstance(arg, FutureItem) else arg.result()
-        for key, arg in apply_dict["kwargs"].items()
-    }
-    return apply_dict
+def backend_load_file(file_name: str) -> dict:
+    """
+    Load the data from an HDF5 file and convert FutureItem objects to their results.
+
+    Args:
+        file_name (str): The name of the HDF5 file.
+
+    Returns:
+        dict: The loaded data from the file.
+
+    """
+    try:
+        apply_dict = load(file_name=file_name)
+        try:
+            apply_dict["args"] = [
+                arg if not isinstance(arg, FutureItem) else arg.result()
+                for arg in apply_dict["args"]
+            ]
+            apply_dict["kwargs"] = {
+                key: arg if not isinstance(arg, FutureItem) else arg.result()
+                for key, arg in apply_dict["kwargs"].items()
+            }
+            return apply_dict
+        except Exception as e:
+            raise RuntimeError(f"Failed to resolve FutureItems: {str(e)}") from e
+    except Exception as e:
+        raise RuntimeError(f"Failed to load file {file_name}: {str(e)}") from e
+
+
+def backend_write_file(file_name: str, output: Any) -> None:
+    """
+    Write the output to an HDF5 file.
+
+    Args:
+        file_name (str): The name of the HDF5 file.
+        output (Any): The output to be written.
+
+    Returns:
+        None
+
+    """
+    file_name_out = os.path.splitext(file_name)[0]
+    os.rename(file_name, file_name_out + ".h5ready")
+    dump(file_name=file_name_out + ".h5ready", data_dict={"output": output})
+    os.rename(file_name_out + ".h5ready", file_name_out + ".h5out")
-def backend_write_file(file_name: str, output: Any) -> None:
-    """
-    Write the output to an HDF5 file.
-
-    Args:
-        file_name (str): The name of the HDF5 file.
-        output (Any): The output to be written.
-
-    Returns:
-        None
-
-    """
-    file_name_out = os.path.splitext(file_name)[0]
-    os.rename(file_name, file_name_out + ".h5ready")
-    dump(file_name=file_name_out + ".h5ready", data_dict={"output": output})
-    os.rename(file_name_out + ".h5ready", file_name_out + ".h5out")
+def backend_write_file(file_name: str, output: Any) -> None:
+    """
+    Write the output to an HDF5 file.
+
+    Args:
+        file_name (str): The name of the HDF5 file.
+        output (Any): The output to be written.
+
+    Returns:
+        None
+
+    """
+    file_name_out = os.path.splitext(file_name)[0]
+    temp_file = file_name_out + ".h5ready"
+    output_file = file_name_out + ".h5out"
+    
+    # Check permissions early
+    if not os.access(os.path.dirname(file_name_out), os.W_OK):
+        raise PermissionError(f"No write permission in directory: {os.path.dirname(file_name_out)}")
+    
+    # Clean up any existing temporary files
+    if os.path.exists(temp_file):
+        os.remove(temp_file)
+    
+    try:
+        os.rename(file_name, temp_file)
+        try:
+            dump(file_name=temp_file, data_dict={"output": output})
+            os.rename(temp_file, output_file)
+        except Exception as e:
+            # Restore original file if dump fails
+            os.rename(temp_file, file_name)
+            raise RuntimeError(f"Failed to write output: {str(e)}") from e
+    except Exception as e:
+        raise RuntimeError(f"Failed to process file {file_name}: {str(e)}") from e
-def backend_write_file(file_name: str, output: Any) -> None:
-    """
-    Write the output to an HDF5 file.
-
-    Args:
-        file_name (str): The name of the HDF5 file.
-        output (Any): The output to be written.
-
-    Returns:
-        None
-
-    """
-    file_name_out = os.path.splitext(file_name)[0]
-    os.rename(file_name, file_name_out + ".h5ready")
-    dump(file_name=file_name_out + ".h5ready", data_dict={"output": output})
-    os.rename(file_name_out + ".h5ready", file_name_out + ".h5out")
+def backend_write_file(file_name: str, output: Any) -> None:
+    """
+    Write the output to an HDF5 file.
+
+    Args:
+        file_name (str): The name of the HDF5 file.
+        output (Any): The output to be written.
+
+    Returns:
+        None
+
+    """
+    file_name_out = os.path.splitext(file_name)[0]
+    temp_file = file_name_out + ".h5ready"
+    output_file = file_name_out + ".h5out"
+    
+    # Check permissions early
+    if not os.access(os.path.dirname(file_name_out), os.W_OK):
+        raise PermissionError(f"No write permission in directory: {os.path.dirname(file_name_out)}")
+    
+    # Clean up any existing temporary files
+    if os.path.exists(temp_file):
+        os.remove(temp_file)
+    
+    try:
+        os.rename(file_name, temp_file)
+        try:
+            dump(file_name=temp_file, data_dict={"output": output})
+            os.rename(temp_file, output_file)
+        except Exception as e:
+            # Restore original file if dump fails
+            os.rename(temp_file, file_name)
+            raise RuntimeError(f"Failed to write output: {str(e)}") from e
+    except Exception as e:
+        raise RuntimeError(f"Failed to process file {file_name}: {str(e)}") from e
+
+
+def backend_execute_task_in_file(file_name: str) -> None:
+    """
+    Execute the task stored in a given HDF5 file.
+
+    Args:
+        file_name (str): The file name of the HDF5 file as an absolute path.
+
+    Returns:
+        None
+    """
+    apply_dict = backend_load_file(file_name=file_name)
+    result = apply_dict["fn"].__call__(*apply_dict["args"], **apply_dict["kwargs"])
+    backend_write_file(
+        file_name=file_name,
+        output=result,
+    )
-def backend_execute_task_in_file(file_name: str) -> None:
-    """
-    Execute the task stored in a given HDF5 file.
-
-    Args:
-        file_name (str): The file name of the HDF5 file as an absolute path.
-
-    Returns:
-        None
-    """
-    apply_dict = backend_load_file(file_name=file_name)
-    result = apply_dict["fn"].__call__(*apply_dict["args"], **apply_dict["kwargs"])
-    backend_write_file(
-        file_name=file_name,
-        output=result,
-    )
+def backend_execute_task_in_file(file_name: str) -> None:
+    """
+    Execute the task stored in a given HDF5 file.
+
+    Args:
+        file_name (str): The file name of the HDF5 file as an absolute path.
+
+    Expected file format:
+        The HDF5 file should contain a dictionary with:
+        - 'fn': A callable object
+        - 'args': List of positional arguments
+        - 'kwargs': Dictionary of keyword arguments
+
+    Returns:
+        None
+
+    Raises:
+        RuntimeError: If the file format is invalid or execution fails
+    """
+    apply_dict = backend_load_file(file_name=file_name)
+    
+    # Validate function
+    if "fn" not in apply_dict:
+        raise RuntimeError("Missing 'fn' in task file")
+    if not callable(apply_dict["fn"]):
+        raise RuntimeError("The 'fn' object is not callable")
+    
+    try:
+        result = apply_dict["fn"].__call__(*apply_dict["args"], **apply_dict["kwargs"])
+        backend_write_file(
+            file_name=file_name,
+            output=result,
+        )
+    except Exception as e:
+        raise RuntimeError(f"Task execution failed: {str(e)}") from e
-def backend_execute_task_in_file(file_name: str) -> None:
-    """
-    Execute the task stored in a given HDF5 file.
-
-    Args:
-        file_name (str): The file name of the HDF5 file as an absolute path.
-
-    Returns:
-        None
-    """
-    apply_dict = backend_load_file(file_name=file_name)
-    result = apply_dict["fn"].__call__(*apply_dict["args"], **apply_dict["kwargs"])
-    backend_write_file(
-        file_name=file_name,
-        output=result,
-    )
+def backend_execute_task_in_file(file_name: str) -> None:
+    """
+    Execute the task stored in a given HDF5 file.
+
+    Args:
+        file_name (str): The file name of the HDF5 file as an absolute path.
+
+    Expected file format:
+        The HDF5 file should contain a dictionary with:
+        - 'fn': A callable object
+        - 'args': List of positional arguments
+        - 'kwargs': Dictionary of keyword arguments
+
+    Returns:
+        None
+
+    Raises:
+        RuntimeError: If the file format is invalid or execution fails
+    """
+    apply_dict = backend_load_file(file_name=file_name)
+    
+    # Validate function
+    if "fn" not in apply_dict:
+        raise RuntimeError("Missing 'fn' in task file")
+    if not callable(apply_dict["fn"]):
+        raise RuntimeError("The 'fn' object is not callable")
+    
+    try:
+        result = apply_dict["fn"].__call__(*apply_dict["args"], **apply_dict["kwargs"])
+        backend_write_file(
+            file_name=file_name,
+            output=result,
+        )
+    except Exception as e:
+        raise RuntimeError(f"Task execution failed: {str(e)}") from e
@@ -4,10 +4,10 @@
 import subprocess
 import sys
 from concurrent.futures import Future
-from typing import Any, Tuple
+from typing import Tuple
 
 from executorlib.shared.command import get_command_path
-from executorlib.shared.hdf import dump, get_output, load
+from executorlib.shared.hdf import dump, get_output
 from executorlib.shared.serialize import serialize_funct_h5
 
 
@@ -47,47 +47,6 @@ def done(self) -> bool:
         return get_output(file_name=self._file_name)[0]
 
 
-def backend_load_file(file_name: str) -> dict:
-    """
-    Load the data from an HDF5 file and convert FutureItem objects to their results.
-
-    Args:
-        file_name (str): The name of the HDF5 file.
-
-    Returns:
-        dict: The loaded data from the file.
-
-    """
-    apply_dict = load(file_name=file_name)
-    apply_dict["args"] = [
-        arg if not isinstance(arg, FutureItem) else arg.result()
-        for arg in apply_dict["args"]
-    ]
-    apply_dict["kwargs"] = {
-        key: arg if not isinstance(arg, FutureItem) else arg.result()
-        for key, arg in apply_dict["kwargs"].items()
-    }
-    return apply_dict
-
-
-def backend_write_file(file_name: str, output: Any) -> None:
-    """
-    Write the output to an HDF5 file.
-
-    Args:
-        file_name (str): The name of the HDF5 file.
-        output (Any): The output to be written.
-
-    Returns:
-        None
-
-    """
-    file_name_out = os.path.splitext(file_name)[0]
-    os.rename(file_name, file_name_out + ".h5ready")
-    dump(file_name=file_name_out + ".h5ready", data_dict={"output": output})
-    os.rename(file_name_out + ".h5ready", file_name_out + ".h5out")
-
-
 def execute_in_subprocess(
     command: list, task_dependent_lst: list = []
 ) -> subprocess.Popen:
@@ -180,24 +139,6 @@ def execute_tasks_h5(
             }
 
 
-def execute_task_in_file(file_name: str) -> None:
-    """
-    Execute the task stored in a given HDF5 file.
-
-    Args:
-        file_name (str): The file name of the HDF5 file as an absolute path.
-
-    Returns:
-        None
-    """
-    apply_dict = backend_load_file(file_name=file_name)
-    result = apply_dict["fn"].__call__(*apply_dict["args"], **apply_dict["kwargs"])
-    backend_write_file(
-        file_name=file_name,
-        output=result,
-    )
-
-
 def _get_execute_command(file_name: str, cores: int = 1) -> list:
     """
     Get command to call backend as a list of two strings

@@ -6,10 +6,10 @@
 
 try:
     from executorlib.shared.cache import (
-        FutureItem,
         execute_task_in_file,
         _check_task_output,
     )
+    from executorlib.cache.backend import FutureItem
     from executorlib.shared.hdf import dump
     from executorlib.shared.serialize import serialize_funct_h5