hydraflow.core.io

[docs] module hydraflow.core.io
"""Provide utility functions for HydraFlow."""from __future__ importannotationsimport fnmatchimport urllib.parseimport urllib.requestfrom functools importcachefrom pathlib importPathfrom typing importTYPE_CHECKINGfrom omegaconf importOmegaConfifTYPE_CHECKING:from collections.abc importCallable,Iteratorfrom mlflow.entities importRundef file_uri_to_path(uri:str)->Path:[docs]
    """Convert a file URI to a local path."""ifnoturi.startswith("file:"):returnPath(uri)path=urllib.parse.urlparse(uri).pathreturnPath(urllib.request.url2pathname(path))# for Windowsdef get_artifact_dir(run:Run)->Path:[docs]
    """Retrieve the artifact directory for the given run.    This function uses MLflow to get the artifact directory for the given run.    Args:        run (Run | None): The run instance. Defaults to None.    Returns:        The local path to the directory where the artifacts are downloaded.    """uri=run.info.artifact_uriifnotisinstance(uri,str):raiseNotImplementedErrorreturnfile_uri_to_path(uri)def log_text(run:Run,from_dir:Path,pattern:str="*.log")->None:[docs]
    """Log text files in the given directory as artifacts.    Append the text files to the existing text file in the artifact directory.    Args:        run (Run): The run instance.        from_dir (Path): The directory to find the logs in.        pattern (str): The pattern to match the logs.    """import mlflowartifact_dir=get_artifact_dir(run)forfileinfrom_dir.glob(pattern):ifnotfile.is_file():continuefile_artifact=artifact_dir/file.nameiffile_artifact.exists():text=file_artifact.read_text()ifnottext.endswith("\n"):text+="\n"else:text=""text+=file.read_text()mlflow.log_text(text,file.name)@cachedef get_experiment_name(experiment_dir:Path)->str:[docs]
    """Get the job name from an experiment directory.    Extracts the job name from the meta.yaml file. Returns an empty string    if the file does not exist or if the job name cannot be found.    Args:        experiment_dir: Path to the experiment directory containing the meta.yaml file    Returns:        The job name as a string, or an empty string if the file does not exist    """path=experiment_dir/"meta.yaml"ifnotpath.exists():return""meta=OmegaConf.load(experiment_dir/"meta.yaml")returnOmegaConf.select(meta,"name",default="")def predicate_experiment_dir([docs]
experiment_dir:Path,experiment_names:list[str]|Callable[[str],bool]|None=None,)->bool:    """Predicate an experiment directory based on the path and experiment names."""ifnotexperiment_dir.is_dir()orexperiment_dir.namein[".trash","0"]:returnFalsename=get_experiment_name(experiment_dir)ifnotname:returnFalseifexperiment_namesisNone:returnTrueifisinstance(experiment_names,list):returnany(fnmatch.fnmatch(name,e)foreinexperiment_names)returnexperiment_names(name)def get_experiment_names(tracking_dir:str|Path)->list[str]:[docs]
    """Get the experiment names from the tracking directory.    Returns:        list[str]: A list of experiment names sorted by the name.    """names=[get_experiment_name(path)forpathinPath(tracking_dir).iterdir()]returnsorted(namefornameinnamesifnameandname!="Default")def iter_experiment_dirs([docs]
tracking_dir:str|Path,experiment_names:str|list[str]|Callable[[str],bool]|None=None,)->Iterator[Path]:    """Iterate over the experiment directories in the tracking directory."""ifisinstance(experiment_names,str):experiment_names=[experiment_names]forpathinPath(tracking_dir).iterdir():ifpredicate_experiment_dir(path,experiment_names):yieldpathdef iter_run_dirs([docs]
tracking_dir:str|Path,experiment_names:str|list[str]|Callable[[str],bool]|None=None,)->Iterator[Path]:    """Iterate over the run directories in the tracking directory."""forexperiment_diriniter_experiment_dirs(tracking_dir,experiment_names):forpathinexperiment_dir.iterdir():ifpath.is_dir()and(path/"artifacts").exists():yieldpathdef iter_artifacts_dirs([docs]
tracking_dir:str|Path,experiment_names:str|list[str]|Callable[[str],bool]|None=None,)->Iterator[Path]:    """Iterate over the artifacts directories in the tracking directory."""forpathiniter_run_dirs(tracking_dir,experiment_names):yieldpath/"artifacts"def iter_artifact_paths([docs]
tracking_dir:str|Path,artifact_path:str|Path,experiment_names:str|list[str]|Callable[[str],bool]|None=None,)->Iterator[Path]:    """Iterate over the artifact paths in the tracking directory."""forpathiniter_artifacts_dirs(tracking_dir,experiment_names):yieldpath/artifact_path