Add frozen_runs_analysis/src/frozen_runs_analysis/cli.py
This commit is contained in:
parent
c67cc23016
commit
0bb836f087
1 changed files with 76 additions and 0 deletions
76
frozen_runs_analysis/src/frozen_runs_analysis/cli.py
Normal file
76
frozen_runs_analysis/src/frozen_runs_analysis/cli.py
Normal file
|
|
@ -0,0 +1,76 @@
|
||||||
|
import argparse
|
||||||
|
import json
|
||||||
|
import logging
|
||||||
|
from pathlib import Path
|
||||||
|
from typing import Any, List
|
||||||
|
|
||||||
|
import pandas as pd
|
||||||
|
|
||||||
|
from frozen_runs_analysis import core
|
||||||
|
|
||||||
|
def _setup_logging() -> None:
|
||||||
|
"""Initializes logging with INFO level for CLI execution."""
|
||||||
|
logging.basicConfig(
|
||||||
|
level=logging.INFO,
|
||||||
|
format='[%(asctime)s] %(levelname)s - %(message)s',
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
def _load_json_data(file_path: Path) -> List[dict]:
|
||||||
|
"""Loads and validates JSON data file expected to contain a list of RunData objects."""
|
||||||
|
if not file_path.exists() or not file_path.is_file():
|
||||||
|
raise FileNotFoundError(f"Input file not found: {file_path}")
|
||||||
|
|
||||||
|
with file_path.open('r', encoding='utf-8') as f:
|
||||||
|
data = json.load(f)
|
||||||
|
|
||||||
|
if not isinstance(data, list):
|
||||||
|
raise ValueError("Expected top-level JSON array for frozen run data.")
|
||||||
|
|
||||||
|
for idx, item in enumerate(data):
|
||||||
|
if not isinstance(item, dict):
|
||||||
|
raise ValueError(f"Item #{idx} in data is not a JSON object.")
|
||||||
|
for field in ('run_id', 'status', 'sanity_checks', 'config_hash'):
|
||||||
|
if field not in item:
|
||||||
|
raise ValueError(f"Missing required field '{field}' in item #{idx}: {item}")
|
||||||
|
|
||||||
|
return data
|
||||||
|
|
||||||
|
|
||||||
|
def _write_json_output(data: dict, output_path: Path) -> None:
|
||||||
|
"""Writes output JSON report to the given file path."""
|
||||||
|
output_path.parent.mkdir(parents=True, exist_ok=True)
|
||||||
|
with output_path.open('w', encoding='utf-8') as f:
|
||||||
|
json.dump(data, f, indent=2, ensure_ascii=False)
|
||||||
|
logging.info(f"Analysis report written to {output_path}")
|
||||||
|
|
||||||
|
|
||||||
|
def main() -> None:
|
||||||
|
"""CLI entrypoint for frozen runs analysis."""
|
||||||
|
parser = argparse.ArgumentParser(description='Analyse frozen run datasets from Gate v0.')
|
||||||
|
parser.add_argument('--input', required=True, help='Path to the input JSON data file containing frozen runs.')
|
||||||
|
parser.add_argument('--output', required=False, help='Path to output JSON file where results will be saved.')
|
||||||
|
|
||||||
|
args = parser.parse_args()
|
||||||
|
|
||||||
|
_setup_logging()
|
||||||
|
|
||||||
|
input_path = Path(args.input).expanduser().resolve()
|
||||||
|
output_path = Path(args.output).expanduser().resolve() if args.output else Path('output/frozen_runs_analysis.json').resolve()
|
||||||
|
|
||||||
|
logging.info(f"Loading data from {input_path}")
|
||||||
|
data = _load_json_data(input_path)
|
||||||
|
|
||||||
|
logging.info("Running analysis on frozen runs data ...")
|
||||||
|
try:
|
||||||
|
result: dict[str, Any] = core.analyse_frozen_runs(data)
|
||||||
|
except Exception as e:
|
||||||
|
logging.exception("Error running analysis: %s", e)
|
||||||
|
raise
|
||||||
|
|
||||||
|
logging.info("Analysis complete. Saving results ...")
|
||||||
|
_write_json_output(result, output_path)
|
||||||
|
|
||||||
|
|
||||||
|
if __name__ == '__main__':
|
||||||
|
main()
|
||||||
Loading…
Reference in a new issue