From 7e9983a0f0e46bc146a945cae6af87c323ccde47 Mon Sep 17 00:00:00 2001 From: Orion Eiger Date: Mon, 4 Dec 2023 11:30:28 -0800 Subject: [PATCH 1/2] Print table of produced and missing datasets to the command-line --- python/lsst/ctrl/mpexec/cli/cmd/commands.py | 6 ++--- python/lsst/ctrl/mpexec/cli/script/report.py | 23 ++++++++++++++++++-- 2 files changed, 23 insertions(+), 6 deletions(-) diff --git a/python/lsst/ctrl/mpexec/cli/cmd/commands.py b/python/lsst/ctrl/mpexec/cli/cmd/commands.py index 279352f1..75547294 100644 --- a/python/lsst/ctrl/mpexec/cli/cmd/commands.py +++ b/python/lsst/ctrl/mpexec/cli/cmd/commands.py @@ -329,16 +329,14 @@ def update_graph_run( @click.command(cls=PipetaskCommand) @repo_argument() @ctrlMpExecOpts.qgraph_argument() -@click.argument("output_yaml", type=click.Path(exists=False)) +@click.option("--output-yaml", default='', help="Summarize report in a yaml file (pass its name here).") @click.option("--logs/--no-logs", default=True, help="Get butler log datasets for extra information.") -def report(repo: str, qgraph: str, output_yaml: str, logs: bool = True) -> None: +def report(repo: str, qgraph: str, output_yaml: str='', logs: bool = True) -> None: """Write a yaml file summarizing the produced and missing expected datasets in a quantum graph. REPO is the location of the butler/registry config file. QGRAPH is the URL to a serialized Quantum Graph file. - - OUTPUT_YAML is the URL to store the summary report. """ script.report(repo, qgraph, output_yaml, logs) diff --git a/python/lsst/ctrl/mpexec/cli/script/report.py b/python/lsst/ctrl/mpexec/cli/script/report.py index c8528c66..b8f9f962 100644 --- a/python/lsst/ctrl/mpexec/cli/script/report.py +++ b/python/lsst/ctrl/mpexec/cli/script/report.py @@ -28,9 +28,10 @@ from lsst.daf.butler import Butler from lsst.pipe.base import QuantumGraph from lsst.pipe.base.execution_reports import QuantumGraphExecutionReport +from astropy.table import Table -def report(butler_config: str, qgraph_uri: str, output_yaml: str, logs: bool = True) -> None: +def report(butler_config: str, qgraph_uri: str, output_yaml: str | None, logs: bool = True) -> None: """Write a yaml file summarizing the produced and missing expected datasets in a quantum graph. @@ -54,4 +55,22 @@ def report(butler_config: str, qgraph_uri: str, output_yaml: str, logs: bool = T butler = Butler.from_config(butler_config, writeable=False) qgraph = QuantumGraph.loadUri(qgraph_uri) report = QuantumGraphExecutionReport.make_reports(butler, qgraph) - report.write_summary_yaml(butler, output_yaml, do_store_logs=logs) + if not output_yaml: + # this is the option to print to the command-line + summary_dict = report.to_summary_dict(butler, logs, human_readable=True) + quanta = Table() + datasets = Table() + dataset_table_rows = [] + data_products = [] + for task in summary_dict.keys(): + for data_product in summary_dict[task]["outputs"]: + print(summary_dict[task]["outputs"][data_product]) + dataset_table_rows.append(summary_dict[task]["outputs"][data_product]) + data_products.append(data_product) + datasets = Table(dataset_table_rows) + datasets.add_column(data_products, index=0, name="DatasetType") + print(datasets) + # something about failed quanta outside the smaller loop + #print(Table(summary_dict[task]["outputs"])) + else: + report.write_summary_yaml(butler, output_yaml, do_store_logs=logs) From 39d2baaf7980ffb7b1ca145e75d7ab2ea8f8297e Mon Sep 17 00:00:00 2001 From: Orion Eiger Date: Mon, 4 Dec 2023 11:46:10 -0800 Subject: [PATCH 2/2] Print table of failed and blocked quanta per task to the command-line --- doc/changes/DM-41606.feature.md | 7 ++ python/lsst/ctrl/mpexec/cli/cmd/commands.py | 9 ++- python/lsst/ctrl/mpexec/cli/script/report.py | 85 ++++++++++++++------ tests/test_cliCmdReport.py | 22 ++++- types.txt | 1 + 5 files changed, 92 insertions(+), 32 deletions(-) create mode 100644 doc/changes/DM-41606.feature.md create mode 100644 types.txt diff --git a/doc/changes/DM-41606.feature.md b/doc/changes/DM-41606.feature.md new file mode 100644 index 00000000..d1b1b9f8 --- /dev/null +++ b/doc/changes/DM-41606.feature.md @@ -0,0 +1,7 @@ +Make option to output `pipetask report` information to the command-line using +astropy tables and set to default. +Unpack a more human-readable dictionary from +`lsst.pipe.base.QuantumGraphExecutionReports.to_summary_dict` and print summary +tables of quanta and datasets to the command-line. Save error messages and +associated data ids to a yaml file in the working directory, or optionally print +them to screen as well. diff --git a/python/lsst/ctrl/mpexec/cli/cmd/commands.py b/python/lsst/ctrl/mpexec/cli/cmd/commands.py index 75547294..ac85511b 100644 --- a/python/lsst/ctrl/mpexec/cli/cmd/commands.py +++ b/python/lsst/ctrl/mpexec/cli/cmd/commands.py @@ -329,9 +329,12 @@ def update_graph_run( @click.command(cls=PipetaskCommand) @repo_argument() @ctrlMpExecOpts.qgraph_argument() -@click.option("--output-yaml", default='', help="Summarize report in a yaml file (pass its name here).") +@click.option("--full-output-filename", default="", help="Summarize report in a yaml file") @click.option("--logs/--no-logs", default=True, help="Get butler log datasets for extra information.") -def report(repo: str, qgraph: str, output_yaml: str='', logs: bool = True) -> None: +@click.option("--show-errors", default=False, help="Pretty-print a dict of errors from failed quanta.") +def report( + repo: str, qgraph: str, full_output_filename: str = "", logs: bool = True, show_errors: bool = False +) -> None: """Write a yaml file summarizing the produced and missing expected datasets in a quantum graph. @@ -339,4 +342,4 @@ def report(repo: str, qgraph: str, output_yaml: str='', logs: bool = True) -> No QGRAPH is the URL to a serialized Quantum Graph file. """ - script.report(repo, qgraph, output_yaml, logs) + script.report(repo, qgraph, full_output_filename, logs) diff --git a/python/lsst/ctrl/mpexec/cli/script/report.py b/python/lsst/ctrl/mpexec/cli/script/report.py index b8f9f962..913c52f8 100644 --- a/python/lsst/ctrl/mpexec/cli/script/report.py +++ b/python/lsst/ctrl/mpexec/cli/script/report.py @@ -24,53 +24,86 @@ # # You should have received a copy of the GNU General Public License # along with this program. If not, see . +import pprint +import yaml +from astropy.table import Table from lsst.daf.butler import Butler from lsst.pipe.base import QuantumGraph from lsst.pipe.base.execution_reports import QuantumGraphExecutionReport -from astropy.table import Table -def report(butler_config: str, qgraph_uri: str, output_yaml: str | None, logs: bool = True) -> None: - """Write a yaml file summarizing the produced and missing expected datasets - in a quantum graph. +def report( + butler_config: str, + qgraph_uri: str, + full_output_filename: str | None, + logs: bool = True, + show_errors: bool = False, +) -> None: + """Summarize the produced and missing expected dataset in a quantum graph. Parameters ---------- - butler_config : `str` - The Butler used for this report. This should match the Butler used - for the run associated with the executed quantum graph. - qgraph_uri : `str` - The uri of the location of said quantum graph. - output_yaml : `str` - The name to be used for the summary yaml file. - logs : `bool` - Get butler log datasets for extra information. - - See Also - -------- - lsst.pipe.base.QuantumGraphExecutionReport.make_reports : Making reports. - lsst.pipe.base.QuantumGraphExecutionReport.write_summary_yaml : Summaries. + butler_config : `str` + The Butler used for this report. This should match the Butler used + for the run associated with the executed quantum graph. + qgraph_uri : `str` + The uri of the location of said quantum graph. + full_output_filename : `str` + Output the full summary report to a yaml file (named herein). + Each data id and error message is keyed to a quantum graph node id. + A convenient output format for error-matching and cataloguing tools + such as the ones in the Campaign Management database. If this is + not included, quanta and dataset information will be printed to the + command-line instead. + logs : `bool` + Get butler log datasets for extra information (error messages). + show_errors : `bool` + If no output yaml is provided, print error messages to the + command-line along with the report. By default, these messages and + their associated data ids are stored in a yaml file with format + `{run timestamp}_err.yaml` in the working directory instead. """ butler = Butler.from_config(butler_config, writeable=False) qgraph = QuantumGraph.loadUri(qgraph_uri) report = QuantumGraphExecutionReport.make_reports(butler, qgraph) - if not output_yaml: + if not full_output_filename: # this is the option to print to the command-line summary_dict = report.to_summary_dict(butler, logs, human_readable=True) - quanta = Table() - datasets = Table() dataset_table_rows = [] data_products = [] + quanta_summary = [] + error_summary = [] for task in summary_dict.keys(): for data_product in summary_dict[task]["outputs"]: - print(summary_dict[task]["outputs"][data_product]) dataset_table_rows.append(summary_dict[task]["outputs"][data_product]) data_products.append(data_product) + + quanta_summary.append( + { + "Task": task, + "Failed Quanta": summary_dict[task]["failed_quanta"], + "Blocked Quanta": summary_dict[task]["n_quanta_blocked"], + } + ) + + if "errors" in summary_dict[task].keys(): + error_summary.append({task: summary_dict[task]["errors"]}) + quanta = Table(quanta_summary) datasets = Table(dataset_table_rows) datasets.add_column(data_products, index=0, name="DatasetType") - print(datasets) - # something about failed quanta outside the smaller loop - #print(Table(summary_dict[task]["outputs"])) + quanta.pprint_all() + print("\n") + if show_errors: + pprint.pprint(error_summary) + print("\n") + else: + assert qgraph.metadata is not None, "Saved QGs always have metadata." + collection = qgraph.metadata["output_run"] + collection = str(collection) + run_name = collection.split("/")[-1] + with open(f"{run_name}_err.yaml", "w") as stream: + yaml.safe_dump(error_summary, stream) + datasets.pprint_all() else: - report.write_summary_yaml(butler, output_yaml, do_store_logs=logs) + report.write_summary_yaml(butler, full_output_filename, do_store_logs=logs) diff --git a/tests/test_cliCmdReport.py b/tests/test_cliCmdReport.py index ab26dd21..be59426e 100644 --- a/tests/test_cliCmdReport.py +++ b/tests/test_cliCmdReport.py @@ -53,7 +53,7 @@ def tearDown(self) -> None: def test_report(self): """Test for making a report on the produced and missing expected - datasets in a quantum graph. in a graph. + datasets in a quantum graph. """ metadata = {"output_run": "run"} butler, qgraph = makeSimpleQGraph( @@ -71,10 +71,9 @@ def test_report(self): result = self.runner.invoke( pipetask_cli, - ["report", self.root, graph_uri, test_filename, "--no-logs"], + ["report", self.root, graph_uri, "--full-output-filename", test_filename, "--no-logs"], input="no", ) - # Check that we can read from the command line self.assertEqual(result.exit_code, 0, clickResultMsg(result)) @@ -84,6 +83,23 @@ def test_report(self): self.assertIsNotNone(report_output_dict["task0"]) self.assertIsNotNone(report_output_dict["task0"]["failed_quanta"]) + result_hr = self.runner.invoke( + pipetask_cli, + ["report", self.root, graph_uri, "--no-logs"], + input="no", + ) + + # Check that we can read from the command line + self.assertEqual(result_hr.exit_code, 0, clickResultMsg(result_hr)) + + # Check that we get string output + self.assertIsInstance(result_hr.stdout, str) + + # Check that task0 and the failed quanta for task0 exist in the string + self.assertIn("task0", result_hr.stdout) + self.assertIn("Failed Quanta", result_hr.stdout) + self.assertIn("{'data_id': {'instrument': 'INSTR', 'detector': 0}}", result_hr.stdout) + if __name__ == "__main__": unittest.main() diff --git a/types.txt b/types.txt new file mode 100644 index 00000000..1bb6d20b --- /dev/null +++ b/types.txt @@ -0,0 +1 @@ +types-PyYAML