Skip to content

Commit

Permalink
Coalesce data ID query explanation into a single log.
Browse files Browse the repository at this point in the history
Logging a single statement as multiple logs causes problems with Loki,
because each line may be rearranged or independently filtered. Logging
a single multiline message fixes this problem, without changing
behavior for console users.

Constructing the multiline message makes it impossible to defer string
evaluation, but for an error-level log this is unlikely to come up
in practice.
  • Loading branch information
kfindeisen committed Aug 27, 2024
1 parent 1935541 commit 5c974ed
Show file tree
Hide file tree
Showing 2 changed files with 31 additions and 21 deletions.
1 change: 1 addition & 0 deletions doc/changes/DM-45722.bugfix.md
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
Explanatory logs for "initial data ID query returned no rows" now appear as a single entry in Loki/Json instead of being split on line breaks. There is no change to console behavior.
51 changes: 30 additions & 21 deletions python/lsst/pipe/base/all_dimensions_quantum_graph_builder.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,7 @@
import dataclasses
from collections.abc import Iterator, Mapping
from contextlib import contextmanager
from io import StringIO
from typing import TYPE_CHECKING, Any, final

from lsst.daf.butler.registry import MissingDatasetTypeError
Expand Down Expand Up @@ -507,31 +508,39 @@ def from_builder(
yield result

def log_failure(self, log: LsstLogAdapter) -> None:
"""Emit a series of ERROR-level log message that attempts to explain
"""Emit an ERROR-level log message that attempts to explain
why the initial data ID query returned no rows.
Parameters
----------
log : `logging.Logger`
The logger to use to emit log messages.
"""
log.error("Initial data ID query returned no rows, so QuantumGraph will be empty.")
for message in self.common_data_ids.explain_no_results():
log.error(message)
log.error(
"To reproduce this query for debugging purposes, run "
"Registry.queryDataIds with these arguments:"
)
# We could just repr() the queryArgs dict to get something
# the user could make sense of, but it's friendlier to
# put these args in an easier-to-reconstruct equivalent form
# so they can read it more easily and copy and paste into
# a Python terminal.
log.error(" dimensions=%s,", list(self.query_args["dimensions"].names))
log.error(" dataId=%s,", dict(self.query_args["dataId"].required))
if self.query_args["where"]:
log.error(" where=%s,", repr(self.query_args["where"]))
if "datasets" in self.query_args:
log.error(" datasets=%s,", list(self.query_args["datasets"]))
if "collections" in self.query_args:
log.error(" collections=%s,", list(self.query_args["collections"]))
# A single multiline log plays better with log aggregators like Loki.
buffer = StringIO()
try:
buffer.write("Initial data ID query returned no rows, so QuantumGraph will be empty.\n")
for message in self.common_data_ids.explain_no_results():
buffer.write(message)
buffer.write("\n")
buffer.write(
"To reproduce this query for debugging purposes, run "
"Registry.queryDataIds with these arguments:\n"
)
# We could just repr() the queryArgs dict to get something
# the user could make sense of, but it's friendlier to
# put these args in an easier-to-reconstruct equivalent form
# so they can read it more easily and copy and paste into
# a Python terminal.
buffer.write(" dimensions=%s," % list(self.query_args["dimensions"].names))
buffer.write(" dataId=%s," % dict(self.query_args["dataId"].required))
if self.query_args["where"]:
buffer.write(" where=%s," % repr(self.query_args["where"]))
if "datasets" in self.query_args:
buffer.write(" datasets=%s," % list(self.query_args["datasets"]))
if "collections" in self.query_args:
buffer.write(" collections=%s," % list(self.query_args["collections"]))
finally:
# If an exception was raised, write a partial.
log.error(buffer.getvalue())
buffer.close()

0 comments on commit 5c974ed

Please sign in to comment.