Skip to content

Commit

Permalink
Optimize JSON decoding for sessions
Browse files Browse the repository at this point in the history
  • Loading branch information
vkarak committed Dec 11, 2024
1 parent ada1dfc commit cf2a106
Showing 1 changed file with 25 additions and 12 deletions.
37 changes: 25 additions & 12 deletions reframe/frontend/reporting/storage.py
Original file line number Diff line number Diff line change
Expand Up @@ -233,26 +233,39 @@ def _decode_sessions(self, results, sess_filter):
Return a map of session uuids to decoded session data
'''
sess_info_patt = re.compile(
r'\"session_info\":\s+(?P<sess_info>\{.*?\})'
)

def _extract_sess_info(s):
return sess_info_patt.search(s).group('sess_info')

@time_function
def _mass_json_decode(json_objs):
data = '[' + ','.join(json_objs) + ']'
getlogger().debug(f'decoding {len(data)} bytes')
return json.loads(data)

session_infos = {}
sessions = {}
for uuid, json_blob in results:
sessions.setdefault(uuid, json_blob)
session_infos.setdefault(uuid, _extract_sess_info(json_blob))

# Join all sessions and decode them at once
reports_blob = '[' + ','.join(sessions.values()) + ']'
getprofiler().enter_region('json decode')
reports = json.loads(reports_blob)
getprofiler().exit_region()

# Reindex and filter sessions based on their decoded data
sessions.clear()
for rpt in reports:
# Find the UUIDs to decode full by inspecting only the session info
uuids = []
for info in _mass_json_decode(session_infos.values()):
try:
if self._db_filter_json(sess_filter, rpt['session_info']):
sessions[rpt['session_info']['uuid']] = rpt
if self._db_filter_json(sess_filter, info):
uuids.append(info['uuid'])
except Exception:
continue

return sessions
# Decode selected sessions
reports = _mass_json_decode(sessions[uuid] for uuid in uuids)

# Return only the selected sessions
return {rpt['session_info']['uuid']: rpt for rpt in reports}

@time_function
def _fetch_testcases_raw(self, condition):
Expand Down

0 comments on commit cf2a106

Please sign in to comment.