Skip to content

Commit

Permalink
parquet cli
Browse files Browse the repository at this point in the history
  • Loading branch information
lchen-2101 committed Nov 13, 2024
1 parent 74fdb2b commit d98333f
Showing 1 changed file with 1 addition and 2 deletions.
3 changes: 1 addition & 2 deletions src/regtech_data_validator/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -98,8 +98,7 @@ def validate(
final_phase = validation_results.phase
all_findings.append(validation_results)
elif filetype == FileType.PARQUET:
lf = pl.scan_parquet(path, allow_missing_columns=True)
# lf = pl.scan_csv(path, infer_schema=False, missing_utf8_is_empty_string=True)
lf = pl.scan_parquet(path)
for validation_results in validate_lazy_frame(lf, context_dict, batch_size=50000, batch_count=1):
total_findings += validation_results.error_counts.total_count + validation_results.warning_counts.total_count
final_phase = validation_results.phase
Expand Down

0 comments on commit d98333f

Please sign in to comment.