Skip to content

Commit

Permalink
#5592: Update 2k prefill treshold
Browse files Browse the repository at this point in the history
  • Loading branch information
s-jovic committed May 17, 2024
1 parent fa3f319 commit c613ad6
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions models/demos/falcon7b/tests/test_perf_falcon.py
Original file line number Diff line number Diff line change
Expand Up @@ -511,7 +511,7 @@ def run_perf_wh_bare_metal(
(
("prefill", 32, 1, 128, 0, "BFLOAT16-DRAM", 0.97, 0.99, 0.96, 0.1),
("prefill", 32, 1, 1024, 0, "BFLOAT16-DRAM", 0.98, 0.99, 0.96, 1),
("prefill", 32, 1, 2048, 0, "BFLOAT16-DRAM", 0.98, 0.99, 0.96, 1),
("prefill", 32, 1, 2048, 0, "BFLOAT16-DRAM", 0.98, 0.99, 0.96, 2),
("decode", 32, 32, 1, 128, "BFLOAT16-DRAM", 0.91, 0.92, 0.93, 0.15),
("decode", 32, 32, 1, 128, "BFLOAT16-L1", 0.91, 0.92, 0.93, 0.15),
("decode", 32, 32, 1, 128, "BFLOAT16-L1_SHARDED", 0.92, 0.95, 0.95, 0.1),
Expand Down Expand Up @@ -558,7 +558,7 @@ def test_perf_wh_bare_metal(
async_mode,
):
if async_mode:
if llm_mode == "prefill" and seq_len != 128:
if llm_mode == "prefill" and seq_len != 1024:
pytest.skip(
f"Skipping {llm_mode} with {seq_len} in async mode. Config is supported but provides redundant testing."
)
Expand Down

0 comments on commit c613ad6

Please sign in to comment.