Skip to content

Commit

Permalink
#12330: Removed the deprecated flash decode gqa op as its functionali…
Browse files Browse the repository at this point in the history
…ty is covered in the generic flash decode op
  • Loading branch information
caixunshiren committed Oct 22, 2024
1 parent 044a345 commit a7ba1ad
Show file tree
Hide file tree
Showing 10 changed files with 1 addition and 821 deletions.
4 changes: 1 addition & 3 deletions models/demos/llama3/tt/llama_attention.py
Original file line number Diff line number Diff line change
Expand Up @@ -279,19 +279,17 @@ def forward_decode(
values,
cur_pos_tensor=current_pos,
page_table_tensor=page_table,
transpose_q=False,
scale=self.scale,
program_config=self.model_config["SDPA_DECODE_PROGCFG"],
compute_kernel_config=self.model_config["SDPA_DECODE_COMPUTE_PROGCFG"],
memory_config=ttnn.DRAM_MEMORY_CONFIG,
)
else:
attn_output_1G4D = ttnn.transformer.scaled_dot_product_attention_decode_gqa(
attn_output_1G4D = ttnn.transformer.scaled_dot_product_attention_decode(
q_heads_1BQD,
keys,
values,
cur_pos_tensor=current_pos,
transpose_q=False,
scale=self.scale,
program_config=self.model_config["SDPA_DECODE_PROGCFG"],
compute_kernel_config=self.model_config["SDPA_DECODE_COMPUTE_PROGCFG"],
Expand Down

This file was deleted.

3 changes: 0 additions & 3 deletions ttnn/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -348,9 +348,6 @@ set(ALL_TTNN_SRCS
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/transformer/sdpa_decode/sdpa_decode_pybind.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/transformer/sdpa_decode/device/sdpa_decode_op.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/transformer/sdpa_decode/device/sdpa_decode_program_factory.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/transformer/sdpa_decode_gqa/sdpa_decode_gqa.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/transformer/sdpa_decode_gqa/sdpa_decode_gqa_pybind.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/transformer/sdpa_decode_gqa/device/sdpa_decode_gqa_op.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/data_movement/sharded/interleaved_to_sharded/interleaved_to_sharded.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/data_movement/sharded/interleaved_to_sharded/interleaved_to_sharded_pybind.cpp
${CMAKE_CURRENT_SOURCE_DIR}/cpp/ttnn/operations/data_movement/sharded/interleaved_to_sharded/device/interleaved_to_sharded_op.cpp
Expand Down
Loading

0 comments on commit a7ba1ad

Please sign in to comment.