Skip to content

Commit

Permalink
#4984: Fix addressing issues on eth cores
Browse files Browse the repository at this point in the history
  • Loading branch information
mo-tenstorrent authored and pgkeller committed Sep 16, 2024
1 parent 3038e37 commit 38278f9
Show file tree
Hide file tree
Showing 4 changed files with 16 additions and 15 deletions.
2 changes: 1 addition & 1 deletion tt_metal/hw/inc/blackhole/eth_l1_address_map.h
Original file line number Diff line number Diff line change
Expand Up @@ -60,7 +60,7 @@ struct address_map {
// erisc early exit functionality re-uses mailboxes_t::ncrisc_halt_msg_t::stack_save memory
static constexpr std::int32_t ERISC_MEM_MAILBOX_STACK_SAVE = ERISC_MEM_MAILBOX_BASE + 4;

static constexpr std::uint32_t ERISC_MEM_MAILBOX_END = ERISC_MEM_MAILBOX_BASE + 288 + 256 + 16 + 32 * 4 + 512;
static constexpr std::uint32_t ERISC_MEM_MAILBOX_END = ERISC_MEM_MAILBOX_BASE + 288 + 256 + 16 + (32 + 512) * 4;

static constexpr std::int32_t ERISC_L1_KERNEL_CONFIG_BASE = ERISC_MEM_MAILBOX_END;
static constexpr std::int32_t ERISC_L1_UNRESERVED_BASE = ERISC_L1_KERNEL_CONFIG_BASE + ERISC_L1_KERNEL_CONFIG_SIZE;
Expand Down
2 changes: 1 addition & 1 deletion tt_metal/hw/inc/wormhole/eth_l1_address_map.h
Original file line number Diff line number Diff line change
Expand Up @@ -60,7 +60,7 @@ struct address_map {
// erisc early exit functionality re-uses mailboxes_t::ncrisc_halt_msg_t::stack_save memory
static constexpr std::int32_t ERISC_MEM_MAILBOX_STACK_SAVE = ERISC_MEM_MAILBOX_BASE + 4;

static constexpr std::uint32_t ERISC_MEM_MAILBOX_END = ERISC_MEM_MAILBOX_BASE + 288 + 256 + 16 + 512 + 32 * 4;
static constexpr std::uint32_t ERISC_MEM_MAILBOX_END = ERISC_MEM_MAILBOX_BASE + 288 + 256 + 16 + (512 + 32) * 4;

static constexpr std::int32_t ERISC_L1_KERNEL_CONFIG_BASE = ERISC_MEM_MAILBOX_END;
static constexpr std::int32_t ERISC_L1_UNRESERVED_BASE = ERISC_L1_KERNEL_CONFIG_BASE + ERISC_L1_KERNEL_CONFIG_SIZE;
Expand Down
10 changes: 5 additions & 5 deletions tt_metal/tools/profiler/kernel_profiler.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -192,7 +192,7 @@ namespace kernel_profiler{
return;
}
uint32_t pageSize =
PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC * PROFILER_RISC_COUNT * profiler_core_count_per_dram;
PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC * MAX_RISCV_PER_CORE * profiler_core_count_per_dram;

while (!profiler_control_buffer[DRAM_PROFILER_ADDRESS]);
uint32_t dram_profiler_address = profiler_control_buffer[DRAM_PROFILER_ADDRESS];
Expand All @@ -213,7 +213,7 @@ namespace kernel_profiler{
if (currEndIndex <= PROFILER_FULL_HOST_VECTOR_SIZE_PER_RISC)
{
dram_offset =
(core_flat_id % profiler_core_count_per_dram) * PROFILER_RISC_COUNT * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
(core_flat_id % profiler_core_count_per_dram) * MAX_RISCV_PER_CORE * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
hostIndex * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
profiler_control_buffer[hostIndex] * sizeof(uint32_t);

Expand All @@ -226,7 +226,7 @@ namespace kernel_profiler{
{
dram_offset =
(core_flat_id % profiler_core_count_per_dram) *
PROFILER_RISC_COUNT * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
MAX_RISCV_PER_CORE * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
hostIndex * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC;

send_size = CUSTOM_MARKERS * sizeof(uint32_t);
Expand Down Expand Up @@ -270,14 +270,14 @@ namespace kernel_profiler{
core_flat_id = noc_xy_to_profiler_flat_id[my_x[0]][my_y[0]];

uint32_t dram_offset =
(core_flat_id % profiler_core_count_per_dram) * PROFILER_RISC_COUNT * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
(core_flat_id % profiler_core_count_per_dram) * MAX_RISCV_PER_CORE * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
(HOST_BUFFER_END_INDEX_BR_ER + myRiscID) * PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC +
profiler_control_buffer[HOST_BUFFER_END_INDEX_BR_ER + myRiscID] * sizeof(uint32_t);

while (!profiler_control_buffer[DRAM_PROFILER_ADDRESS]);
const InterleavedAddrGen<true> s = {
.bank_base_address = profiler_control_buffer[DRAM_PROFILER_ADDRESS],
.page_size = PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC * PROFILER_RISC_COUNT * profiler_core_count_per_dram
.page_size = PROFILER_FULL_HOST_BUFFER_SIZE_PER_RISC * MAX_RISCV_PER_CORE * profiler_core_count_per_dram
};

uint64_t dram_bank_dst_noc_addr = s.get_noc_addr(core_flat_id / profiler_core_count_per_dram, dram_offset);
Expand Down
17 changes: 9 additions & 8 deletions tt_metal/tools/profiler/profiler.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -30,27 +30,28 @@ void DeviceProfiler::readRiscProfilerResults(

ZoneScoped;

std::pair<uint32_t, CoreCoord> deviceCore = {device_id,worker_core};
HalProgrammableCoreType CoreType;
int riscCount;
profiler_msg_t *profiler_msg;

const metal_SocDescriptor& soc_d = tt::Cluster::instance().get_soc_desc(device_id);
uint32_t coreFlatID = soc_d.physical_routing_to_profiler_flat_id.at(worker_core);
uint32_t startIndex = coreFlatID * PROFILER_RISC_COUNT * PROFILER_FULL_HOST_VECTOR_SIZE_PER_RISC;

auto ethCores = soc_d.get_physical_ethernet_cores() ;

HalProgrammableCoreType CoreType;
profiler_msg_t *profiler_msg;
if (std::find(ethCores.begin(), ethCores.end(), worker_core) == ethCores.end())
{
profiler_msg = hal.get_dev_addr<profiler_msg_t *>(HalProgrammableCoreType::TENSIX, HalMemAddrType::PROFILER);
CoreType = HalProgrammableCoreType::TENSIX;
riscCount = 5;
}
else
{
profiler_msg = hal.get_dev_addr<profiler_msg_t *>(HalProgrammableCoreType::ACTIVE_ETH, HalMemAddrType::PROFILER);
CoreType = HalProgrammableCoreType::ACTIVE_ETH;
riscCount = 1;
}

uint32_t coreFlatID = soc_d.physical_routing_to_profiler_flat_id.at(worker_core);
uint32_t startIndex = coreFlatID * MAX_RISCV_PER_CORE * PROFILER_FULL_HOST_VECTOR_SIZE_PER_RISC;

vector<std::uint32_t> control_buffer = tt::llrt::read_hex_vec_from_core(
device_id,
worker_core,
Expand All @@ -64,7 +65,7 @@ void DeviceProfiler::readRiscProfilerResults(
}

int riscNum = 0;
for (int riscEndIndex = 0; riscEndIndex < PROFILER_RISC_COUNT; riscEndIndex ++ ) {
for (int riscEndIndex = 0; riscEndIndex < riscCount; riscEndIndex ++ ) {
uint32_t bufferEndIndex = control_buffer[riscEndIndex];
uint32_t riscType;
if(CoreType == HalProgrammableCoreType::TENSIX)
Expand Down

0 comments on commit 38278f9

Please sign in to comment.