Skip to content

Commit

Permalink
sw: Test addressability and user-defined offload to PULP Cluster
Browse files Browse the repository at this point in the history
  • Loading branch information
sermazz committed Jan 30, 2025
1 parent d3e57b4 commit 8a32b44
Show file tree
Hide file tree
Showing 2 changed files with 136 additions and 0 deletions.
35 changes: 35 additions & 0 deletions sw/tests/testClusterAddr_pulp.c
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
// Copyright 2024 ETH Zurich and University of Bologna.
// Licensed under the Apache License, Version 2.0, see LICENSE for details.
// SPDX-License-Identifier: Apache-2.0
//
// Sergio Mazzola <[email protected]>

// Simple addressability test which writes and subsequently reads a value
// in the first address mapped to the PULP Cluster 0 (i.e., the first
// TCDM address)

#include "offload.h"
#include "soc_addr_map.h"
#include <regs/soc_ctrl.h>
#include <stdint.h>

#define TESTVAL_CLUSTER 0xdeadbeef

int main() {
uint8_t *base_addr_tcdm_cluster_0 = CLUSTER_0_BASE;

*((uint32_t*)base_addr_tcdm_cluster_0) = TESTVAL_CLUSTER;

asm volatile ("nop");
asm volatile ("nop");
asm volatile ("nop");
asm volatile ("nop");
asm volatile ("nop");

uint32_t result = *((uint32_t*)base_addr_tcdm_cluster_0);
if (result == TESTVAL_CLUSTER) {
return 0;
} else {
return 1;
}
}
101 changes: 101 additions & 0 deletions sw/tests/testClusterOffload_pulp.c
Original file line number Diff line number Diff line change
@@ -0,0 +1,101 @@
// Copyright 2024 ETH Zurich and University of Bologna.
// Licensed under the Apache License, Version 2.0, see LICENSE for details.
// SPDX-License-Identifier: Apache-2.0
//
// Sergio Mazzola <[email protected]>

// Simple offload test to PULP Cluster 0. First set the boot address of all 8
// cluster cores to the desired one (the simple test function), then enables the
// fetch enable for all cores at the same time. All this is done through writes
// to the cluster's peripheral interconnect. Does not currently take care of the
// cluster return value.

#include "offload.h"
#include "soc_addr_map.h"
#include <regs/soc_ctrl.h>
#include <stdint.h>

#define TESTVAL_CLUSTER 0xdeadbeef

#define PERIPH_OFFSET 0x00200000

#define FETCH_EN_OFFSET (PERIPH_OFFSET + 0x008)

#define BOOT_ADDR_CORE_0_OFFSET (PERIPH_OFFSET + 0x040)
#define BOOT_ADDR_CORE_1_OFFSET (PERIPH_OFFSET + 0x044)
#define BOOT_ADDR_CORE_2_OFFSET (PERIPH_OFFSET + 0x048)
#define BOOT_ADDR_CORE_3_OFFSET (PERIPH_OFFSET + 0x04C)
#define BOOT_ADDR_CORE_4_OFFSET (PERIPH_OFFSET + 0x050)
#define BOOT_ADDR_CORE_5_OFFSET (PERIPH_OFFSET + 0x054)
#define BOOT_ADDR_CORE_6_OFFSET (PERIPH_OFFSET + 0x058)
#define BOOT_ADDR_CORE_7_OFFSET (PERIPH_OFFSET + 0x05C)
#define BOOT_ADDR_CORE_8_OFFSET (PERIPH_OFFSET + 0x060)
#define BOOT_ADDR_CORE_9_OFFSET (PERIPH_OFFSET + 0x064)
#define BOOT_ADDR_CORE_10_OFFSET (PERIPH_OFFSET + 0x068)
#define BOOT_ADDR_CORE_11_OFFSET (PERIPH_OFFSET + 0x06C)
#define BOOT_ADDR_CORE_12_OFFSET (PERIPH_OFFSET + 0x070)
#define BOOT_ADDR_CORE_13_OFFSET (PERIPH_OFFSET + 0x074)
#define BOOT_ADDR_CORE_14_OFFSET (PERIPH_OFFSET + 0x078)
#define BOOT_ADDR_CORE_15_OFFSET (PERIPH_OFFSET + 0x07C)

int32_t test_cluster() {
int32_t result;
int32_t hart_id;

asm volatile ("csrr %0, mhartid" : "=r"(hart_id)::);

asm volatile (
"li t0, %1\n" // Load immediate value into t0
"mv a0, t0\n" // Move t0 into a0 (x10)
"mv %0, a0\n" // Move a0 into the output variable
: "=r"(result) // Output operand
: "i"(TESTVAL_CLUSTER) // Input operand: immediate value
: "t0", "a0" // Clobbered registers
);

result = result + hart_id;

return result;
}

int main() {
int32_t hart_id;
asm volatile ("csrr %0, mhartid" : "=r"(hart_id)::);

// set boot address of all cores in cluster 0
uint8_t *boot_addr_core_0_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_0_OFFSET;
uint8_t *boot_addr_core_1_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_1_OFFSET;
uint8_t *boot_addr_core_2_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_2_OFFSET;
uint8_t *boot_addr_core_3_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_3_OFFSET;
uint8_t *boot_addr_core_4_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_4_OFFSET;
uint8_t *boot_addr_core_5_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_5_OFFSET;
uint8_t *boot_addr_core_6_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_6_OFFSET;
uint8_t *boot_addr_core_7_cluster_0 = CLUSTER_0_BASE + BOOT_ADDR_CORE_7_OFFSET;

*((uint32_t*)boot_addr_core_0_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_1_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_2_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_3_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_4_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_5_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_6_cluster_0) = test_cluster;
*((uint32_t*)boot_addr_core_7_cluster_0) = test_cluster;

// enable fetch for all cores in cluster 0
uint8_t *fetch_en_cluster_0 = CLUSTER_0_BASE + FETCH_EN_OFFSET;

*((uint32_t*)fetch_en_cluster_0) = 0x00FF;

// only the host hart executes this
volatile int count = 10000;
if (hart_id == 0) {
// delay loop
asm volatile (
"1: nop\n"
"addi %0, %0, -1\n"
"bnez %0, 1b\n"
: "+r"(count) // Input and output operand
);
}
return count;
}

0 comments on commit 8a32b44

Please sign in to comment.