Compare commits

25 Commits

Author SHA1 Message Date
Hansung Kim
b97e94b8ed [tests] vecadd|sgemm|saxpy: save input buffers to file 2023-09-25 13:45:03 -07:00
Hansung Kim
576e7aab78 [tests] Remove -LLCFLAGS from Makefile 2023-09-25 13:28:05 -07:00
Hansung Kim
905b1877fb Add simple tid kernel that has zero arguments 2023-09-20 17:31:14 -07:00
Hansung Kim
3846d2ae59 Add annotated assembly dump for vecadd 2023-09-20 14:43:01 -07:00
Hansung Kim
c90fe56588 More doc comments 2023-09-20 14:42:56 -07:00
Hansung Kim
9efdd2ebb7 Change path to prebuilt toolchain 2023-09-10 14:43:54 -07:00
Hansung Kim
0caf3ad471 Add more comments to vx_spawn.c 2023-09-04 19:04:22 -07:00
Hansung Kim
2fa94b9c21 Hardcode paths into env script instead of args 2023-08-31 14:24:58 -07:00
Hansung Kim
62ebe0312f [tests] Add comment on in-order command queue dispatch 2023-08-28 11:19:11 -07:00
Hansung Kim
19734fc5b6 Accept build dir and avoid dup run in env script 2023-08-24 13:53:44 -07:00
Hansung Kim
fdc0fdc958 [rtl] Add doc comments 2023-07-08 09:54:51 -07:00
Hansung Kim
3e290f6321 Add Verdi signal file 2023-07-08 00:23:31 -07:00
Hansung Kim
c24916b5e0 [tests] Add compute-bound variant of vecadd
This loops 1000 times over `sum += A[i] + B[i]`, making every memory op
hit at L1 cache.
2023-07-05 21:24:53 -07:00
Hansung Kim
0c40864522 Update PS1 in env script for clarity 2023-07-02 21:54:13 -07:00
Hansung Kim
f2f1249b93 Make base build directory a variable in script 2023-07-02 13:48:39 -07:00
Hansung Kim
f46383f350 Add #include <array> to fix compile error
gcc complains std::array being undeclared when trying to build a fresh
clone.
2023-07-02 13:47:41 -07:00
Hansung Kim
8caf476b1a Merge remote-tracking branch 'upstream/master' 2023-07-02 13:27:08 -07:00
Hansung Kim
9cf5a29917 simx: add cycle and core id to load/store memory debug trace 2023-02-17 18:31:29 -08:00
Hansung Kim
d81e4085e2 simx: add thread ID and vlen to load/store memory debug trace 2023-02-17 17:59:56 -08:00
Hansung Kim
b9d1684582 Add sourceme scripts for env variables 2023-02-17 16:04:34 -08:00
Hansung Kim
f8fc305cbd Add sourceme.sh
Needed to set env variables for a custom setup where the prebuilt
binaries are located outside of /opt.
2023-01-23 18:01:18 -08:00
Hansung Kim
70e1e2089d Add .gitignore 2023-01-20 15:20:01 -08:00
Hansung Kim
547216d43f [tests] reduce0, DotProduct: include LLVM_PREFIX in LD_LIBRARY_PATH
Without this, poclcc fails with
`error while loading shared libraries: libclangCodeGen.so.10: cannot
open shared object file: No such file or directory`.
Also fix wrong kernel file name.
2023-01-17 19:04:09 -08:00
Hansung Kim
bb4f38d000 [tests] opencl/convolution: fix linking of libsimx.so
Fixes linker error by following suggestion of
`/usr/bin/ld: warning: libsimx.so, needed by /scratch/hansung/src/vortex/driver/simx/libvortex.so, not found (try using -rpath or -rpath-link)`.
2023-01-17 19:04:09 -08:00
Hansung Kim
7c39cc2b5b Makefile: respect RISCV_TOOLCHAIN_PATH if already set in env 2023-01-17 19:04:03 -08:00
37 changed files with 2754 additions and 35 deletions

10
.gitignore vendored Normal file
View File

@@ -0,0 +1,10 @@
*.dump
*.o
*.bin
*.elf
.depend
*.a
*.so
*.log
*.vcd
blackbox.*.cache

View File

@@ -29,6 +29,10 @@ public:
}
}
// NOTE(hansung): This is code running on the CPU, but CPU is still the one
// that keeps track of allocation of the GPU memory. GPU kernel simply runs
// assuming that CPU has done the right thing and returned a safe and valid
// chunk of memory.
int allocate(uint64_t size, uint64_t* addr) {
if (size == 0 || addr == nullptr)
return -1;
@@ -403,4 +407,4 @@ private:
page_t* pages_;
};
} // namespace vortex
} // namespace vortex

7
env.my-pocl-riscv32.sh Normal file
View File

@@ -0,0 +1,7 @@
export VORTEX_ENV="my-pocl-riscv32"
export LLVM_PREFIX=/scratch/hansung/build/llvm-riscv32-unknown-linux-gnu-10.0.1
export POCL_CC_PATH=/scratch/hansung/build/pocl-riscv32/compiler
export POCL_RT_PATH=/scratch/hansung/build/pocl-riscv32/runtime
export VERILATOR_ROOT=/scratch/hansung/build/vortex-toolchain-prebuilt/verilator
export RISCV_TOOLCHAIN_PATH=/scratch/hansung/build/vortex-toolchain-prebuilt
export PATH="/scratch/hansung/build/vortex-toolchain-prebuilt/verilator/bin:$PATH"

7
env.my-pocl.sh Normal file
View File

@@ -0,0 +1,7 @@
export VORTEX_ENV="my-pocl"
export LLVM_PREFIX=/scratch/hansung/build/vortex-toolchain-prebuilt/llvm-riscv/
export POCL_CC_PATH=/scratch/hansung/build/pocl-vortex/compiler
export POCL_RT_PATH=/scratch/hansung/build/pocl-vortex/runtime
export VERILATOR_ROOT=/scratch/hansung/build/vortex-toolchain-prebuilt/verilator
export RISCV_TOOLCHAIN_PATH=/scratch/hansung/build/vortex-toolchain-prebuilt
export PATH="/scratch/hansung/build/vortex-toolchain-prebuilt/verilator/bin:$PATH"

17
env.vortex-prebuilt.sh Normal file
View File

@@ -0,0 +1,17 @@
if [ -n "$VORTEX_ENV" ]
then
echo "VORTEX_ENV already set. Exiting."
return
fi
# PREBUILT_DIR=/scratch/hansung/build/vortex-toolchain-prebuilt-d2ba5df-230831
PREBUILT_DIR=/scratch/hansung/build/vortex-toolchain-prebuilt-230831
export VORTEX_ENV="vortex-prebuilt"
export LLVM_PREFIX=$PREBUILT_DIR/llvm-riscv/
export POCL_CC_PATH=$PREBUILT_DIR/pocl/compiler
export POCL_RT_PATH=$PREBUILT_DIR/pocl/runtime
export VERILATOR_ROOT=$PREBUILT_DIR/verilator
export RISCV_TOOLCHAIN_PATH=$PREBUILT_DIR/
export PATH="$BUILDDIR/vortex-toolchain-prebuilt-d2ba5df-230831/verilator/bin:$PATH"
export PS1="($VORTEX_ENV) $PS1"

7
env.vortex-prebuilt2.sh Normal file
View File

@@ -0,0 +1,7 @@
export VORTEX_ENV="vortex-prebuilt2"
export LLVM_PREFIX=/scratch/hansung/build/vortex-toolchain-prebuilt/llvm-riscv2
export POCL_CC_PATH=/scratch/hansung/build/vortex-toolchain-prebuilt/pocl2/compiler
export POCL_RT_PATH=/scratch/hansung/build/vortex-toolchain-prebuilt/pocl2/runtime
export VERILATOR_ROOT=/scratch/hansung/build/vortex-toolchain-prebuilt/verilator
export RISCV_TOOLCHAIN_PATH=/scratch/hansung/build/vortex-toolchain-prebuilt
export PATH="/scratch/hansung/build/vortex-toolchain-prebuilt/verilator/bin:$PATH"

View File

@@ -9,6 +9,7 @@ module VX_execute #(
input wire reset,
// Dcache interface
// NOTE(hansung): this comes out of VX_lsu_unit
VX_dcache_req_if.master dcache_req_if,
VX_dcache_rsp_if.slave dcache_rsp_if,
@@ -234,4 +235,4 @@ module VX_execute #(
&& (`INST_BR_BITS'(alu_req_if.op_type) == `INST_BR_EBREAK
|| `INST_BR_BITS'(alu_req_if.op_type) == `INST_BR_ECALL);
endmodule
endmodule

View File

@@ -34,7 +34,7 @@ module VX_lsu_unit #(
wire [`INST_LSU_BITS-1:0] req_type;
wire [`NUM_THREADS-1:0][31:0] req_data;
wire [`NR_BITS-1:0] req_rd;
wire req_wb;
wire req_wb; // NOTE(hansung): 0:load, 1:store
wire [`NW_BITS-1:0] req_wid;
wire [31:0] req_pc;
wire req_is_dup;
@@ -369,4 +369,4 @@ module VX_lsu_unit #(
end
`endif
endmodule
endmodule

View File

@@ -250,6 +250,8 @@ module VX_cache #(
wire [MEM_TAG_IN_WIDTH-1:0] mem_rsp_tag_c;
wire mem_rsp_ready_c;
// NOTE(hansung): non-cacheable addresses. Although is this applied for
// all address range?
if (NC_ENABLE) begin
VX_nc_bypass #(
.NUM_PORTS (NUM_PORTS),

View File

@@ -55,6 +55,7 @@
///////////////////////////////////////////////////////////////////////////////
// NOTE(hansung): what does CORE_TAG_ID_BITS == 0 mean?
`define CORE_RSP_TAGS ((CORE_TAG_ID_BITS != 0) ? 1 : NUM_REQS)
`define LINE_TO_MEM_ADDR(x, i) {x, `BANK_SELECT_BITS'(i)}

View File

@@ -53,6 +53,7 @@ module VX_core_req_bank_sel #(
wire [NUM_REQS-1:0][`LINE_ADDR_WIDTH-1:0] core_req_line_addr;
wire [NUM_REQS-1:0][`UP(`WORD_SELECT_BITS)-1:0] core_req_wsel;
// NOTE(hansung): "bank id"
wire [NUM_REQS-1:0][`UP(`BANK_SELECT_BITS)-1:0] core_req_bid;
for (genvar i = 0; i < NUM_REQS; i++) begin
@@ -123,6 +124,9 @@ module VX_core_req_bank_sel #(
per_bank_core_req_tid_r = 'x;
req_select_table_r = 'x;
// NOTE(hansung): if we're simply overwriting assignment in
// a loop with decrementing index, wouldn't this be unfair
// for reqs with higher index?
for (integer i = NUM_REQS-1; i >= 0; --i) begin
if (core_req_valid[i]) begin
per_bank_core_req_valid_r[core_req_bid[i]] = 1;
@@ -184,6 +188,8 @@ module VX_core_req_bank_sel #(
end
end else begin
// NOTE(hansung): this is what the default config elaborates, i.e.
// NUM_REQS > 1, NUM_PORTS == 1
always @(*) begin
per_bank_core_req_valid_r = 0;
@@ -204,6 +210,8 @@ module VX_core_req_bank_sel #(
per_bank_core_req_byteen_r[core_req_bid[i]]= core_req_byteen[i];
per_bank_core_req_data_r[core_req_bid[i]] = core_req_data[i];
per_bank_core_req_tag_r[core_req_bid[i]] = core_req_tag[i];
// NOTE(hansung): this marks which req 'won' mapping
// to this bank eventually
per_bank_core_req_tid_r[core_req_bid[i]] = `REQS_BITS'(i);
end
end
@@ -216,6 +224,7 @@ module VX_core_req_bank_sel #(
core_req_ready_r = 0;
for (integer i = 0; i < NUM_BANKS; ++i) begin
if (per_bank_core_req_valid_r[i]) begin
// NOTE(hansung): this flows back to upstream
core_req_ready_r[per_bank_core_req_tid_r[i]] = per_bank_core_req_ready[i];
end
end
@@ -311,4 +320,4 @@ module VX_core_req_bank_sel #(
assign bank_stalls = bank_stalls_r;
`endif
endmodule
endmodule

View File

@@ -1,9 +1,9 @@
XLEN ?= 32
ifeq ($(XLEN),32)
RISCV_TOOLCHAIN_PATH = /opt/riscv-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv-gnu-toolchain
else
RISCV_TOOLCHAIN_PATH = /opt/riscv64-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv64-gnu-toolchain
endif
RISCV_PREFIX ?= riscv$(XLEN)-unknown-elf-

View File

@@ -97,6 +97,8 @@ static void spawn_tasks_rem_cb(int thread_mask) {
vx_tmc(1);
}
// NOTE(hansung): where is this used? The main section in the POCL binary calls
// `vx_spawn_kernel` but not this one
void vx_spawn_tasks(int num_tasks, vx_spawn_tasks_cb callback , void * arg) {
// device specs
int NC = vx_num_cores();
@@ -281,9 +283,12 @@ void vx_spawn_kernel(context_t * ctx, vx_spawn_kernel_cb callback, void * arg) {
char log2X = fast_log2(X);
//--
wspawn_kernel_args_t wspawn_args = {
ctx, callback, arg, core_id * wgs_per_core, fW, rW, 0, isXYpow2, isXpow2, log2XY, log2X
};
wspawn_kernel_args_t wspawn_args = {
ctx, callback, arg, core_id * wgs_per_core /*offset*/,
fW /*N*/, rW /*R*/, 0 /*NW*/, isXYpow2,
isXpow2, log2XY, log2X};
// NOTE(hansung): core_id is capped at NUM_CORES_MAX = 32
g_wspawn_args[core_id] = &wspawn_args;
//--
@@ -304,4 +309,4 @@ void vx_spawn_kernel(context_t * ctx, vx_spawn_kernel_cb callback, void * arg) {
#ifdef __cplusplus
}
#endif
#endif

View File

@@ -683,4 +683,4 @@ bool Core::check_exit() const {
bool Core::running() const {
bool is_running = (committed_instrs_ != issued_instrs_);
return is_running;
}
}

View File

@@ -690,8 +690,13 @@ void Warp::execute(const Instr &instr, pipeline_trace_t *trace) {
uint64_t mem_addr = rsdata[t][0].i + immsrc;
uint64_t mem_data = 0;
core_->dcache_read(&mem_data, mem_addr, mem_bytes);
trace->mem_addrs.at(t).push_back({mem_addr, mem_bytes});
DP(4, "LOAD MEM: ADDRESS=0x" << std::hex << mem_addr << ", DATA=0x" << mem_data);
trace->mem_addrs.at(t).push_back({mem_addr, mem_bytes});
DP(1, "LOAD MEM: CYCLE=" << SimPlatform::instance().cycles()
<< ", CORE=" << core_->id()
<< ", THREAD=" << t
<< ", ADDRESS=0x" << std::hex << mem_addr
<< ", DATA=0x" << mem_data << std::dec
<< ", BYTES=" << mem_bytes);
switch (func3) {
case 0:
// RV32I: LB
@@ -731,7 +736,13 @@ void Warp::execute(const Instr &instr, pipeline_trace_t *trace) {
core_->dcache_read(&mem_data, mem_addr, 4);
Word *result_ptr = (Word *)(vd.data() + i);
*result_ptr = mem_data;
DP(4, "LOAD MEM: ADDRESS=0x" << std::hex << mem_addr << ", DATA=0x" << mem_data);
DP(1, "LOAD MEM: CYCLE=" << SimPlatform::instance().cycles()
<< ", CORE=" << core_->id()
<< ", VLEN=" << vl_
<< ", VID=" << i
<< ", ADDRESS=0x" << std::hex << mem_addr
<< ", DATA=0x" << mem_data << std::dec
<< ", BYTES=" << 4);
}
break;
}
@@ -762,7 +773,12 @@ void Warp::execute(const Instr &instr, pipeline_trace_t *trace) {
mem_data &= mask;
}
trace->mem_addrs.at(t).push_back({mem_addr, mem_bytes});
DP(4, "STORE MEM: ADDRESS=0x" << std::hex << mem_addr << ", DATA=0x" << mem_data);
DP(1, "STORE MEM: CYCLE=" << SimPlatform::instance().cycles()
<< ", CORE=" << core_->id()
<< ", THREAD=" << t
<< ", ADDRESS=0x" << std::hex << mem_addr
<< ", DATA=0x" << mem_data << std::dec
<< ", BYTES=" << mem_bytes);
switch (func3) {
case 0:
case 1:
@@ -782,7 +798,13 @@ void Warp::execute(const Instr &instr, pipeline_trace_t *trace) {
// store word and unit strided (not checking for unit stride)
uint32_t mem_data = *(uint32_t *)(vreg_file_.at(instr.getVs3()).data() + i);
core_->dcache_write(&mem_data, mem_addr, 4);
DP(4, "STORE MEM: ADDRESS=0x" << std::hex << mem_addr << ", DATA=0x" << mem_data);
DP(1, "STORE MEM: CYCLE=" << SimPlatform::instance().cycles()
<< ", CORE=" << core_->id()
<< ", VLEN=" << vl_
<< ", VID=" << i
<< ", ADDRESS=0x" << std::hex << mem_addr
<< ", DATA=0x" << mem_data << std::dec
<< ", BYTES=" << 4);
break;
}
default:
@@ -1304,6 +1326,9 @@ void Warp::execute(const Instr &instr, pipeline_trace_t *trace) {
} else {
tmask_.reset();
for (uint32_t t = 0; t < num_threads; ++t) {
// NOTE(hansung): `ts` is the left-most lane currently enabled.
// Doing this only respects the operand of that lane, even though
// every lane might have different operand for the tmask.
tmask_.set(t, rsdata.at(ts)[0].i & (1 << t));
}
}
@@ -2349,4 +2374,4 @@ void Warp::execute(const Instr &instr, pipeline_trace_t *trace) {
DP(3, "*** Next PC: " << std::hex << nextPC << std::dec);
PC_ = nextPC;
}
}
}

View File

@@ -175,4 +175,4 @@ void Processor::attach_ram(RAM* mem) {
int Processor::run() {
return impl_->run();
}
}

View File

@@ -1,5 +1,6 @@
#pragma once
#include <array>
#include "types.h"
namespace vortex {
@@ -25,4 +26,4 @@ private:
Core* core_;
};
}
}

View File

@@ -37,7 +37,7 @@ PROJECT=DotProduct
all: $(PROJECT).dump $(PROJECT).hex
lib$(PROJECT).a: DotProduct.cl
POCL_DEBUG=all POCL_DEBUG_LLVM_PASSES=1 LD_LIBRARY_PATH=$(RISCV_TOOLCHAIN_PATH)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -o lib$(PROJECT).a kernel.cl
POCL_DEBUG=all POCL_DEBUG_LLVM_PASSES=1 LD_LIBRARY_PATH=$(RISCV_TOOLCHAIN_PATH)/lib:$(POCL_CC_PATH)/lib:$(LLVM_PREFIX)/lib $(POCL_CC_PATH)/bin/poclcc -o lib$(PROJECT).a DotProduct.cl
$(PROJECT).elf: main.cc lib$(PROJECT).a
$(CXX) $(CXXFLAGS) $(VX_CFLAGS) $(VX_SRCS) main.cc $(VX_LIBS) -o $(PROJECT).elf

View File

@@ -0,0 +1,6 @@
main.o: main.cpp \
/scratch/hansung/build/vortex-toolchain-prebuilt/pocl/runtime/include/CL/cl.h \
/scratch/hansung/build/vortex-toolchain-prebuilt/pocl/runtime/include/CL/cl_version.h \
/scratch/hansung/build/vortex-toolchain-prebuilt/pocl/runtime/include/CL/cl_platform.h \
utils.h
utils.o: utils.cpp utils.h

View File

@@ -17,7 +17,7 @@ CXXFLAGS += -std=c++11 -Wall -Wextra -pedantic -Wfatal-errors
CXXFLAGS += -I$(POCL_RT_PATH)/include
LDFLAGS += -L$(POCL_RT_PATH)/lib -L$(VORTEX_DRV_PATH)/simx -lOpenCL -lvortex
LDFLAGS += -L$(POCL_RT_PATH)/lib -L$(VORTEX_DRV_PATH)/simx -Wl,-rpath $(VORTEX_DRV_PATH)/simx -lOpenCL -lvortex
# Debugigng
ifdef DEBUG

View File

@@ -37,7 +37,7 @@ PROJECT=reduce0
all: $(PROJECT).dump $(PROJECT).hex
lib$(PROJECT).a: oclReduction_kernel.cl
POCL_DEBUG=all POCL_DEBUG_LLVM_PASSES=1 LD_LIBRARY_PATH=$(RISCV_TOOLCHAIN_PATH)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -o lib$(PROJECT).a kernel.cl
POCL_DEBUG=all POCL_DEBUG_LLVM_PASSES=1 LD_LIBRARY_PATH=$(RISCV_TOOLCHAIN_PATH)/lib:$(POCL_CC_PATH)/lib:$(LLVM_PREFIX)/lib $(POCL_CC_PATH)/bin/poclcc -o lib$(PROJECT).a oclReduction_kernel.cl
$(PROJECT).elf: main.cc lib$(PROJECT).a
$(CXX) $(CXXFLAGS) $(VX_CFLAGS) $(VX_SRCS) main.cc $(VX_LIBS) -o $(PROJECT).elf

View File

@@ -37,7 +37,7 @@ SRCS = main.cc
all: $(PROJECT) kernel.pocl
kernel.pocl: kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -LLCFLAGS $(K_LLCFLAGS) -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
$(PROJECT): $(SRCS)
$(CXX) $(CXXFLAGS) $^ $(LDFLAGS) -o $@

View File

@@ -78,6 +78,25 @@ static int read_kernel_file(const char* filename, uint8_t** data, size_t* size)
return 0;
}
static int write_operand_file(const char* filename, void* data, size_t size) {
if (nullptr == filename || nullptr == data || 0 == size)
return -1;
FILE* fp = fopen(filename, "wb");
if (NULL == fp) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
size_t wsize = fwrite(data, size, 1, fp);
if (wsize != 1) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
return 0;
}
uint8_t *kernel_bin = NULL;
///
@@ -209,6 +228,11 @@ int main(int argc, char **argv) {
for (int i = 0; i < size; i++) {
h_src[i] = ((float)rand() / (float)(RAND_MAX)) * 100.0;
}
// NOTE(hansung): Dump operand buffer to a file
if (write_operand_file("saxpy.input.src.bin", h_src, nbytes) != 0)
return EXIT_FAILURE;
CL_CHECK(clEnqueueWriteBuffer(queue, input_buffer, CL_TRUE, 0, nbytes, h_src, 0, NULL, NULL));
free(h_src);

View File

@@ -37,7 +37,7 @@ SRCS = main.cc
all: $(PROJECT) kernel.pocl
kernel.pocl: kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -LLCFLAGS $(K_LLCFLAGS) -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
$(PROJECT): $(SRCS)
$(CXX) $(CXXFLAGS) $^ $(LDFLAGS) -o $@

View File

@@ -52,6 +52,25 @@ static int read_kernel_file(const char* filename, uint8_t** data, size_t* size)
return 0;
}
static int write_operand_file(const char* filename, void* data, size_t size) {
if (nullptr == filename || nullptr == data || 0 == size)
return -1;
FILE* fp = fopen(filename, "wb");
if (NULL == fp) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
size_t wsize = fwrite(data, size, 1, fp);
if (wsize != 1) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
return 0;
}
static void matmul(float *C, const float* A, const float *B, int M, int N, int K) {
for (int m = 0; m < M; ++m) {
for (int n = 0; n < N; ++n) {
@@ -194,6 +213,12 @@ int main (int argc, char **argv) {
//printf("*** [%d]: h_a=%f, h_b=%f\n", i, h_a[i], h_b[i]);
}
// NOTE(hansung): Dump operand buffer to a file
if (write_operand_file("sgemm.input.a.bin", h_a, nbytes) != 0)
return EXIT_FAILURE;
if (write_operand_file("sgemm.input.b.bin", h_b, nbytes) != 0)
return EXIT_FAILURE;
// Creating command queue
commandQueue = CL_CHECK2(clCreateCommandQueue(context, device_id, 0, &_err));

1
tests/opencl/tid/.gitignore vendored Normal file
View File

@@ -0,0 +1 @@
tid

71
tests/opencl/tid/Makefile Normal file
View File

@@ -0,0 +1,71 @@
XLEN ?= 32
LLVM_PREFIX ?= /opt/llvm-riscv
RISCV_TOOLCHAIN_PATH ?= /opt/riscv-gnu-toolchain
SYSROOT ?= $(RISCV_TOOLCHAIN_PATH)/riscv32-unknown-elf
POCL_CC_PATH ?= /opt/pocl/compiler
POCL_RT_PATH ?= /opt/pocl/runtime
OPTS ?= -n64
VORTEX_DRV_PATH ?= $(realpath ../../../driver)
VORTEX_RT_PATH ?= $(realpath ../../../runtime)
K_LLCFLAGS += "-O3 -march=riscv32 -target-abi=ilp32f -mcpu=generic-rv32 -mattr=+m,+f -mattr=+vortex -float-abi=hard -code-model=small"
K_CFLAGS += "-v -O3 --sysroot=$(SYSROOT) --gcc-toolchain=$(RISCV_TOOLCHAIN_PATH) -march=rv32imf -mabi=ilp32f -Xclang -target-feature -Xclang +vortex -I$(VORTEX_RT_PATH)/include -fno-rtti -fno-exceptions -ffreestanding -nostartfiles -fdata-sections -ffunction-sections"
K_LDFLAGS += "-Wl,-Bstatic,-T$(VORTEX_RT_PATH)/linker/vx_link$(XLEN).ld -Wl,--gc-sections $(VORTEX_RT_PATH)/libvortexrt.a -lm"
CXXFLAGS += -std=c++11 -Wall -Wextra -Wfatal-errors
CXXFLAGS += -Wno-deprecated-declarations -Wno-unused-parameter -Wno-narrowing
CXXFLAGS += -I$(POCL_RT_PATH)/include
LDFLAGS += -L$(POCL_RT_PATH)/lib -L$(VORTEX_DRV_PATH)/stub -lOpenCL -lvortex
# Debugigng
ifdef DEBUG
CXXFLAGS += -g -O0
else
CXXFLAGS += -O2 -DNDEBUG
endif
PROJECT = tid
SRCS = main.cc
all: $(PROJECT) kernel.pocl
kernel.pocl: kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
$(PROJECT): $(SRCS)
$(CXX) $(CXXFLAGS) $^ $(LDFLAGS) -o $@
run-fpga: $(PROJECT) kernel.pocl
LD_LIBRARY_PATH=$(POCL_RT_PATH)/lib:$(VORTEX_DRV_PATH)/fpga:$(LD_LIBRARY_PATH) ./$(PROJECT) $(OPTS)
run-asesim: $(PROJECT) kernel.pocl
LD_LIBRARY_PATH=$(POCL_RT_PATH)/lib:$(VORTEX_DRV_PATH)/asesim:$(LD_LIBRARY_PATH) ./$(PROJECT) $(OPTS)
run-vlsim: $(PROJECT) kernel.pocl
LD_LIBRARY_PATH=$(POCL_RT_PATH)/lib:$(VORTEX_DRV_PATH)/vlsim:$(LD_LIBRARY_PATH) ./$(PROJECT) $(OPTS)
run-simx: $(PROJECT) kernel.pocl
LD_LIBRARY_PATH=$(POCL_RT_PATH)/lib:$(VORTEX_DRV_PATH)/simx:$(LD_LIBRARY_PATH) ./$(PROJECT) $(OPTS)
run-rtlsim: $(PROJECT) kernel.pocl
LD_LIBRARY_PATH=$(POCL_RT_PATH)/lib:$(VORTEX_DRV_PATH)/rtlsim:$(LD_LIBRARY_PATH) ./$(PROJECT) $(OPTS)
.depend: $(SRCS)
$(CXX) $(CXXFLAGS) -MM $^ > .depend;
clean:
rm -rf $(PROJECT) *.o .depend
clean-all: clean
rm -rf *.pocl *.dump
ifneq ($(MAKECMDGOALS),clean)
-include .depend
endif

View File

@@ -0,0 +1,6 @@
__kernel void tid()
{
__global int *out = (__global int *)0xc0000000;
int gid = get_global_id(0);
out[gid] = gid;
}

221
tests/opencl/tid/main.cc Normal file
View File

@@ -0,0 +1,221 @@
#include <stdio.h>
#include <stdlib.h>
#include <assert.h>
#include <math.h>
#include <CL/opencl.h>
#include <unistd.h>
#include <string.h>
#include <chrono>
#define KERNEL_NAME "tid"
#define CL_CHECK(_expr) \
do { \
cl_int _err = _expr; \
if (_err == CL_SUCCESS) \
break; \
printf("OpenCL Error: '%s' returned %d!\n", #_expr, (int)_err); \
cleanup(); \
exit(-1); \
} while (0)
#define CL_CHECK2(_expr) \
({ \
cl_int _err = CL_INVALID_VALUE; \
decltype(_expr) _ret = _expr; \
if (_err != CL_SUCCESS) { \
printf("OpenCL Error: '%s' returned %d!\n", #_expr, (int)_err); \
cleanup(); \
exit(-1); \
} \
_ret; \
})
static int read_kernel_file(const char* filename, uint8_t** data, size_t* size) {
if (nullptr == filename || nullptr == data || 0 == size)
return -1;
FILE* fp = fopen(filename, "r");
if (NULL == fp) {
fprintf(stderr, "Failed to load kernel.");
return -1;
}
fseek(fp , 0 , SEEK_END);
long fsize = ftell(fp);
rewind(fp);
*data = (uint8_t*)malloc(fsize);
*size = fread(*data, 1, fsize, fp);
fclose(fp);
return 0;
}
static int write_operand_file(const char* filename, void* data, size_t size) {
if (nullptr == filename || nullptr == data || 0 == size)
return -1;
FILE* fp = fopen(filename, "wb");
if (NULL == fp) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
size_t wsize = fwrite(data, size, 1, fp);
if (wsize != 1) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
return 0;
}
cl_device_id device_id = NULL;
cl_context context = NULL;
cl_command_queue commandQueue = NULL;
cl_program program = NULL;
cl_kernel kernel = NULL;
cl_mem a_memobj = NULL;
cl_mem b_memobj = NULL;
cl_mem c_memobj = NULL;
float *h_a = NULL;
float *h_b = NULL;
float *h_c = NULL;
uint8_t *kernel_bin = NULL;
static void cleanup() {
if (commandQueue) clReleaseCommandQueue(commandQueue);
if (kernel) clReleaseKernel(kernel);
if (program) clReleaseProgram(program);
if (a_memobj) clReleaseMemObject(a_memobj);
if (b_memobj) clReleaseMemObject(b_memobj);
if (c_memobj) clReleaseMemObject(c_memobj);
if (context) clReleaseContext(context);
if (device_id) clReleaseDevice(device_id);
if (kernel_bin) free(kernel_bin);
if (h_a) free(h_a);
if (h_b) free(h_b);
if (h_c) free(h_c);
}
int size = 64;
static void show_usage() {
printf("Usage: [-n size] [-h: help]\n");
}
static void parse_args(int argc, char **argv) {
int c;
while ((c = getopt(argc, argv, "n:h?")) != -1) {
switch (c) {
case 'n':
size = atoi(optarg);
break;
case 'h':
case '?': {
show_usage();
exit(0);
} break;
default:
show_usage();
exit(-1);
}
}
printf("Workload size=%d\n", size);
}
int main (int argc, char **argv) {
// parse command arguments
parse_args(argc, argv);
cl_platform_id platform_id;
size_t kernel_size;
cl_int binary_status;
// read kernel binary from file
if (0 != read_kernel_file("kernel.pocl", &kernel_bin, &kernel_size))
return -1;
// Getting platform and device information
CL_CHECK(clGetPlatformIDs(1, &platform_id, NULL));
CL_CHECK(clGetDeviceIDs(platform_id, CL_DEVICE_TYPE_DEFAULT, 1, &device_id, NULL));
printf("Create context\n");
context = CL_CHECK2(clCreateContext(NULL, 1, &device_id, NULL, NULL, &_err));
printf("Allocate device buffers\n");
size_t nbytes = size * sizeof(float);
// a_memobj = CL_CHECK2(clCreateBuffer(context, CL_MEM_READ_ONLY, nbytes, NULL, &_err));
// b_memobj = CL_CHECK2(clCreateBuffer(context, CL_MEM_READ_ONLY, nbytes, NULL, &_err));
// c_memobj = CL_CHECK2(clCreateBuffer(context, CL_MEM_WRITE_ONLY, nbytes, NULL, &_err));
printf("Create program from kernel source\n");
program = CL_CHECK2(clCreateProgramWithBinary(
context, 1, &device_id, &kernel_size, (const uint8_t**)&kernel_bin, &binary_status, &_err));
if (program == NULL) {
cleanup();
return -1;
}
// Build program
CL_CHECK(clBuildProgram(program, 1, &device_id, NULL, NULL, NULL));
// Create kernel
kernel = CL_CHECK2(clCreateKernel(program, KERNEL_NAME, &_err));
// Set kernel arguments
// CL_CHECK(clSetKernelArg(kernel, 0, sizeof(cl_mem), (void *)&a_memobj));
// CL_CHECK(clSetKernelArg(kernel, 1, sizeof(cl_mem), (void *)&b_memobj));
// CL_CHECK(clSetKernelArg(kernel, 2, sizeof(cl_mem), (void *)&c_memobj));
// Allocate memories for input arrays and output arrays.
h_a = (float*)malloc(nbytes);
h_b = (float*)malloc(nbytes);
h_c = (float*)malloc(nbytes);
// Creating command queue
commandQueue = CL_CHECK2(clCreateCommandQueue(
context, device_id, 0 /* command-queue properties */, &_err));
// printf("Upload source buffers\n");
// CL_CHECK(clEnqueueWriteBuffer(commandQueue, a_memobj, CL_TRUE, 0, nbytes, h_a, 0, NULL, NULL));
// CL_CHECK(clEnqueueWriteBuffer(commandQueue, b_memobj, CL_TRUE, 0, nbytes, h_b, 0, NULL, NULL));
printf("Execute the kernel\n");
size_t global_work_size[1] = {size};
size_t local_work_size[1] = {1};
auto time_start = std::chrono::high_resolution_clock::now();
CL_CHECK(clEnqueueNDRangeKernel(commandQueue, kernel, 1, NULL, global_work_size, local_work_size, 0, NULL, NULL));
CL_CHECK(clFinish(commandQueue));
auto time_end = std::chrono::high_resolution_clock::now();
double elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(time_end - time_start).count();
printf("Elapsed time: %lg ms\n", elapsed);
// printf("Download destination buffer\n");
// CL_CHECK(clEnqueueReadBuffer(commandQueue, c_memobj, CL_TRUE, 0, nbytes, h_c, 0, NULL, NULL));
// printf("Verify result\n");
// int errors = 0;
// for (int i = 0; i < size; ++i) {
// float ref = h_a[i] + h_b[i];
// if (!almost_equal(h_c[i], ref)) {
// if (errors < 100)
// printf("*** error: [%d] expected=%f, actual=%f, a=%f, b=%f\n", i, ref, h_c[i], h_a[i], h_b[i]);
// ++errors;
// }
// }
// if (0 == errors) {
// printf("PASSED!\n");
// } else {
// printf("FAILED! - %d errors\n", errors);
// }
// Clean up
cleanup();
// return errors;
return 0;
}

View File

@@ -37,7 +37,7 @@ SRCS = main.cc
all: $(PROJECT) kernel.pocl
kernel.pocl: kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -LLCFLAGS $(K_LLCFLAGS) -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
LLVM_PREFIX=$(LLVM_PREFIX) POCL_DEBUG=all LD_LIBRARY_PATH=$(LLVM_PREFIX)/lib:$(POCL_CC_PATH)/lib $(POCL_CC_PATH)/bin/poclcc -CFLAGS $(K_CFLAGS) -LDFLAGS $(K_LDFLAGS) -o kernel.pocl kernel.cl
$(PROJECT): $(SRCS)
$(CXX) $(CXXFLAGS) $^ $(LDFLAGS) -o $@

View File

@@ -0,0 +1,12 @@
__kernel void vecadd (__global const float *A,
__global const float *B,
__global float *C)
{
int gid = get_global_id(0);
float sum = 0.;
for (int i = 0; i < 1000; i++) {
int addr = gid + (i % 2);
sum += A[addr] + B[addr];
}
C[gid] = sum;
}

View File

@@ -52,6 +52,25 @@ static int read_kernel_file(const char* filename, uint8_t** data, size_t* size)
return 0;
}
static int write_operand_file(const char* filename, void* data, size_t size) {
if (nullptr == filename || nullptr == data || 0 == size)
return -1;
FILE* fp = fopen(filename, "wb");
if (NULL == fp) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
size_t wsize = fwrite(data, size, 1, fp);
if (wsize != 1) {
fprintf(stderr, "Failed to write operand data.\n");
return -1;
}
return 0;
}
static bool almost_equal(float a, float b, int ulp = 4) {
union fi_t { int i; float f; };
fi_t fa, fb;
@@ -156,6 +175,8 @@ int main (int argc, char **argv) {
kernel = CL_CHECK2(clCreateKernel(program, KERNEL_NAME, &_err));
// Set kernel arguments
// NOTE(hansung): clSetKernelArg doesn't seem to incur any device-specific
// operation
CL_CHECK(clSetKernelArg(kernel, 0, sizeof(cl_mem), (void *)&a_memobj));
CL_CHECK(clSetKernelArg(kernel, 1, sizeof(cl_mem), (void *)&b_memobj));
CL_CHECK(clSetKernelArg(kernel, 2, sizeof(cl_mem), (void *)&c_memobj));
@@ -173,10 +194,21 @@ int main (int argc, char **argv) {
//printf("*** [%d]: h_a=%f, h_b=%f\n", i, h_a[i], h_b[i]);
}
// Creating command queue
commandQueue = CL_CHECK2(clCreateCommandQueue(context, device_id, 0, &_err));
// NOTE(hansung): Dump operand buffer to a file
if (write_operand_file("vecadd.input.a.bin", h_a, nbytes) != 0)
return EXIT_FAILURE;
if (write_operand_file("vecadd.input.b.bin", h_b, nbytes) != 0)
return EXIT_FAILURE;
printf("Upload source buffers\n");
// Creating command queue
// NOTE(hansung): The 3rd properties arg is a bit-field, where fields like
// CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE can be set. With value of 0,
// nothing is set and the commands in the queue will be completed in-order.
// See OpenCL 1.2 spec, section 5.1
commandQueue = CL_CHECK2(clCreateCommandQueue(
context, device_id, 0 /* command-queue properties */, &_err));
printf("Upload source buffers\n");
CL_CHECK(clEnqueueWriteBuffer(commandQueue, a_memobj, CL_TRUE, 0, nbytes, h_a, 0, NULL, NULL));
CL_CHECK(clEnqueueWriteBuffer(commandQueue, b_memobj, CL_TRUE, 0, nbytes, h_b, 0, NULL, NULL));
@@ -185,6 +217,8 @@ int main (int argc, char **argv) {
size_t local_work_size[1] = {1};
auto time_start = std::chrono::high_resolution_clock::now();
CL_CHECK(clEnqueueNDRangeKernel(commandQueue, kernel, 1, NULL, global_work_size, local_work_size, 0, NULL, NULL));
// NOTE(hansung): clFinish blocks until all kernels in the command queue are
// finished. This seems to be what actually kicks off kernel execution.
CL_CHECK(clFinish(commandQueue));
auto time_end = std::chrono::high_resolution_clock::now();
double elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(time_end - time_start).count();

File diff suppressed because it is too large Load Diff

View File

@@ -1,9 +1,9 @@
XLEN ?= 32
ifeq ($(XLEN),32)
RISCV_TOOLCHAIN_PATH = /opt/riscv-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv-gnu-toolchain
else
RISCV_TOOLCHAIN_PATH = /opt/riscv64-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv64-gnu-toolchain
endif
RISCV_PREFIX ?= riscv$(XLEN)-unknown-elf-

View File

@@ -1,9 +1,9 @@
XLEN ?= 32
ifeq ($(XLEN),32)
RISCV_TOOLCHAIN_PATH = /opt/riscv-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv-gnu-toolchain
else
RISCV_TOOLCHAIN_PATH = /opt/riscv64-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv64-gnu-toolchain
endif
RISCV_PREFIX ?= riscv$(XLEN)-unknown-elf-

View File

@@ -1,9 +1,9 @@
XLEN ?= 32
ifeq ($(XLEN),32)
RISCV_TOOLCHAIN_PATH = /opt/riscv-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv-gnu-toolchain
else
RISCV_TOOLCHAIN_PATH = /opt/riscv64-gnu-toolchain
RISCV_TOOLCHAIN_PATH ?= /opt/riscv64-gnu-toolchain
endif
RISCV_PREFIX ?= riscv$(XLEN)-unknown-elf-

219
vortex-rtlsim.rc Normal file
View File

@@ -0,0 +1,219 @@
Magic 271485
Revision Verdi_S-2021.09-SP1-1
; Window Layout <x> <y> <width> <height> <signalwidth> <valuewidth>
viewPort 0 33 3840 1560 374 148
; File list:
; openDirFile [-d delimiter] [-s time_offset] [-rf auto_bus_rule_file] path_name file_name
openDirFile -d / "" "/scratch/hansung/src/vortex/trace.vcd.fsdb"
; file time scale:
; fileTimeScale ### s|ms|us|ns|ps
; signal spacing:
signalSpacing 5
; windowTimeUnit is used for zoom, cursor & marker
; waveform viewport range
zoom 75133.753950 75225.192159
cursor 75155.000000
marker 0.000000
; user define markers
; userMarker time_pos marker_name color linestyle
; visible top row signal index
top 42
; marker line index
markerPos 78
; event list
; addEvent event_name event_expression
; curEvent event_name
COMPLEX_EVENT_BEGIN
COMPLEX_EVENT_END
; toolbar current search type
; curSTATUS search_type
curSTATUS ByValue
addGroup "G1"
activeDirFile "" "/scratch/hansung/src/vortex/trace.vcd.fsdb"
addSignal -h 30 /TOP/clk
addSignal -h 30 -holdScope reset
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/dcache_req_valid[3:0]
addSignal -h 30 -holdScope dcache_rsp_ready
addSubGroup "Issue"
addSubGroup "Ibuffer"
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/ibuffer/ibuffer_if/PC[31:0]
addSignal -h 30 -holdScope rs1[5:0]
addSignal -h 30 -holdScope wid[1:0]
endSubGroup "Ibuffer"
addSubGroup "gpr_rsp_if"
addSignal -h 30 -UNSIGNED -HEX /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/dispatch/gpr_rsp_if/\rs1_data[0] [31:0]
addSignal -h 30 -holdScope \rs1_data[1] [31:0]
addSignal -h 30 -holdScope \rs1_data[2] [31:0]
addSignal -h 30 -holdScope \rs1_data[3] [31:0]
endSubGroup "gpr_rsp_if"
addSubGroup "Dispatch"
endSubGroup "Dispatch"
endSubGroup "Issue"
addSubGroup "Execute"
addSubGroup "LSU"
addSubGroup "lsu_req_if" -e FALSE
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_req_if/ready
addSignal -h 30 -holdScope valid
addSignal -h 30 -UNSIGNED -HEX -holdScope PC[31:0]
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/lsu_req_if/\base_addr[0] [31:0]
addSignal -h 30 -holdScope \base_addr[1] [31:0]
addSignal -h 30 -holdScope \base_addr[2] [31:0]
addSignal -h 30 -holdScope \base_addr[3] [31:0]
addSignal -h 30 -holdScope offset[31:0]
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_req_if/tmask[3:0]
addSignal -h 30 -holdScope op_type[3:0]
endSubGroup "lsu_req_if"
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/req_valid
addSignal -h 30 -holdScope req_pc[31:0]
addSignal -h 30 -holdScope dcache_req_ready
addSignal -h 30 -holdScope req_sent_mask[3:0]
endSubGroup "LSU"
addSubGroup "dcache_req_if"
addSignal -h 30 -UNSIGNED -HEX /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/dcache_req_if/ready[3:0]
addSignal -h 30 -holdScope valid[3:0]
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/dcache_req_if/\addr[0] [29:0]
addSignal -h 30 -holdScope \addr[1] [29:0]
addSignal -h 30 -holdScope \addr[2] [29:0]
addSignal -h 30 -holdScope \addr[3] [29:0]
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/\per_bank_core_req_addr[0] [25:0]
addSignal -h 30 -holdScope \per_bank_core_req_addr[1] [25:0]
addSignal -h 30 -holdScope \per_bank_core_req_addr[2] [25:0]
addSignal -h 30 -holdScope \per_bank_core_req_addr[3] [25:0]
endSubGroup "dcache_req_if"
addSubGroup "dcache_rsp_if"
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/dcache_rsp_if/ready
addSignal -h 30 -holdScope valid
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/dcache_rsp_if/tag[48:0]
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/dcache_rsp_if/tmask[3:0]
endSubGroup "dcache_rsp_if"
addSubGroup "alu_req_if" -e FALSE
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/alu_req_if/PC[31:0]
addSignal -h 30 -holdScope tmask[3:0]
addSignal -h 30 -holdScope ready
addSignal -h 30 -holdScope valid
endSubGroup "alu_req_if"
endSubGroup "Execute"
addSubGroup "Decode" -e FALSE
addSignal -h 30 -UNSIGNED -HEX /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/decode/decode_if/tmask[3:0]
endSubGroup "Decode"
addGroup "L1 Dcache"
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_ready[3:0]
addSignal -h 30 -UNSIGNED -HEX -holdScope core_req_valid[3:0]
addSignal -h 30 -holdScope core_req_rw[3:0]
addSignal -h 30 -holdScope \core_req_addr[0] [29:0]
addSignal -h 30 -holdScope \core_req_addr[1] [29:0]
addSignal -h 30 -holdScope \core_req_addr[2] [29:0]
addSignal -h 30 -holdScope \core_req_addr[3] [29:0]
addSubGroup "BankSel"
addSignal -h 30 -UNSIGNED -HEX /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel/\core_req_bid[0] [1:0]
addSignal -h 30 -holdScope \core_req_bid[1] [1:0]
addSignal -h 30 -holdScope \core_req_bid[2] [1:0]
addSignal -h 30 -holdScope \core_req_bid[3] [1:0]
addSignal -h 30 -holdScope \core_req_line_addr[0] [25:0]
addSignal -h 30 -holdScope \core_req_line_addr[1] [25:0]
addSignal -h 30 -holdScope \core_req_line_addr[2] [25:0]
addSignal -h 30 -holdScope \core_req_line_addr[3] [25:0]
addSignal -h 30 -holdScope \per_bank_core_req_tid_r[0][0] [1:0]
addSignal -h 30 -holdScope \per_bank_core_req_tid_r[1][0] [1:0]
addSignal -h 30 -holdScope \per_bank_core_req_tid_r[2][0] [1:0]
addSignal -h 30 -holdScope \per_bank_core_req_tid_r[3][0] [1:0]
addSignal -h 30 -UNSIGNED -BIN -holdScope per_bank_core_req_valid[3:0]
addSignal -h 30 -holdScope core_req_ready[3:0]
endSubGroup "BankSel"
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_rsp_valid[0:0]
addSignal -h 30 -holdScope mem_req_valid
addSignal -h 30 -holdScope mem_req_rw
addSignal -h 30 -holdScope mem_rsp_valid
addGroup "L2"
addSignal -h 30 -UNSIGNED -HEX /TOP/Vortex/\genblk2[0] /cluster/genblk3/l2cache/core_req_ready[1:0]
addSignal -h 30 -holdScope core_req_valid[1:0]
addSignal -h 30 -holdScope mem_req_valid
addGroup "DRAM"
addSignal -h 30 /TOP/Vortex/\genblk2[0] /cluster/genblk3/l2cache/mem_req_valid
addSignal -h 30 -holdScope mem_rsp_valid
addGroup "G3"
; getSignalForm Scope Hierarchy Status
; active file of getSignalForm
activeDirFile "" "/scratch/hansung/src/vortex/trace.vcd.fsdb"
GETSIGNALFORM_SCOPE_HIERARCHY_BEGIN
getSignalForm close
"/TOP"
"/TOP/Vortex"
"/TOP/Vortex/\genblk2[0] "
"/TOP/Vortex/\genblk2[0] /cluster"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] "
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/dcache_rsp_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/\genblk7[0] "
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/mem_req_arb"
"/TOP/Vortex/genblk3"
SCOPE_LIST_BEGIN
"/TOP"
"/TOP/Vortex"
"/TOP/Vortex/genblk3"
"/TOP/Vortex/\genblk2[0]"
"/TOP/Vortex/\genblk2[0] "
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/dcache_rsp_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/dcache_req_if"
"/TOP/Vortex/\genblk2[0] /cluster"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] "
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/dcache_rsp_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/dcache_req_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache_mem_req_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/mem_req_arb"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/\genblk7[0] "
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/mem_req_arb/genblk1"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/lsu_req_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_req_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/execute/lsu_unit/lsu_req_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/dispatch"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/dispatch/ibuffer_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/dispatch/gpr_rsp_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/ibuffer"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/ibuffer_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/ibuffer/ibuffer_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/ibuffer/decode_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/gpr_rsp_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/pipeline/issue/gpr_req_if"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel/genblk5"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_rsp_merge"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel/genblk5/genblk1"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel/genblk5/genblk1/genblk1"
"/TOP/Vortex/\genblk2[0] /cluster/\genblk2[0] /core/mem_unit/dcache/core_req_bank_sel/genblk5/genblk1/genblk1/unnamedblk7"
SCOPE_LIST_END
GETSIGNALFORM_SCOPE_HIERARCHY_END