Skip to content

Commit ffc62b6

Browse files
ericxu233pcolberg
authored andcommitted
Add direct write for new start bit register
Enbaled backwards compatibility with the new CSR change
1 parent 9a313e7 commit ffc62b6

File tree

2 files changed

+53
-22
lines changed

2 files changed

+53
-22
lines changed

include/acl_kernel_if.h

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -60,6 +60,9 @@ typedef struct {
6060

6161
// Track debug printf activity
6262
time_ns last_printf_dump = 0;
63+
64+
// CRA address offset for backwards compatibility
65+
unsigned int cra_address_offset = 8;
6366
} acl_kernel_if;
6467

6568
// *********************** Public functions **************************

src/acl_kernel_if.cpp

Lines changed: 50 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,8 @@ acl_process_autorun_profiler_scan_chain(unsigned int physical_device_id,
4545
// address map.
4646
#define CSR_VERSION_ID_18_1 (3)
4747
#define CSR_VERSION_ID_19_1 (4)
48-
#define CSR_VERSION_ID CSR_VERSION_ID_19_1
48+
#define CSR_VERSION_ID_23_1 (5)
49+
#define CSR_VERSION_ID CSR_VERSION_ID_23_1
4950

5051
// Address map
5152
// For unit tests to work, these defines must match those in the unit test
@@ -66,6 +67,8 @@ acl_process_autorun_profiler_scan_chain(unsigned int physical_device_id,
6667
#define KERNEL_ROM_SIZE_BYTES 8
6768

6869
// Byte offsets into the CRA:
70+
// For CSR version >= 5 byte offsets are pushed back with the proper
71+
// value except for the CSR later on in the runtime execution
6972
#define KERNEL_OFFSET_CSR 0
7073
#define KERNEL_OFFSET_PRINTF_BUFFER_SIZE 0x4
7174
#define KERNEL_OFFSET_CSR_PROFILE_CTRL 0xC
@@ -75,11 +78,14 @@ acl_process_autorun_profiler_scan_chain(unsigned int physical_device_id,
7578
#define KERNEL_OFFSET_FINISH_COUNTER 0x28
7679
#define KERNEL_OFFSET_INVOCATION_IMAGE 0x30
7780

81+
// CSR version >= 5 byte offsets
82+
#define KERNEL_OFFSET_START_REG 0x8
83+
7884
// Backwards compatibility with CSR_VERSION_ID 3
7985
#define KERNEL_OFFSET_INVOCATION_IMAGE_181 0x28
8086

8187
// Bit positions
82-
#define KERNEL_CSR_GO 0
88+
#define KERNEL_CSR_START 0
8389
#define KERNEL_CSR_DONE 1
8490
#define KERNEL_CSR_STALLED 3
8591
#define KERNEL_CSR_UNSTALL 4
@@ -593,8 +599,9 @@ static int acl_kernel_if_issue_profile_hw_command(acl_kernel_if *kern,
593599
int status;
594600
acl_assert_locked_or_sig();
595601
assert(acl_kernel_if_is_valid(kern));
596-
status = acl_kernel_cra_read(kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_CTRL,
597-
&profile_ctrl_val);
602+
status = acl_kernel_cra_read(
603+
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_CTRL + kern->cra_address_offset,
604+
&profile_ctrl_val);
598605
if (status)
599606
return status;
600607
ACL_KERNEL_IF_DEBUG_MSG(
@@ -609,8 +616,9 @@ static int acl_kernel_if_issue_profile_hw_command(acl_kernel_if *kern,
609616
ACL_KERNEL_IF_DEBUG_MSG(
610617
kern, ":: Issue profile HW command:: Accelerator %d new csr is %x.\n",
611618
accel_id, profile_ctrl_val);
612-
status = acl_kernel_cra_write(kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_CTRL,
613-
profile_ctrl_val);
619+
status = acl_kernel_cra_write(
620+
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_CTRL + kern->cra_address_offset,
621+
profile_ctrl_val);
614622
if (status)
615623
return status;
616624
return 0;
@@ -1040,6 +1048,11 @@ int acl_kernel_if_post_pll_config_init(acl_kernel_if *kern) {
10401048
ACL_KERNEL_IF_DEBUG_MSG(kern,
10411049
"Read CSR version from kernel 0: Version = %u\n",
10421050
kern->csr_version);
1051+
if (kern->csr_version < 5) {
1052+
// Register addresses are pushed back since previous versions
1053+
// doesn't have the start register
1054+
kern->cra_address_offset = 0;
1055+
}
10431056
} else {
10441057
kern->csr_version = 0;
10451058
}
@@ -1220,7 +1233,8 @@ void acl_kernel_if_launch_kernel_on_custom_sof(
12201233
}
12211234

12221235
} else {
1223-
offset = (unsigned int)KERNEL_OFFSET_INVOCATION_IMAGE;
1236+
offset = (unsigned int)(KERNEL_OFFSET_INVOCATION_IMAGE +
1237+
kern->cra_address_offset);
12241238
image_p = (uintptr_t) & (image->work_dim);
12251239
image_size_static =
12261240
(size_t)((uintptr_t) & (image->arg_value) - (uintptr_t) &
@@ -1279,11 +1293,15 @@ void acl_kernel_if_launch_kernel_on_custom_sof(
12791293
return;
12801294
}
12811295

1282-
unsigned int new_csr = 0;
1283-
acl_kernel_cra_read(kern, accel_id, KERNEL_OFFSET_CSR, &new_csr);
1284-
ACL_KERNEL_SET_BIT(new_csr, KERNEL_CSR_GO);
1285-
acl_kernel_cra_write(kern, accel_id, KERNEL_OFFSET_CSR, new_csr);
1286-
1296+
// backwards compatibility for version prior to 2023.1
1297+
if (kern->csr_version < CSR_VERSION_ID) {
1298+
unsigned int new_csr = 0;
1299+
acl_kernel_cra_read(kern, accel_id, KERNEL_OFFSET_CSR, &new_csr);
1300+
ACL_KERNEL_SET_BIT(new_csr, KERNEL_CSR_START);
1301+
acl_kernel_cra_write(kern, accel_id, KERNEL_OFFSET_CSR, new_csr);
1302+
} else {
1303+
acl_kernel_cra_write(kern, accel_id, KERNEL_OFFSET_START_REG, 1);
1304+
}
12871305
// IRQ handler takes care of the completion event through
12881306
// acl_kernel_if_update_status()
12891307
}
@@ -1362,7 +1380,9 @@ static void acl_kernel_if_update_status_query(acl_kernel_if *kern,
13621380
// kernel arguments
13631381
printf_size = 0;
13641382
if (kern->accel_num_printfs[accel_id] > 0) {
1365-
acl_kernel_cra_read(kern, accel_id, KERNEL_OFFSET_PRINTF_BUFFER_SIZE,
1383+
acl_kernel_cra_read(kern, accel_id,
1384+
KERNEL_OFFSET_PRINTF_BUFFER_SIZE +
1385+
kern->cra_address_offset,
13661386
&printf_size);
13671387
assert(printf_size <= ACL_PRINTF_BUFFER_TOTAL_SIZE);
13681388
ACL_KERNEL_IF_DEBUG_MSG(kern,
@@ -1427,7 +1447,8 @@ static void acl_kernel_if_update_status_query(acl_kernel_if *kern,
14271447
// Only expect single completion for older csr version
14281448
finish_counter = 1;
14291449
} else {
1430-
acl_kernel_cra_read(kern, accel_id, KERNEL_OFFSET_FINISH_COUNTER,
1450+
acl_kernel_cra_read(kern, accel_id,
1451+
KERNEL_OFFSET_FINISH_COUNTER + kern->cra_address_offset,
14311452
&finish_counter);
14321453
ACL_KERNEL_IF_DEBUG_MSG(kern, ":: Accelerator %d has %d finishes.\n",
14331454
accel_id, finish_counter);
@@ -1586,8 +1607,9 @@ void acl_kernel_if_debug_dump_printf(acl_kernel_if *kern, unsigned k) {
15861607
next_queue_back = kern->accel_queue_back[k] + 1;
15871608

15881609
if (kern->accel_num_printfs[k] > 0) {
1589-
acl_kernel_cra_read(kern, k, KERNEL_OFFSET_PRINTF_BUFFER_SIZE,
1590-
&printf_size);
1610+
acl_kernel_cra_read(
1611+
kern, k, KERNEL_OFFSET_PRINTF_BUFFER_SIZE + kern->cra_address_offset,
1612+
&printf_size);
15911613
assert(printf_size <= ACL_PRINTF_BUFFER_TOTAL_SIZE);
15921614
ACL_KERNEL_IF_DEBUG_MSG(
15931615
kern, ":: Accelerator %d printf buffer size is %d.\n", k, printf_size);
@@ -1785,16 +1807,19 @@ static uint64_t acl_kernel_if_get_profile_data_word(acl_kernel_if *kern,
17851807
#ifdef _WIN32
17861808
// Use 32-bit reads on Windows.
17871809
unsigned int low_word, high_word;
1788-
status = acl_kernel_cra_read(kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_DATA,
1789-
&low_word);
1810+
status = acl_kernel_cra_read(
1811+
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_DATA + kern->cra_address_offset,
1812+
&low_word);
17901813
if (status)
17911814
return (uint64_t)status;
17921815
ACL_KERNEL_IF_DEBUG_MSG(kern,
17931816
":: Read profile hardware:: Accelerator %d "
17941817
"profile_data low_word is %x.\n",
17951818
accel_id, low_word);
17961819
status = acl_kernel_cra_read(kern, accel_id,
1797-
KERNEL_OFFSET_CSR_PROFILE_DATA + 4, &high_word);
1820+
KERNEL_OFFSET_CSR_PROFILE_DATA + 4 +
1821+
kern->cra_address_offset,
1822+
&high_word);
17981823
if (status)
17991824
return (uint64_t)status;
18001825
ACL_KERNEL_IF_DEBUG_MSG(kern,
@@ -1805,7 +1830,8 @@ static uint64_t acl_kernel_if_get_profile_data_word(acl_kernel_if *kern,
18051830
((((uint64_t)high_word) & 0xFFFFFFFF) << 32) | (low_word & 0xFFFFFFFF);
18061831
#else
18071832
status = acl_kernel_cra_read_64b(
1808-
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_DATA, &read_result);
1833+
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_DATA + kern->cra_address_offset,
1834+
&read_result);
18091835
if (status)
18101836
return (uint64_t)status;
18111837
ACL_KERNEL_IF_DEBUG_MSG(kern,
@@ -1905,7 +1931,8 @@ int acl_kernel_if_set_profile_start_cycle(acl_kernel_if *kern, cl_uint accel_id,
19051931
assert(acl_kernel_if_is_valid(kern));
19061932
assert(accel_id < kern->num_accel);
19071933
status = acl_kernel_cra_write_64b(
1908-
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_START_CYCLE, value);
1934+
kern, accel_id,
1935+
KERNEL_OFFSET_CSR_PROFILE_START_CYCLE + kern->cra_address_offset, value);
19091936

19101937
return status;
19111938
}
@@ -1919,6 +1946,7 @@ int acl_kernel_if_set_profile_stop_cycle(acl_kernel_if *kern, cl_uint accel_id,
19191946
assert(acl_kernel_if_is_valid(kern));
19201947
assert(accel_id < kern->num_accel);
19211948
status = acl_kernel_cra_write_64b(
1922-
kern, accel_id, KERNEL_OFFSET_CSR_PROFILE_STOP_CYCLE, value);
1949+
kern, accel_id,
1950+
KERNEL_OFFSET_CSR_PROFILE_STOP_CYCLE + kern->cra_address_offset, value);
19231951
return status;
19241952
}

0 commit comments

Comments
 (0)