@@ -769,15 +769,27 @@ static void l_dump_printf_buffer(cl_event event, cl_kernel kernel,
769
769
hal_dma_fn = acl_get_hal ()->copy_globalmem_to_hostmem ;
770
770
}
771
771
772
- void * b = (void *)((char *)kernel->printf_device_buffer ->block_allocation ->range .begin + kernel->processed_buffer_size );
773
- // hal_dma_fn(NULL, b, buffer, size - 64);
774
- hal_dma_fn ( NULL , b, buffer, size - kernel-> processed_buffer_size );
772
+ // void* b = (void*)((char*)kernel->printf_device_buffer->block_allocation->range.begin + kernel->processed_buffer_size);
773
+ // // hal_dma_fn(NULL, b, buffer, size - 64);
774
+
775
775
// hal_dma_fn(NULL, b, buffer, size - 64);
776
776
// test is giving segfault if I use size - 64, because test doesn't have that much data
777
777
// What if I don't use -64
778
+ printf (" total size is %d \n " , size);
779
+ printf (" kernel prcessed buffer size is %d \n " , kernel->processed_buffer_size );
780
+
781
+ void * unprocessed_begin = (void *)((char *)kernel->printf_device_buffer ->block_allocation ->range .begin + kernel->processed_buffer_size );
782
+ printf (" Hang may begin here?? \n " );
783
+ if (size > (unsigned int ) kernel->processed_buffer_size ){
784
+ printf (" ZIBAI has something to print! \n " );
785
+ hal_dma_fn (NULL , unprocessed_begin, buffer, size - kernel->processed_buffer_size );
786
+ } else {
787
+ printf (" Zibai Added, nothing to print \n " );
788
+ return ;
789
+ }
790
+
778
791
779
- // hal_dma_fn(NULL, kernel->printf_device_buffer->block_allocation->range.begin,
780
- // buffer, size);
792
+ // hal_dma_fn(NULL, kernel->printf_device_buffer->block_allocation->range.begin, buffer, size);
781
793
782
794
#ifdef DEBUG
783
795
if (debug_mode > 0 ) {
@@ -1025,7 +1037,7 @@ void acl_process_printf_buffer(void *user_data, acl_device_op_t *op) {
1025
1037
// buffer again.
1026
1038
// Zibai Testing
1027
1039
if (op->info .debug_dump == 1 ){
1028
- kernel->processed_buffer_size += num_bytes;
1040
+ kernel->processed_buffer_size += num_bytes; // TODO, Fix this, should be += processed bytes
1029
1041
} else {
1030
1042
// Full dump, clear this global var
1031
1043
kernel->processed_buffer_size = 0 ;
0 commit comments