|
22 | 22 | #include "shared/source/memory_manager/graphics_allocation.h" |
23 | 23 | #include "shared/source/memory_manager/memory_manager.h" |
24 | 24 |
|
25 | | -#include "opencl/source/helpers/hardware_commands_helper.h" |
26 | | - |
27 | 25 | #include "level_zero/core/source/cmdlist/cmdlist_hw.h" |
28 | 26 | #include "level_zero/core/source/device/device_imp.h" |
29 | 27 | #include "level_zero/core/source/event/event.h" |
@@ -882,13 +880,13 @@ ze_result_t CommandListCoreFamily<gfxCoreFamily>::appendMemoryCopyRegion(void *d |
882 | 880 | size_t srcSize = 0; |
883 | 881 |
|
884 | 882 | if (srcRegion->depth > 1) { |
885 | | - uint hostPtrDstOffset = dstRegion->originX + ((dstRegion->originY) * dstPitch) + ((dstRegion->originZ) * dstSlicePitch); |
886 | | - uint hostPtrSrcOffset = srcRegion->originX + ((srcRegion->originY) * srcPitch) + ((srcRegion->originZ) * srcSlicePitch); |
| 883 | + uint32_t hostPtrDstOffset = dstRegion->originX + ((dstRegion->originY) * dstPitch) + ((dstRegion->originZ) * dstSlicePitch); |
| 884 | + uint32_t hostPtrSrcOffset = srcRegion->originX + ((srcRegion->originY) * srcPitch) + ((srcRegion->originZ) * srcSlicePitch); |
887 | 885 | dstSize = (dstRegion->width * dstRegion->height * dstRegion->depth) + hostPtrDstOffset; |
888 | 886 | srcSize = (srcRegion->width * srcRegion->height * srcRegion->depth) + hostPtrSrcOffset; |
889 | 887 | } else { |
890 | | - uint hostPtrDstOffset = dstRegion->originX + ((dstRegion->originY) * dstPitch); |
891 | | - uint hostPtrSrcOffset = srcRegion->originX + ((srcRegion->originY) * srcPitch); |
| 888 | + uint32_t hostPtrDstOffset = dstRegion->originX + ((dstRegion->originY) * dstPitch); |
| 889 | + uint32_t hostPtrSrcOffset = srcRegion->originX + ((srcRegion->originY) * srcPitch); |
892 | 890 | dstSize = (dstRegion->width * dstRegion->height) + hostPtrDstOffset; |
893 | 891 | srcSize = (srcRegion->width * srcRegion->height) + hostPtrSrcOffset; |
894 | 892 | } |
@@ -976,10 +974,10 @@ ze_result_t CommandListCoreFamily<gfxCoreFamily>::appendMemoryCopyKernel3d(NEO:: |
976 | 974 | ze_group_count_t dispatchFuncArgs{srcRegion->width / groupSizeX, srcRegion->height / groupSizeY, |
977 | 975 | srcRegion->depth / groupSizeZ}; |
978 | 976 |
|
979 | | - uint srcOrigin[3] = {(srcRegion->originX + static_cast<uint32_t>(srcOffset)), (srcRegion->originY), (srcRegion->originZ)}; |
980 | | - uint dstOrigin[3] = {(dstRegion->originX + static_cast<uint32_t>(dstOffset)), (dstRegion->originY), (dstRegion->originZ)}; |
981 | | - uint srcPitches[2] = {(srcPitch), (srcSlicePitch)}; |
982 | | - uint dstPitches[2] = {(dstPitch), (dstSlicePitch)}; |
| 977 | + uint32_t srcOrigin[3] = {(srcRegion->originX + static_cast<uint32_t>(srcOffset)), (srcRegion->originY), (srcRegion->originZ)}; |
| 978 | + uint32_t dstOrigin[3] = {(dstRegion->originX + static_cast<uint32_t>(dstOffset)), (dstRegion->originY), (dstRegion->originZ)}; |
| 979 | + uint32_t srcPitches[2] = {(srcPitch), (srcSlicePitch)}; |
| 980 | + uint32_t dstPitches[2] = {(dstPitch), (dstSlicePitch)}; |
983 | 981 |
|
984 | 982 | auto dstValPtr = static_cast<uintptr_t>(dstGA->getGpuAddress()); |
985 | 983 | auto srcValPtr = static_cast<uintptr_t>(srcGA->getGpuAddress()); |
@@ -1035,8 +1033,8 @@ ze_result_t CommandListCoreFamily<gfxCoreFamily>::appendMemoryCopyKernel2d(NEO:: |
1035 | 1033 |
|
1036 | 1034 | ze_group_count_t dispatchFuncArgs{srcRegion->width / groupSizeX, srcRegion->height / groupSizeY, 1u}; |
1037 | 1035 |
|
1038 | | - uint srcOrigin[2] = {(srcRegion->originX + static_cast<uint32_t>(srcOffset)), (srcRegion->originY)}; |
1039 | | - uint dstOrigin[2] = {(dstRegion->originX + static_cast<uint32_t>(dstOffset)), (dstRegion->originY)}; |
| 1036 | + uint32_t srcOrigin[2] = {(srcRegion->originX + static_cast<uint32_t>(srcOffset)), (srcRegion->originY)}; |
| 1037 | + uint32_t dstOrigin[2] = {(dstRegion->originX + static_cast<uint32_t>(dstOffset)), (dstRegion->originY)}; |
1040 | 1038 |
|
1041 | 1039 | auto dstValPtr = static_cast<uintptr_t>(dstGA->getGpuAddress()); |
1042 | 1040 | auto srcValPtr = static_cast<uintptr_t>(srcGA->getGpuAddress()); |
@@ -1374,11 +1372,10 @@ ze_result_t CommandListCoreFamily<gfxCoreFamily>::appendWaitOnEvents(uint32_t nu |
1374 | 1372 | if (event->isTimestampEvent) { |
1375 | 1373 | gpuAddr += offsetof(KernelTimestampEvent, contextEnd); |
1376 | 1374 | } |
1377 | | - |
1378 | | - NEO::HardwareCommandsHelper<GfxFamily>::programMiSemaphoreWait(*(commandContainer.getCommandStream()), |
1379 | | - gpuAddr, |
1380 | | - eventStateClear, |
1381 | | - COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD); |
| 1375 | + NEO::EncodeSempahore<GfxFamily>::addMiSemaphoreWaitCommand(*commandContainer.getCommandStream(), |
| 1376 | + gpuAddr, |
| 1377 | + eventStateClear, |
| 1378 | + COMPARE_OPERATION::COMPARE_OPERATION_SAD_NOT_EQUAL_SDD); |
1382 | 1379 |
|
1383 | 1380 | bool dcFlushEnable = (!event->waitScope) ? false : true; |
1384 | 1381 | if (dcFlushEnable) { |
|
0 commit comments