summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorLi Peng <peng.li@linux.intel.com>2014-05-26 19:25:59 +0800
committerZhigang Gong <zhigang.gong@intel.com>2014-05-30 14:53:28 +0800
commit0db692659e4bc6ce25c19cb56ae07f2c46425d6e (patch)
tree92fac8f676d67cc1576f8d3a5c8540c987abfa63
parentf9074f9ff4e24da2ee92fc84a8dcff0604346d28 (diff)
downloadbeignet-0db692659e4bc6ce25c19cb56ae07f2c46425d6e.tar.gz
Fix timestamp on HASWELL
The GPU timestamp should be lower 36 bit on HASWELL Signed-off-by: Li Peng <peng.li@intel.com> Reviewed-by: He Junyan <junyan.he@inbox.com>
-rw-r--r--src/cl_driver.h2
-rw-r--r--src/cl_event.c4
-rw-r--r--src/intel/intel_gpgpu.c26
3 files changed, 20 insertions, 12 deletions
diff --git a/src/cl_driver.h b/src/cl_driver.h
index 9dc23305..3e01c927 100644
--- a/src/cl_driver.h
+++ b/src/cl_driver.h
@@ -193,7 +193,7 @@ typedef void (cl_gpgpu_event_delete_cb)(cl_gpgpu_event);
extern cl_gpgpu_event_delete_cb *cl_gpgpu_event_delete;
/* Get a event time stamp */
-typedef void (cl_gpgpu_event_get_exec_timestamp_cb)(cl_gpgpu_event, int, uint64_t*);
+typedef void (cl_gpgpu_event_get_exec_timestamp_cb)(cl_gpgpu, cl_gpgpu_event, int, uint64_t*);
extern cl_gpgpu_event_get_exec_timestamp_cb *cl_gpgpu_event_get_exec_timestamp;
/* Get current GPU time stamp */
diff --git a/src/cl_event.c b/src/cl_event.c
index 101e735f..bcd4a6fb 100644
--- a/src/cl_event.c
+++ b/src/cl_event.c
@@ -498,11 +498,11 @@ cl_int cl_event_get_timestamp(cl_event event, cl_profiling_info param_name)
event->timestamp[param_name - CL_PROFILING_COMMAND_QUEUED] = ret_val;
return CL_SUCCESS;
} else if(param_name == CL_PROFILING_COMMAND_START) {
- cl_gpgpu_event_get_exec_timestamp(event->gpgpu_event, 0, &ret_val);
+ cl_gpgpu_event_get_exec_timestamp(gpgpu, event->gpgpu_event, 0, &ret_val);
event->timestamp[param_name - CL_PROFILING_COMMAND_QUEUED] = ret_val;
return CL_SUCCESS;
} else if (param_name == CL_PROFILING_COMMAND_END) {
- cl_gpgpu_event_get_exec_timestamp(event->gpgpu_event, 1, &ret_val);
+ cl_gpgpu_event_get_exec_timestamp(gpgpu, event->gpgpu_event, 1, &ret_val);
event->timestamp[param_name - CL_PROFILING_COMMAND_QUEUED] = ret_val;
return CL_SUCCESS;
}
diff --git a/src/intel/intel_gpgpu.c b/src/intel/intel_gpgpu.c
index fba480c8..bde9bd59 100644
--- a/src/intel/intel_gpgpu.c
+++ b/src/intel/intel_gpgpu.c
@@ -1135,8 +1135,12 @@ intel_gpgpu_event_get_gpu_cur_timestamp(intel_gpgpu_t* gpgpu, uint64_t* ret_ts)
drm_intel_bufmgr *bufmgr = gpgpu->drv->bufmgr;
drm_intel_reg_read(bufmgr, TIMESTAMP_ADDR, &result);
- result = result & 0xFFFFFFFFF0000000;
- result = result >> 28;
+ if (IS_HASWELL(gpgpu->drv->device_id)) {
+ result = result & 0x0000000FFFFFFFFF;
+ } else {
+ result = result & 0xFFFFFFFFF0000000;
+ result = result >> 28;
+ }
result *= 80;
*ret_ts = result;
@@ -1145,8 +1149,8 @@ intel_gpgpu_event_get_gpu_cur_timestamp(intel_gpgpu_t* gpgpu, uint64_t* ret_ts)
/* Get the GPU execute time. */
static void
-intel_gpgpu_event_get_exec_timestamp(intel_event_t *event,
- int index, uint64_t* ret_ts)
+intel_gpgpu_event_get_exec_timestamp(intel_gpgpu_t* gpgpu, intel_event_t *event,
+ int index, uint64_t* ret_ts)
{
uint64_t result = 0;
@@ -1156,11 +1160,15 @@ intel_gpgpu_event_get_exec_timestamp(intel_event_t *event,
uint64_t* ptr = event->ts_buf->virtual;
result = ptr[index];
- /* According to BSpec, the timestamp counter should be 36 bits,
- but comparing to the timestamp counter from IO control reading,
- we find the first 4 bits seems to be fake. In order to keep the
- timestamp counter conformable, we just skip the first 4 bits. */
- result = ((result & 0x0FFFFFFFF) << 4) * 80; //convert to nanoseconds
+ if (IS_HASWELL(gpgpu->drv->device_id))
+ result = (result & 0xFFFFFFFFF) * 80; //convert to nanoseconds
+ else
+ /* According to BSpec, the timestamp counter should be 36 bits,
+ but comparing to the timestamp counter from IO control reading,
+ we find the first 4 bits seems to be fake. In order to keep the
+ timestamp counter conformable, we just skip the first 4 bits.
+ */
+ result = ((result & 0x0FFFFFFFF) << 4) * 80; //convert to nanoseconds
*ret_ts = result;
drm_intel_gem_bo_unmap_gtt(event->ts_buf);