intel/perf: expose some utility functions

The Vulkan performance query extension is a bit lower level than the
GL one. Expose some of the functions to do the result accumulation
directly in the Anv driver.

Signed-off-by: Lionel Landwerlin <lionel.g.landwerlin@intel.com>
Reviewed-by: Rafael Antognolli <rafael.antognolli@intel.com>
This commit is contained in:
Lionel Landwerlin
2019-08-28 15:45:00 +03:00
parent a0e0e75db1
commit a338b7d739
2 changed files with 55 additions and 31 deletions

View File

@@ -583,14 +583,15 @@ kernel_has_dynamic_config_support(struct gen_perf_config *perf, int fd)
&invalid_config_id) < 0 && errno == ENOENT;
}
static bool
load_metric_id(struct gen_perf_config *perf, const char *guid,
bool
gen_perf_load_metric_id(struct gen_perf_config *perf_cfg,
const char *guid,
uint64_t *metric_id)
{
char config_path[280];
snprintf(config_path, sizeof(config_path), "%s/metrics/%s/id",
perf->sysfs_dev_dir, guid);
perf_cfg->sysfs_dev_dir, guid);
/* Don't recreate already loaded configs. */
return read_file_uint64(config_path, metric_id);
@@ -605,7 +606,7 @@ init_oa_configs(struct gen_perf_config *perf, int fd)
uint64_t config_id;
int ret;
if (load_metric_id(perf, query->guid, &config_id)) {
if (gen_perf_load_metric_id(perf, query->guid, &config_id)) {
DBG("metric set: %s (already loaded)\n", query->guid);
register_oa_config(perf, query, config_id);
continue;
@@ -964,8 +965,8 @@ gen8_read_report_clock_ratios(const uint32_t *report,
*unslice_freq_hz = unslice_freq * 16666667ULL;
}
static void
query_result_read_frequencies(struct gen_perf_query_result *result,
void
gen_perf_query_result_read_frequencies(struct gen_perf_query_result *result,
const struct gen_device_info *devinfo,
const uint32_t *start,
const uint32_t *end)
@@ -989,8 +990,8 @@ query_result_read_frequencies(struct gen_perf_query_result *result,
&result->unslice_frequency[1]);
}
static void
query_result_accumulate(struct gen_perf_query_result *result,
void
gen_perf_query_result_accumulate(struct gen_perf_query_result *result,
const struct gen_perf_query_info *query,
const uint32_t *start,
const uint32_t *end)
@@ -1031,8 +1032,8 @@ query_result_accumulate(struct gen_perf_query_result *result,
}
static void
query_result_clear(struct gen_perf_query_result *result)
void
gen_perf_query_result_clear(struct gen_perf_query_result *result)
{
memset(result, 0, sizeof(*result));
result->hw_id = 0xffffffff; /* invalid */
@@ -1292,7 +1293,7 @@ get_metric_id(struct gen_perf_config *perf,
}
struct gen_perf_query_info *raw_query = (struct gen_perf_query_info *)query;
if (!load_metric_id(perf, query->guid,
if (!gen_perf_load_metric_id(perf, query->guid,
&raw_query->oa_metrics_set_id)) {
DBG("Unable to read query guid=%s ID, falling back to test config\n", query->guid);
raw_query->oa_metrics_set_id = 1ULL;
@@ -1735,7 +1736,7 @@ gen_perf_begin_query(struct gen_perf_context *perf_ctx,
*/
buf->refcount++;
query_result_clear(&query->oa.result);
gen_perf_query_result_clear(&query->oa.result);
query->oa.results_accumulated = false;
add_to_unaccumulated_query_list(perf_ctx, query);
@@ -2203,7 +2204,8 @@ accumulate_oa_reports(struct gen_perf_context *perf_ctx,
}
if (add) {
query_result_accumulate(&query->oa.result, query->queryinfo,
gen_perf_query_result_accumulate(&query->oa.result,
query->queryinfo,
last, report);
}
@@ -2224,7 +2226,7 @@ accumulate_oa_reports(struct gen_perf_context *perf_ctx,
end:
query_result_accumulate(&query->oa.result, query->queryinfo,
gen_perf_query_result_accumulate(&query->oa.result, query->queryinfo,
last, end);
query->oa.results_accumulated = true;
@@ -2412,7 +2414,7 @@ gen_perf_get_query_data(struct gen_perf_context *perf_ctx,
read_gt_frequency(perf_ctx, query);
uint32_t *begin_report = query->oa.map;
uint32_t *end_report = query->oa.map + MI_RPC_BO_END_OFFSET_BYTES;
query_result_read_frequencies(&query->oa.result,
gen_perf_query_result_read_frequencies(&query->oa.result,
perf_ctx->devinfo,
begin_report,
end_report);

View File

@@ -255,12 +255,34 @@ struct gen_perf_config {
struct gen_perf_query_object;
const struct gen_perf_query_info* gen_perf_query_info(const struct gen_perf_query_object *);
struct gen_perf_context;
struct gen_perf_context *gen_perf_new_context(void *parent);
void gen_perf_init_metrics(struct gen_perf_config *perf_cfg,
const struct gen_device_info *devinfo,
int drm_fd);
/** Query i915 for a metric id using guid.
*/
bool gen_perf_load_metric_id(struct gen_perf_config *perf_cfg,
const char *guid,
uint64_t *metric_id);
/** Read the slice/unslice frequency from 2 OA reports and store then into
* result.
*/
void gen_perf_query_result_read_frequencies(struct gen_perf_query_result *result,
const struct gen_device_info *devinfo,
const uint32_t *start,
const uint32_t *end);
/** Accumulate the delta between 2 OA reports into result for a given query.
*/
void gen_perf_query_result_accumulate(struct gen_perf_query_result *result,
const struct gen_perf_query_info *query,
const uint32_t *start,
const uint32_t *end);
void gen_perf_query_result_clear(struct gen_perf_query_result *result);
struct gen_perf_context;
struct gen_perf_context *gen_perf_new_context(void *parent);
void gen_perf_init_context(struct gen_perf_context *perf_ctx,
struct gen_perf_config *perf_cfg,
void * ctx, /* driver context (eg, brw_context) */