Spaces:

geonmin-kim
/

NetsPresso_QA

Runtime error

App Files Files Community

NetsPresso_QA / tools /eval /trec_eval.9.0.4 /m_gm_bpref.c

geonmin-kim

Upload folder using huggingface_hub

d6585f5 almost 2 years ago

raw

history blame contribute delete

3.27 kB

	/*
	Copyright (c) 2008 - Chris Buckley.

	Permission is granted for use and modification of this file for
	research, non-commercial purposes.
	*/

	#include "common.h"
	#include "sysfunc.h"
	#include "trec_eval.h"
	#include "functions.h"
	#include "trec_format.h"

	static int
	te_calc_gm_bpref (const EPI epi, const REL_INFO rel_info,
	const RESULTS results, const TREC_MEAS tm, TREC_EVAL *eval);

	/* See trec_eval.h for definition of TREC_MEAS */
	TREC_MEAS te_meas_gm_bpref =
	{"gm_bpref",
	" Binary preference (bpref), but using goemetric mean over topics\n\
	See the explanation for 'bpref' for the base measure for a single topic.\n\
	Gm_bpref uses the geometric mean to combine the single topic scores.\n\
	This rewards methods that are more consistent across topics as opposed to\n\
	high scores for some topics and low scores for others.\n\
	Gm_bpref is printed only as a summary measure across topics, not for the\n\
	individual topics.\n",
	te_init_meas_s_float,
	te_calc_gm_bpref,
	te_acc_meas_s,
	te_calc_avg_meas_s_gm,
	te_print_single_meas_empty,
	te_print_final_meas_s_float,
	NULL, -1};

	static int
	te_calc_gm_bpref (const EPI epi, const REL_INFO rel_info,
	const RESULTS results, const TREC_MEAS tm, TREC_EVAL *eval)
	{
	RES_RELS res_rels;
	long j;
	long nonrel_so_far, rel_so_far, pool_unjudged_so_far;
	long num_nonrel = 0;
	double bpref = 0.0;

	if (UNDEF == te_form_res_rels (epi, rel_info, results, &res_rels))
	return (UNDEF);

	for (j = 0; j < epi->relevance_level; j++)
	num_nonrel += res_rels.rel_levels[j];

	/* Calculate judgement based measures (dependent on only
	judged docs; no assumption of non-relevance if not judged) */
	/* Binary Preference measures; here expressed as all docs with a higher
	value of rel are to be preferred. Optimize by keeping track of nonrel
	seen so far */
	nonrel_so_far = 0;
	rel_so_far = 0;
	pool_unjudged_so_far = 0;
	for (j = 0; j < res_rels.num_ret; j++) {
	if (res_rels.results_rel_list[j] == RELVALUE_NONPOOL)
	/* document not in pool. Skip */
	continue;
	if (res_rels.results_rel_list[j] == RELVALUE_UNJUDGED) {
	/* document in pool but unjudged. */
	pool_unjudged_so_far++;
	continue;
	}

	if (res_rels.results_rel_list[j] >= 0 &&
	res_rels.results_rel_list[j] < epi->relevance_level)
	nonrel_so_far++;
	else {
	/* Judged Rel doc */
	rel_so_far++;
	/* Add fraction of correct preferences. */
	/* Special case nonrel_so_far == 0 to avoid division by 0 */
	if (nonrel_so_far > 0) {
	bpref += 1.0 -
	(((double) MIN (nonrel_so_far, res_rels.num_rel)) /
	(double) MIN (num_nonrel, res_rels.num_rel));
	}
	else
	bpref += 1.0;
	}
	}
	if (res_rels.num_rel)
	bpref /= res_rels.num_rel;

	/* Original measure value is constrained to be greater than
	MIN_GEO_MEAN (for time being .00001, since trec_eval prints to
	four significant digits) */
	eval->values[tm->eval_index].value =
	(double) log ((double)(MAX (bpref, MIN_GEO_MEAN)));

	if (epi->debug_level > 1)
	printf ("gm_bpref: bpref %6.4f, gm_bpref %6.4f",
	bpref, eval->values[tm->eval_index].value);


	return (1);
	}