Skip to content

Commit

Permalink
Fix typo
Browse files Browse the repository at this point in the history
  • Loading branch information
lolipopshock committed May 4, 2024
1 parent 9ee3ef0 commit d83ab8c
Show file tree
Hide file tree
Showing 2 changed files with 7 additions and 8 deletions.
15 changes: 7 additions & 8 deletions collm/eval.py
Original file line number Diff line number Diff line change
Expand Up @@ -725,7 +725,7 @@ def eval_tydiqa(pred_data, orig_data):
pred_data = pred_data["train"]

metric = evaluate.load("squad")
data_languages = set(orig_data["lang"])
data_languages = sorted(list(set(orig_data["lang"])))
target = [ele.strip().split("\n\n")[0] if ele else "" for ele in pred_data["generated_text"]]

eval_scores = {}
Expand All @@ -743,18 +743,17 @@ def eval_tydiqa(pred_data, orig_data):
eval_scores["average"] = {
metric: np.mean([scores[metric] for scores in eval_scores.values()]) for metric in ["exact_match", "f1"]
}

def_rate = np.array([(np.array(ele["deferral_prob"]) > ele["def_threshold"]).mean() for ele in pred_data]).mean()
th = pred_data["def_threshold"][0]

return {
"threshold": th,
"def_rate": def_rate,
result = {
"exact_match": eval_scores["average"]["exact_match"],
"f1": eval_scores["average"]["f1"],
"performance": eval_scores,
}

if "deferral_prob" in pred_data.column_names:
_add_deferral_probs(pred_data, result)

return result


def eval_math(
pred_data,
Expand Down
File renamed without changes.

0 comments on commit d83ab8c

Please sign in to comment.