Evaluation.summarize:v0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
import weave
from weave.flow.scorer import transpose
from weave.flow.scorer import get_scorer_attributes
from weave.flow.scorer import auto_summarize
class EvaluationResults(weave.Object):
rows: weave.Table
@weave.op()
async def summarize(self, eval_table: EvaluationResults) -> dict:
eval_table_rows = list(eval_table.rows)
cols = transpose(eval_table_rows)
summary = {}
for name, vals in cols.items():
if name == "scores":
scorers = self.scorers or []
for scorer in scorers:
scorer_name, _, summarize_fn = get_scorer_attributes(scorer)
scorer_stats = transpose(vals)
score_table = scorer_stats[scorer_name]
scored = summarize_fn(score_table)
summary[scorer_name] = scored
else:
model_output_summary = auto_summarize(vals)
if model_output_summary:
summary[name] = model_output_summary