diff --git a/src/wandbot/evaluation/weave_eval/main.py b/src/wandbot/evaluation/weave_eval/main.py index 867705b..1dc33e0 100644 --- a/src/wandbot/evaluation/weave_eval/main.py +++ b/src/wandbot/evaluation/weave_eval/main.py @@ -65,7 +65,6 @@ async def get_eval_record( return { "system_prompt": response["system_prompt"], "generated_answer": response["answer"], - "retrieved_contexts": response["source_documents"], "retrieved_contexts_individual": parse_text_to_json(response["source_documents"]), "model": response["model"], "total_tokens": response["total_tokens"], @@ -103,7 +102,6 @@ async def get_answer_correctness( "answer_correctness": result.dict()["passing"] } - dataset_ref = weave.ref(config.eval_dataset).get() question_rows = dataset_ref.rows question_rows = [