diff --git a/tests/llmobs/llmobs_cassettes/tests.llmobs.test_llmobs_ragas_context_precision_evaluator.emits_traces_and_evaluations_on_exit.yaml b/tests/llmobs/llmobs_cassettes/tests.llmobs.test_llmobs_ragas_context_precision_evaluator.emits_traces_and_evaluations_on_exit.yaml deleted file mode 100644 index 1fbb302c10..0000000000 --- a/tests/llmobs/llmobs_cassettes/tests.llmobs.test_llmobs_ragas_context_precision_evaluator.emits_traces_and_evaluations_on_exit.yaml +++ /dev/null @@ -1,197 +0,0 @@ -interactions: -- request: - body: '{"messages": [{"content": "Given question, answer and context verify if - the context was useful in arriving at the given answer. Give verdict as \"1\" - if useful and \"0\" if not with json output.\n\nThe output should be a well-formatted - JSON instance that conforms to the JSON schema below.\n\nAs an example, for - the schema {\"properties\": {\"foo\": {\"title\": \"Foo\", \"description\": - \"a list of strings\", \"type\": \"array\", \"items\": {\"type\": \"string\"}}}, - \"required\": [\"foo\"]}\nthe object {\"foo\": [\"bar\", \"baz\"]} is a well-formatted - instance of the schema. The object {\"properties\": {\"foo\": [\"bar\", \"baz\"]}} - is not well-formatted.\n\nHere is the output JSON schema:\n```\n{\"description\": - \"Answer for the verification task wether the context was useful.\", \"type\": - \"object\", \"properties\": {\"reason\": {\"title\": \"Reason\", \"description\": - \"Reason for verification\", \"type\": \"string\"}, \"verdict\": {\"title\": - \"Verdict\", \"description\": \"Binary (0/1) verdict of verification\", \"type\": - \"integer\"}}, \"required\": [\"reason\", \"verdict\"]}\n```\n\nDo not return - any preamble or explanations, return only a pure JSON string surrounded by triple - backticks (```).\n\nExamples:\n\nquestion: \"What can you tell me about albert - Albert Einstein?\"\ncontext: \"Albert Einstein (14 March 1879 \u2013 18 April - 1955) was a German-born theoretical physicist, widely held to be one of the - greatest and most influential scientists of all time. Best known for developing - the theory of relativity, he also made important contributions to quantum mechanics, - and was thus a central figure in the revolutionary reshaping of the scientific - understanding of nature that modern physics accomplished in the first decades - of the twentieth century. His mass\u2013energy equivalence formula E = mc2, - which arises from relativity theory, has been called \\\"the world''s most famous - equation\\\". He received the 1921 Nobel Prize in Physics \\\"for his services - to theoretical physics, and especially for his discovery of the law of the photoelectric - effect\\\", a pivotal step in the development of quantum theory. His work is - also known for its influence on the philosophy of science. In a 1999 poll of - 130 leading physicists worldwide by the British journal Physics World, Einstein - was ranked the greatest physicist of all time. His intellectual achievements - and originality have made Einstein synonymous with genius.\"\nanswer: \"Albert - Einstein born in 14 March 1879 was German-born theoretical physicist, widely - held to be one of the greatest and most influential scientists of all time. - He received the 1921 Nobel Prize in Physics for his services to theoretical - physics. He published 4 papers in 1905. Einstein moved to Switzerland in 1895\"\nverification: - ```{\"reason\": \"The provided context was indeed useful in arriving at the - given answer. The context includes key information about Albert Einstein''s - life and contributions, which are reflected in the answer.\", \"verdict\": 1}```\n\nquestion: - \"who won 2020 icc world cup?\"\ncontext: \"The 2022 ICC Men''s T20 World Cup, - held from October 16 to November 13, 2022, in Australia, was the eighth edition - of the tournament. Originally scheduled for 2020, it was postponed due to the - COVID-19 pandemic. England emerged victorious, defeating Pakistan by five wickets - in the final to clinch their second ICC Men''s T20 World Cup title.\"\nanswer: - \"England\"\nverification: ```{\"reason\": \"the context was useful in clarifying - the situation regarding the 2020 ICC World Cup and indicating that England was - the winner of the tournament that was intended to be held in 2020 but actually - took place in 2022.\", \"verdict\": 1}```\n\nquestion: \"What is the tallest - mountain in the world?\"\ncontext: \"The Andes is the longest continental mountain - range in the world, located in South America. It stretches across seven countries - and features many of the highest peaks in the Western Hemisphere. The range - is known for its diverse ecosystems, including the high-altitude Andean Plateau - and the Amazon rainforest.\"\nanswer: \"Mount Everest.\"\nverification: ```{\"reason\": - \"the provided context discusses the Andes mountain range, which, while impressive, - does not include Mount Everest or directly relate to the question about the - world''s tallest mountain.\", \"verdict\": 0}```\n\nYour actual task:\n\nquestion: - \"What is the capital of France?\"\ncontext: \"The capital of France is Paris.\"\nanswer: - \"The capital of France is Paris\"\nverification: \n", "role": "user"}], "model": - "gpt-4o-mini", "n": 1, "stream": false, "temperature": 1e-08}' - headers: - accept: - - application/json - accept-encoding: - - gzip, deflate - connection: - - keep-alive - content-length: - - '4637' - content-type: - - application/json - host: - - api.openai.com - user-agent: - - OpenAI/Python 1.52.0 - x-stainless-arch: - - arm64 - x-stainless-async: - - 'false' - x-stainless-lang: - - python - x-stainless-os: - - MacOS - x-stainless-package-version: - - 1.52.0 - x-stainless-retry-count: - - '0' - x-stainless-runtime: - - CPython - x-stainless-runtime-version: - - 3.10.13 - method: POST - uri: https://api.openai.com/v1/chat/completions - response: - body: - string: !!binary | - H4sIAAAAAAAAAwAAAP//jFJNj9owFLznVzz5TFawrAjk1qLurdVKW7Vqmyox9gsxdWzLfnysEP+9 - cggE1D30EiVv3ozmzeSYADAlWQ5MNJxE63T6Qb5+W9ZfZPNz8/HF2/mrMPzH8vPy0/fn3Z6NIsOu - NijownoQtnUaSVlzhoVHThhVJ9l0uphl2WTeAa2VqCNt7Sh9smmrjEofx49P6ThLJ/Oe3VglMLAc - fiUAAMfuGX0aiQeWw3h0mbQYAl8jy69LAMxbHSeMh6ACcUNsNIDCGkLTWa+qahOsKcyxYB55fGU5 - FOxrg+C83SmJErr9A4FUHgXpNwjECQNQwwmoQRDcKeIabA3PnhuBoAK8cK/CCPaNEk38xgPvyB5r - jYJQgjIdm5uwR/9QsBEUbIdeKkHRxeRUmKqqbp17rLeBx/TMVut+frpGoe3aebsKPX6d18qo0JTn - A+PZgaxjHXpKAH53kW/vUmTO29ZRSfYPmii4mPWRs6HpAZ3OepAscX3DWlyAO71SInGlw01pTHDR - oByoQ8N8K5W9AZKbq/918572+XJl1v8jPwBCoCOUpfMYS7m7eFjzuOn6fH/tmnJnmIW3QNiWtTJr - 9M6r829Yu3K14lMxx2y8Yskp+QsAAP//AwD3kxRElAMAAA== - headers: - CF-Cache-Status: - - DYNAMIC - CF-RAY: - - 8f0a03dada4a1a07-EWR - Connection: - - keep-alive - Content-Encoding: - - gzip - Content-Type: - - application/json - Date: - - Thu, 12 Dec 2024 01:41:59 GMT - Server: - - cloudflare - Set-Cookie: - - __cf_bm=4cLkRN3PY0ywDy6QMgqCvUo.CNS0TwsQcaD5jxK7_gY-1733967719-1.0.1.1-2.RXD8FxUii4MNFP7.rwVGA.kO1IWKZO2S1Tk_qg6JQnbvS1CdSa5Zs9iY2u.LeDL7LSdOj_wu_vSeownk1aaA; - path=/; expires=Thu, 12-Dec-24 02:11:59 GMT; domain=.api.openai.com; HttpOnly; - Secure; SameSite=None - - _cfuvid=vyJTsjtFxMQ60N5X2hl.15Ts.0C6n9TY2Udt2zwtF1k-1733967719343-0.0.1.1-604800000; - path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None - Transfer-Encoding: - - chunked - X-Content-Type-Options: - - nosniff - access-control-expose-headers: - - X-Request-ID - alt-svc: - - h3=":443"; ma=86400 - openai-organization: - - datadog-staging - openai-processing-ms: - - '1298' - openai-version: - - '2020-10-01' - strict-transport-security: - - max-age=31536000; includeSubDomains; preload - x-ratelimit-limit-requests: - - '30000' - x-ratelimit-limit-tokens: - - '150000000' - x-ratelimit-remaining-requests: - - '29999' - x-ratelimit-remaining-tokens: - - '149998897' - x-ratelimit-reset-requests: - - 2ms - x-ratelimit-reset-tokens: - - 0s - x-request-id: - - req_43f2a90eb7cbf539dca15be67231801c - status: - code: 200 - message: OK -- request: - body: '{"data": {"type": "evaluation_metric", "attributes": {"metrics": [{"span_id": - "171867700624094790", "trace_id": "675a3f650000000010166e6542ea0ba8", "label": - "ragas_context_precision", "metric_type": "score", "timestamp_ms": 1733967719288, - "score_value": 1.0, "ml_app": "unnamed-ml-app", "tags": ["ddtrace.version:2.15.0.dev406+ge04c8acf7.d20241210", - "ml_app:unnamed-ml-app"], "metadata": {"_dd.evaluation_kind": "context_precision", - "_dd.evaluation_span": {"span_id": "8227163496056680773", "trace_id": "675a3f6500000000e42b67cfbbbba3b1"}}}]}}}' - headers: - Content-Type: - - application/json - DD-API-KEY: - - XXXXXX - method: POST - uri: https://api.datad0g.com/api/intake/llm-obs/v1/eval-metric - response: - body: - string: '{"data":{"id":"92ff21e8-7018-4a29-b8c7-21c24b9fa74d","type":"evaluation_metric","attributes":{"metrics":[{"id":"giRg5dS154","join_on":{"span":{"trace_id":"675a3f650000000010166e6542ea0ba8","span_id":"171867700624094790"}},"trace_id":"675a3f650000000010166e6542ea0ba8","span_id":"171867700624094790","timestamp_ms":1733967719288,"ml_app":"unnamed-ml-app","metric_type":"score","label":"ragas_context_precision","score_value":1,"tags":["ddtrace.version:2.15.0.dev406+ge04c8acf7.d20241210","ml_app:unnamed-ml-app"]}]}}}' - headers: - content-length: - - '516' - content-security-policy: - - frame-ancestors 'self'; report-uri https://logs.browser-intake-datadoghq.com/api/v2/logs?dd-api-key=pub293163a918901030b79492fe1ab424cf&dd-evp-origin=content-security-policy&ddsource=csp-report&ddtags=site%3Adatad0g.com - content-type: - - application/vnd.api+json - date: - - Thu, 12 Dec 2024 01:42:00 GMT - strict-transport-security: - - max-age=31536000; includeSubDomains; preload - vary: - - Accept-Encoding - x-content-type-options: - - nosniff - x-frame-options: - - SAMEORIGIN - status: - code: 202 - message: Accepted -version: 1