diff --git a/evals/registry/data/04_mechanism_QA/mechanism_QA.jsonl b/evals/registry/data/04_mechanism_QA/mechanism_QA.jsonl new file mode 100644 index 0000000000..09097299ca --- /dev/null +++ b/evals/registry/data/04_mechanism_QA/mechanism_QA.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da36b7d682d814e3102a67df609cd8bb26d08acec983265e28fa7e7154745852 +size 15794 diff --git a/evals/registry/data/04_sol_QA/sol_QA.jsonl b/evals/registry/data/04_sol_QA/sol_QA.jsonl index cf97f5f676..b373b28c3d 100644 --- a/evals/registry/data/04_sol_QA/sol_QA.jsonl +++ b/evals/registry/data/04_sol_QA/sol_QA.jsonl @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aa86d3995689464a8555fbd4d1122eb1454e0bfa4d157446306c905547bc5443 -size 27054 +oid sha256:afc34f4b912fd05d16db14f0050dc6a71f74bc84bc6549265543253ce6a70728 +size 29931 diff --git a/evals/registry/eval_sets/chemistry_electrolytes.yaml b/evals/registry/eval_sets/chemistry_electrolytes.yaml index 1db7666311..78f94055eb 100644 --- a/evals/registry/eval_sets/chemistry_electrolytes.yaml +++ b/evals/registry/eval_sets/chemistry_electrolytes.yaml @@ -1,5 +1,5 @@ chemistry_electrolytes: evals: - solubility_large - - sol_reaction - - sol_QA \ No newline at end of file + - solQA + - mechanismQA \ No newline at end of file diff --git a/evals/registry/evals/04_mechanism_QA.yaml b/evals/registry/evals/04_mechanism_QA.yaml new file mode 100644 index 0000000000..204c2c6e5d --- /dev/null +++ b/evals/registry/evals/04_mechanism_QA.yaml @@ -0,0 +1,9 @@ + +mechanismQA: + id: mechanismQA.dev.v0 + metrics: [accuracy] + +mechanismQA.dev.v0: + class: evals.elsuite.rag_match_fuzzy:RAGMatch + args: + samples_jsonl: 04_mechanism_QA/mechanism_QA.jsonl \ No newline at end of file