diff --git a/evals/registry/data/logiqa-logical-reasoning-plus/logiqa-logical-reasoning-plus.jsonl b/evals/registry/data/logiqa-logical-reasoning-plus/logiqa-logical-reasoning-plus.jsonl new file mode 100644 index 0000000000..8fe696c68c --- /dev/null +++ b/evals/registry/data/logiqa-logical-reasoning-plus/logiqa-logical-reasoning-plus.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9b355240cd6255ffdaa97e05cef7e157ab63d52e2cbaa286cdec95101022f3e +size 1013200 diff --git a/evals/registry/data/logiqa-logical-reasoning-plus/logiqav2-logical-reasoning-plus.jsonl b/evals/registry/data/logiqa-logical-reasoning-plus/logiqav2-logical-reasoning-plus.jsonl new file mode 100644 index 0000000000..1b8baa25fc --- /dev/null +++ b/evals/registry/data/logiqa-logical-reasoning-plus/logiqav2-logical-reasoning-plus.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419874b2a62f5bac77cc1a6280f7557a0b2075456453bf6909fece3a8a001fba +size 2582087 diff --git a/evals/registry/data/logiqa-logical-reasoning-plus/reclor-logical-reasoning-plus.jsonl b/evals/registry/data/logiqa-logical-reasoning-plus/reclor-logical-reasoning-plus.jsonl new file mode 100644 index 0000000000..55faf8e20f --- /dev/null +++ b/evals/registry/data/logiqa-logical-reasoning-plus/reclor-logical-reasoning-plus.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cedfb531340aa051619041602e381efee6a4c3485014501c2885b6d61f56501d +size 843548 diff --git a/evals/registry/eval_sets/logiqa-logical-reasoning-plus.yaml b/evals/registry/eval_sets/logiqa-logical-reasoning-plus.yaml new file mode 100644 index 0000000000..6bf8971b1f --- /dev/null +++ b/evals/registry/eval_sets/logiqa-logical-reasoning-plus.yaml @@ -0,0 +1,5 @@ +logiqa-logical-reasoning-plus: + evals: + - logiqa-logical-reasoning-plus + - logiqav2-logical-reasoning-plus + - reclor-logical-reasoning-plus diff --git a/evals/registry/evals/logiqa-logical-reasoning-plus.yaml b/evals/registry/evals/logiqa-logical-reasoning-plus.yaml new file mode 100644 index 0000000000..0ec4f4aacd --- /dev/null +++ b/evals/registry/evals/logiqa-logical-reasoning-plus.yaml @@ -0,0 +1,26 @@ +logiqa-logical-reasoning-plus: + id: logiqa-logical-reasoning-plus.dev.v0 + description: logical reasoning instruction or the logiqa plus dataset + metrics: [accuracy] +logiqa-logical-reasoning-plus.dev.v0: + class: evals.elsuite.basic.match:Match + args: + samples_jsonl: logiqa-logical-reasoning-plus/logiqa-logical-reasoning-plus.jsonl + +logiqav2-logical-reasoning-plus: + id: logiqav2-logical-reasoning-plus.dev.v0 + description: logical reasoning instruction for the logiqav2 plus dataset + metrics: [accuracy] +logiqav2-logical-reasoning-plus.dev.v0: + class: evals.elsuite.basic.match:Match + args: + samples_jsonl: logiqa-logical-reasoning-plus/logiqav2-logical-reasoning-plus.jsonl + +reclor-logical-reasoning-plus: + id: reclor-logical-reasoning-plus.dev.v0 + description: logical reasoning instruction for the reclor plus dataset + metrics: [accuracy] +reclor-logical-reasoning-plus.dev.v0: + class: evals.elsuite.basic.match:Match + args: + samples_jsonl: logiqa-logical-reasoning-plus/reclor-logical-reasoning-plus.jsonl \ No newline at end of file