From 4ac11b6f0588d23b10c1988253dd1bc114dfb765 Mon Sep 17 00:00:00 2001 From: Adam Owada Date: Mon, 8 May 2023 01:52:43 -0700 Subject: [PATCH] Add Grid Position Tracking eval --- evals/registry/data/grid-position-tracking/samples.jsonl | 3 +++ evals/registry/evals/grid-position-tracking.yaml | 8 ++++++++ 2 files changed, 11 insertions(+) create mode 100644 evals/registry/data/grid-position-tracking/samples.jsonl create mode 100644 evals/registry/evals/grid-position-tracking.yaml diff --git a/evals/registry/data/grid-position-tracking/samples.jsonl b/evals/registry/data/grid-position-tracking/samples.jsonl new file mode 100644 index 0000000000..6a6e6d6794 --- /dev/null +++ b/evals/registry/data/grid-position-tracking/samples.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cbb8df154dd2ff6a900f7fe36cbcbd9bd9345ab06b830d8f98e6f1c34d3a37e +size 81667 diff --git a/evals/registry/evals/grid-position-tracking.yaml b/evals/registry/evals/grid-position-tracking.yaml new file mode 100644 index 0000000000..5ebf8674b7 --- /dev/null +++ b/evals/registry/evals/grid-position-tracking.yaml @@ -0,0 +1,8 @@ +grid-position-tracking: + id: grid-position-tracking.dev.v0 + metrics: [accuracy] + +grid-position-tracking.dev.v0: + class: evals.elsuite.basic.match:Match + args: + samples_jsonl: grid-position-tracking/samples.jsonl \ No newline at end of file