From 726978277bf7365caf72b652dd54f983af8315ff Mon Sep 17 00:00:00 2001 From: Natanael Wildner Fraga Date: Thu, 28 Mar 2024 09:54:56 -0300 Subject: [PATCH 1/2] eval pattern-concat-logic --- evals/registry/data/pattern_concat_logic/samples.jsonl | 3 +++ evals/registry/evals/pattern-concat-logic.yaml | 7 +++++++ 2 files changed, 10 insertions(+) create mode 100644 evals/registry/data/pattern_concat_logic/samples.jsonl create mode 100644 evals/registry/evals/pattern-concat-logic.yaml diff --git a/evals/registry/data/pattern_concat_logic/samples.jsonl b/evals/registry/data/pattern_concat_logic/samples.jsonl new file mode 100644 index 0000000000..4c0b5e7a89 --- /dev/null +++ b/evals/registry/data/pattern_concat_logic/samples.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64bf508962840fc78bb55b491f59073cbd5959d1af443bb14517d40242b6e434 +size 4684 diff --git a/evals/registry/evals/pattern-concat-logic.yaml b/evals/registry/evals/pattern-concat-logic.yaml new file mode 100644 index 0000000000..c1075a838a --- /dev/null +++ b/evals/registry/evals/pattern-concat-logic.yaml @@ -0,0 +1,7 @@ +pattern-concat-logic: + id: pattern-concat-logic.dev.v0 + metrics: [accuracy] +pattern-concat-logic.dev.v0: + class: evals.elsuite.basic.includes:Includes + args: + samples_jsonl: pattern_concat_logic/samples.jsonl \ No newline at end of file From 2b692c0df584be320e827af8c1e55c32b695e51c Mon Sep 17 00:00:00 2001 From: Natanael Wildner Fraga Date: Thu, 9 May 2024 10:17:36 -0300 Subject: [PATCH 2/2] Correction in some samples.jsonl data --- evals/registry/data/pattern_concat_logic/samples.jsonl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/evals/registry/data/pattern_concat_logic/samples.jsonl b/evals/registry/data/pattern_concat_logic/samples.jsonl index 4c0b5e7a89..ad11927dde 100644 --- a/evals/registry/data/pattern_concat_logic/samples.jsonl +++ b/evals/registry/data/pattern_concat_logic/samples.jsonl @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:64bf508962840fc78bb55b491f59073cbd5959d1af443bb14517d40242b6e434 -size 4684 +oid sha256:b48e966f22809e0eee26550223080706d36542f0ed869ae996501fa68414e386 +size 5757