From e63f0668c9768db21323cb24095847dfdab5889c Mon Sep 17 00:00:00 2001 From: Evgeniy Aristov Date: Thu, 28 May 2026 20:32:05 +0300 Subject: [PATCH 1/2] Add BABILong results for Aegyx 0.1 --- babilong_evals/aegyx/Aegyx 0.1/SUBMISSION.md | 9 ++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ ...t_no_chat_template_no_system_prompt_no.csv | 21 ++++++++++++++++++ ..._no_chat_template_no_system_prompt_no.json | 18 +++++++++++++++ babilong_results/Aegyx 0.1.csv | 7 ++++++ babilong_results/Aegyx 0.1.pdf | Bin 0 -> 25973 bytes babilong_results/Aegyx 0.1_heatmap.pdf | Bin 0 -> 29126 bytes babilong_results/Aegyx 0.1_manifest.json | 12 ++++++++++ 135 files changed, 2563 insertions(+) create mode 100644 babilong_evals/aegyx/Aegyx 0.1/SUBMISSION.md create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv create mode 100644 babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json create mode 100644 babilong_results/Aegyx 0.1.csv create mode 100644 babilong_results/Aegyx 0.1.pdf create mode 100644 babilong_results/Aegyx 0.1_heatmap.pdf create mode 100644 babilong_results/Aegyx 0.1_manifest.json diff --git a/babilong_evals/aegyx/Aegyx 0.1/SUBMISSION.md b/babilong_evals/aegyx/Aegyx 0.1/SUBMISSION.md new file mode 100644 index 0000000..cb043b6 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/SUBMISSION.md @@ -0,0 +1,9 @@ +# Aegyx 0.1 BABILong Submission + +Aegyx 0.1 is a closed research prototype of the Aegyx system. + +This directory contains BABILong QA1-QA5 prediction files for the public splits from `0k` through `10M`. +The submitted prediction files use the standard BABILong CSV format with `target`, `output`, and `question` columns. + +Implementation details are not disclosed in this public result submission. + diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..2e9dddb --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +office,office,Where is Mary? +kitchen,kitchen,Where is Sandra? +bathroom,bathroom,Where is Daniel? +bedroom,bedroom,Where is John? +bedroom,bedroom,Where is John? +bedroom,bedroom,Where is Daniel? +garden,garden,Where is John? +kitchen,kitchen,Where is Mary? +hallway,hallway,Where is Sandra? +kitchen,kitchen,Where is Mary? +bathroom,bathroom,Where is Daniel? +bathroom,bathroom,Where is Sandra? +office,office,Where is John? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +bedroom,bedroom,Where is John? +kitchen,kitchen,Where is Daniel? +hallway,hallway,Where is Daniel? +bedroom,bedroom,Where is Mary? +office,office,Where is Sandra? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..5aff4d5 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bathroom,bathroom,Where is Mary? +kitchen,kitchen,Where is Sandra? +kitchen,kitchen,Where is Mary? +kitchen,kitchen,Where is John? +bedroom,bedroom,Where is Sandra? +office,office,Where is John? +garden,garden,Where is Mary? +bathroom,bathroom,Where is Sandra? +kitchen,kitchen,Where is Mary? +bedroom,bedroom,Where is John? +office,office,Where is Daniel? +office,office,Where is Daniel? +bathroom,bathroom,Where is Mary? +bathroom,bathroom,Where is Sandra? +bathroom,bathroom,Where is Sandra? +hallway,hallway,Where is Mary? +kitchen,kitchen,Where is Sandra? +office,office,Where is Daniel? +kitchen,kitchen,Where is Sandra? +bedroom,bedroom,Where is John? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa1_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..1cbc6e9 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +hallway,hallway,Where is the milk? +bathroom,bathroom,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +office,office,Where is the football? +office,office,Where is the apple? +garden,garden,Where is the football? +office,office,Where is the apple? +office,office,Where is the football? +garden,garden,Where is the football? +bedroom,bedroom,Where is the football? +kitchen,kitchen,Where is the milk? +office,office,Where is the football? +bathroom,bathroom,Where is the milk? +bedroom,bedroom,Where is the apple? +bathroom,bathroom,Where is the apple? +garden,garden,Where is the football? +kitchen,kitchen,Where is the milk? +bedroom,bedroom,Where is the football? +office,office,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..19dc262 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where is the football? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the apple? +bedroom,bedroom,Where is the apple? +kitchen,kitchen,Where is the apple? +hallway,hallway,Where is the apple? +kitchen,kitchen,Where is the milk? +garden,garden,Where is the milk? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the milk? +bathroom,bathroom,Where is the football? +bedroom,bedroom,Where is the milk? +bathroom,bathroom,Where is the apple? +kitchen,kitchen,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the apple? +bedroom,bedroom,Where is the football? +bedroom,bedroom,Where is the apple? +garden,garden,Where is the milk? +garden,garden,Where is the milk? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa2_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..6179fc6 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +office,office,Where was the milk before the garden? +bedroom,bedroom,Where was the football before the hallway? +office,office,Where was the milk before the bathroom? +bathroom,bathroom,Where was the football before the hallway? +bathroom,bathroom,Where was the football before the garden? +garden,garden,Where was the football before the office? +office,office,Where was the milk before the garden? +bathroom,bathroom,Where was the milk before the hallway? +office,office,Where was the apple before the hallway? +hallway,hallway,Where was the football before the kitchen? +hallway,hallway,Where was the milk before the bedroom? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the apple before the kitchen? +bedroom,bedroom,Where was the football before the bathroom? +garden,garden,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the garden? +office,office,Where was the apple before the hallway? +garden,garden,Where was the apple before the bathroom? +hallway,hallway,Where was the apple before the bedroom? +garden,garden,Where was the apple before the bathroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..0d2996f --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +garden,garden,Where was the football before the hallway? +office,office,Where was the football before the hallway? +kitchen,kitchen,Where was the apple before the office? +garden,garden,Where was the milk before the hallway? +hallway,hallway,Where was the milk before the office? +kitchen,kitchen,Where was the milk before the office? +hallway,hallway,Where was the football before the kitchen? +garden,garden,Where was the milk before the hallway? +kitchen,kitchen,Where was the milk before the bedroom? +office,office,Where was the football before the kitchen? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +kitchen,kitchen,Where was the football before the garden? +kitchen,kitchen,Where was the football before the garden? +hallway,hallway,Where was the milk before the kitchen? +hallway,hallway,Where was the apple before the office? +bathroom,bathroom,Where was the apple before the office? +hallway,hallway,Where was the apple before the bedroom? +bedroom,bedroom,Where was the milk before the office? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..348bf16 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +kitchen,kitchen,Where was the football before the garden? +bathroom,bathroom,Where was the apple before the kitchen? +kitchen,kitchen,Where was the apple before the garden? +garden,garden,Where was the apple before the bedroom? +kitchen,kitchen,Where was the football before the bathroom? +office,office,Where was the football before the hallway? +garden,garden,Where was the apple before the bathroom? +office,office,Where was the milk before the bathroom? +hallway,hallway,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the garden? +kitchen,kitchen,Where was the milk before the bedroom? +garden,garden,Where was the football before the hallway? +hallway,hallway,Where was the milk before the kitchen? +bedroom,bedroom,Where was the apple before the bathroom? +bedroom,bedroom,Where was the apple before the bathroom? +kitchen,kitchen,Where was the milk before the office? +bedroom,bedroom,Where was the milk before the kitchen? +bathroom,bathroom,Where was the football before the kitchen? +garden,garden,Where was the milk before the office? +bathroom,bathroom,Where was the football before the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa3_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..c9abf12 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +garden,garden,What is the bathroom south of? +bedroom,bedroom,What is west of the kitchen? +office,office,What is the garden south of? +bedroom,bedroom,What is south of the bathroom? +bedroom,bedroom,What is the garden south of? +kitchen,kitchen,What is the office north of? +hallway,hallway,What is the office south of? +office,office,What is east of the kitchen? +kitchen,kitchen,What is east of the office? +bathroom,bathroom,What is the bedroom south of? +bedroom,bedroom,What is south of the hallway? +office,office,What is the hallway north of? +kitchen,kitchen,What is the bedroom south of? +bathroom,bathroom,What is the garden west of? +office,office,What is north of the hallway? +office,office,What is north of the hallway? +hallway,hallway,What is the office east of? +garden,garden,What is the bathroom south of? +bedroom,bedroom,What is west of the kitchen? +hallway,hallway,What is east of the office? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..f9ff70d --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +bedroom,bedroom,What is the bathroom east of? +kitchen,kitchen,What is south of the office? +garden,garden,What is north of the office? +garden,garden,What is the bedroom north of? +garden,garden,What is the bathroom south of? +office,office,What is north of the bedroom? +bathroom,bathroom,What is north of the garden? +bedroom,bedroom,What is west of the office? +kitchen,kitchen,What is the garden south of? +bathroom,bathroom,What is the hallway north of? +bedroom,bedroom,What is south of the hallway? +office,office,What is east of the bedroom? +hallway,hallway,What is north of the garden? +bedroom,bedroom,What is the garden west of? +hallway,hallway,What is east of the bathroom? +bathroom,bathroom,What is the office west of? +bathroom,bathroom,What is west of the bedroom? +kitchen,kitchen,What is north of the hallway? +bathroom,bathroom,What is south of the kitchen? +office,office,What is south of the bedroom? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa4_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_0k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..cb225d2 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +football,football,What did Jeff give to Mary? +fred,fred,Who gave the apple? +fred,fred,Who received the apple? +fred,fred,Who received the football? +jeff,jeff,Who received the apple? +bill,bill,Who gave the milk to Jeff? +bill,bill,Who did Mary give the football to? +fred,fred,Who received the apple? +mary,mary,Who did Fred give the apple to? +apple,apple,What did Mary give to Bill? +apple,apple,What did Mary give to Fred? +bill,bill,Who gave the football? +fred,fred,Who gave the apple? +football,football,What did Jeff give to Fred? +mary,mary,Who gave the football to Fred? +apple,apple,What did Fred give to Bill? +bill,bill,Who did Fred give the milk to? +mary,mary,Who did Bill give the milk to? +bill,bill,Who gave the milk? +fred,fred,Who gave the football to Mary? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_10M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_128k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_16k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_1M_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_1k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_256k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_2k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_32k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_4k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_512k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_64k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv b/babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv new file mode 100644 index 0000000..d224432 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.csv @@ -0,0 +1,21 @@ +target,output,question +jeff,jeff,Who did Fred give the football to? +bill,bill,Who did Mary give the milk to? +jeff,jeff,Who did Fred give the milk to? +milk,milk,What did Mary give to Fred? +fred,fred,Who received the milk? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Mary give to Jeff? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who gave the milk to Fred? +fred,fred,Who gave the apple to Mary? +jeff,jeff,Who received the football? +jeff,jeff,Who did Mary give the football to? +milk,milk,What did Mary give to Bill? +bill,bill,Who did Mary give the milk to? +milk,milk,What did Mary give to Bill? +apple,apple,What did Fred give to Mary? +mary,mary,Who received the football? +apple,apple,What did Fred give to Bill? +jeff,jeff,Who received the apple? +bill,bill,Who did Mary give the football to? diff --git a/babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json b/babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json new file mode 100644 index 0000000..95d0931 --- /dev/null +++ b/babilong_evals/aegyx/Aegyx 0.1/qa5_8k_instruction_no_examples_no_post_prompt_no_chat_template_no_system_prompt_no.json @@ -0,0 +1,18 @@ +{ + "prompt": { + "instruction": "", + "examples": "", + "post_prompt": "", + "template": "{instruction}\n{examples}\n{post_prompt}\nContext: {context}\n\nQuestion: {question}", + "chat_template": false, + "system_prompt": "" + }, + "generate_kwargs": { + "num_beams": 1, + "do_sample": false, + "temperature": null, + "top_p": null, + "top_k": null + }, + "submission_note": "Aegyx 0.1 is a closed research prototype; implementation details are not disclosed in this public result." +} diff --git a/babilong_results/Aegyx 0.1.csv b/babilong_results/Aegyx 0.1.csv new file mode 100644 index 0000000..2985a1c --- /dev/null +++ b/babilong_results/Aegyx 0.1.csv @@ -0,0 +1,7 @@ +,0k,1k,2k,4k,8k,16k,32k,64k,128k,256k,512k,1M,10M +qa1,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0 +qa2,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0 +qa3,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0 +qa4,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0 +qa5,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0 +avg,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0 diff --git a/babilong_results/Aegyx 0.1.pdf b/babilong_results/Aegyx 0.1.pdf new file mode 100644 index 0000000000000000000000000000000000000000..8bc828da4e1fa10e838c280b9839d598caa2e9e3 GIT binary patch literal 25973 zcmd752|U%!A3sV+jxB2`%aJIuoSkFKzVB;_vM*)d5-pa9%DzR)UPMZ^Y>_2<6opWT z>`Nsi<<9rW^YrBW{&nwt-Ph~(yvEF#?<}AB%x7jkGxK@R!>gm9B!m>kz zBpd;Eu{;fvl!S{IoO88-i^yAeS~$Ac!9{c|>})*XD3Cx8E-ekSakhpMiv5y7$;H_d zjwU1!Ii_uS+Q!NgF1qC6B0RpDm8kb~Ub0EljgdUqQ@-6r`WdNv*| zUhY<)JrMnRa1l)#YX=KC7avd~0{n+Wh#}xO1V&g4ZUz&P2kioxJ>dAw#InxLF5nju zO8F}GsaWiWig4?fu%Zo!uYDdK33dH@bB6FFI7&=le#!J7d%1w|-IAsJdan%W84z zP9b0XQQIM|r((AjEmmjDx=pcm6F%mog^8M_{@i)`u5<6LJtqVD$%Y^GCXx9s2aH(d zEo9#7v98;=s^7yGQ<0i;Dd&Wjx0a2D-chU4g^%A9*={+~@$og4KBZiayH$dWb2+cp zvtzn9ahic_wz#l`F9yw3YvJAD(sAYsgOx|w+Zk_1dy&i_QTT}xllRy%Q_LRt5B1N5 z?XP%)F5!0`; z@2Z@B`yx7Ad`RCe8 zq=b9NRAYG;ip-V$zqwUw4x~Tk(|S{XQCgzD7~Sh>TF`&IgHQQTW-7_bd*7R-L2kD) z>G))Mb+1c!%tf?&VcsM~;nlo%x@s4c*-J3@&IT#1H}i%@4JFNhyc{-j;YG~k5<3PX zXPn;9HI|@F&lx6;X%(0}cqU6!W%H!hoN5tYIg8${_b538K2zQw(B`Gphh4~bZF#Y|H zaV-7WvR|?bOJ^lg?!P=LfXMefZu6WD?hI6&@(PGIdjrvjKS70kjmGs&zSRg){jKkF*i(4H%B3S_$QI%F3`4Rb;o zbBOA#wvc<4nt^hC45QW_jG zZcxX_T=(MPv*^oL<(}D6saYJjRXE~w;WSJKRyM>7i%&YD1M{OspNn`I2||>sSJ60w zWI!p;qQck_sJyX!C7)rzvnrsxNiS=Zpy+7|m_-&#^7&;|m~k3&X>%vzBlOgMKm(hz zOp<^Hh*P>1XT=c;h-cW_N2$YW1BxSab$q7-82Ie@a$lhsvsSnO9(7%}0(7^#U4!*M9wzExAon?b;J6Z6Lns-LG^f`9#dn2XZas8)JuNnG4_C+(S~TKa0uV2*=w%?+Z3^6yBca*B0u zG_(2A3$j`d(#LImemI=oP3^Vh#)O@hNV@~l$x=FV`b#ylc^1#^qSfvWBG;)L6Mez- zgv^&+Yd(fzWl566uM0hCKgF;Q*A?p~X7W}+dyR8aHce2fF5ouHLwc#|h=|*=_2N=d zkyM6^Sy2be!!7!guflt5x?GQYa!1p6#>@Lf8e`TQi?m+q=Pg0J8)PcMg$u}9g3k*UOSj0zKGuQ7?U=w62Kd_Wec2V7nudCq}|D z0^S(Rr6rt8p0?hQ8*sVcscTiv-eNu2ozxZQm85%ur!Ld90g;Q z10pXJMRdN|AK)^w@!q}QHvJi{wQ~td5{g=k+ShAg`KEljVFPrtI~oUhLT0+Iv^ukg)Lv#U9}9Z8-2GF`6>eGbYps-35q#Ey>x`_xYTFsgMu7) zNRnMkABAz}y%<}Y;aW7z6Fzz>uXkd3N#T~e#FQ4_y%#ecr&dbWMh2`pC3M&nSE872 zD%US(w!6G){MvYG16MPrqp!E)90gPruHEt~ zctCUU48GUt3p~N-^>W**SDup9DPA+DC48Qo*&oq*V9)!n-@^{%aRlzbg!8TLnnRXJ zJ&iWHbkv~%o%%!SX2h#eXPlXEPyG2}whouLuW1P$DP#|d#Zx%`9PXBM0Z;Gl}(1xp?AH?m-Eyv)$#-_#^hP<4a->I7=V+@@jp~ z`p#Rer}g8;UVi7$Uv<5nwDnyPw){q4koW3Z|9RxOJlKis+(B(WjEROYSLSKV#k=#b zZ6?~jewrB?(?0F%A$oIA!#Odrjeq^iob@^UEuo&|13AWJpKX#pJib}GWF+)XbI)`^ z(db%pY~$U2y$iRsp43uZj~EYbnPmu0*0m|>?YKmea#KtdQhR?YZ9f%Yf`$iaeJG45 zW=kt3sD@DF37|i2CHz%Y{;3|~kw7KPj7C-oinSP(cB7FFF2lG^+htgpm~2f z!zh3*sxTREZMaBls_}w}T~qzom5r*@U8 zjnwhi3u04R*+wzLQvBt2Jn0MFY67GS87P+Ms|^Te>&{wBcuVHXk;Nt zhegscSFM@7&l*btFS*~^|Kj0E7gHS|7FM^K*GhfThgOc_bL^wHa~1{d6@J?rU=e?2 zEE*@OhtPRQ&Y;A)6ZSzV0mdIF;C~@*O5|yBmiCWKbR~y%CQj!t* z-Sb4Kfc8PZwI7AS{h17`PNiETf@TIwvB&4^sPU5I^Km_~Z)Kzh??zFnlaoI5Xk|Vx zy^mk&Za(7cONQ0&IV}sjQuj;Me}Q+`F;Lu39L(hC!#CE-eT12kDcl^!8qdzd8l|Sr zl#0>4s&h9+)QJjo4i(-BtWPwg);}#lqhT#2ps+LP73R*ch`keC{>i;YQT8o)3O9Rq z_dBFU-&m~MsOns0!x$7r4RNcFh3w|AOjL80PuLTKa#Lx@ZQ31;#a*UD_neWtA@V#s zV2 zF}^FCSVDLGyP<4Pv4`TT;E~H8+q<4O+7~=LDH(sG=ujZjlP{f*(2uTm=q+-MVK0VI zo~fGnjtKcc(-rab+>J7?RO^&NL$lipFMMd39PTWA7{8iere5lhK}}tCXA0!5flmJO0f&N5?V3oM&b`+A&E?GA-04<2 zs%K)AI9Ak0#`@RcJ#~quk2u#n6yH4Te0Z3BP zd6N2rw9hGLoM1xT*#m(&&u&(eCtwpa+;!%bXpl%&+vYvb+AHsRWb88(yuoVdG}G>o738EHoFH_((9K&d)wA(y zLjSVJzUsG^HolfWd9Wg~kK3$@2pgdjo8Q=o#{9(^p%|m-JcOXRydq5@VlJ~DZGG#I zVwa-thEq*?EUS+XyZTsrRL`V`>SrD(ruPW-yU8NGaL4FSUtx)s*8e;jF*m1%}#s7Yhx7oL=G4$Fe15C zJE!JsJ}~b2V4EguRQfnjh~!tL(K}2u#)}Xk4~Ij*}GbCQ9tjaeR|8o%a}g*Rn^wm`!vUoBcihpKWRH1 z=O|vHxEB1@ueMP3IyYtbPLUlPii0oXb;4h&#qpXl-WPNDZ<#v88OWy$t4o zxGSA;Bh=H>eFu_uOeudiOJ!RaRkFYnnUY#*&)04mR2Scxlp~cto@V%FIOQ%r;>&QR z`D6O}wDN4F&uRB8t$}M?2k$oIZZIq7#t%zVMR+Rf7^JR!j(e$4oKG8F?Nd_R`#j<% zb9}TnAG;Y-M9%$}e9}j%-<+yEO6owPWKV<*M6^8=@-K!7R;Qen49wV4!K}N?r;A)} zQwL)DYr+p7Y7CIPnV~Xq64j{5iBLTomh!3LVTLnzss%cEO28mgDb$Q_rAxddf4@*q zP{rDvjXOF4QhqzrtN8ciP@9qNTG_o|apLB=3kHuzMBfK^f9&ygnw7F1)S!rU{a~F* z-Tg9tYU9HE$9d=cuWZhhCUN4|?`FR_d9Oj>`#Hw8AiG0s-nZg*blp~ccAZXmY0S!< zx=_5yF(jT@W{zg;)y^-gOGj4Y9~FI^CNW4=VYgFxgIucFd8GQufe-_8BHSUOXo~&K zRNTI)3)f0K7^V_@Q}W}kgKyWysl2|1ljbot7TL)=95j4ij2epU(qV2XzLv`0BZr~s z_#Cv}kj(StuxLwzcAms37Zc3N$rhd!>cErx3Fp}VRp`;gRJFfRm`cI$(LrDkJ7SbR zu);!E3CbFrbT>MYn(qdgEgOkL=qUT+WcC7@0u0HF6K(%?zMzRHYe=y_FHvY*p$@{o zo>?B0%*jSZWLTn!C}3jvKbMRRe@a`6*hRLX@pP9tyhX?yVEyHo{Q})D&ID9k?}+PJ2aMFz>j@yejXE^|98#~1WR6ssNNY9s~u z9K^ntpd#09n5yMPf6K7jd+4k8%aX%=DsxqxUFYJ)oUdFSynX|#h)KS>$75QXUzJxZ z>r=C<);d2dZ+Fi5iN&O%2vmf3+CWR1&|!P}X}eUrD$3VA58u$L<+COxkH=O$qUM{} z;qquYuzpfX$IH#3v43ZRSU~Yk)3+Qt*n3YOiJwj{8nUQ`-}Yc~ef;=sn{iz}%f8wG zwL?KMX$`^8&bInh{UGgnZ;0LA@yK5ntj#+o!bOsZoP~$YW=PRURbE#6h=R>&3nMRm z3ug}@ITuH3h>h+Zp7Qn>06$KMfaIm$t0k>7q_0$PC z7`P%Ht`=6{<_t8;{+z45jWb-t)yCby#Tt$QbAzvqy9->z#n}dq12i^PqzjmvE%-!Pz&kb^4Oa#&CXs0;xY6~zFdK>_i>fRBJ1VrYUBBTyv@ zLqo&>Ckn;@4lN4D4A?E1#CfY#)*Q$pbZD)a3C-60gEu82JitVCQ8Tv zWx{~WSU?#DWF~yWqJR`(;5aala3G8Ylo1L8g+M+aV6)#K76Kv&tOb?g0C5DiY*7dK z1QCMThXFZ}NSr7k3ux1p_`nD~0$n46>;wlEGeS;?!~X^#0-+)hct9ES1)>U2xg`mZ z1Q0q7NIc|2?Ajt^lPVn4BpiW%kR<$vREVjVpAO`Li9)3S2N4IA0)4~&EC6&4lzZzB zBn<>XfP~>U2kytQpe#`FPs!NwwDw?$!Swc2$BK`2lyt6 z#1jMo5{BO$=x{(d=wL`PesQoZ$=LEY1!7Y$pzyB_B5vzDBmi3u5)L3hFv$P+`1aR* zjVv5!Wdy?kIj|gThE(A|8VGS3a4=2?Aze7?rvZQs91K_x2iu&XK@$lH?BGCR2%(=d zJL;zegfkrV({#cGj`~>_G{=KkkWk9c1%RNe>TRtM1oaX8@_|+jLaFEAU^o&&gk^%D zko;=00AzC8ZtZUlrLos5A+=D!@6Ka}RWbjSungwqA5Nh{dj_SZ!ah5iTi?3EQ~aLw z(H&QP4Lz-#voxo(ML8rUc{{#iT6~4~Ez!GuVJW>y7NdJG`ieqgTfE))sq@k_F6@@u z^#d?fZzB-}ME1{0lwNr>P@>w(UJ^op{?K z*ZXYjRL2rl(wsh3WK8eOy$Sbdacg0*O!)Me@gS>^4c}|KdqJPvXiu{|S!6;pb#tpW zFuLnS9>|Y;5Y+pHeejg%)cQU)E>A}tU-g*0G=usl?!}A}3Daglvq5)mzMMvP7tH!+ ze+$0NZk_MUwS&9ocxd|`@%y1)#|B?K#TcI3cc5M`IA~5P6KguTk5Rq; ztLiiI4>gNx`OQw3Hb`9U?J9^cl*lFn1xEcJ8H&|abtXaXs+?f?A(Q>^&_dF^>Gba# zB_X;ZWMqAP2N#|y9h7c}nm=rOzI7VYwkTmT*4U{wGFBZ5%Mz%AIZ$@G8=+}#?@!v1 zi2i6|E1kqD!K$O#;O0Gs36c$UFja1wLUc<`Qk6^Zb+fu_QedevGo)Ajr1w**K&$fW zA;B`O{vNfV47*uXQ}2`7P7bH`dNGSqMALCeR8f9C@Ig>mJlc8rCjXWAEN(F&f3C1} zgHE~!415=D5Bjv;)>_EKR4vPPf2sD9Rd(jH7AVtE61bg@d3HU0E!>_jcVQ#o_Lu4> zKS<;?4a$k|jL7!sZ_Z!QkDybPhs7j}AqgM;bbw!Toz{p*)kHQ%xW731MPsqh0Y0eu z&K;%yRBdDLKxaGdZ^HUaW~T~UiUmp5(_{~GU-!qT$1h3RSa!D)A!18Kf)v)R%PXK# z{qgcDq79lScZmLI(#=Y5~jpJ;we#Y)4K`6f7?%q6h!ke9jHNir5W zRyOOg0f{}=)NEO6lKFC(ULJINtB@|CsdkILxO-qYc!KQ96vr$P3W=OcqQG+aM-s6* z>ILB3X<&l+iA=T(BRJl@=X>+*rEiFwYYeZ4xjxR^5DQ5ZTxDD}sjt7a9zJ;;f^ImdEK2gD6c1SbXxx2Nt zr!A_8Cv>mcPIaB`68pN0x!l!TpRU)4U)yuBiSCH!;7GSV!xyP~JLypM>SxP2{YeTH zBF$0V$?8;^nEn?F&CJgwMYE!w!)5hM1JBq*eVolOF{gFRXQRsmrk@Lc?L0CwTUPg zd(OsRX?hkHzG82seObtK+;g9nK3n9qN?WtEHVag@OI31tt${`KtJ#dTy;bR-^KGv@ zFhnCSizYGdGZ#4PPXFc0U9q`=m?%eMi>_PyvWgJx(d$yX^*y>gLZjDtPPw14=t}yq zXOB=G+kG327qb@k9EE76!)4F5e(CWo_>5p!_)PXrR@$0KlYd>Ze>Qn@bNGiVS1dU3 zS0IRlsd<*n>cNSm(>;oQ8%|Cy%cxkntYY8r>K_=-F3nC*D{o1R@G?bdUTi|0v1W@o z(%`7-7`xJSpK)(@%IL7U=~O<6Nzz04&MCGp3c-R+V==8mfyJ?sPi^yesyO>ScML2( zE%&T4FjT!?mLaA5k&0Y;V)t0#C(d^~tO`PpEi4vRd65%6}vrIHX z^e;pwM%@`Y#sEjU!nEI$Uw%?WKW3yi-@%`&kuFCsb&d=yOJ4VlQ8sT68VE z^-039)7EzQct&E_c-%x6i{*UA`Tlk#Gm}G&)0b_<%O-X4dnj?5_fqo&vxkIz=z95X zpIBx%TGf@t*@G3P67@9BwBg5C-TQXwrQiB>)bMEyGe^BVKQ76W3Wk%Dl*(ZTtP=N3 zyqBe#QmeB+9vXjEkxX{}Q*o;w)%?KQ)6I`4b8kGC;J1A^`d!m)BR*?Ed1YD9`T^{c8GD{d4Lw3688jYHJjnnL~W)bVmIHIa&+%CHuQpxQ_RF zauMM@5d{r}`3vnwF4oEVl6Xp=Z8f3{Tb=&kg73;XbIh4rwW zHrA=W>B-dXQK1D4CZ0zUy=1!M=JiJQIi3h){-TzD=vEqLlA(3+Y}}diUQF5#3damO zxQ}<-XWDo5p`(v%Ps>4u654Br5rfSKEK7j zeFrcHtF+tmELojXF~S&g3ImUFh8*eThW3(|BN5HywFSk`MvUe8w@YD~MbywR)I%DhX4xAZZur4`Q(5#%a9 zbZ|8Wo5^?4&fR!jP&-(;?*6bUb3o$AN$Vn3GNAf+ zcZ(w`cY5{Nz6pE6JyOJ@*P)cq-OIT2Qh>Zwzx3TyAfr>>n#Z?%YNu~+n6$k8rd7w8 zLMIaPYi-`M#5Nw=DWzMkj=T^x?U;Tjz3OmkkfZeJP=&<9cEe#$pC0a_n=PNS8#Uy% zHygU^WR;_&*3?}?tEm~Y>#G8lT`6Xs^~a@7pi+IK*Wxx{Ai^*rs^Q<*f1q)Yu>b-? z9<8Lb6Lv?&=qmRfmD;Xm1@1)ZgS#w&uCY^QUxpZE0pFD)WbHd0f^#Sf;nU$l;pqYl zf}xI(^}^leJr9TwL`3gGfo;y8dr%u6L(Wapb}m>NVYqidrsnS5Qe5BHOBFFmT2YJK zE!|8UNj^zDJP&P~298_9ZHM(W8f%t|>6z}W409fcyGCsh67Bjr|Go3=h&>zL@twyg z7jUarO-}CatJ8RG%xWh*Kw;&O(tvMqzHY`;818lduKqD)L^{o7&(iuhxQ9X3QcDEt z!=zaBq1)FMmInmA@fYc4sBz)kEEB5&zJa))jM;MwJNCKDZkP?Naw=9%^1}C1vA))| zoKG3Qe5%^ple6S7qla9wtS}RI$CSXG-N`!nMVV=Ox~{p>cPH~xFO8ov6(YhfBFZ8P z^EapHIua2I+%z-zV3EaxpLkq3mGXpa7v2?+CG+cOTr5Q&>|zK|ra{I%c+Y!3tstQ0 zn%qa{(V3t+c%Hl-{JAfEsORh*Tr`t7M+*9=g{W0Tts-(~%9Q6FDM~*4w>sEmkNq~Y zMkj!g-}j2NUPHOU*om3&l8;KT)G@2`J=r+%qYuXF%iv@lcketQuj`Ger5$laoXj2HnkP| z5>+vUoRdn!j%gVZh1ocR`%w{g2bpSEhU_fa%_m+wA}wGuP)P8bZ3@kOo^!oQp+Q<( zbM0_~hLF)SXMMI)>v7k6&U;b_ed;nS>Y_dtc8+lwzpk=6@!F9)MBMrHr?7D@ zbR&xKxw$&tJU#Kf^6-F(7efI@`QzuF0bKE~T{VhlE;fJB{^2=ryu+)?eOHFexTfr4 zC0&71VM7B-`c^o15 zswRJ}vCxQrUC&hKxNz%r`Xe-2fIIL_MabzH8SkPepIu8+kD@0toQU)(k-Y&DIzj%^ zI-nUTO9%D_WDDnlQ)S>XKAlE}^aC5G)cd@W(<3i)2}-R-b9;z>-+wWqztY4vrllX4 zvK-LYUDeAGwv;mq-QStcuqc&&hS8+3`XgR2Gs)u#C0Foca&$VW)df{ldCrG;ZYC`n zFLt`)S#^)kSk{joe<2w@==@E|)`ssgZKSo_;9mbw_{@$+dj;cgI3|?IbFw+w7TV+H zy}A2!uLT~7drjq;VbpN1eYohuYj06`p-;m(7e21p8zq_tzfk{j%;!|F^o`sk@A()x z-w{oT1MQr!ER=-MkrKa#Y3G2oqiuSN-&4h}ZvHX_b?G@JE{b@*lPt$5)vN|}B4w&a+=W^ODd=4f zU3$}Hkdn}S)*)Kekbf|X@!STT9bZ(=xffQqR;aDM@kkP(l9=X=`HSUG5llwV4yH!m zH9%z~G3s;iJxK9BaZ}?}$1s(-qfeXu9qZPI<-9xxd*ie(9FWhyvyO2;c;L>eDiwuy zd}PxZ_5ASJ=p5$MHy_^@E-BsVXF2|5{zZ02hHgh|GroCu`fZkqM}9qY{foY)DisTH z9o+0~8#)1kHbd?(UfB~}XJ;AS(Q_089tpH~ct$vA&IZ-9v37;kbm78^Ws|T!YyQNO zr*tGacbSSQn%UmWGdvmG*5t4H_xF7oz$5HT(YO!-QPyuCw<^=uTSK-_Og;Ntm0G3|zKTbXU6Gb4^T~JLdRHeBkKIG|uDi zO+^bwop=h%jo;04jiiW}F3;>ypS|2bq<4tu=E%P}nN*Bwa-)E*ckk`sMfk(M|YER zG-OJogD5mWpm4ef9A<|lQ!ulA8dCL3}~O^hLy_+?@^&?XoZYui+NK5L+$);z@2tC!dVpxlfu{( zI8sQX+lJN1NO%WWTZqs@L@xzbA%C1cq}uU}{)k-^UAOhuc`i2}SaD;&=Cfghc(Ic+ z&o_-*EU4n?{Soul3Qwj5{r9h)r7%+E_^4?nR8af&6hG;CVn19t^FjSp*wK#8J-6s9 zIoO7XkVZrW#Qeo(ohYjkb{h%r(Ga9;-|-^B6?WkE)A*ev<#x1(h*V2NZ$e@J!gfV5 zTHT!-4s6G72lDu@k4eU=*+6Drw9l<^-ibNiFRSs~VHBKTK8Lu_@~OkRbm}bLNMb() zv*O_!EryeYJMtv-88GGCh~T}x_N(|ZY2z^eMn!qaSqsyLVVs4*ISOuFVqoqGBGFmGR=~b6 zdiKU^@1|3hF)SXW*9Q4>Ce8>S?`0Ez8;folyYnsNdAWIFWst_g*Q2jH*M5+3^4qQv zVI?tj1@{-yr5Gi_NX89JVYJeDR(Z&zJ8e&%|L%=Np&FmbP1*yJs85Ype%CW0sT7U2>P9meCqUA?c(_nt@#UrzZ77ixrZB%8q zDs5$`2KDi8@}!P(!Niw|w3V19^EW0>Qaa_~z_Pi`EO_6sTHm=`JJxIJcQ%$(zAhhl z!K$byfK7_w7x9YYHPL@7em1~vofaq1d*3QySVZk4dnG63HOWWcFUhx3 z#U$FRkEVZ$JCV?8v%-USX{i{OzoHfI@X5KW<3Zt%Oqw0u8#)HN@ADR_wVS?lF2tyc z^w*1pC!Q&Zn8@|JY?A4-_`a{3KVV7<_0+bg8jr}6dQKOm_4wI?>28VmgJfY9QJ>|q zVKbaPycv;425#ux(h?fqo0vN3cRqqds_||3;ESfVJ=c{=gmPY-ju)dxFzLUDcgu?o zh-2C*Z>MaGq0Vk@^_9cch2ztcs_R|N$=Zr8XJy~ltD?6do!nveM*KZSEii(l?%m<* zU)FZsTR$mEgm1(&2XI>T=k-GyPgjqi836YDaDT63rEg;oOh)~wT+fHuz4{=AQ_5504u{CRgCr0mlT4<@>Kd$z%kk=#hRa|E* zgJszDyL+eEN&?vq>?)K~#!eiB@6hNtY{7K7v&h`Prq|Nj>FBFq@2tdvgc%={j4glu zL-oSvI`vP}4?5KZoxlAKZGaCsp0_XF@^OlN6Srvm9_E$);HT2>=Txnm(=0jEt}pL^ z8;sHQ2Spd%zJEvJ6Mj9eb3Cilcx)E6=aTUo=m2&@6404Tvy~TDHJ?D zP5rTUj-|8XTrg8oI1|T0QD?ZmPRTI!;2DwbC8FH@jr5{%#hVtulrc&nG6~UP za?mj-NkjX1Ak~Lok3b>o`H^DU8$_xmqP!u2>itK_QjEegf|CkzkLtifDyD%e`E4an z*EVt~Un^%!?ZB{CuxhsYGTTc}6)L4ybe)+LREtq~${NF=bJr?V;;@Q_idBqCDQ6H* z^06Yb8%YKNMS3H}4vlp+{l{N5D}=j-uZKfv&T|@)(ls`69NKf6p z5l%DU0W(WOuTqXlPI*@NRBx2V#40M$nJ*#7L&DU~o50I5UpJJ6x61^NJjiPg?o=6Q z77uNUy7o9mDA-Rya17ZX*$}vp_mPwHYkqr65#=+H{heD|mii!K_-hQS!^#b(?gHP38WQ)i9G{r&lRCv(a#!37Kb=mMA^4z=M4r4sN@`-1)*TWmVmNcj$gr`jV7MQro*& z_3SPVO|41N#@0sFG&9w&X-PNK6k-x*E)>cwh1AAKN-HB<{AY1tP8k$@6P($+?G4Q0 z51V#W*(Sd-oHVcFyuyFon7Sy3)A7>@ruZz5`|sKM5pUZN`j+V<4=H*+SlR^6kH5!0 zs0*FbjWw%xolodEyX%GhkNvEz!&WRY{>pa?8EGBFYC~&ppA>66`I!k%R~u?|D_M}n z%AW78Z$wya*X^Qgi)T%o$G?20H<&tqg-AybQAz*qFaX>Wk;s{;^H5m92L_wE>4@Bk0+YXO%kST883^<9Pm~152Qob(?INa^ z0Smf63YcP~IvqJT*uyPW%x?|vo`L*G{MC{Re=z0oohGtMGM(Dm-!FiXdgX_*Uyf4cr6nV zxm@hX!g(s=!~w6Eqd^S%Us&F2 za18!pj$PIDdYDeMzjweJ6&k#sptmm968bQbY4Xi}#X;Es-k2Ns#tP4+cdK26X+Qd| zi`Iw>Or1DxV)asb|6JTNLDZD*u_e#XubYCXF$)>%6R&6(F*e~b&nWM|!G~ld=^FWz z$;Z-mAe*>9)7`FTqf%RwWUh(iW#Wiyen&@}e(4lv=JgcZ+Z`V=jykbW(v23?pDYhx zQQLDSW`#6YV=`cB8iSu$?mG`JhF7z_U=2Y z#3NV6HhOopQtqU^CgXX0H0^pST+p~`JUY+5{v8?__>SVr#Us5=$Hrs~;Hp+S*mUoY zzDt~aZa1jfV_!d{vCXGnzs^56**Jn^vn%Vh>DfJN_CP90wk6-RftP8I#w!aRJG!Gu zDB)rcDN*=@(y>H~C}*R6XvPRkunKqZy_;Fj$z>U@7bu0}+?l^+i$r>c7>4H{XFY_R zPIYREo#~oAmj7uij?>Id_|P7aeD&ZM&DJ1zW;Xp!NkPZb+S|DCqjt`I1xn+2~3s$DBzk=s&w+;pkyVb zZcol-bnS#>&Akfyg_`^FlwJYrV{lhV$u75p!k*TX*CUSHWPe{<1h*P}A-2)-Sh@iz zJCq@GEYZ8Ezn#&e4u#xNs?^dinNdsMWV(ydI+5#1E&PC4qT0>T30FDE6e@sLZ%HL&TkcL$Y6zPQv@ANR1RnbyeFpG^=wJ^*is(1 zLPvb@V$VtL_U$@;*eRCvt?LDn6plF}1QJth{^DL7t69zf2n29U<=RM@d7ROC}|Bmhh-zrr?TvikVb&uia3ePw>*0grkm zweJqA>%m=J`|l;!hnU}d-}sW(;LIv>qYSTTbCNk-cGgP{h3n$kY zDr0OfbUl-+;I;Sn%hz`pyyM2yz=5Th=ATZ2?03U zpCNDH$;5vkZvbOK04!|b+x~As-T-?bs2c(E1t~7B&?}CPHnyHWgYE?M7r^uU28@G= zcsN>k*#8QS6Y)F?U~-=J?lu7MXA53`{E3wl@c__02q3?SB!g}&tXv#joIw#bP7Z`1 zfbaao(}~Fc3aJB#GPo$1L$ty3k`T5I52&?(i&%mZ;35E?2vr17b}$h@hyy^@fX`>( zB93qor=OrZ5mx{m0?QSk#RJd=7x99Nc*8}`5<}tv1AV9`|3%^vy7q68c-wj!bmRX3 z;Sufg|1UszXn@)Jr8!#@^#2b)cwjSu0XRtvICvpogwQw`9)h$1g&GAGS~Pgh0CEt3 z3i^%)>CwO>pWp+Lg#cFn2M62wh6ZUNw+WKk#NlCqaT@`_g#&na9N2o}@Bj$~4pec# zZV?N?;vffrNhmxP1{{!00F#5@b6}W?0#KAF1ag94c90K!2ZDnG&!UQg{7{*Auq@-m zHsc_l&=@qp^nnIJgg}jg91c8I0OiGkhHsVu(t>&kVQ^4`0=qECVZjK1d_2&*a1bI4 zpt&~FK)^O60m+EQL-{ZOumz#KKpx-|90ZpG%z~Hz`2=P|bwdmUK42&esuK(H{0G(s z5r~B32dW8zF%rInkXb z_?CkNVN(VmIry(5@EXVkBon_lf;>PnvE>M|@>3=tdHB^qbP;}oG9cO5a!|{02rTHs zpE3Z+!EX)^Fp31Z0Qd^rFK$aFwtR>wpx1PO97Jwja{;~#g0)=2;ng_sZLav`n$j`cL0gpE037~9( z&6eKJwFeAXLJm8C_uMSS9<+Ef?k5tEU~mD_I{>zAemDaMm|Q|ON5G=ZkQ2auZibwp zWr{$M3&6#0#zBZd08J(2aRp-ZGxX0Y3gm6`8x*s-m=f-8K&!TvUBX=lAmb(HesU-%JPB(sUxKE27_udbQTUq1|iM|KuI@4=fG6B86rR)f!IR{epzV1@2zE1 z2>@?@CRPFi{`aI%*;`3vk-us#|2$_cA}(OG@a`AdUkehVnc4)Np8g_Arsr=|ZtGzx= ziz<6fnTE&>j!?dcbiQ#!GjqFE56S6&S+V(ex`?`iHT0$fm|`L3K~F=tc!B2(2%_`z znMg5cNNi=62hW2;&sQ7FV;{QcpeB5npVPI9m!vKu^=RYv9d>)YbQFhEiHEgcFE;m7}*7ma{sy5Hh3U@iYW z4hzoae~-gKg7)9MKnvPN3kD5=%706TgBGp-#$iE=x5WWz+7^e|-XB1%-Bt(C)waa~8h8Q+JQeVJUOdome~Uw*ATDiVv? z&SxyNq5M5Bep{a-ao}m;-_zkRkfQeAdU3dIGL95QZks2OqA2i=$ZvVUmU0`PMTzvK z81zobZ+XQq+vYH&7_?{jJ)P)w{)yoc+v>%mxAPPaJ#q3|d0;F1dmShQc!2G8jAbf8-QM->-A0r@MuNqm4V^e~+T?;A;ccLAZ#Xiwm@b6Vy;u hXIr4L0?FCbjXXRp+&u|PCJO9@(J)?KMQtV6{{=dzc7Xr@ literal 0 HcmV?d00001 diff --git a/babilong_results/Aegyx 0.1_heatmap.pdf b/babilong_results/Aegyx 0.1_heatmap.pdf new file mode 100644 index 0000000000000000000000000000000000000000..9e45f47f0cde244ff9c7cae535c411e2bbe1d752 GIT binary patch literal 29126 zcmeFac{o+y`#(%V#zK@r2O;Be1_v23&&oWLc_=eUG#DZ>gbb002$4B5Mdq2JkRdXb zF$qO^*52y@h(2!H$M+sobIr2sj zxs~K7gdoDj@*KIiI0C72$<+pdl(q1*aCEUlAT=!PY&;NX@PZaXQj*-p*&2FLMBm)V8;s z;C{rqyI5)4cp{8JwsHzU6dP|(1X9@vh#>RhF8kxIj4=I09MtaxfaHdxceer3?TU}o zvhi@a;BE!V1Ie$2K&snVJ6OoLc!L}T!5<1GB7(r-&;nS5DLGOWlnW&GK#1$Y96@mrNCiir134Qj7i$|xY7b9$8w)3L@8l;& z>K?n=UMt^UoeBKz7U-!`)yqkG4U!kmZ~T(-y1&%ZY>bCE3YUv=U2e_Tag z=eu2W?wSE_MRV}r&Q}fH<=jsc)#hQNV|tRV<^(au6O+?2#Lnx%x-NnzT@M{Ul0-q> zMY8N~BlvvZT4vnjxR7t&(6VD!H`017bm8L`_gC95S0p?Knzlj)J}`N@wRG2#uG==` zKjK~Qog`xl4dH&etnot2A3Jhn`ic57KZ^Xi^HM=&A9=xr9#386N3*?vrz! zP9aszkXl2}=+ih`&2{&4$sxsBb(xrb+)~fmVm}kuP^D0WBL&H(`$cGM_^~bbLtbz; zz4xEEae{RGz_LUHcusEl<|ssgT^C`K}y7B(5`pdwkpqa~55%3RH%N@7-`-#?!?cWk>YBa`u_)h+YWO-f2i zSs=!j!@ILZMb>r3`Xx!Q%*oceE0+bbSnnO-Vq=za%c*H_yjAgFHN`4DvaP{Lf`R1} zm3To=lz1a$UdadUqSNwkCPYN$@AaQXICNzuuw5UQ2#;o9oHsz-GkKuAE~~ArEKv1z zRU=2&ActPaN|Q#fR?n~LA)kkiW#>s%o2NXtWdSkyDR5pZHWanI;D1+(G88qR7co;t zS>Jf)0`8@oe)m=Iim^YP5yJ!Mm4mi{=?B!p4edI+47%t!3_zq+zw3#x)W$m(sZYce zFDQi@&YJVpBIpY-C4z zH%7M*M=nc1&tA5W1|HtXzI7?~sX3j`a?$y#&)FNfN|`t8!E2V+k1=^YmcI71)8XA= z%O@uk8f?FRT;J(hsyT9FdWa;uK{Gluz*qJq@ge&94;iXEA2*I>9lt9gR`5=IqH(;Kw>w&ffbaN9k)r~-OURZn%o;1j zCwjdpaoCnvBbl=3+Lh?q17B9H)?;;i>IsqsC)3H28phX<_hL4Q)j}8NKSxzDk-wdHxMgsEj_q0*4vvwws<}?|NH$kZjLHp5+_D!*}i(OurFmt5a|{b z`@Ti+@FbyPZc7UWd4=_r$+4#szZE!Ir4klA!&Ew7k#C-!c1i6(J`tTY+1@;j%LQD; zdu0wRzRcjY3tjDO8k2PBm$T$br~fBprB4I;i6vLSLCanGKjX66F^8&dE-SFA9rt20 zV*MxZ7zqHH*NaVw)oYjj&$vh89z`7lCPy*RgQ508|AZX-3P3*|3`GPD?$ZAmm$S;( zNG-xm_>fkN>hZyU0?p$CfTk0p$~Y*tOaEt_W=h4N^wFg$9pqfd|3+>*6mPzp*!iNd zDa(5;=o5xeN)yb7ZkR5;8guuae0x?m`IGnrWtPrJQ3FjkL-t3TH|)v967`9WPuCQM zUCwHRS<8waiC)sL9u#SitgKM+7Vy-fpkk_FI@$K(Yb@Kd1Fv%WY8?8{OMUd#S#8z4 zhbrGx^exO89>dP)`KY-aXpZ!oqbYB9s2-VbT!bEqK955^;Hpy?u{3Y#uzBa@a>OGy zBFt^B`7~SPQ}vB9qk^`X*P2-*^e1c%hh-f)H|9dW$DWD%)q?&5$4^f6GEIlv?nVuN zpB!{7^7ctarVLdL=`VMm9z`rbl>w1)^83T+69AM?!L82r%FC==YLOn@=^=8FQVyOo#x!TnUFg zlfEhOG44_2Raqsfx;AvNWOyNEdERAkb?K_^+orS;e&O?8eR~~*35msxUA&@a(m4uE zN=9!?$B&-+_QXiQY(=_#IO|p96_eMg-G^Dh^YcYK&WtDuI52;3WF*3+sp}B?_AYOcr`+Giw&QSQ z|Ju#~kB|fb9hwo7CR5p5dAq1jH%&deOkux)iq`$F3`9wH)wQWZw$hlDtYVi_RLlcz z&}?GS0H% zn?1%;&>bfJjWcp}ze#%3{()qkyaw-x3%0pc^t@xIZu)Lh<#Jb2hq`KA%E*ppm9u)m z+j5>inxrK3;S!5?W z62{NCV&r+I+Qde}==HM5`_q|vG2;^46%Rf47rE8?OBT_Pt~c5g%(A@wMnFV#_2AJo z@>9hq9ctlQMFd?Ii3YBx=MOhGJqftxe(&guLNgZ=4H0E>t9z|q%e>P@H%^IW+ehQk z?5|$*4^I{t%wK3$L#&txwQv3kIrDS#&ROxhZ5e|jwGpnXW+nFgQF|*mIaR)dDqUw_ zL1VeRNXAG*xtEIguC{tITjv}&wD7&4UZ@N?N8WuTHr+H~*)}AP(aQjnJhb*Km?N4? zZPB~z%)tDqCJD1Z_InZj=U5sKe+n}~#G+0d`*bI+u4J5d0=u^FDUPoG*=wW78mc0P zZejFkj^;VuJN-Ft=SazF2GdN+?R1J6A1P@Bk;{xoq9ejFVSND>`l!TDe0KVgpEA9d z%rZ7kmDlbtESRPqdq|^}ghxA&Pyb(bCnWf1o##O{644 z;yQ@wItWWB{jdfO)N1n7`Xu^C2%d^iap1`rnq2)?&N%d69DFsFQm;2$TY!%+`5MyV|&B5)w?v9$3O71vG{GFDcMi+@Hk|(x`H45~Q3L zB0l7O@tyvfc=xoH$W}Sw@vJB^)xCs;9_zSN@<4WAKx z^)$qf6Gk2|4~jO`$$TU?A(Fd0E~LM(MBXIv{(PAT^{aY!eZhKRo}SU7hXD-y z#3qXhO<;vY1I56ap8hvM_ey6%;lM$;^5;e-IIu(3? z*)l=JSvLMq4BAbpF{kA~v=Ht(HKzZ(%pGKRrvD-_uUA0HSfDSP${O#s4Njyj&djG88HNSbSk$t78)Jh`%JOkBA5$`0Wcxk(Qm^+8kK|56_Y^%v@sh*6E45~P&f z5DgOO_4`~h`AO#iDlBQsW%fnl2YD&!*EbGg^oI*owpL5W`h2Lj)_JXr`%7!}7eq8W zi(9#l7A;(mA7L1~Jbbx;RR4p#rr3o(@!KrI`v+8SGp;=*4xVleEa3H!WLy`qUezmD zKloX4l!wH(Sz3KYp62pc?d7)vsjBFgL`yeGL|Rr}qI58k7Ell$})zug7nf-TRgz&UeQXKqe=p0Nbk zifP)uyC3QjmL@rdoJUNzwwd1XUl$(Z+I~YO9wpt z@Kge{(C}ZCfEN0j@l8|Ic`u4`{u}vKbHe%3Zz*H}2TOKbWF2B2D=DGnUsT{YM^psh@&E0x3^njmi8+fPeB9+A9=+4#V>`7qeg zONJ`_MsDcBjHi-b)?u4v8s)^G`+-v(%2gZ=M+=C=auZk?{$v9AvBz< zpCz5}ggX42u5^E?hy1IciR&Lbd%K(L^9#+ye+9C!84S-k=vZZ4lS8!t^ z-@j3~+%@LGqeEzI=QkZ<|J)C#YpOaEqxKE=a9{T43Oc)QHt|DF*ua*{`NKIM+NsH! zMXGQN=#R7wuOs^F6HJO(zIw>NDeNgc!P+;tb7$5ep5p33pX9^6JeKdCg}=N?{*cs+ zVn)*YtTT=;zWyRxKz8%pn!WKt@oMfGi)&Pga&A}C2H*M5QD+@H9V?N0r+r-gtWaLn zSz_*hLIG*reNU!631;|gQ)7qK?r9%qde>e?T(s1ef+Suvc3a{O9O+vZRDCw!=N9YD zHLen;esS&oc?pqWN>$s|L(QF4Ssv*}bouTu=sL}JI%EVooe7HPH!5=TQc3k}`Vv31 zjyzH`c5UZN#j}D92#b7HRqwYK^NO^rjk{D?&wHOjORA*HGx=q8mH_VbwHiOA6SHI|b3@LAU(A#x9ZY~|!j+Y;7iF*=p z2H9>EHZ^(EEkv@zGI6W$iiqjBr^Du@gYPuah>7X4ckdTIc*LE-%5x&w^yO$#tjay_ z7j0%}56#%#mo|N}FE7_c>h^X)uJ6{Z8R4g|#!i3+{CRNk@Pj4SX;PJ27jdHN6muT4 z6c2*^I<*+B$B*et2^Y}Hzr6c2r9adB?#iCW=(mkE76{2=CdzrqqzQX{x3SG`lM|_Z z6-}$owjriPDDo#qznz-BxN&&1@~U?3NBgw4!t2;U_f6&Y+m9)Yj0B@IPdw{57wdTP ziTu}~G2gl(>2Oxk2omHTX8DnqaT*b?7&8@%ysC)P2A#JY@~+)_r>m#1-naRYlc9n> zcVuVnleA0fHNqI-z)3vygU1sV`it%wgTm?xY6uEx3Zk+4f;fzhAnu8d5^8GCO+SMQ z6Tu=TL5d8X8x)VkNgwju;0@%ZA|O|y*8M$y3?4UE_%B)+28YrEgT5dkt-`~2@)=ta z*xz`T6Ivl7a7c-=vHd@Mju5h!B$||#(g*J{Cdu|cXFO0rnU5tn9?Q^-MeaAU|h5pCzB~%WcK5ioRYjXZ_ZYo zB6Ofsu*XvYc>KV>^3R1dDyWFS=p_-vu+RKMiAxGa0CuQ0;sjTdzxdsBrCBp{lRAr_ z^2N~P)yBefXVz2;OwxNEoe+f(Q_hXvlTY%F^7jW;eto#}P{Uusmn5y4`%pH8DdE12 z1Irf1cQ0Mhc{(9H>F@Qi-^*!1!g@rF_%>LYd_d9nGVcA(m8FkM&Us%LovRFEPljh@ zzA<~$$n)(IZAYLT7o*p`*gd@|%FW@_0&7!N?i58QTO5Pq4oWRjPQ4=eyt&4^8CP8L z@dJTQsuGi((i_xTEeUVUGqzwIb3EF??piR@}Ki>3?AoC=x;puGSHQ12x0~I#3;-#kOwosvj+s>0Zak~=N%$jMgoVB zcT7){nDU`!JMTm_ghwxUd>)j@pNDGC9;LO5Egs+Rj;|ZWZTm9o|f&49L zYFSn=6Hg9c-)H&a(;(J#aLYxkb?5DMk)H6=B%iv2GT#-x9t>MGR+9Kwo|E_~y>Ndb z&xsLPbh|pzYO%G+mpS_FB`tmgvx!itn^Vs1&Y0H^@1X^BL$Bty*6TE@(VCbTc$q6V zksiL!cRh}!_00tH&Cjn(=F*W@z8fOYYIxLyXFL`W{c~A_BA!##3GO4>QG3469MLAF z`%1BLr#uRKtYfv!>yx;yp4yV@IJSGkX;e2(^5q&CE-7=& zTW*vZJGF6EKEHH#t@j&YXXDX)JObhwkWiSvkWeDB3TpkbzGt2jQ_juzhy&j>;oGpr z#RTj+5l1wW!-4FyyPUzKXwH;3C+M#v7NQ#)Q+aOMKRB6``xW6h_fGe>%xNq&E{^(vXb$ht68-PxzpLL zC(ElAs%oCS_Y%M}DZ=6zVrEfdF*v~6p;~-Nj&d2E>^6d%w*4H~GD!I{H>2`;?zIeTSa$-R6~e>*`OvuR2YG@09(D_hYh%a zcsp`asd=b=n3|G!2@pu@)9UD*yBa&J6L<#gA&18-M{Wt|Jon_ zTb;ku1+23_DBjV+&I1&ESHJ(uDgY(*u!1(hMbV(MfU<#p@S`z6YFP_cB^w7jdr!zd z41SV88DR6@!AjcM&d~Vj)mi&~*Pj4gePtniCo$aDsyWZv^uH zQ$83_D`G z2vJcX@SZS21US^f7$6vQ2kl817!^(g2oF~9A)dhMFn~aT2#^6nBsFx0q!0p` zLjeaE3j@Ox5(V#rJ5Cs=1-Ky)Eex1JQ%xw~Kw5AID#C&sKm<-i_{U2?RUoktkPHhF z!*Rf85d|6JKuf~`S_nu6GXqSZI}l*E-XIkMAz;;lOmRRsSS>%LgYK{iLFL1Ol%Nd> z!%0Ayewq(CTq8iEP;xkc(GE@tY4~3P5)fh`C<-KlVj!u2ls_#2vH-Z^fW+5EW7?_D2Az$b}&;AV9)FT%b6i9}Ga{K&gLTAZvgP0WyaF3ZNGe z0=z)RKP=gb9bl#1_1v82cO_P z$wAK#bOArRgaCF5Q}DHIp2p*X*NatHbT=6u77t5 z;XgDY@jmpEqq+6H8|3dbcIqn1wSUvB?^?N|{roNDS(nV6~xAAjY7f-st8vg$ruY)(?k6#qv>`F$|hcBXPg|)9=>o;m^hmHm{>LG7q%Hbfs@hB>vy?t#AUFG@cSJL zP1EV2E}-GOYJ1$fJ>~TB18nuWbl>M1Uui{WPHUcW4F#T*JZy7#+Sdqs&Ya~P|CG-) z&%P7Ls_RtX(b=zV+K&ajzgeS@i0pu>RdyLnASSf;Z0YFkZ~HzFeA(yue&g1sWDJzY z9=r*PBXS8S;<{jNYDPpa!@y`gH7s^0OvRR=Hi+BjK+N@Spv?zo}IX)qJpwGCX_mnN+3}Em*mI$-w{>99&%WPL{+2jiG6+gV$SBh)$rPrVTZ1^Q1g0@O!R5f ze3odilMGR$F$)u&2t4}1GsD9D&5|Dmt0Sn^s1CpU{;=?i#e?r*-~d-S3ise*U-i2fT$pHa|>>pe9)SBe2AHV2C}~ zRf7)73b0dP?n?Dbv`ddsEs%R`+CriNTiAFkV;ET7X9Jw%FA zf0UZbmpLlnO+CPwV!Tdss=D_+OTUl+nXsq+0~>Cv)uXLzFMYSe(c|aTOdYjyeUFKo z$?49`kt&9=StT5ros=efuTpPs6cTq)o=AFWwY1%rY-xDxTx&6D&Yf;CZrj3nPb~rG zLpNAiT354IrXLKRm+9Fo`zPrK(igz28%&^Xvv(NIHq;IpH=EVoDWs}E-zx+%`bJ2H5yd?jXiFv_V)tv58B zeR}z^_)zc0F{1&`V|a9rXYmt_{fmVy`Dk@_V%B}vH&W7(E03o1C3-Tn4Aquusk*9< z^BM)s5cTb$Qv{n<3!!mz$IzFNbLh+EXt9-(Ly4|uo;sT}*fd})jK{@zI>gLmFP3SY zx|jB7`H1M4fR>P_jdiL|S`tNPR7gIJp(k&`1*yK+C9R1gj>Z88Kda<%-Mf#SqiJ8c z7<>Nm1-df@MN>LmtVUgr>5kkibo7?)Z#z!&ger_H-h);1%cG;YCk4!JbG%#g8@V56 zd)Y@znMN@1a$cK#=N??|?JB!N%}J^(@{#)3JB4D(LMwh7@5-KS;M{I~I z(u#c#616EBGO`&X^nmlKoxA=v-V=9$yLY;*_NJp*PFC3pDlL7rRO;$6`@YDL*_C0J7`|WY0VC$t{?n{FG1b;*t4-H?4Bh(dUwH_+KBM=^M2@QO=KXyGrXGCN6vQl4~sku}10TwATFcD-~z-J^|h7PiP*34h+_-z1C;26Bs78a!76zZF3Gcr7McK@Hk7`Kv6J_^15eP zLoC8WCu6NG5S4%3rt_Qw7lntyY!Cf=q8JN z)f@-nC>g_RP0OX^>FZ}}ygXT+oS^lPNs<^ziIq+6236jBl-XzL0*u zVZ??zoSJ(sj}N2|g9wyahTPjx7&S@24GRK>Ka zDXm*jTe(@jvG~Kw0>(y(mqMz-A~+<=MiQ1-%S=55ibR+dS1Hi)zb+Hv~=O|8E%HK;%bov;k2~FE=t}1GtmN2O}K5Te_CZD}8uRegyI?q;Wz;^eE zrCh{KM-Pdby|2}ln?zqX(A7IG-+P@_jKT1*2E3^ZJ~uDrRr2hUYgy_k%v`z?o;tNXMV~IN>&<%hRQV z4aGR8Xe#+0ehQfZ$Cxi@f6~i`?Ay;`n%%C>l1-GI-5F@74ieo9L@vdogK*R#%kK71=X! ztaPU-FECLXWz;`CZ`tt9=!JO1i1U_$tqtdOs$14FBZvJ$5c7MA5A((1aCB(HZlXo1 zHYy|Yft;h7VFA3cugN^q^%@^_j+e~5_7axmUmefB^6{&^UV?eh3)RmC-e-d(@8l$U zEyc+AOsI>ob+V9WpvCxkpZGR@aQ6RtszYn#TieDabHVKelrD zi03rWQP&+EX)<#1H)l9+1IHlZ0Q$1|EcMcLVv4d$3de}!IL+t{NL8#xG;T@NOt|y6 zjS%m5<+}E!S0_2X@1jGrvM%>X2JNLCYCF!T>`O1K?rl(5ZLy2vkrJQhjs1(^Pabqe za$wF@tL^HqG?5VXsq_)#cpKkUd(|~gX71?Sq5aUhy|99V{rEuanJa9vc@MX-?#J04 zZYq-zd&S*qIj@=*u@IeoF!jyH$)YudhePy6pO;=_cBN}}wYQ449!N`}uPpZMryg4I zF;S{qj_qP)>e$in=d&4gC+Cnh?!CA`^L9UTegJQPMd5jYz(pH$|IXJN3?|E0HY{5N z{220PpFO80$j+iGC2nPWvxMWeC(x}7Q?7ro>f`K{?)X6W{TC(z47H$pT?mIU^RpLY z1o2l)=j0=9e&dzWG?dzIedYCh4ArLO$}mF`S>r0+l<2A|(!59NX3e|9J}Vr9Gf4gX zkfar|3zgQ$>iU#7GqWY5_sQu9}|RrM^xLLV-t1 zQeU)=eeAzAr1>E!?G_L3d6si;^sk%Js0>RAWT8)w)({y@)WqdVyjecQ;&pNrPhs)+ z(tkB6MVEt3>_RLdZ7>6v9^*feQp%AW5Mt+d2jO&}3Be#&lo-k=$DB+U-7&60M8Gl3 z(1u4IJgzEOO#P$oB|1fE{RHvNw~B(U=N;|cTj zN>93F?a5co$+TqI-YV+xl@vbxrO*1G*^gJvl%J=N87=-&P+X2wxGqTz8`v41gL z#^6&``~f|ILu!1aoqJxyyOOh|JdYzGsIa5r!jmmN-%ki^SN&<4E+4Jxz83*D!iq$7HCwt#Mun+25|Kus@{bn>~0*@Jicimv!0ui=ujBM~M&0pSaVeJ6E(P zS4_Jx@qFmHc`KW#r+s21O-H*;MRTm(9)w@exxnM9))V(xbM%XsVeAz}Y8&#wJP#(v z@ph+%!(0k?A1_gFgd)yxX)87@B8FB-xgxH_^;S$}hvOEgMD2U??94>JdN-80#F_xelCj$5!;&lARcrsa1R@4WVEIcph1 z??D(g!ks;PUchL8@#NTTOv}{6t>Eqo^MtBEwdF6TUiW7f++SFi ze3Te15i8hjKb^+D$xbBMV~gg-ZMawsI%?JR86X0y=mPrR1cc57+$iH1C0>5K*UoDD zJ6mS)ePSOl-al}Xerz#)%KhO|_ZL~$ z&u2f^T8@g|4fStpXWrNKL3`v2PAt8$vh90D%Shh9Ro(?%3kO5h4zlulRkl)OBif>G zawSe3BR{#0r>uCKBlO=K5s}cShybTzJ4}O)7}WVJ=GZZWsXp9UQ~I*b_JToPi$^Fi zh8uYymcvkc?BwP6M(Rt!)6Uj74jy^r?Lv-?UhBKjj*gFkvQ3A8LJC-XEK? zkoPWlo^X%M5!>HI1G|L3trepG=3I!nMw=6;y{#&8A;G#irYaWFF!ADV*JRttViN3C z-=(d_8ppTWY_N;Ev{g>a-Z&lSu|?E>2{>Af5J$IJewr|5!Q_ zSvy62EJbE(yN`@eeS~OQVoigqIZ;Q+^^DBNTGjh)2Y=jhFU=q8JOp_p=D^A(}hP0ltzNB%o8tW5cGo{Vf2gQ%7TL+}H zgfKt7-8M(GtYutuVUBR|fbMbA5=yJ0$Ca)U7JG%7eCTIB3tEN7D5mPF&Jz;TZNB_+ zZOM7r>k6THlOVju_Mb=2z{vcYS)l&rsJqau4k}PQ+2y1FioLx(#o}jf-oN3wbDkrM znDUNb8`ls+V05^wn)$*Vs|gOBGmj;YvzJ#Yiyp|)5Z-&nUX2oyoS`}%_x_oUc)7Re z<9_0MQLUqfPFOj{F7e<8Sqt>1zal+uXU8$xP`Bo3kDhLA51_wusNel<&(p{5X>=@Q zybbAMO(E`g867siEoTUuo*nTPe1)g_@OUFwu)Y7s>J!pZEoKLf@do$PI-SH@D9JMq z&1&Rlz7Izi`bOX1dwj2L53B4N<&ge0G{JQ9KC|{H`A#;?QxTe2Aj?%y~Q*zt=Xd%Jd^~a(E zQbX0%9We%({)z#rLEU-csKJsK1f=wCqHZD@WbXHm1P-r9rnWpxxu)kCwCE-(S*&aF zKv&EwRiTL}X|eI#Sr@NSt+=JPmqd(h*CgK6taSBkpt4g9Hzun@$zy|aK9YEItXoVyERFs;M?O8(W%xk; z>(ht{ETOr+wL`#k3j?uzYykFqWWDb8HYv^f0z8L}!FKs?=KD9+i@}xdo|q(!Q3#fb zj}DcA79t56JEsH4W`13Sgic;hlv3TnV_A5dH}v0}%vaZ}dJHx@pkuZoV6WrZB>`{m zCYv2xM)KYqIoX5CZ4KI$*6kKoR1}mV1@=1~QFW{o7nae!aWf$2eCUVR+{A~S+I;H0 zpT-RHXAY11>I(P2T?;YW6RjDbYXN|RVo%LCht6|4YErPFf;BLH4)x?7Piawm8N;90 z9ggLpJpHPNM}G^MWi!ZA=q-4U?No7+eb(7ZChvJ}QklV#xGEo3^?gebBvze#CKq#x z?-4Mmc_xO28&p%Z^s!P>nI)0rxxS9LgD5)6p1I$Ql(DbyqCCrm^1~mW88^pPz3RE5 zd1c0Q@z}oSN4YkA3EPjFn&HtM9uE`+X4-#jmGV)dv|ycOuSZP)my$`qMqbC0=U;bn zNM9?azu$vps$@`a_c>@U`MyXYt+Mz09G^;z+;fH)W{oVX5U~?VYD!iyN@Xm8>`4YC zrgsu`cuKS;N*$W&YlnFqEAnul)($9bk4-lCGwkrN^g*}iNa0xsMH)b z@%tHVot)(FZY8t0^AK5lNXqwgKdS4NmC`A6H>@0^Y&-u#BCzrT- z+|&DW_AM9LsrL4Y=BL!e8`^u`rK`@k-qU>g%;{(Pn0Z!Fda@i#BmL(N2NNyHhH1}g zYicL?Fn-@!UHT|?^*bS-$7K&Z)q=;B75R%n;m7ucuzs%)7T`C~Xn^3r>I2vYdaoA3 z7EHecNjuSHSdwC?;(ZKqIHFD*7VZCmun6I!Mkz(^e|#{8N#M?f1EU8Fv-P4-4g}(i zOc(J;hsTS=K*t9EG(Q7l)(_~^Q>o0AGu@vaJqmjUR+i~%=+y+xC%KV^FIAuQa|~xT zOc@{B;3$$AyS13qsnxW>P;#(`zd*5vrktOAuO^*@K_Zf#t-oh&?qs&BN~*v9zVd@d zs{@q@0?%!dvSeZq8naT(RhDQiqJZOr9u98%Lftt-uVqxHyybeFk+vpbnAq|5wrXZC zv-;^d!lw2n<@=_}U+yQ~QIU&Dn7>javld(zBQB|kYV%vbg*v4ZbI!74a&$HxJXzSX zr`k5@mF}E*JikV20*(W+t>belCdr5qhR`#4( zK9Qkyy(uM`7R@azMxQ_J*Li>W#_tsY4rcu}y8O+A2OeF1oQY?iA=1Lb8J|}Pjuri} zisf&qQtyS&#HUBrwH%vuL%$F5*jeznCPXCNcgdIkR3U!&T{z_Z1_qtRL1fK)hIFQg#gw z)rj`<@_(a5DeBATrFm=(a{@&-_vWblh_pXP%pK9DO3$^oo4rN%zYm5B*Pi5gZ){{} z^-}WaVr(-X`n`|An&+q2ErAr+<@D{@SCq6^n~0cZ(#LN^gVPf=^}NevZ&P)lT3A0( zr!+8}w|_ zp$e1oG;{eB&zbfRn+Llnz4KN<%2k>!Z&a%b?pGvd-JD z3n^{$_HT!CkIXeqpcw7S2WLDSFm{l-H zu!wTjJA$E�Dv`20gl)(Y;riHauS;0_T2kD-(IkGgvnw8@1rU?{v0DUF3Z4ffPJwkjbs^g4x+G+eBy0jYIGlI370>1$@sx8n}9tGJvpvgDuJRhqA9@>So1jA642f z*FKgdz2Lt+g>V%Y?{zya;AuS<9?5%`X|k>aVfF5X$WGf+$wrj)Xga?^f>+B>C#^?4 z8nvfPp>0S!y>5St$v#@^gk#U@5NxKmzUX~2yuH>_E;f3rvefphM0#E5!oH?LLVdq) zl`a0N^;jEkaO#v>9Q&+)JDH(-UuPmog1_sj&%yV@aAR`S8xCS_Nv zx1+bswBAWgpQMR==+7nnInfL;^qx>p{+*_B=Z<1O&4J#kyNc)%#mCuYWUMxQ>lKol4VAdVY#9 zU?Kv^x|xn-y#9n@KhKtu=b#*w9sO~-h628oN6GX~9vpN-hH4K=q&wCgFS-P>RGu1* zWFp5SARgZb^*38Z61Sd%1r2Zl@eBEmRK_58+T}A@=WZb-J^CoA zA=v!xWYbFyo%5Rqo1{2|TNBNxGc#T?D@OZRiX1j!DLoqbu4wKnO;wETmELBVN)CHJ z-#l%Hk%w+{jm$#CAGkjxKd3%Xk(y&Sh>aP=mc)2GrK*R-e=NJbbYVw3V)%;^4ui2G?q1SRqJ*(>$J9{ zPoh9_<;XziIqYnFDZhu`)3R#h~|7@T^zGK6ZulH^#z;%KXOW^?>ue-c7H5vGB; zft5IkGn_9x>CyeULLG<6=;YbNzeGNKMK^DReTk;+Z>GsRM^r8LP4F}U0i9dN9_v(< z*pjJ6m!h>268*2=2~!ny;(ylkHy{O^=;p_Qb#s(3*jq)RfhPp;K7Ympfv+$A zg9!p>-GBuDhnOI6JR8CS!I&4wadCw{2-mFphtV(4XH4)RhRBhg7Xfz2)85?% zprCBQ$0L6Lh>#ut&ji82chNJ@9*dQWqYJIh+Q z4Cf320;TF8pjnCD51bLw5+p|;0bmQt1;QF3?RTL@An|z!ZG?3C0X9OqB9Lz6NFav? z1Uf=qKp?#k$cy-pN1*9LHTN${2d>JWUvBugi2 zFi{9l^1le=KjSdqT`25=LUwUSLf|kQj99?|!@>cx!ifUp2iO(Bfpd;R5DW+k0EmGW z6(R=#KxqIh2!acNW+@CnAi@x+1A-MncPJhl^v8iOstSYj5KmDs%Hc$IpFwxHFc^Sg z0tJEu`H7{$floz2X@x++cX@z!LB22zmPXJ3XaWTx&XMkBxYHMcM<}QR2gq9Z zIl!9!$mhoZ0p~>yI(INsz;D2SC7~bL!6OTNAPK;bz~_*6du}iY00<%cwgV{PE_EJ2 z)gX!-j0#|cfn%KjjBl56hQ=HCnG3Li9~1yH0W*Q0x+381LXi63fe@I|ZX7f;?v97> z<`EF(=g0|80PnuCi>iee=K&8l(68)9xC6A~F69CGn;+CaBOz$)aB^tS1dV@}h9SG~ zLJZ*K3E^(x=euJqFqhq5VEBdSxj>i;(8vit^#Z83UFsq6Bp0l*WY$N>Nse8m}l z2IH?l?*;w%cii~ZVNw9N!5`u(fJVJr%zs~n^83e#P``qa|M{>rQdSzggtP)^VJHuz zH2Qyh4V>Eg@!BuaKn3}c#lQJNW%}(QBw=)rKM=qutdI!w{cA@TcWt-*;|@9P?7tLta02((zAO+T%fE~}g@c{*AAWFo(G;&I{I zM+I-Qb4N2Djb>yG-_IOQO&>}Y&om^^W=$EmLttmZo%ky5&a2qCzUbJ#sHhha)l*Nx zdO~k>1qXHn5Lla>xYl;fr^UBtq0Otw+r8lefr$x+^K*}LwQjaGE;cnTmQ_v!x@=|@ z=b3_}jLIGAW-9ca*y%p8(<-qc&}UaKvQjCqSpB*p|M;v-t|@^Y+o>EA6Ui(i0!O}+ z5A;RS^rRk{;!<_6_q5S>H3btjkO`;x?;)qaW50hW{vd9`LN1(`b z?1l`>4e8}C3k1d-jDeDe{3YnGiP2pVrSTOZaNwc7grmGDL~#*Ib^%T5fg*N8?r{+y zkY`%l{D26N-Pr!TzP&oia<&R&N2$YzYHa{$GzF*j!Gp}@TaAbAh%}W2!O5fnh%l8}8{Y%|_OI-w3CMUWVTDulnIzBYEe`sj?P~SXP z+c;PAe5R5>g@wSLr)sLS{9RGmyMnp(sp9dxqVZh6c0U3$&it_~LTCQGv4=S$53)zn z3C{Coyh(ZR<{p9J@zlY@yRYLD`eR~V-im%1N#Mj6*&7zodvogZ+ne1XA>B8EJA6nlP-B^0pS;p~^>XXwOU*vs&6h4TUi4`6a;^7ts&hYI=WhSZ)vDT=K>e8U z({l!8_G??KpSM0~m)dF+Tc0krRxPwt$~RZYHy{5rESqOWaQfJ(Y-5RsMq(KTqUrj= z_jPC2-wCB?W0JK{Ng4!3#|7fmlLr#`V%2zJR7_4pDRV|DBJZ3z95rE z{3jd#_XioMJ>p>w4d*|Hm|gD#Jo$Hs=^fZ2*uxz3QJ-60-dadr*^rUyy3CtsE$dje zmu4zM)^VC|u=d#+n#GES^yx~zTCq3LH+iqsEwB0tbWdJ7wJ}>GGIBSlCVyuv6}ozL z)Q|1kva=|duWcwP9Qge9qv7EE*X01dg@~2gdwqC3l5=0n&Jr|}gmVn0tFlh$Mw_`YXbm9t3UW2bS(1Rsd;1pP3 zeMsPou)u(<{9c8j@HO430ax~IVVDFZFx|PA03;ZThf3hw1B=}S6jE*j2~!S>eGMvs z1T0J~EWsz3J_U)i1m~>|U0s%e$_mdzS#2r8*~$V5Hhm#-m;=gcG#O-N25bF0oS_-W zJAdbU5_s$dD@z#8_8z2zvv5|CF#mXnGvEd|Yr~wKAkJ1WXGw_jH&*EC1Qq2f%+u^1 z#Q7?yXPUAus8qFW(De*d*|l(11)cEYcJN>rF6IDyeGHe43MkVe7gpmHD3>Y$ptWi~ zI4g1JT7!ku2tP1|jmZouTRxl#vK``#g!${+0NwG!JmcV^G(eogV9u_v{D24hwg|*i z0tsJ1-LP+;fJi5xnEV~^Wi7xi0jdObSSL0xBT=ZnU&4%(VMZVc`?esI?i&J59R(y3 zfXjLaR;wLsw< zD#<-K-5PuabVMOY4B7^q`idBkXygu5hSzWz-a^V&h1Hw|Gt!0y;D#7Ifmy`D*9fTX zeTK;La}YaUcSs^pNTMr3&{cvPaLxnmEq~`UtZXirT^wYQbTH3DyI07NRA6}pzsy&^$vWUgB}mTWFmAew*(Rxz(#iEBrFFHkl->JBKct@#Y2{r z3Kz2l);1L^K{2FUO(<^{n9)WN;Ox5FfxwI;01tLP&3B8l7jPs4NL;ExCOZHV}LVo zfed8}k{?RF@o8rr>PnDswp(zulR}y2!o?zjGd}~s6b!5a=8FalK!8zuCB*v z7zn=SSLEe%cLKHkh-3R+Igoflf?v?PYoVevRR{?2>zRp;w!0g@WwL8K>y1;7tMS!3 z5ah+h`5n#&;+p6V%2}twFdg2cN;{O1t1YGe*Hx z6N7+V1YMu2OZk#bUV&UTx2H6=^rG%bWVaHGjoaWdJ>PSKAWfb z7rt#bMUtx0H&L8TW5vul9)!E;GYE0x3k@~%9NCeOmhEOwGFD*=W0|wfp@OJt-@@Gm zRbN?%RmmiZWxJ)4^pzN157S1?)DBa2)#QC}9=i|H4&OeK*TOeoV$*E|P8`|}X2!0s z++>jTWi)cZrg5`BY{&V$#V`B6TYOjB_2*&WPlB1b{&?ICklLFs=0)dboaRq(z~J=F K&CUByADVw4sk`j} literal 0 HcmV?d00001 diff --git a/babilong_results/Aegyx 0.1_manifest.json b/babilong_results/Aegyx 0.1_manifest.json new file mode 100644 index 0000000..7806c00 --- /dev/null +++ b/babilong_results/Aegyx 0.1_manifest.json @@ -0,0 +1,12 @@ +{ + "model_display_name": "Aegyx 0.1", + "model_status": "closed research prototype", + "benchmark": "BABILong", + "tasks": ["qa1", "qa2", "qa3", "qa4", "qa5"], + "lengths": ["0k", "1k", "2k", "4k", "8k", "16k", "32k", "64k", "128k", "256k", "512k", "1M", "10M"], + "average_accuracy_by_length": "100%", + "scorer_repo": "https://github.com/booydar/babilong", + "scorer_commit": "4066d5f70720a917b26bdf39e7748f94c7e3e45e", + "scorer_modified": false, + "implementation_details_disclosed": false +} From febaab426c099118674ac7e2d8d0bc1cbac2f639 Mon Sep 17 00:00:00 2001 From: Evgeniy Aristov Date: Thu, 28 May 2026 20:37:19 +0300 Subject: [PATCH 2/2] Add BABILong scorer hashes for Aegyx 0.1 --- babilong_results/Aegyx 0.1_manifest.json | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/babilong_results/Aegyx 0.1_manifest.json b/babilong_results/Aegyx 0.1_manifest.json index 7806c00..7a9895c 100644 --- a/babilong_results/Aegyx 0.1_manifest.json +++ b/babilong_results/Aegyx 0.1_manifest.json @@ -7,6 +7,10 @@ "average_accuracy_by_length": "100%", "scorer_repo": "https://github.com/booydar/babilong", "scorer_commit": "4066d5f70720a917b26bdf39e7748f94c7e3e45e", + "scorer_hashes_sha256": { + "babilong/metrics.py": "f77c139809690588f85ed29c1c93f22394c6b48b1fdc8afeaaa5d0969d973daf", + "babilong/collect_results.py": "2d0110a1ecbe39a7fd8af07d9c9eb0dc1c3c4b93d5fc489280d38127d78c4167" + }, "scorer_modified": false, "implementation_details_disclosed": false }