From 3f29fa017b7076021d75a4b53541e52ebdd8f0f0 Mon Sep 17 00:00:00 2001 From: tocmo0nlord Date: Wed, 13 May 2026 12:58:29 +0000 Subject: [PATCH] replace Capybara with SlimOrca (compatible ShareGPT format) --- human_chat_qlora.yml | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/human_chat_qlora.yml b/human_chat_qlora.yml index cb17d5b6e..0ff381e14 100644 --- a/human_chat_qlora.yml +++ b/human_chat_qlora.yml @@ -29,15 +29,16 @@ default_system_message: >- a clear, useful, conversational answer as if talking to a knowledgeable friend. # --- Datasets --- -# Both Capybara and OpenHermes use ShareGPT format: -# field: conversations, role key: from, content key: value +# Both use ShareGPT format: conversations field, from/value keys +# SlimOrca: ~15k sample of high-quality multi-turn conversations +# OpenHermes-2.5: broad instruction coverage, 5% sample (~50k) datasets: - - path: LDJnr/Capybara + - path: Open-Orca/SlimOrca type: chat_template field_messages: conversations message_field_role: from message_field_content: value - split: train + split: "train[:3%]" - path: teknium/OpenHermes-2.5 type: chat_template