From 08967e324a68e1d7aad380b69cac4ab65018bc26 Mon Sep 17 00:00:00 2001 From: Mark Mueller Date: Thu, 8 Feb 2024 17:54:18 +0100 Subject: [PATCH] Slim Orca data parsing Former-commit-id: 7f792dfedebac8ed46eea935fed296bdb50d5f44 --- src/llmtuner/data/aligner.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/llmtuner/data/aligner.py b/src/llmtuner/data/aligner.py index 070a917c..d4f281bc 100644 --- a/src/llmtuner/data/aligner.py +++ b/src/llmtuner/data/aligner.py @@ -77,7 +77,7 @@ def convert_sharegpt(examples: Dict[str, List[Any]], dataset_attr: "DatasetAttr" response.append(last_message) outputs["prompt"].append(prompt) outputs["response"].append(response) - if not dataset_attr.system_tag: + if n_sys == 0: outputs["system"].append(examples[dataset_attr.system][i] if dataset_attr.system else "") outputs["tools"].append(examples[dataset_attr.tools][i] if dataset_attr.tools else "")