This commit is contained in:
hiyouga
2024-08-30 03:21:50 +08:00
parent 8b588c7224
commit bee1bd43b9
8 changed files with 24 additions and 13 deletions

View File

@@ -84,7 +84,7 @@ def preprocess_feedback_dataset(
tokenizer: "PreTrainedTokenizer",
processor: Optional["ProcessorMixin"],
data_args: "DataArguments",
) -> Dict[str, List[List[int]]]:
) -> Dict[str, List[Any]]:
# create unrelated input-output pairs for estimating the KL term by flipping the matched pairs
kl_response = examples["response"][::-1]
model_inputs = defaultdict(list)