mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-08-03 04:02:49 +08:00
parent
019c6dad84
commit
d63beb7a24
@ -120,15 +120,15 @@ def convert_sharegpt(
|
|||||||
even_tags = (dataset_attr.assistant_tag, dataset_attr.function_tag)
|
even_tags = (dataset_attr.assistant_tag, dataset_attr.function_tag)
|
||||||
accept_tags = (odd_tags, even_tags)
|
accept_tags = (odd_tags, even_tags)
|
||||||
for i, messages in enumerate(examples[dataset_attr.messages]):
|
for i, messages in enumerate(examples[dataset_attr.messages]):
|
||||||
|
if len(messages) == 0:
|
||||||
|
continue
|
||||||
|
|
||||||
if dataset_attr.system_tag and messages[0][dataset_attr.role_tag] == dataset_attr.system_tag:
|
if dataset_attr.system_tag and messages[0][dataset_attr.role_tag] == dataset_attr.system_tag:
|
||||||
system = messages[0][dataset_attr.content_tag]
|
system = messages[0][dataset_attr.content_tag]
|
||||||
messages = messages[1:]
|
messages = messages[1:]
|
||||||
else:
|
else:
|
||||||
system = examples[dataset_attr.system][i] if dataset_attr.system else ""
|
system = examples[dataset_attr.system][i] if dataset_attr.system else ""
|
||||||
|
|
||||||
if len(messages) == 0:
|
|
||||||
continue
|
|
||||||
|
|
||||||
aligned_messages = []
|
aligned_messages = []
|
||||||
broken_data = False
|
broken_data = False
|
||||||
for turn_idx, message in enumerate(messages):
|
for turn_idx, message in enumerate(messages):
|
||||||
|
Loading…
x
Reference in New Issue
Block a user