Spaces:
Sleeping
Sleeping
ChatExplorer
/
dataset_adapters
/87522c634adeee86c404df5141f0a2b983dff4bdde32f7d475db4cefa1dc2520.py
# def transform_data(data): | |
# conversations = [] | |
# # start with instruction or input | |
# if "instruction" in data: | |
# conversation = {} | |
# conversation["from"] = "system" | |
# conversation["value"] = data["instruction"] | |
# conversations.append(conversation) | |
# if "input" in data and data["input"].strip() != "": | |
# if conversations: | |
# # Concat the input at the end of the first message | |
# conversations[0]["value"] += "\n" + data["input"] | |
# else: | |
# conversation = {} | |
# conversation["from"] = "human" | |
# conversation["value"] = data["input"] | |
# conversations.append(conversation) | |
# # finalize with "output" | |
# if "output" in data: | |
# conversation = {} | |
# conversation["from"] = "gpt" | |
# conversation["value"] = data["output"] | |
# conversations.append(conversation) | |
# return {"conversations": conversations} | |
# def transform_data(data): | |
# # Initialize the final result list | |
# result = [] | |
# # Process "instruction" | |
# if "instruction" in data and data["instruction"]: | |
# result.append({ | |
# 'from': 'system', | |
# 'value': data["instruction"] | |
# }) | |
# # Process "input" | |
# if "input" in data and data["input"]: | |
# # If "instruction" has already been added | |
# if result: | |
# # Add "input" to the end of the first message | |
# result[0]['value'] += '\n' + data["input"] | |
# else: | |
# # If there's no "instruction", add "input" as a separate message | |
# result.append({ | |
# 'from': 'human', | |
# 'value': data["input"] | |
# }) | |
# # Process "output" | |
# if "output" in data and data["output"]: | |
# result.append({ | |
# 'from': 'gpt', | |
# 'value': data["output"] | |
# }) | |
# return { 'conversations': result } | |
def transform_data(data): | |
result = {'conversations': []} | |
if 'instruction' in data and data['instruction']: | |
msg = {'from': 'system', 'value': data['instruction']} | |
result['conversations'].append(msg) | |
if 'input' in data and data['input']: | |
if 'instruction' in data and data['instruction']: | |
result['conversations'][-1]['value'] += ' ' + data['input'] | |
else: | |
msg = {'from': 'human', 'value': data['input']} | |
result['conversations'].append(msg) | |
if 'output' in data and data['output']: | |
msg = {'from': 'gpt', 'value': data['output']} | |
result['conversations'].append(msg) | |
return result |