|
roles_map = { |
|
'system': 'system', |
|
'user': 'user', |
|
'human': 'user', |
|
'assistant': 'assistant', |
|
'gpt': 'assistant', |
|
'AI': 'assistant', |
|
} |
|
|
|
|
|
pretrain_reflection_datasets = [ |
|
|
|
|
|
|
|
|
|
{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-gpt-4o-judge', 'transform': lambda r: [ |
|
{'role': 'system', 'content': r['system']}, |
|
{'role': 'user', 'content': r['prompt']}, |
|
{'role': 'assistant', 'content': r['response']}, |
|
]}, |
|
|
|
{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-openai-o-mini-judge', 'transform': lambda r: [ |
|
{'role': 'system', 'content': r['system']}, |
|
{'role': 'user', 'content': r['prompt']}, |
|
{'role': 'assistant', 'content': r['response']}, |
|
]}, |
|
|
|
{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-final-dedup', 'transform': lambda r: [ |
|
{'role': 'system', 'content': r['system']}, |
|
{'role': 'user', 'content': r['prompt']}, |
|
{'role': 'assistant', 'content': r['response']}, |
|
]}, |
|
|
|
{'kind': 'instruct', 'path': 'flozi00/reflection-qwen2.5-72b-260924', 'transform': lambda r: [ |
|
r['system'][0], |
|
{'role': 'user', 'content': r['input']}, |
|
{'role': 'assistant', 'content': r['reflection'] + '\n' + r['output']}, |
|
]}, |
|
] |
|
|