tangled-alpha-0.5-core / scripts /backup /pretrain_reflection_datasets.py
mtasic85's picture
trained 128k tokenizer
869eee4
roles_map = {
'system': 'system',
'user': 'user',
'human': 'user',
'assistant': 'assistant',
'gpt': 'assistant',
'AI': 'assistant',
}
pretrain_reflection_datasets = [
#
# reflection
#
# 4.17 MB, 1,000
{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-gpt-4o-judge', 'transform': lambda r: [
{'role': 'system', 'content': r['system']},
{'role': 'user', 'content': r['prompt']},
{'role': 'assistant', 'content': r['response']},
]},
# 12.4 MB, 3,000
{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-openai-o-mini-judge', 'transform': lambda r: [
{'role': 'system', 'content': r['system']},
{'role': 'user', 'content': r['prompt']},
{'role': 'assistant', 'content': r['response']},
]},
# 70.8 MB, 36,549
{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-final-dedup', 'transform': lambda r: [
{'role': 'system', 'content': r['system']},
{'role': 'user', 'content': r['prompt']},
{'role': 'assistant', 'content': r['response']},
]},
# 30.6 MB, 25,391
{'kind': 'instruct', 'path': 'flozi00/reflection-qwen2.5-72b-260924', 'transform': lambda r: [
r['system'][0],
{'role': 'user', 'content': r['input']},
{'role': 'assistant', 'content': r['reflection'] + '\n' + r['output']},
]},
]