tangled-alpha-0.5-core / scripts /backup /pretrain_reflection_datasets.py

trained 128k tokenizer

869eee4 8 days ago

1.37 kB

	roles_map = {
	'system': 'system',
	'user': 'user',
	'human': 'user',
	'assistant': 'assistant',
	'gpt': 'assistant',
	'AI': 'assistant',
	}


	pretrain_reflection_datasets = [
	#
	# reflection
	#
	# 4.17 MB, 1,000
	{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-gpt-4o-judge', 'transform': lambda r: [
	{'role': 'system', 'content': r['system']},
	{'role': 'user', 'content': r['prompt']},
	{'role': 'assistant', 'content': r['response']},
	]},
	# 12.4 MB, 3,000
	{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-openai-o-mini-judge', 'transform': lambda r: [
	{'role': 'system', 'content': r['system']},
	{'role': 'user', 'content': r['prompt']},
	{'role': 'assistant', 'content': r['response']},
	]},
	# 70.8 MB, 36,549
	{'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-final-dedup', 'transform': lambda r: [
	{'role': 'system', 'content': r['system']},
	{'role': 'user', 'content': r['prompt']},
	{'role': 'assistant', 'content': r['response']},
	]},
	# 30.6 MB, 25,391
	{'kind': 'instruct', 'path': 'flozi00/reflection-qwen2.5-72b-260924', 'transform': lambda r: [
	r['system'][0],
	{'role': 'user', 'content': r['input']},
	{'role': 'assistant', 'content': r['reflection'] + '\n' + r['output']},
	]},
	]