| | roles_map = { |
| | 'system': 'system', |
| | 'user': 'user', |
| | 'human': 'user', |
| | 'assistant': 'assistant', |
| | 'gpt': 'assistant', |
| | 'AI': 'assistant', |
| | } |
| |
|
| |
|
| | pretrain_reflection_datasets = [ |
| | |
| | |
| | |
| | |
| | {'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-gpt-4o-judge', 'transform': lambda r: [ |
| | {'role': 'system', 'content': r['system']}, |
| | {'role': 'user', 'content': r['prompt']}, |
| | {'role': 'assistant', 'content': r['response']}, |
| | ]}, |
| | |
| | {'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-openai-o-mini-judge', 'transform': lambda r: [ |
| | {'role': 'system', 'content': r['system']}, |
| | {'role': 'user', 'content': r['prompt']}, |
| | {'role': 'assistant', 'content': r['response']}, |
| | ]}, |
| | |
| | {'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-final-dedup', 'transform': lambda r: [ |
| | {'role': 'system', 'content': r['system']}, |
| | {'role': 'user', 'content': r['prompt']}, |
| | {'role': 'assistant', 'content': r['response']}, |
| | ]}, |
| | |
| | {'kind': 'instruct', 'path': 'flozi00/reflection-qwen2.5-72b-260924', 'transform': lambda r: [ |
| | r['system'][0], |
| | {'role': 'user', 'content': r['input']}, |
| | {'role': 'assistant', 'content': r['reflection'] + '\n' + r['output']}, |
| | ]}, |
| | ] |
| |
|