| roles_map = { |
| 'system': 'system', |
| 'user': 'user', |
| 'human': 'user', |
| 'assistant': 'assistant', |
| 'gpt': 'assistant', |
| 'AI': 'assistant', |
| } |
|
|
|
|
| pretrain_reflection_datasets = [ |
| |
| |
| |
| |
| {'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-gpt-4o-judge', 'transform': lambda r: [ |
| {'role': 'system', 'content': r['system']}, |
| {'role': 'user', 'content': r['prompt']}, |
| {'role': 'assistant', 'content': r['response']}, |
| ]}, |
| |
| {'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-openai-o-mini-judge', 'transform': lambda r: [ |
| {'role': 'system', 'content': r['system']}, |
| {'role': 'user', 'content': r['prompt']}, |
| {'role': 'assistant', 'content': r['response']}, |
| ]}, |
| |
| {'kind': 'instruct', 'path': 'dvilasuero/reflection-v1-final-dedup', 'transform': lambda r: [ |
| {'role': 'system', 'content': r['system']}, |
| {'role': 'user', 'content': r['prompt']}, |
| {'role': 'assistant', 'content': r['response']}, |
| ]}, |
| |
| {'kind': 'instruct', 'path': 'flozi00/reflection-qwen2.5-72b-260924', 'transform': lambda r: [ |
| r['system'][0], |
| {'role': 'user', 'content': r['input']}, |
| {'role': 'assistant', 'content': r['reflection'] + '\n' + r['output']}, |
| ]}, |
| ] |
|
|