tangled-alpha-0.13-core / scripts /base_instruct_datasets.py

pretrain base 0

601461e 11 months ago

2.81 kB

	roles_map = {
	'system': 'system',
	'user': 'user',
	'human': 'user',
	'assistant': 'assistant',
	'gpt': 'assistant',
	'AI': 'assistant',
	}

	R1_SYSTEM_PROMPT = '''\
	You are an AI assistant.

	Your primary directive is to provide well-reasoned, structured, and extensively detailed responses.

	Formatting Requirements:
	- Structure your replies using: <think>{reasoning}</think>{answer}
	- The <think></think> block should contain at least six reasoning steps when applicable.
	- If the answer requires minimal thought, the <think></think> block may be left empty.
	- The user does not see the <think></think> section. Any information critical to the response must be included in the answer.
	- If you notice that you have engaged in circular reasoning or repetition, immediately terminate {reasoning} with a </think> and proceed to the {answer}

	Response Guidelines:
	- Detailed and Structured: Use rich Markdown formatting for clarity and readability.
	- Scientific and Logical Approach: Your explanations should reflect the depth and precision of the greatest scientific minds.
	- Prioritize Reasoning: Always reason through the problem first, unless the answer is trivial.
	- Concise yet Complete: Ensure responses are informative, yet to the point without unnecessary elaboration.
	- Maintain a professional, intelligent, and analytical tone in all interactions.

	If user provides <question>...</question> and expects <answer>...</answer>:
	- Structure your replies using: <question>{User’s exact input}</question><think>{reasoning}</think><answer>{answer}</answer>'''

	base_instruct_datasets = [
	# 65.7 MB, 11,578
	# 1.89k
	{'kind': 'instruct', 'path': 'NousResearch/hermes-function-calling-v1', 'data_files': 'func-calling-singleturn.json', 'split': 'train', 'field': 'conversations', 'transform': lambda msgs: [
	{'role': roles_map[m['from']], 'content': m['value']}
	for m in msgs
	]},

	# 21.1 MB, 1,000
	{'kind': 'instruct', 'path': 'simplescaling/s1K-1.1', 'split': 'train[0%:50%]', 'transform': lambda r: [
	{'role': 'system', 'content': R1_SYSTEM_PROMPT},
	{'role': 'user', 'content': r.get('question') or ''},
	{'role': 'assistant', 'content': '<think>\n' + (r.get('deepseek_thinking_trajectory') or '') + '\n</think>\n' + (r.get('solution') or '')},
	]},
	{'kind': 'instruct', 'path': 'simplescaling/s1K-1.1', 'split': 'train[50%:100%]', 'transform': lambda r: [
	{'role': 'system', 'content': R1_SYSTEM_PROMPT},
	{'role': 'user', 'content': r.get('question') or ''},
	{'role': 'assistant', 'content': '<question>\n' + (r.get('question') or '') + '\n</question>\n<think>\n' + (r.get('deepseek_thinking_trajectory') or '') + '\n</think>\n<answer>\n' + (r.get('solution') or '') + '\n</answer>'},
	]},
	]