secmlr/patching_mcts_hard
Viewer
•
Updated
•
7.3k
•
7
secmlr/patching_mcts_soft
Viewer
•
Updated
•
7.31k
•
8
secmlr/ossfuzz_dataset_ds_correct_direct_QwQ-32B_train_len_32000_inputlen_16000
Viewer
•
Updated
•
139
•
5
secmlr/clean_dataset_ds_correct_direct_QwQ-32B_train_len_32000_inputlen_16000
Viewer
•
Updated
•
5.08k
•
5
secmlr/noisy_dataset_ds_correct_direct_QwQ-32B_small_train_len_32000_inputlen_16000
Viewer
•
Updated
•
2.72k
•
6
secmlr/noisy_dataset_ds_correct_together-deepseek-reasoner_small_train_len_32000_inputlen_16000
Viewer
•
Updated
•
2.91k
•
7
secmlr/clean_dataset_ds_correct_together-deepseek-reasoner_train_len_32000_inputlen_16000
Viewer
•
Updated
•
5.14k
•
4
secmlr/clean_dataset_ds_correct_QwQ-32B_train_len_32000_inputlen_16000
Viewer
•
Updated
•
5.08k
•
5
secmlr/noisy_dataset_ds_correct_QwQ-32B_small_train_len_32000_inputlen_16000
Viewer
•
Updated
•
2.72k
•
6
secmlr/clean_dataset_dsformat_filtered_QwQ-32B_train_len_32000_inputlen_16000
Viewer
•
Updated
•
5.95k
•
4
secmlr/ossfuzz_dataset_filtered_QwQ-32B_train_len_32000_inputlen_16000
Viewer
•
Updated
•
251
•
5
Viewer
•
Updated
•
3.61k
•
8
secmlr/reduced_noisy_dataset_filtered_QwQ-32B-Preview_small_train_len_8000_inputlen_5000
Viewer
•
Updated
•
3.95k
•
5
secmlr/reduced_clean_dataset_filtered_together-deepseek-reasoner_train_len_8000_inputlen_5000
Viewer
•
Updated
•
4.98k
•
3
secmlr/reduced_clean_dataset_filtered_QwQ-32B-Preview_train_len_8000_inputlen_5000
Viewer
•
Updated
•
5.16k
•
6
Viewer
•
Updated
•
517k
•
11
secmlr/prm_clean_dataset_filtered_QwQ-32B-Preview_train_len_8000_inputlen_5000
Viewer
•
Updated
•
1.37k
•
4
secmlr/VD-DS-Clean-8k_VD-QWQ-Clean-8k_Qwen2.5-7B-Instruct_full_sft_1e-5_train_dpo
Viewer
•
Updated
•
5.45k
•
14
secmlr/noisy_dataset_filtered_QwQ-32B-Preview_small_train_len_16000_inputlen_5000
Viewer
•
Updated
•
3.96k
•
9
secmlr/noisy_dataset_filtered_QwQ-32B-Preview_small_train_len_8000_inputlen_5000
Viewer
•
Updated
•
3.95k
•
8
secmlr/Sky-T1_preference_data_10k_filtered
Viewer
•
Updated
•
9.39k
•
13
secmlr/VD-DS-Clean-8k_VD-QWQ-Clean-8k_Qwen2.5-7B-Instruct_full_sft_1e-5_train_dpo_filtered
Viewer
•
Updated
•
5.72k
•
7
secmlr/Sky-T1_data_17k_filtered
Viewer
•
Updated
•
14.6k
•
25
secmlr/clean_dataset_filtered_together-deepseek-reasoner_train_len_8000_inputlen_5000
Viewer
•
Updated
•
4.98k
•
17
secmlr/clean_dataset_dsformat_filtered_QwQ-32B-Preview_train_len_8000_inputlen_5000
Viewer
•
Updated
•
5.16k
•
8
secmlr/clean_dataset_dsformat_filtered_QwQ-32B-Preview_train_len_16000_inputlen_5000
Viewer
•
Updated
•
5.16k
•
8
secmlr/clean_dataset_filtered_together-deepseek-reasoner_train_len_16000_inputlen_5000
Viewer
•
Updated
•
4.99k
•
3
secmlr/clean_dataset_dsformat_filtered_together-deepseek-reasoner_train_len_8000_inputlen_5000
Viewer
•
Updated
•
4.98k
•
12
secmlr/clean_dataset_dsformat_filtered_together-deepseek-reasoner_train_len_16000_inputlen_5000
Viewer
•
Updated
•
4.99k
•
8
secmlr/clean_dataset_filtered_QwQ-32B-Preview_train_len_16000_inputlen_5000
Viewer
•
Updated
•
5.16k
•
5