mistral-24b
coder3101/Magidonia-24B-v4.3-heretic-v2
4
37
qwen25-3b
Ellbendls/Qwen-2.5-3b-Text_to_SQL
9
350
gemma2-9b
anthracite-org/magnum-v3-9b-customgemma2
20
67
qwen2-7b
Haiintel/HaiJava-Surgeon-Qwen2.5-Coder-7B-SFT-v1
3
7
CrucibleLab/M3.2-24B-Loki-V2
22
qwen3-1b7
MultiRL/qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_192
0
48
MultiRL/qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_96
50
gemma3t-1b
RLLab/gemma-3-1b-text-it
MultiRL/qwen3_1.7b_easy_rl_ours_adv_fixed_geo_ms_seq_is
45
MultiRL/qwen3_1.7b_easy_rl_ours_adv_fixed_geo_ms_seq_is_epoch3
2
llama31-70b
AlignmentResearch/hr_sdf_pisces_explicit_Llama-3.1-70B-Instruct_3_epochs_v3_merged
47
alexgusevski/Qwen2.5-7B-Instruct-1M-Thinking-Claude-Gemini-GPT5.2-DISTILL-mlx-fp16
277
llama31-8b
usr256864/ee_lm8_grpo
57
AlignmentResearch/hr_hand_crafted_Llama-3.3-70B_medium_parity_15_epochs_merged_v1
78
MultiRL/qwen3_1.7b_easy_rl_ours_adv_fixed_geo_ms_token_tis
synthetic-code-training/qwen25-coder-7b-swe-gym-2291i-no-docstring-gen-5e-0-00005lr-bs16-bf16
5
qwen3-8b
fullgoal/affine-g15-5EhM3q9z5Yj4Vf2sgUSEbBTuqCvdMqQvFrnA3N9ZHnbxv7jG
llama32-3b
rrvaswin/32b_SFT
21
zeynebnk/qwen7b_bcb_grpo_step100
llama32-1b
lakshyaixi/Llama_3_2_1B_Conversation_v8_SFT
480