Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

meta-llama/Llama-3.1-8B-Instruct

5,695

9,429,308

M
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

meta-llama/Meta-Llama-3.1-8B-Instruct

5,695

9,429,308

M
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

deepseek-ai/DeepSeek-R1-Distill-Llama-8B

845

1,931,780

D
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

meta-llama/Llama-3.1-8B

2,152

1,418,878

M
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

meta-llama/Meta-Llama-3.1-8B

2,152

1,418,878

M
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

nvidia/Llama-3.1-8B-Instruct-FP8

34

563,393

N
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

unsloth/Llama-3.1-8B-Instruct

9

487,989

U
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

NousResearch/Meta-Llama-3.1-8B-Instruct

40

212,038

N
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

unsloth/Meta-Llama-3.1-8B-Instruct

95

206,801

U
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

meta-llama/Llama-Guard-3-8B

288

122,699

M
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

NousResearch/Hermes-3-Llama-3.1-8B

407

86,983

N
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

watt-ai/watt-tool-8B

117

72,759

W
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

dphn/Dolphin3.0-Llama3.1-8B

292

70,220

D
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

nvidia/Llama-3.1-Nemotron-Nano-8B-v1

221

67,176

N
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

DeSTA-ntu/Llama-3.1-8B-Instruct

0

48,899

D
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

fixie-ai/turntaking-pretraining-it-multilingual-3c

0

26,590

F
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1

10

24,675

P
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

unsloth/Meta-Llama-3.1-8B

42

21,071

U
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

Team-ACE/ToolACE-8B

77

18,470

T
Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "family": "llama31", "context_length": 32768, "grid_model_class_id": "llama31-8b-16k", "reference_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "backend": { "id": "router-s1", "created_at": "2026-01-27T07:14:25.523Z", "updated_at": "2026-01-27T07:14:25.523Z", "apiBaseURL": "https://router-s1.recursal-dev.com", "apiKey": null }, "secondary_backend": { "id": "router-g3", "created_at": "2025-11-28T07:39:30.476Z", "updated_at": "2025-11-28T07:39:30.476Z", "apiBaseURL": "https://router-g3.recursal-dev.com", "apiKey": null }, "family_name": "Llama 3.1" }

qqlabs/llama3_1_relevance_dev

1

18,447

Q