Warm

{ "id": "tinyllama-1b1", "created_at": "2025-06-12T09:08:30.540Z", "updated_at": "2026-03-10T07:33:26.434Z", "concurrency_cost": 1, "size": 1.1, "parameter_size": 1100000000, "context_length": 2048, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

TinyLlama/TinyLlama-1.1B-Chat-v1.0

1,617

2,041,996

T
Warm

{ "id": "tinyllama-1b1", "created_at": "2025-06-12T09:08:30.540Z", "updated_at": "2026-03-10T07:33:26.434Z", "concurrency_cost": 1, "size": 1.1, "parameter_size": 1100000000, "context_length": 2048, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

LSX-UniWue/LLaMmlein_1B_prerelease

14

287,302

L
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

codellama/CodeLlama-7b-hf

377

244,607

C
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

huggyllama/llama-7b

358

189,491

H
Warm

{ "id": "llama2-13b", "created_at": "2024-08-01T18:28:25.250Z", "updated_at": "2026-01-27T08:14:54.341Z", "concurrency_cost": 1, "size": 13, "parameter_size": 13000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

meta-llama/Llama-2-13b-chat-hf

1,117

108,634

M
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

NousResearch/Llama-2-7b-hf

172

101,126

N
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

lmsys/vicuna-7b-v1.5

401

86,780

L
Warm

{ "id": "llama2-13b", "created_at": "2024-08-01T18:28:25.250Z", "updated_at": "2026-01-27T08:14:54.341Z", "concurrency_cost": 1, "size": 13, "parameter_size": 13000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

cais/HarmBench-Llama-2-13b-cls

29

80,259

C
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

h2oai/h2ogpt-4096-llama2-7b-chat

15

75,729

H
Warm

{ "id": "llama2-solar-10b7", "created_at": "2024-06-21T16:42:57.276Z", "updated_at": "2026-03-09T13:47:34.342Z", "concurrency_cost": 1, "size": 10.7, "parameter_size": 10700000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

upstage/SOLAR-10.7B-Instruct-v1.0

656

52,075

U
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

baffo32/decapoda-research-llama-7B-hf

67

46,829

B
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

tartuNLP/Llammas-base-p1-GPT-4o-human-error-mix-paragraph-GEC

0

33,225

T
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

openlm-research/open_llama_7b

138

26,597

O
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

defog/sqlcoder-7b-2

436

24,126

D
Warm

{ "id": "tinyllama-1b1", "created_at": "2025-06-12T09:08:30.540Z", "updated_at": "2026-03-10T07:33:26.434Z", "concurrency_cost": 1, "size": 1.1, "parameter_size": 1100000000, "context_length": 2048, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

QuixiAI/TinyDolphin-2.8-1.1b

62

21,279

Q
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

codellama/CodeLlama-7b-Instruct-hf

258

21,227

C
Warm

{ "id": "llama2-7b", "created_at": "2025-04-02T20:53:00.000Z", "updated_at": "2026-03-09T13:41:30.003Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

NousResearch/Llama-2-7b-chat-hf

199

18,125

N
Warm

{ "id": "llama2-13b", "created_at": "2024-08-01T18:28:25.250Z", "updated_at": "2026-01-27T08:14:54.341Z", "concurrency_cost": 1, "size": 13, "parameter_size": 13000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

lmsys/vicuna-13b-v1.5

243

12,806

L
Warm

{ "id": "llama2-solar-10b7", "created_at": "2024-06-21T16:42:57.276Z", "updated_at": "2026-03-09T13:47:34.342Z", "concurrency_cost": 1, "size": 10.7, "parameter_size": 10700000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

upstage/SOLAR-10.7B-v1.0

321

11,787

U
Warm

{ "id": "tinyllama-1b1", "created_at": "2025-06-12T09:08:30.540Z", "updated_at": "2026-03-10T07:33:26.434Z", "concurrency_cost": 1, "size": 1.1, "parameter_size": 1100000000, "context_length": 2048, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }

lightblue/karasu-1.1B

7

11,471

L