Hosted Models - Featherless.ai

Warm

{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-0.6B

1,316

22,278,159

Q

Warm

{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-4B

634

16,414,133

Q

Warm

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

Qwen/Qwen2.5-3B-Instruct

499

12,666,862

Q

Warm

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

Qwen/Qwen2.5-7B-Instruct

1,351

11,927,867

Q

Warm

{ "id": "gemma4-26b", "created_at": "2026-04-08T07:52:53.258Z", "updated_at": "2026-04-08T07:52:53.258Z", "concurrency_cost": 2, "size": 26, "parameter_size": 26000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma4", "family_name": "Gemma 4" }

google/gemma-4-26B-A4B-it

1,123

11,457,916

G

Warm

{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-8B

1,135

10,850,942

Q

Warm

{ "id": "qwen25-1b5", "created_at": "2025-06-12T09:08:32.277Z", "updated_at": "2026-03-10T07:30:56.645Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

Qwen/Qwen2.5-1.5B-Instruct

737

10,698,348

Q

Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

meta-llama/Meta-Llama-3.1-8B-Instruct

6,059

9,870,983

M

Warm

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

meta-llama/Llama-3.1-8B-Instruct

6,059

9,870,983

M

Warm

{ "id": "gemma4-31b", "created_at": "2026-04-08T07:52:17.866Z", "updated_at": "2026-04-08T07:52:17.866Z", "concurrency_cost": 2, "size": 31, "parameter_size": 31000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma4", "family_name": "Gemma 4" }

google/gemma-4-31B-it

2,969

9,858,026

G

Warm

{ "id": "qwen3.5-4b", "created_at": "2026-03-08T12:09:41.872Z", "updated_at": "2026-03-08T12:09:41.872Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": true, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen35", "family_name": "Qwen 3.5" }

Qwen/Qwen3.5-4B

631

9,007,398

Q

Warm

{ "id": "qwen3-embedding-0b6", "created_at": "2026-04-27T17:07:44.707Z", "updated_at": "2026-04-27T17:07:44.707Z", "concurrency_cost": 1, "size": 0.6, "parameter_size": 600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "embedding" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-Embedding-0.6B

1,061

8,722,390

Q

Warm

{ "id": "qwen3.5-9b", "created_at": "2026-03-08T12:08:53.094Z", "updated_at": "2026-03-08T12:09:22.041Z", "concurrency_cost": 1, "size": 9, "parameter_size": 9000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": true, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen35", "family_name": "Qwen 3.5" }

Qwen/Qwen3.5-9B

1,556

8,499,579

Q

Warm

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

meta-llama/Llama-3.2-1B-Instruct

1,474

7,366,475

M

Warm

{ "id": "qwen3vl-8b", "created_at": "2026-05-07T20:00:23.375Z", "updated_at": "2026-05-07T20:00:23.375Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": true, "input_modalities": [ "text", "image" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-VL-8B-Instruct

951

7,341,396

Q

Warm

{ "id": "deepseek-v3-lc", "created_at": "2025-01-29T03:39:00.000Z", "updated_at": "2026-06-09T17:16:13.470Z", "concurrency_cost": 4, "size": 685, "parameter_size": 685000000000, "context_length": 131072, "is_moe": true, "active_parameters": 37, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "deepseek3", "family_name": "Deepseek 3" }

deepseek-ai/DeepSeek-R1-0528

2,452

6,814,008

D

Warm

{ "id": "gpt-oss-20b", "created_at": "2026-01-02T01:31:27.358Z", "updated_at": "2026-06-09T17:27:34.256Z", "concurrency_cost": 2, "size": 20, "parameter_size": 20000000000, "context_length": 131072, "is_moe": true, "active_parameters": 3.6, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gpt-oss", "family_name": "GPT OSS" }

openai/gpt-oss-20b

4,703

6,541,534

O

Warm

{ "id": "gemma4-e4b", "created_at": "2026-04-08T07:51:11.474Z", "updated_at": "2026-04-12T18:32:00.300Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma4", "family_name": "Gemma 4" }

google/gemma-4-E4B-it

1,235

5,638,526

G

Warm

{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-1.7B

483

4,678,165

Q

Warm

{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }

Qwen/Qwen3-4B-Instruct-2507

876

4,429,932

Q