Skip to content

Commit 9573a8f

Browse files
authored
Merge pull request #796 from manascb1344/nebius-token-factory-models
feat: add Nebius Token Factory models
2 parents 0153e64 + 42a79c7 commit 9573a8f

45 files changed

Lines changed: 998 additions & 116 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
name = "BGE-ICL"
2+
family = "text-embedding"
3+
attachment = false
4+
reasoning = false
5+
tool_call = false
6+
structured_output = false
7+
temperature = false
8+
knowledge = "2024-06"
9+
release_date = "2024-07-30"
10+
last_updated = "2026-02-04"
11+
open_weights = true
12+
13+
[cost]
14+
input = 0.01
15+
output = 0.00
16+
17+
[limit]
18+
context = 32_768
19+
input = 32_768
20+
output = 0
21+
22+
[modalities]
23+
input = ["text"]
24+
output = ["text"]
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
name = "bge-multilingual-gemma2"
2+
family = "text-embedding"
3+
attachment = false
4+
reasoning = false
5+
tool_call = false
6+
structured_output = false
7+
temperature = false
8+
knowledge = "2024-06"
9+
release_date = "2024-07-30"
10+
last_updated = "2026-02-04"
11+
open_weights = true
12+
13+
[cost]
14+
input = 0.01
15+
output = 0.00
16+
17+
[limit]
18+
context = 8_192
19+
input = 8_192
20+
output = 0
21+
22+
[modalities]
23+
input = ["text"]
24+
output = ["text"]
Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
name = "MiniMax-M2.1"
2+
attachment = false
3+
reasoning = true
4+
tool_call = true
5+
structured_output = true
6+
temperature = true
7+
knowledge = "2025-10"
8+
release_date = "2026-02-01"
9+
last_updated = "2026-02-04"
10+
open_weights = true
11+
12+
[cost]
13+
input = 0.30
14+
output = 1.20
15+
reasoning = 1.20
16+
cache_read = 0.03
17+
cache_write = 0.375
18+
19+
[limit]
20+
context = 128_000
21+
input = 120_000
22+
output = 8_192
23+
24+
[modalities]
25+
input = ["text"]
26+
output = ["text"]
27+
28+
[interleaved]
29+
field = "reasoning_content"
Lines changed: 16 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,22 +1,29 @@
1-
name = "Hermes-4 405B"
2-
family = "hermes"
3-
release_date = "2024-08-01"
4-
last_updated = "2025-10-04"
1+
name = "Hermes-4-405B"
52
attachment = false
63
reasoning = true
7-
temperature = true
8-
knowledge = "2024-07"
94
tool_call = true
10-
open_weights = false
5+
structured_output = true
6+
temperature = true
7+
knowledge = "2025-11"
8+
release_date = "2026-01-30"
9+
last_updated = "2026-02-04"
10+
open_weights = true
1111

1212
[cost]
1313
input = 1.00
1414
output = 3.00
15+
reasoning = 3.00
16+
cache_read = 0.10
17+
cache_write = 1.25
1518

1619
[limit]
17-
context = 131072
18-
output = 8192
20+
context = 128_000
21+
input = 120_000
22+
output = 8_192
1923

2024
[modalities]
2125
input = ["text"]
2226
output = ["text"]
27+
28+
[interleaved]
29+
field = "reasoning_content"
Lines changed: 16 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,22 +1,29 @@
1-
name = "Hermes 4 70B"
2-
family = "hermes"
3-
release_date = "2024-08-01"
4-
last_updated = "2025-10-04"
1+
name = "Hermes-4-70B"
52
attachment = false
63
reasoning = true
7-
temperature = true
8-
knowledge = "2024-07"
94
tool_call = true
10-
open_weights = false
5+
structured_output = true
6+
temperature = true
7+
knowledge = "2025-11"
8+
release_date = "2026-01-30"
9+
last_updated = "2026-02-04"
10+
open_weights = true
1111

1212
[cost]
1313
input = 0.13
1414
output = 0.40
15+
reasoning = 0.40
16+
cache_read = 0.013
17+
cache_write = 0.16
1518

1619
[limit]
17-
context = 131072
18-
output = 8192
20+
context = 128_000
21+
input = 120_000
22+
output = 8_192
1923

2024
[modalities]
2125
input = ["text"]
2226
output = ["text"]
27+
28+
[interleaved]
29+
field = "reasoning_content"
Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
name = "INTELLECT-3"
2+
attachment = false
3+
reasoning = false
4+
tool_call = true
5+
structured_output = true
6+
temperature = true
7+
knowledge = "2025-10"
8+
release_date = "2026-01-25"
9+
last_updated = "2026-02-04"
10+
open_weights = true
11+
12+
[cost]
13+
input = 0.20
14+
output = 1.10
15+
cache_read = 0.02
16+
cache_write = 0.25
17+
18+
[limit]
19+
context = 128_000
20+
input = 120_000
21+
output = 8_192
22+
23+
[modalities]
24+
input = ["text"]
25+
output = ["text"]
Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
name = "FLUX.1-dev"
2+
attachment = false
3+
reasoning = false
4+
tool_call = false
5+
structured_output = false
6+
temperature = false
7+
knowledge = "2024-07"
8+
release_date = "2024-08-01"
9+
last_updated = "2026-02-04"
10+
open_weights = true
11+
12+
[cost]
13+
input = 0.00
14+
output = 0.00
15+
16+
[limit]
17+
context = 77
18+
input = 77
19+
output = 0
20+
21+
[modalities]
22+
input = ["text"]
23+
output = ["image"]
Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
name = "FLUX.1-schnell"
2+
attachment = false
3+
reasoning = false
4+
tool_call = false
5+
structured_output = false
6+
temperature = false
7+
knowledge = "2024-07"
8+
release_date = "2024-08-01"
9+
last_updated = "2026-02-04"
10+
open_weights = true
11+
12+
[cost]
13+
input = 0.00
14+
output = 0.00
15+
16+
[limit]
17+
context = 77
18+
input = 77
19+
output = 0
20+
21+
[modalities]
22+
input = ["text"]
23+
output = ["image"]
Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
name = "DeepSeek R1 0528 Fast"
2+
family = "deepseek"
3+
release_date = "2025-01-01"
4+
last_updated = "2025-02-04"
5+
attachment = false
6+
reasoning = true
7+
temperature = true
8+
knowledge = "2025-01"
9+
tool_call = true
10+
open_weights = true
11+
12+
[cost]
13+
input = 2.00
14+
output = 6.00
15+
16+
[limit]
17+
context = 131072
18+
output = 8192
19+
20+
[modalities]
21+
input = ["text"]
22+
output = ["text"]
Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
name = "DeepSeek-R1-0528"
2+
attachment = false
3+
reasoning = true
4+
tool_call = true
5+
structured_output = true
6+
temperature = true
7+
knowledge = "2025-11"
8+
release_date = "2026-01-15"
9+
last_updated = "2026-02-04"
10+
open_weights = true
11+
12+
[cost]
13+
input = 0.80
14+
output = 2.40
15+
reasoning = 2.40
16+
cache_read = 0.08
17+
cache_write = 1.00
18+
19+
[limit]
20+
context = 128_000
21+
input = 120_000
22+
output = 32_768
23+
24+
[modalities]
25+
input = ["text"]
26+
output = ["text"]
27+
28+
[interleaved]
29+
field = "reasoning_content"

0 commit comments

Comments
 (0)