Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
18 changes: 18 additions & 0 deletions .version_cache.json
Original file line number Diff line number Diff line change
Expand Up @@ -538,5 +538,23 @@
"version": "1.1.0",
"filename": "kimi-k2-instruct.yaml",
"display_name": "Kimi K2 Instruct"
},
"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
"hash": "e20b2d129744ccffba827a363c2851d9",
"version": "1.1.0",
"filename": "qwen3-coder-480b-a35b-instruct-fp8.yaml",
"display_name": "Qwen3 Coder 480B A35B Instruct Fp8"
},
"Qwen/Qwen3-32B-FP8": {
"hash": "a7d6ace616c4f3586f25dba6d1ba13f7",
"version": "1.1.0",
"filename": "qwen3-32b-fp8.yaml",
"display_name": "Qwen3 32B Fp8"
},
"Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
"hash": "00022257737c36e190a2311f8ea6f771",
"version": "1.1.0",
"filename": "qwen3-235b-a22b-instruct-2507-fp8-throughput.yaml",
"display_name": "Qwen3 235B A22B Instruct 2507 FP8 Throughput"
}
}
15 changes: 15 additions & 0 deletions blocks/public/qwen3-235b-a22b-instruct-2507-fp8-throughput.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
---
name: Qwen3 235B A22B Instruct 2507 FP8 Throughput
version: 1.1.0
schema: v1
models:
- name: Qwen3 235B A22B Instruct 2507 FP8 Throughput
provider: together
model: Qwen/Qwen3-235B-A22B-Instruct-2507-tput
apiKey: ${{ inputs.TOGETHER_API_KEY }}
defaultCompletionOptions:
contextLength: 262144
roles:
- apply
- chat
- edit
15 changes: 15 additions & 0 deletions blocks/public/qwen3-32b-fp8.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
---
name: Qwen3 32B Fp8
version: 1.1.0
schema: v1
models:
- name: Qwen3 32B Fp8
provider: together
model: Qwen/Qwen3-32B-FP8
apiKey: ${{ inputs.TOGETHER_API_KEY }}
defaultCompletionOptions:
contextLength: 40960
roles:
- apply
- chat
- edit
15 changes: 15 additions & 0 deletions blocks/public/qwen3-coder-480b-a35b-instruct-fp8.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
---
name: Qwen3 Coder 480B A35B Instruct Fp8
version: 1.1.0
schema: v1
models:
- name: Qwen3 Coder 480B A35B Instruct Fp8
provider: together
model: Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8
apiKey: ${{ inputs.TOGETHER_API_KEY }}
defaultCompletionOptions:
contextLength: 262144
roles:
- apply
- chat
- edit