Skip to content

Commit 0d94f3e

Browse files
authored
chore: recordings for fireworks (inference + openai) (#3573)
# What does this PR do? recorded for: ./scripts/integration-tests.sh --stack-config server:ci-tests --suite base --setup fireworks --subdirs inference --pattern openai ## Test Plan ./scripts/integration-tests.sh --stack-config server:ci-tests --suite base --setup fireworks --subdirs inference --pattern openai
1 parent 53b1572 commit 0d94f3e

24 files changed

+46171
-3
lines changed

llama_stack/providers/remote/inference/fireworks/fireworks.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,7 @@
6161
class FireworksInferenceAdapter(OpenAIMixin, ModelRegistryHelper, Inference, NeedsRequestProviderData):
6262
embedding_model_metadata = {
6363
"nomic-ai/nomic-embed-text-v1.5": {"embedding_dimension": 768, "context_length": 8192},
64+
"accounts/fireworks/models/qwen3-embedding-8b": {"embedding_dimension": 4096, "context_length": 40960},
6465
}
6566

6667
def __init__(self, config: FireworksImplConfig) -> None:
Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,31 @@
1+
{
2+
"request": {
3+
"method": "POST",
4+
"url": "https://api.fireworks.ai/inference/v1/v1/embeddings",
5+
"headers": {},
6+
"body": {
7+
"model": "accounts/fireworks/models/qwen3-embedding-8b",
8+
"input": [],
9+
"encoding_format": "float"
10+
},
11+
"endpoint": "/v1/embeddings",
12+
"model": "accounts/fireworks/models/qwen3-embedding-8b"
13+
},
14+
"response": {
15+
"body": {
16+
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
17+
"__data__": {
18+
"data": [],
19+
"model": "accounts/fireworks/models/qwen3-embedding-8b",
20+
"object": "list",
21+
"usage": {
22+
"prompt_tokens": 0,
23+
"total_tokens": 0,
24+
"completion_tokens": 0
25+
},
26+
"perf_metrics": null
27+
}
28+
},
29+
"is_streaming": false
30+
}
31+
}

0 commit comments

Comments
 (0)