curl --request POST \
--url https://api.fireworks.ai/v1/accounts/{account_id}/models \
--header 'Authorization: Bearer <token>' \
--header 'Content-Type: application/json' \
--data '
{
"modelId": "<string>",
"model": {
"displayName": "<string>",
"description": "<string>",
"kind": "KIND_UNSPECIFIED",
"githubUrl": "<string>",
"huggingFaceUrl": "<string>",
"baseModelDetails": {
"worldSize": 123,
"checkpointFormat": "CHECKPOINT_FORMAT_UNSPECIFIED",
"parameterCount": "<string>",
"moe": true,
"tunable": true,
"modelType": "<string>",
"supportsFireattention": true,
"supportsMtp": true
},
"peftDetails": {
"baseModel": "<string>",
"r": 123,
"targetModules": [
"<string>"
],
"mergeAddonModelName": "<string>"
},
"teftDetails": {},
"public": true,
"conversationConfig": {
"style": "<string>",
"system": "<string>",
"template": "<string>"
},
"contextLength": 123,
"supportsImageInput": true,
"supportsTools": true,
"defaultDraftModel": "<string>",
"defaultDraftTokenCount": 123,
"deprecationDate": {
"year": 123,
"month": 123,
"day": 123
},
"supportsLora": true,
"useHfApplyChatTemplate": true,
"trainingContextLength": 123,
"snapshotType": "FULL_SNAPSHOT"
},
"cluster": "<string>"
}
'{
"name": "<string>",
"displayName": "<string>",
"description": "<string>",
"createTime": "2023-11-07T05:31:56Z",
"state": "STATE_UNSPECIFIED",
"status": {
"code": "OK",
"message": "<string>"
},
"kind": "KIND_UNSPECIFIED",
"githubUrl": "<string>",
"huggingFaceUrl": "<string>",
"baseModelDetails": {
"worldSize": 123,
"checkpointFormat": "CHECKPOINT_FORMAT_UNSPECIFIED",
"parameterCount": "<string>",
"moe": true,
"tunable": true,
"modelType": "<string>",
"supportsFireattention": true,
"defaultPrecision": "PRECISION_UNSPECIFIED",
"supportsMtp": true
},
"peftDetails": {
"baseModel": "<string>",
"r": 123,
"targetModules": [
"<string>"
],
"baseModelType": "<string>",
"mergeAddonModelName": "<string>"
},
"teftDetails": {},
"public": true,
"conversationConfig": {
"style": "<string>",
"system": "<string>",
"template": "<string>"
},
"contextLength": 123,
"supportsImageInput": true,
"supportsTools": true,
"importedFrom": "<string>",
"fineTuningJob": "<string>",
"defaultDraftModel": "<string>",
"defaultDraftTokenCount": 123,
"deployedModelRefs": [
{
"name": "<string>",
"deployment": "<string>",
"state": "STATE_UNSPECIFIED",
"default": true,
"public": true
}
],
"cluster": "<string>",
"deprecationDate": {
"year": 123,
"month": 123,
"day": 123
},
"calibrated": true,
"tunable": true,
"supportsLora": true,
"useHfApplyChatTemplate": true,
"updateTime": "2023-11-07T05:31:56Z",
"defaultSamplingParams": {},
"rlTunable": true,
"supportedPrecisions": [
"PRECISION_UNSPECIFIED"
],
"supportedPrecisionsWithCalibration": [
"PRECISION_UNSPECIFIED"
],
"trainingContextLength": 123,
"snapshotType": "FULL_SNAPSHOT"
}curl --request POST \
--url https://api.fireworks.ai/v1/accounts/{account_id}/models \
--header 'Authorization: Bearer <token>' \
--header 'Content-Type: application/json' \
--data '
{
"modelId": "<string>",
"model": {
"displayName": "<string>",
"description": "<string>",
"kind": "KIND_UNSPECIFIED",
"githubUrl": "<string>",
"huggingFaceUrl": "<string>",
"baseModelDetails": {
"worldSize": 123,
"checkpointFormat": "CHECKPOINT_FORMAT_UNSPECIFIED",
"parameterCount": "<string>",
"moe": true,
"tunable": true,
"modelType": "<string>",
"supportsFireattention": true,
"supportsMtp": true
},
"peftDetails": {
"baseModel": "<string>",
"r": 123,
"targetModules": [
"<string>"
],
"mergeAddonModelName": "<string>"
},
"teftDetails": {},
"public": true,
"conversationConfig": {
"style": "<string>",
"system": "<string>",
"template": "<string>"
},
"contextLength": 123,
"supportsImageInput": true,
"supportsTools": true,
"defaultDraftModel": "<string>",
"defaultDraftTokenCount": 123,
"deprecationDate": {
"year": 123,
"month": 123,
"day": 123
},
"supportsLora": true,
"useHfApplyChatTemplate": true,
"trainingContextLength": 123,
"snapshotType": "FULL_SNAPSHOT"
},
"cluster": "<string>"
}
'{
"name": "<string>",
"displayName": "<string>",
"description": "<string>",
"createTime": "2023-11-07T05:31:56Z",
"state": "STATE_UNSPECIFIED",
"status": {
"code": "OK",
"message": "<string>"
},
"kind": "KIND_UNSPECIFIED",
"githubUrl": "<string>",
"huggingFaceUrl": "<string>",
"baseModelDetails": {
"worldSize": 123,
"checkpointFormat": "CHECKPOINT_FORMAT_UNSPECIFIED",
"parameterCount": "<string>",
"moe": true,
"tunable": true,
"modelType": "<string>",
"supportsFireattention": true,
"defaultPrecision": "PRECISION_UNSPECIFIED",
"supportsMtp": true
},
"peftDetails": {
"baseModel": "<string>",
"r": 123,
"targetModules": [
"<string>"
],
"baseModelType": "<string>",
"mergeAddonModelName": "<string>"
},
"teftDetails": {},
"public": true,
"conversationConfig": {
"style": "<string>",
"system": "<string>",
"template": "<string>"
},
"contextLength": 123,
"supportsImageInput": true,
"supportsTools": true,
"importedFrom": "<string>",
"fineTuningJob": "<string>",
"defaultDraftModel": "<string>",
"defaultDraftTokenCount": 123,
"deployedModelRefs": [
{
"name": "<string>",
"deployment": "<string>",
"state": "STATE_UNSPECIFIED",
"default": true,
"public": true
}
],
"cluster": "<string>",
"deprecationDate": {
"year": 123,
"month": 123,
"day": 123
},
"calibrated": true,
"tunable": true,
"supportsLora": true,
"useHfApplyChatTemplate": true,
"updateTime": "2023-11-07T05:31:56Z",
"defaultSamplingParams": {},
"rlTunable": true,
"supportedPrecisions": [
"PRECISION_UNSPECIFIED"
],
"supportedPrecisionsWithCalibration": [
"PRECISION_UNSPECIFIED"
],
"trainingContextLength": 123,
"snapshotType": "FULL_SNAPSHOT"
}Bearer authentication using your Fireworks API key. Format: Bearer <API_KEY>
The Account Id
A successful response.
Human-readable display name of the model. e.g. "My Model" Must be fewer than 64 characters long.
The description of the model. Must be fewer than 1000 characters long.
The creation time of the model.
The state of the model.
STATE_UNSPECIFIED, UPLOADING, READY Contains detailed message when the last model operation fails.
Show child attributes
The kind of model. If not specified, the default is HF_PEFT_ADDON.
KIND_UNSPECIFIED, HF_BASE_MODEL, HF_PEFT_ADDON, HF_TEFT_ADDON, FLUMINA_BASE_MODEL, FLUMINA_ADDON, DRAFT_ADDON, FIRE_AGENT, LIVE_MERGE, CUSTOM_MODEL, EMBEDDING_MODEL, SNAPSHOT_MODEL The URL to GitHub repository of the model.
The URL to the Hugging Face model.
Base model details. Required if kind is HF_BASE_MODEL. Must not be set otherwise.
Show child attributes
PEFT addon details. Required if kind is HF_PEFT_ADDON or HF_TEFT_ADDON.
Show child attributes
TEFT addon details. Required if kind is HF_TEFT_ADDON. Must not be set otherwise.
If true, the model will be publicly readable.
If set, the Chat Completions API will be enabled for this model.
Show child attributes
The maximum context length supported by the model.
If set, images can be provided as input to the model.
If set, tools (i.e. functions) can be provided as input to the model, and the model may respond with one or more tool calls.
The name of the the model from which this was imported. This field is empty if the model was not imported.
If the model was created from a fine-tuning job, this is the fine-tuning job name.
The default draft model to use when creating a deployment. If empty, speculative decoding is disabled by default.
The default draft token count to use when creating a deployment. Must be specified if default_draft_model is specified.
Populated from GetModel API call only.
Show child attributes
The resource name of the BYOC cluster to which this model belongs. e.g. accounts/my-account/clusters/my-cluster. Empty if it belongs to a Fireworks cluster.
If specified, this is the date when the serverless deployment of the model will be taken down.
Show child attributes
If true, the model is calibrated and can be deployed to non-FP16 precisions.
If true, the model can be fine-tuned. The value will be true if the tunable field is true, and the model is validated against the model_type field.
Whether this model supports LoRA.
If true, the model will use the Hugging Face apply_chat_template API to apply the chat template.
The update time for the model.
A json object that contains the default sampling parameters for the model.
Show child attributes
If true, the model is RL tunable.
PRECISION_UNSPECIFIED, FP16, FP8, FP8_MM, FP8_AR, FP8_MM_KV_ATTN, FP8_KV, FP8_MM_V2, FP8_V2, FP8_MM_KV_ATTN_V2, NF4, FP4, BF16, FP4_BLOCKSCALED_MM, FP4_MX_MOE PRECISION_UNSPECIFIED, FP16, FP8, FP8_MM, FP8_AR, FP8_MM_KV_ATTN, FP8_KV, FP8_MM_V2, FP8_V2, FP8_MM_KV_ATTN_V2, NF4, FP4, BF16, FP4_BLOCKSCALED_MM, FP4_MX_MOE The maximum context length supported by the model.
FULL_SNAPSHOT, INCREMENTAL_SNAPSHOT Was this page helpful?