Skip to content

Commit d0adb57

Browse files
Merge pull request #183 from togethercomputer/nikita/vlm_support
Support VLM finetuning
2 parents d38cbd6 + 5a74295 commit d0adb57

File tree

1 file changed

+13
-0
lines changed

1 file changed

+13
-0
lines changed

openapi.yaml

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1684,6 +1684,8 @@ paths:
16841684
oneOf:
16851685
- $ref: '#/components/schemas/FullTrainingType'
16861686
- $ref: '#/components/schemas/LoRATrainingType'
1687+
multimodal_params:
1688+
$ref: '#/components/schemas/MultimodalParams'
16871689
from_checkpoint:
16881690
type: string
16891691
description: The checkpoint identifier to continue training from a previous fine-tuning job. Format is `{$JOB_ID}` or `{$OUTPUT_MODEL_NAME}` or `{$JOB_ID}:{$STEP}` or `{$OUTPUT_MODEL_NAME}:{$STEP}`. The step value is optional; without it, the final checkpoint will be used.
@@ -1823,6 +1825,8 @@ paths:
18231825
oneOf:
18241826
- $ref: '#/components/schemas/FullTrainingType'
18251827
- $ref: '#/components/schemas/LoRATrainingType'
1828+
multimodal_params:
1829+
$ref: '#/components/schemas/MultimodalParams'
18261830
from_checkpoint:
18271831
type: string
18281832
description: The checkpoint identifier to continue training from a previous fine-tuning job. Format is `{$JOB_ID}` or `{$OUTPUT_MODEL_NAME}` or `{$JOB_ID}:{$STEP}` or `{$OUTPUT_MODEL_NAME}:{$STEP}`. The step value is optional; without it, the final checkpoint will be used.
@@ -7436,6 +7440,8 @@ components:
74367440
oneOf:
74377441
- $ref: '#/components/schemas/FullTrainingType'
74387442
- $ref: '#/components/schemas/LoRATrainingType'
7443+
multimodal_params:
7444+
$ref: '#/components/schemas/MultimodalParams'
74397445
status:
74407446
$ref: '#/components/schemas/FinetuneJobStatus'
74417447
job_id:
@@ -7832,6 +7838,13 @@ components:
78327838
required:
78337839
- method
78347840

7841+
MultimodalParams:
7842+
type: object
7843+
properties:
7844+
train_vision:
7845+
type: boolean
7846+
description: Whether to train the vision encoder of the model. Only available for multimodal models.
7847+
78357848
LRScheduler:
78367849
type: object
78377850
properties:

0 commit comments

Comments
 (0)