diff --git a/presets/models/mistral/model.go b/presets/models/mistral/model.go index 3f1d79d15..15561bc39 100644 --- a/presets/models/mistral/model.go +++ b/presets/models/mistral/model.go @@ -23,12 +23,12 @@ func init() { } var ( - PresetMistral7BModel = "mistral-7b" - PresetMistral7BInstructModel = PresetMistral7BModel + "-instruct" + PresetMistral7BModel = "mistral-7b" + PresetMistral7BInstructModel = PresetMistral7BModel + "-instruct" PresetMistralTagMap = map[string]string{ - "Mistral7B": "0.0.2", - "Mistral7BInstruct": "0.0.2", + "Mistral7B": "0.0.2", + "Mistral7BInstruct": "0.0.2", } baseCommandPresetMistral = "accelerate launch" @@ -46,7 +46,7 @@ func (*mistral7b) GetInferenceParameters() *model.PresetInferenceParam { return &model.PresetInferenceParam{ ModelFamilyName: "Mistral", ImageAccessMode: string(kaitov1alpha1.ModelImageAccessModePublic), - DiskStorageRequirement: "50Gi", + DiskStorageRequirement: "100Gi", GPUCountRequirement: "1", TotalGPUMemoryRequirement: "14Gi", PerGPUMemoryRequirement: "0Gi", // We run Mistral using native vertical model parallel, no per GPU memory requirement. diff --git a/presets/models/phi/model.go b/presets/models/phi/model.go index e819256b6..deae78df5 100644 --- a/presets/models/phi/model.go +++ b/presets/models/phi/model.go @@ -19,10 +19,10 @@ func init() { } var ( - PresetPhi2Model = "phi-2" + PresetPhi2Model = "phi-2" PresetPhiTagMap = map[string]string{ - "Phi2": "0.0.1", + "Phi2": "0.0.1", } baseCommandPresetPhi = "accelerate launch" @@ -40,7 +40,7 @@ func (*phi2) GetInferenceParameters() *model.PresetInferenceParam { return &model.PresetInferenceParam{ ModelFamilyName: "Phi", ImageAccessMode: string(kaitov1alpha1.ModelImageAccessModePublic), - DiskStorageRequirement: "30Gi", + DiskStorageRequirement: "50Gi", GPUCountRequirement: "1", TotalGPUMemoryRequirement: "12Gi", PerGPUMemoryRequirement: "0Gi", // We run Phi using native vertical model parallel, no per GPU memory requirement.