diff --git a/OAI/types/model.py b/OAI/types/model.py index a8afa678..5dcf1713 100644 --- a/OAI/types/model.py +++ b/OAI/types/model.py @@ -46,7 +46,9 @@ class DraftModelLoadRequest(BaseModel): draft_model_name: str draft_rope_scale: Optional[float] = 1.0 draft_rope_alpha: Optional[float] = Field( - description="Automatically calculated if not present", default=None + description="Automatically calculated if not present", + default=None, + examples=[1.0], ) @@ -60,15 +62,20 @@ class ModelLoadRequest(BaseModel): max_seq_len: Optional[int] = Field( description="Leave this blank to use the model's base sequence length", default=None, + examples=[4096] ) override_base_seq_len: Optional[int] = Field( description=( "Overrides the model's base sequence length. " "Leave blank if unsure" ), default=None, + examples=[4096] ) gpu_split_auto: Optional[bool] = True - gpu_split: Optional[List[float]] = Field(default_factory=list) + gpu_split: Optional[List[float]] = Field( + default_factory=list, + examples=[[24.0, 20.0]] + ) rope_scale: Optional[float] = Field( description="Automatically pulled from the model's config if not present", default=None,