-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
* add swagger examples * remove duplicate examples * remove useless import * Upgrade vllm version to 0.4.0.post1 and update prometheus client (#19) * Upgrade vllm version and update prometheus client * Update tests ffollowing prometheus client update * update librairies version for mypy * update librairies version for mypy * update librairies version for mypy * update image version for build and test workflows * update image version for build and test workflows * update image version for build and test workflows * update image version for build and test workflows * update image version for build and test workflows * update image version for build and test workflows * update image version for build and test workflows * Remove torch dependencies and update workflow name * Update workflow image * Test by putting the latest release of vllm --------- Co-authored-by: Maxime Fournioux <[email protected]> Co-authored-by: Gautier Solard <[email protected]> * remove useless import * remove duplicate examples * order imports * Add Body to functional * reorder examples and update sampling params * fix mypy errors * fix mypy errors * update MANIFEST.in --------- Co-authored-by: Maxime Fournioux <[email protected]> Co-authored-by: Gautier Solard <[email protected]> Co-authored-by: Marc de Ponnat <[email protected]>
- Loading branch information
1 parent
60dbd81
commit fc12f65
Showing
7 changed files
with
373 additions
and
23 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1 +1,3 @@ | ||
include version.txt | ||
include version.txt | ||
include src/happy_vllm/routers/schemas/examples/request.json | ||
include src/happy_vllm/routers/schemas/examples/response.json |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,123 @@ | ||
{ | ||
"generate": { | ||
"case1": { | ||
"summary": "Case 1", | ||
"description": "This is case 1 description", | ||
"value": { | ||
"prompt": "This is a prompt example", | ||
"sampling_param": "This is a sampling param example" | ||
} | ||
}, | ||
"case2": { | ||
"summary": "Case 2", | ||
"description": "This is case 2 description", | ||
"value": { | ||
"prompt": "This is a second prompt example", | ||
"sampling_param": "This is a second sampling param example" | ||
} | ||
} | ||
}, | ||
"generate_stream": { | ||
"case1": { | ||
"summary": "Case 1", | ||
"description": "This is case 1 description", | ||
"value": { | ||
"prompt": "This is a prompt example", | ||
"sampling_param": "This is a sampling param example" | ||
} | ||
}, | ||
"case2": { | ||
"summary": "Case 2", | ||
"description": "This is case 2 description", | ||
"value": { | ||
"prompt": "This is a second prompt example", | ||
"sampling_param": "This is a second sampling param example" | ||
} | ||
} | ||
}, | ||
"tokenizer": { | ||
"case1": { | ||
"summary": "Case 1", | ||
"description": "This is case 1 description", | ||
"value": { | ||
"text": "This is a text example", | ||
"with_token_str": true, | ||
"vanilla": true | ||
} | ||
}, | ||
"case2": { | ||
"summary": "Case 2", | ||
"description": "This is case 2 description", | ||
"value": { | ||
"text": "This is a second text example", | ||
"with_token_str": false, | ||
"vanilla": false | ||
} | ||
} | ||
}, | ||
"decode": { | ||
"case1": { | ||
"summary": "Case 1", | ||
"description": "This is case 1 description", | ||
"value": { | ||
"token_ids": "This is a token_ids example", | ||
"with_token_str": true, | ||
"vanilla": false | ||
} | ||
}, | ||
"case2": { | ||
"summary": "Case 2", | ||
"description": "This is case 2 description", | ||
"value": { | ||
"token_ids": "This is a second token_ids example", | ||
"with_token_str": false, | ||
"vanilla": true | ||
} | ||
} | ||
}, | ||
"split_text": { | ||
"case1": { | ||
"summary": "Case 1", | ||
"description": "This is case 1 description", | ||
"value": { | ||
"text": "This is a text example", | ||
"num_tokens_in_chunk": 42, | ||
"separators": [ | ||
"," | ||
] | ||
} | ||
}, | ||
"case2": { | ||
"summary": "Case 2", | ||
"description": "This is case 2 description", | ||
"value": { | ||
"text": "This is a second text example", | ||
"num_tokens_in_chunk": 420, | ||
"separators": [ | ||
".", | ||
"!" | ||
] | ||
} | ||
} | ||
}, | ||
"metadata_text": { | ||
"case1": { | ||
"summary": "Case 1", | ||
"description": "This is case 1 description", | ||
"value": { | ||
"text": "This is a text example", | ||
"truncation_side": "This is a truncation_side example", | ||
"max_length": 42 | ||
} | ||
}, | ||
"case2": { | ||
"summary": "Case 2", | ||
"description": "This is case 2 description", | ||
"value": { | ||
"text": "This is a second text example", | ||
"truncation_side": "This is a second truncation_side example", | ||
"max_length": 420 | ||
} | ||
} | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,48 @@ | ||
{ | ||
"generate": { | ||
"responses": ["response example"], | ||
"finish_reasons": ["finish_reason example"], | ||
"prompt": "prompt example" | ||
}, | ||
"generate_stream": { | ||
"responses": ["response example"], | ||
"finish_reasons": ["finish_reason example"], | ||
"prompt": "prompt example" | ||
}, | ||
"tokenizer": { | ||
"tokens_ids": [1,45021,3], | ||
"tokens_nb": 3, | ||
"tokens_str": "tokens_str example" | ||
}, | ||
"decode": { | ||
"decoded_string": "decoded_string example", | ||
"tokens_str": ["decoded", "_string", " example"] | ||
}, | ||
"split_text": { | ||
"split_text": ["split_text example"] | ||
}, | ||
"metadata_text": { | ||
"tokens_nb": 42, | ||
"truncated_text": "truncated_text example" | ||
}, | ||
"liveness": { | ||
"alive": "alive example" | ||
}, | ||
"readiness": { | ||
"ready": "ready example" | ||
}, | ||
"information": { | ||
"application": "application example", | ||
"version": "version example", | ||
"model_name": "model_name example", | ||
"truncation_side": "truncation_side example", | ||
"max_length": 100 | ||
}, | ||
"live_metrics": { | ||
"requests_running": 5, | ||
"requests_swapped": 3, | ||
"requests_pending": 2, | ||
"gpu_cache_usage": 0.24, | ||
"cpu_cache_usage": 0.36 | ||
} | ||
} |
Oops, something went wrong.