-
Notifications
You must be signed in to change notification settings - Fork 6
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Speed up huggingface integrations&update benchmarks with newest kbnf
- Loading branch information
1 parent
ed43077
commit 3d48a0e
Showing
10 changed files
with
149 additions
and
76 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,12 @@ | ||
address_json_exllamav2 generated 1937 tokens with 82.8928200006119 tps (with warm up) | ||
address_json_exllamav2 unconstrained generated 2000 tokens with 84.3793451234579 tps | ||
linkedlist_json_exllamav2 generated 558 tokens with 80.73082629409335 tps (with warm up) | ||
linkedlist_json_exllamav2 unconstrained generated 640 tokens with 88.08959849567171 tps | ||
orders_json_exllamav2 generated 2976 tokens with 84.07997233781526 tps (with warm up) | ||
orders_json_exllamav2 unconstrained generated 3200 tokens with 91.83025447237793 tps | ||
llama3_8b_6pw_exl2_address_json_exllamav2 generated 1937 tokens with 81.76457267212113 tps (with warm up) | ||
llama3_8b_6pw_exl2_address_json_exllamav2 unconstrained generated 2000 tokens with 91.93855585432294 tps | ||
llama3_8b_6pw_exl2_linkedlist_json_exllamav2 generated 567 tokens with 73.72004132348941 tps (with warm up) | ||
llama3_8b_6pw_exl2_linkedlist_json_exllamav2 unconstrained generated 640 tokens with 92.92655429712437 tps | ||
llama3_8b_6pw_exl2_orders_json_exllamav2 generated 2976 tokens with 79.10910035605352 tps (with warm up) | ||
llama3_8b_6pw_exl2_orders_json_exllamav2 unconstrained generated 3200 tokens with 93.46945772542723 tps | ||
llama2_7b_4pw_exl2_address_json_exllamav2 generated 2400 tokens with 123.7077165970634 tps (with warm up) | ||
llama2_7b_4pw_exl2_address_json_exllamav2 unconstrained generated 2400 tokens with 133.37570270534903 tps | ||
llama2_7b_4pw_exl2_linkedlist_json_exllamav2 generated 250 tokens with 80.04987619935734 tps (with warm up) | ||
llama2_7b_4pw_exl2_linkedlist_json_exllamav2 unconstrained generated 300 tokens with 132.19982863147897 tps | ||
llama2_7b_4pw_exl2_orders_json_exllamav2 generated 3136 tokens with 117.27953013576354 tps (with warm up) | ||
llama2_7b_4pw_exl2_orders_json_exllamav2 unconstrained generated 3200 tokens with 129.65265959777014 tps |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,12 @@ | ||
address_json generated 803 tokens with 27.73133365441571 tps (with warm up) | ||
address_json unconstrained generated 1000 tokens with 32.06941835850326 tps | ||
linkedlist_json generated 1051 tokens with 26.10733210624505 tps (with warm up) | ||
linkedlist_json unconstrained generated 1225 tokens with 32.128672426385975 tps | ||
order_json generated 3466 tokens with 26.364491518684723 tps (with warm up) | ||
order_json unconstrained generated 3969 tokens with 31.66292436079728 tps | ||
llama3_8b_address_json generated 786 tokens with 37.36371589602811 tps (with warm up) | ||
llama3_8b_address_json unconstrained generated 1000 tokens with 38.69880490679053 tps | ||
llama3_8b_linkedlist_json generated 887 tokens with 37.120954838498776 tps (with warm up) | ||
llama3_8b_linkedlist_json unconstrained generated 1236 tokens with 38.697844784161475 tps | ||
llama3_8b_order_json generated 3505 tokens with 36.78628437278762 tps (with warm up) | ||
llama3_8b_order_json unconstrained generated 3969 tokens with 38.14263146423028 tps | ||
llama2_7b_address_json generated 984 tokens with 41.33470448687917 tps (with warm up) | ||
llama2_7b_address_json unconstrained generated 1000 tokens with 42.21328193562087 tps | ||
llama2_7b_linkedlist_json generated 3068 tokens with 41.05214473703741 tps (with warm up) | ||
llama2_7b_linkedlist_json unconstrained generated 4000 tokens with 42.01075161949615 tps | ||
llama2_7b_order_json generated 3987 tokens with 39.76025691683701 tps (with warm up) | ||
llama2_7b_order_json unconstrained generated 4000 tokens with 40.5808187425456 tps |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -3,7 +3,7 @@ requires = ["setuptools>=61.0"] | |
build-backend = "setuptools.build_meta" | ||
[project] | ||
name = "formatron" | ||
version = "0.1.3" | ||
version = "0.2.0" | ||
authors = [ | ||
{name = "Xintong Sun", email = "[email protected]"}, | ||
] | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.