Skip to content

Commit

Permalink
server: bench: init
Browse files Browse the repository at this point in the history
  • Loading branch information
phymbert committed Mar 25, 2024
1 parent 117ad4f commit 4b3dfc8
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 14 deletions.
1 change: 0 additions & 1 deletion .github/workflows/bench.yml
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,6 @@ concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true


jobs:
bench-server-baseline:
runs-on: Standard_NC4as_T4_v3
Expand Down
15 changes: 2 additions & 13 deletions examples/server/bench/bench.py
Original file line number Diff line number Diff line change
Expand Up @@ -160,34 +160,23 @@ def main(args_in: list[str] | None = None) -> None:
# </detail>
# """

# 140 chars max for commit status description
bench_results = {
"req": {
"p90": data['metrics']["http_req_duration"]["p(90)"],
"p95": data['metrics']["http_req_duration"]["p(95)"],
"avg": data['metrics']["http_req_duration"]["avg"],
"min": data['metrics']["http_req_duration"]["min"],
"med": data['metrics']["http_req_duration"]["med"],
"max": data['metrics']["http_req_duration"]["max"]
},
"pp": {
"p90": data['metrics']["llamacpp_prompt_tokens"]["p(90)"],
"p95": data['metrics']["llamacpp_prompt_tokens"]["p(95)"],
"avg": data['metrics']["llamacpp_prompt_tokens"]["avg"],
"min": data['metrics']["llamacpp_prompt_tokens"]["min"],
"med": data['metrics']["llamacpp_prompt_tokens"]["med"],
"max": data['metrics']["llamacpp_prompt_tokens"]["max"]
},
"tg": {
"p90": data['metrics']["llamacpp_tokens_second"]["p(90)"],
"p95": data['metrics']["llamacpp_tokens_second"]["p(95)"],
"avg": data['metrics']["llamacpp_tokens_second"]["avg"],
"min": data['metrics']["llamacpp_tokens_second"]["min"],
"med": data['metrics']["llamacpp_tokens_second"]["med"],
"max": data['metrics']["llamacpp_tokens_second"]["max"]
},
}
with open("results.github.env", 'a') as github_env:
github_env.write(f"BENCH_RESULTS='{json.dumps(bench_results, indent=None, separators=(',', ':') )}'")
github_env.write(f"BENCH_RESULTS={json.dumps(bench_results, indent=None, separators=(',', ':') )}")


def start_benchmark(args):
Expand Down

0 comments on commit 4b3dfc8

Please sign in to comment.