Skip to content

Commit

Permalink
Invoke benchmarking in the deploy_and_benchmark process
Browse files Browse the repository at this point in the history
Signed-off-by: Cathy Zhang <[email protected]>
  • Loading branch information
bjzhjing authored and Cathy Zhang committed Jan 24, 2025
1 parent 216918b commit 2cc560f
Showing 1 changed file with 10 additions and 1 deletion.
11 changes: 10 additions & 1 deletion deploy_and_benchmark.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,8 @@
import shutil
import re

from benchmark import run_benchmark

def read_yaml(file_path):
try:
with open(file_path, 'r') as file:
Expand Down Expand Up @@ -220,7 +222,14 @@ def main(yaml_file, target_node=None):
except subprocess.CalledProcessError as e:
print(f"Depoyments status failed with returncode: {e.returncode}")

# TODO: Here is to call benchmark
# Run benchmark
run_benchmark(
benchmark_config=benchmark_config,
chart_name=chart_name,
namespace=namespace,
llm_model=deploy_config.get('services', {}).get('llm', {}).get('model_id', "")
)


except Exception as e:
print(f"Error during {'deployment' if i == 0 else 'update'} for {node} nodes with max_batch_size {max_batch_size}: {str(e)}")
Expand Down

0 comments on commit 2cc560f

Please sign in to comment.