You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: ChatQnA/benchmark/performance/kubernetes/intel/gaudi/benchmark.yaml
+3-5Lines changed: 3 additions & 5 deletions
Original file line number
Diff line number
Diff line change
@@ -17,14 +17,12 @@ test_suite_config: # Overall configuration settings for the test suite
17
17
llm_model: "Intel/neural-chat-7b-v3-3"# The LLM model used for the test
18
18
test_output_dir: "${TEST_OUTPUT_DIR}"# The directory to store the test output
19
19
load_shape: # Tenant concurrency pattern
20
-
name: constant # poisson or constant(locust default load shape)
20
+
name: ${LOAD_SHAPE}# poisson or constant(locust default load shape)
21
21
params: # Loadshape-specific parameters
22
22
constant: # Constant load shape specific parameters, activate only if load_shape.name is constant
23
-
concurrent_level: 5# If user_queries is specified, concurrent_level is target number of requests per user. If not, it is the number of simulated users
24
-
# arrival_rate: 1.0 # Request arrival rate. If set, concurrent_level will be overridden, constant load will be generated based on arrival-rate
23
+
concurrent_level: ${CONCURRENT_LEVEL} # If user_queries is specified, concurrent_level is target number of requests per user. If not, it is the number of simulated users
25
24
poisson: # Poisson load shape specific parameters, activate only if load_shape.name is poisson
0 commit comments