forked from openshift-psap/llm-load-test
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathload_test.py
executable file
·152 lines (118 loc) · 4.73 KB
/
load_test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
"""Main llm-load-test CLI entrypoint."""
import logging
import logging.handlers
import multiprocessing as mp
import sys
import time
from user import User
from dataset import Dataset
import logging_utils
import utils
def run_main_process(concurrency, duration, dataset, dataset_q, stop_q):
"""Run the main process."""
logging.info("Test from main process")
# Initialize the dataset_queue with 4*concurrency requests
for query in dataset.get_next_n_queries(2 * concurrency):
dataset_q.put(query)
start_time = time.time()
current_time = start_time
while (current_time - start_time) < duration:
# Keep the dataset queue full for duration
if dataset_q.qsize() < int(0.5*concurrency + 1):
logging.info("Adding %d entries to dataset queue", concurrency)
for query in dataset.get_next_n_queries(concurrency):
dataset_q.put(query)
time.sleep(0.1)
current_time = time.time()
logging.info("Timer ended, stopping processes")
# Signal users to stop sending requests
stop_q.put(None)
# Empty the dataset queue
while not dataset_q.empty():
logging.debug("Removing element from dataset_q")
dataset_q.get()
return
def gather_results(results_pipes):
"""Get the results."""
# Receive all results from each processes results_pipe
logging.debug("Receiving results from user processes")
results_list = []
for results_pipe in results_pipes:
user_results = results_pipe.recv()
results_list.extend(user_results)
return results_list
def exit_gracefully(procs, dataset_q, stop_q, logger_q, log_reader_thread, code):
"""Exit gracefully."""
# Signal users to stop sending requests
if stop_q.empty():
stop_q.put(None)
if dataset_q is not None and not dataset_q.empty():
logging.warning("Removing more elements from dataset_q after gathering results!")
while not dataset_q.empty():
dataset_q.get()
logging.debug("Calling join() on all user processes")
for proc in procs:
proc.join()
logging.info("User processes terminated succesfully")
# Shutdown logger thread
logger_q.put(None)
log_reader_thread.join()
sys.exit(code)
def main(args):
"""Load test CLI entrypoint."""
args = utils.parse_args(args)
mp_ctx = mp.get_context("spawn")
logger_q = mp_ctx.Queue()
log_reader_thread = logging_utils.init_logging(args.log_level, logger_q)
# Create processes and their Users
stop_q = mp_ctx.Queue(1)
dataset_q = mp_ctx.Queue()
procs = []
results_pipes = []
# Parse config
logging.debug("Parsing YAML config file %s", args.config)
concurrency, duration, plugin = 0, 0, None
try:
config = utils.yaml_load(args.config)
concurrency, duration, plugin = utils.parse_config(config)
except Exception as e:
logging.error("Exiting due to invalid input: %s", repr(e))
exit_gracefully(procs, dataset_q, stop_q, logger_q, log_reader_thread, 1)
try:
logging.debug("Creating dataset with configuration %s", config["dataset"])
# Get model_name if set for prompt formatting
model_name = config.get("plugin_options", {}).get("model_name", "")
dataset = Dataset(model_name=model_name, **config["dataset"])
logging.debug("Creating %s Users and corresponding processes", concurrency)
for idx in range(concurrency):
send_results, recv_results = mp_ctx.Pipe()
user = User(
idx,
dataset_q=dataset_q,
stop_q=stop_q,
results_pipe=send_results,
plugin=plugin,
logger_q=logger_q,
log_level=args.log_level,
run_duration=duration,
)
proc = mp_ctx.Process(target=user.run_user_process)
procs.append(proc)
logging.info("Starting %s", proc)
proc.start()
results_pipes.append(recv_results)
logging.debug("Running main process")
run_main_process(concurrency, duration, dataset, dataset_q, stop_q)
results_list = gather_results(results_pipes)
utils.write_output(config, results_list)
# Terminate queues immediately on ^C
except KeyboardInterrupt:
stop_q.cancel_join_thread()
dataset_q.cancel_join_thread()
exit_gracefully(procs, dataset_q, stop_q, logger_q, log_reader_thread, 130)
except Exception:
logging.exception("Unexpected exception in main process")
exit_gracefully(procs, dataset_q, stop_q, logger_q, log_reader_thread, 1)
exit_gracefully(procs, dataset_q, stop_q, logger_q, log_reader_thread, 0)
if __name__ == "__main__":
main(sys.argv[1:])