Skip to content
Open
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 11 additions & 0 deletions llm_bench/load_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
import traceback
from typing import Optional
from locust import HttpUser, task, events, constant_pacing
from urllib3 import PoolManager
import copy
import json
import time
Expand Down Expand Up @@ -519,6 +520,7 @@ def _load_curl_like_data(text):

class LLMUser(HttpUser):
# no wait time, so every user creates a continuous load, sending requests as quickly as possible
pool_manager = PoolManager(maxsize=50, block=True)

def on_start(self):
try:
Expand Down Expand Up @@ -986,6 +988,15 @@ def init_parser(parser):
type=int,
help="How many sequences to generate (makes sense to use with non-zero temperature).",
)
#DEBUG
import logging
from http.client import HTTPConnection
logging.basicConfig()
logging.getLogger().setLevel(logging.DEBUG)
requests_log = logging.getLogger("requests.packages.urllib3")
requests_log.setLevel(logging.DEBUG)
requests_log.propagate = True
#DEBUG

@events.quitting.add_listener
def _(environment, **kw):
Expand Down