Skip to content
Closed
Show file tree
Hide file tree
Changes from 6 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions src/guidellm/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,8 @@
hf_logging.set_verbosity_error()
logging.getLogger("transformers").setLevel(logging.ERROR)

from .config import (
from .logger import configure_logger, logger
from .settings import (
DatasetSettings,
Environment,
LoggingSettings,
Expand All @@ -30,7 +31,6 @@
reload_settings,
settings,
)
from .logger import configure_logger, logger

__all__ = [
"DatasetSettings",
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/__main__.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,9 +13,9 @@
)
from guidellm.benchmark.entrypoints import benchmark_with_scenario
from guidellm.benchmark.scenario import GenerativeTextScenario, get_builtin_scenarios
from guidellm.config import print_config
from guidellm.preprocess.dataset import ShortPromptStrategy, process_dataset
from guidellm.scheduler import StrategyType
from guidellm.settings import print_config
from guidellm.utils import DefaultGroupHandler
from guidellm.utils import cli as cli_tools

Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/backend/backend.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
from PIL import Image

from guidellm.backend.response import ResponseSummary, StreamingTextResponse
from guidellm.config import settings
from guidellm.settings import settings

__all__ = [
"Backend",
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/backend/openai.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@
ResponseSummary,
StreamingTextResponse,
)
from guidellm.config import settings
from guidellm.settings import settings

__all__ = [
"CHAT_COMPLETIONS",
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/backend/response.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@

from pydantic import computed_field

from guidellm.config import settings
from guidellm.settings import settings
from guidellm.utils import StandardBaseModel

__all__ = [
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/benchmark/aggregator.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,6 @@
GenerativeTextErrorStats,
GenerativeTextResponseStats,
)
from guidellm.config import settings
from guidellm.request import (
GenerationRequest,
GenerativeRequestLoaderDescription,
Expand All @@ -34,6 +33,7 @@
SchedulerRequestResult,
WorkerDescription,
)
from guidellm.settings import settings
from guidellm.utils import (
RunningStats,
StandardBaseModel,
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/benchmark/output.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,10 +20,10 @@
SweepProfile,
ThroughputProfile,
)
from guidellm.config import settings
from guidellm.presentation import UIDataBuilder
from guidellm.presentation.injector import create_report
from guidellm.scheduler import strategy_display_str
from guidellm.settings import settings
from guidellm.utils import (
Colors,
DistributionSummary,
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/benchmark/profile.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,6 @@
import numpy as np
from pydantic import Field, computed_field

from guidellm.config import settings
from guidellm.scheduler import (
AsyncConstantStrategy,
AsyncPoissonStrategy,
Expand All @@ -14,6 +13,7 @@
SynchronousStrategy,
ThroughputStrategy,
)
from guidellm.settings import settings
from guidellm.utils import StandardBaseModel

__all__ = [
Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/logger.py
Original file line number Diff line number Diff line change
Expand Up @@ -41,7 +41,7 @@

from loguru import logger

from guidellm.config import LoggingSettings, settings
from guidellm.settings import LoggingSettings, settings

__all__ = ["configure_logger", "logger"]

Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/presentation/injector.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

from loguru import logger

from guidellm.config import settings
from guidellm.settings import settings
from guidellm.utils.text import load_text


Expand Down
2 changes: 1 addition & 1 deletion src/guidellm/request/loader.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,9 @@
from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
from transformers import PreTrainedTokenizerBase # type: ignore[import]

from guidellm.config import settings
from guidellm.dataset import ColumnInputTypes, load_dataset
from guidellm.request.request import GenerationRequest
from guidellm.settings import settings
from guidellm.utils import StandardBaseModel

__all__ = [
Expand Down
71 changes: 59 additions & 12 deletions src/guidellm/scheduler/__init__.py
Original file line number Diff line number Diff line change
@@ -1,21 +1,46 @@
from .result import (
SchedulerRequestInfo,
SchedulerRequestResult,
SchedulerResult,
SchedulerRunInfo,
from .constraints import (
Constraint,
ConstraintInitializer,
ConstraintsInitializerFactory,
MaxDurationConstraint,
MaxErrorRateConstraint,
MaxErrorsConstraint,
MaxGlobalErrorRateConstraint,
MaxNumberConstraint,
PydanticConstraintInitializer,
SerializableConstraintInitializer,
UnserializableConstraintInitializer,
)
from .objects import (
BackendInterface,
BackendT,
MeasuredRequestTimings,
MeasuredRequestTimingsT,
MultiTurnRequestT,
RequestSchedulerTimings,
RequestT,
ResponseT,
ScheduledRequestInfo,
SchedulerState,
SchedulerUpdateAction,
SchedulerUpdateActionProgress,
)
from .scheduler import Scheduler
from .strategy import (
AsyncConstantStrategy,
AsyncPoissonStrategy,
ConcurrentStrategy,
ConstantRateRequestTimings,
LastCompletionRequestTimings,
NoDelayRequestTimings,
PoissonRateRequestTimings,
ScheduledRequestTimings,
SchedulingStrategy,
StrategyT,
StrategyType,
SynchronousStrategy,
ThroughputStrategy,
strategy_display_str,
)
from .types import RequestT, ResponseT
from .worker import (
GenerativeRequestsWorker,
GenerativeRequestsWorkerDescription,
Expand All @@ -29,24 +54,46 @@
__all__ = [
"AsyncConstantStrategy",
"AsyncPoissonStrategy",
"BackendInterface",
"BackendT",
"ConcurrentStrategy",
"ConstantRateRequestTimings",
"Constraint",
"ConstraintInitializer",
"ConstraintsInitializerFactory",
"GenerativeRequestsWorker",
"GenerativeRequestsWorkerDescription",
"LastCompletionRequestTimings",
"MaxDurationConstraint",
"MaxErrorRateConstraint",
"MaxErrorsConstraint",
"MaxGlobalErrorRateConstraint",
"MaxNumberConstraint",
"MeasuredRequestTimings",
"MeasuredRequestTimingsT",
"MultiTurnRequestT",
"NoDelayRequestTimings",
"PoissonRateRequestTimings",
"PydanticConstraintInitializer",
"RequestSchedulerTimings",
"RequestT",
"RequestsWorker",
"ResolveStatus",
"ResponseT",
"ScheduledRequestInfo",
"ScheduledRequestTimings",
"Scheduler",
"SchedulerRequestInfo",
"SchedulerRequestResult",
"SchedulerResult",
"SchedulerRunInfo",
"SchedulerState",
"SchedulerUpdateAction",
"SchedulerUpdateActionProgress",
"SchedulingStrategy",
"SerializableConstraintInitializer",
"StrategyT",
"StrategyType",
"SynchronousStrategy",
"ThroughputStrategy",
"UnserializableConstraintInitializer",
"WorkerDescription",
"WorkerProcessRequest",
"WorkerProcessResult",
"strategy_display_str",
]
Loading
Loading