Skip to content

Commit

Permalink
feat: introduce MQAphroditeEngine (#1056)
Browse files Browse the repository at this point in the history
* feat: introduce MQAphroditeEngine

* add `dead_error` property to engine client

* fix model unload endpoint

* add a simple model load endpoint

* take more args in model load field

* take yaml config in model load endpoint

* inline model switching
  • Loading branch information
AlpinDale authored Dec 31, 2024
1 parent 0b5588d commit 9a7d551
Show file tree
Hide file tree
Showing 20 changed files with 1,296 additions and 1,124 deletions.
6 changes: 3 additions & 3 deletions aphrodite/common/envs.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,7 +54,7 @@
APHRODITE_DYNAMIC_ROPE_SCALING: bool = False
APHRODITE_TEST_FORCE_FP8_MARLIN: bool = False
APHRODITE_PLUGINS: Optional[List[str]] = None
APHRODITE_RPC_GET_DATA_TIMEOUT_MS: int = 5000
APHRODITE_RPC_TIMEOUT: int = 5000
APHRODITE_FORCE_SINGLE_USER_PREFIX_CACHE: bool = False
APHRODITE_TEST_DYNAMO_GRAPH_CAPTURE: int = 0
APHRODITE_TEST_DYNAMO_FULLGRAPH_CAPTURE: int = 0
Expand Down Expand Up @@ -383,8 +383,8 @@ def get_default_config_root():

# Time in ms for the zmq client to wait for a response from the backend
# server for simple data operations
"APHRODITE_RPC_GET_DATA_TIMEOUT_MS":
lambda: int(os.getenv("APHRODITE_RPC_GET_DATA_TIMEOUT_MS", "5000")),
"APHRODITE_RPC_TIMEOUT":
lambda: int(os.getenv("APHRODITE_RPC_TIMEOUT", "5000")),

# a list of plugin names to load, separated by commas.
# if this is not set, it means all plugins will be loaded
Expand Down
Loading

0 comments on commit 9a7d551

Please sign in to comment.