Skip to content

Commit 96112a8

Browse files
committed
add code doc
1 parent 1548729 commit 96112a8

File tree

1 file changed

+11
-0
lines changed

1 file changed

+11
-0
lines changed

src/twinkle/server/twinkle/model.py

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -189,6 +189,17 @@ def __init__(self, nproc_per_node: int, device_group: Dict[str, Any], device_mes
189189

190190
@serve.multiplexed(max_num_models_per_replica=kwargs.get('max_loras', 5))
191191
async def get_multiplexed_adapter(self, request_id: str):
192+
"""
193+
Reference docs:
194+
1. https://docs.ray.io/en/latest/serve/model-multiplexing.html
195+
2. https://docs.ray.io/en/latest/serve/llm/architecture/routing-policies.html
196+
3. https://github.com/ray-project/ray/pull/56855/changes
197+
Args:
198+
request_id:
199+
200+
Returns:
201+
202+
"""
192203
return request_id
193204

194205
def _on_adapter_expired(self, adapter_name: str) -> None:

0 commit comments

Comments
 (0)