ShaneIsley · ShaneIsley · Jan 29, 2026 · Jan 15, 2026 · Jan 19, 2026 · Jan 23, 2026
diff --git a/examples/daytona_repl_example.py b/examples/daytona_repl_example.py
@@ -0,0 +1,112 @@
+"""
+Example usage of Daytona REPL with code execution and LLM queries.
+
+Run with: python -m examples.daytona_repl_example
+"""
+
+from rlm.clients.base_lm import BaseLM
+from rlm.core.lm_handler import LMHandler
+from rlm.core.types import ModelUsageSummary, UsageSummary
+from rlm.environments.daytona_repl import DaytonaREPL
+
+
+class MockLM(BaseLM):
+    """Simple mock LM that echoes prompts."""
+
+    def __init__(self):
+        super().__init__(model_name="mock-model")
+
+    def completion(self, prompt):
+        return f"Mock response to: {prompt[:50]}"
+
+    async def acompletion(self, prompt):
+        return self.completion(prompt)
+
+    def get_usage_summary(self):
+        return UsageSummary(
+            model_usage_summaries={
+                "mock-model": ModelUsageSummary(
+                    total_calls=1, total_input_tokens=10, total_output_tokens=10
+                )
+            }
+        )
+
+    def get_last_usage(self):
+        return self.get_usage_summary()
+
+
+def main():
+    print("=" * 60)
+    print("Daytona REPL Example")
+    print("=" * 60)
+
+    # Note: Requires DAYTONA_API_KEY environment variable to be set
+    # or passed explicitly to DaytonaREPL(api_key="...")
+
+    # Example 1: Basic code execution
+    print("\n[1] Basic code execution (no LLM handler)")
+    print("-" * 40)
+
+    try:
+        with DaytonaREPL(name="rlm-example") as repl:
+            print(f"Daytona sandbox started with ID: {repl.sandbox.id}")
+            result = repl.execute_code("x = 1 + 2")
+            print("Executed: x = 1 + 2")
+            print(f"Locals: {result.locals}")
+
+            result = repl.execute_code("print(x * 2)")
+            print("Executed: print(x * 2)")
+            print(f"Stdout: {result.stdout.strip()}")
+
+            result = repl.execute_code("answer = 42")
+            result = repl.execute_code('print(FINAL_VAR("answer"))')
+            print(f"FINAL_VAR('answer'): {result.stdout.strip()}")
+
+        # Example 2: With LLM handler
+        print("\n[2] Code execution with LLM handler")
+        print("-" * 40)
+
+        mock_client = MockLM()
+
+        with LMHandler(client=mock_client) as handler:
+            print(f"LM Handler started at {handler.address}")
+
+            with DaytonaREPL(
+                name="rlm-example-handler",
+                lm_handler_address=handler.address,
+            ) as repl:
+                print(f"Daytona sandbox started with ID: {repl.sandbox.id}")
+                print(f"Broker URL: {repl.broker_url}")
+
+                # Single LLM query
+                result = repl.execute_code('response = llm_query("What is 2+2?")')
+                print("Executed: response = llm_query('What is 2+2?')")
+                if result.stderr:
+                    print(f"Stderr: {result.stderr}")
+
+                result = repl.execute_code("print(response)")
+                print(f"Response: {result.stdout.strip()}")
+
+                # Batched LLM query
+                result = repl.execute_code(
+                    'responses = llm_query_batched(["Question 1", "Question 2", "Question 3"])'
+                )
+                print("\nExecuted: responses = llm_query_batched([...])")
+
+                result = repl.execute_code("print(f'Got {len(responses)} responses')")
+                print(f"Result: {result.stdout.strip()}")
+
+                result = repl.execute_code("print(responses[0])")
+                print(f"First response: {result.stdout.strip()}")
+
+    except Exception as e:
+        print(f"Error: {e}")
+        print("\nMake sure Daytona is configured correctly and DAYTONA_API_KEY is set.")
+
+    print("\n" + "=" * 60)
+    print("Done!")
+    print("=" * 60)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/examples/quickstart.py b/examples/quickstart.py
@@ -13,13 +13,13 @@
     backend_kwargs={
         "model_name": "gpt-5-nano",
     },
-    environment="local",
+    environment="docker",
     environment_kwargs={},
     max_depth=1,
     logger=logger,
     verbose=True,  # For printing to console with rich, disabled by default.
 )
 
-result = rlm.completion("Print me the first 100 powers of two, each on a newline.")
+result = rlm.completion("Print me the first 5 powers of two, each on a newline.")
 
 print(result)
diff --git a/pyproject.toml b/pyproject.toml
@@ -21,6 +21,7 @@ dependencies = [
 
 [project.optional-dependencies]
 modal = ["modal>=0.73.0", "dill>=0.3.7"]
+daytona = ["daytona>=0.128.1", "dill>=0.3.7"]
 prime = ["prime-sandboxes>=0.2.0", "dill>=0.3.7"]
 
 [build-system]

diff --git a/rlm/clients/base_lm.py b/rlm/clients/base_lm.py
@@ -1,7 +1,7 @@
 from abc import ABC, abstractmethod
 from typing import Any
 
-from rlm.core.types import UsageSummary
+from rlm.core.types import ModelUsageSummary, UsageSummary
 
 
 class BaseLM(ABC):
@@ -28,7 +28,7 @@ def get_usage_summary(self) -> UsageSummary:
         raise NotImplementedError
 
     @abstractmethod
-    def get_last_usage(self) -> UsageSummary:
+    def get_last_usage(self) -> ModelUsageSummary:
         """Get the last cost summary of the model."""
         raise NotImplementedError
 

diff --git a/rlm/core/lm_handler.py b/rlm/core/lm_handler.py
@@ -58,10 +58,12 @@ def _handle_single(self, request: LMRequest, handler: "LMHandler") -> LMResponse
         content = client.completion(request.prompt)
         end_time = time.perf_counter()
 
-        usage_summary = client.get_last_usage()
+        model_usage = client.get_last_usage()
+        root_model = request.model or client.model_name
+        usage_summary = UsageSummary(model_usage_summaries={root_model: model_usage})
         return LMResponse.success_response(
             chat_completion=RLMChatCompletion(
-                root_model=request.model or client.model_name,
+                root_model=root_model,
                 prompt=request.prompt,
                 response=content,
                 usage_summary=usage_summary,
@@ -83,11 +85,13 @@ async def run_all():
         end_time = time.perf_counter()
 
         total_time = end_time - start_time
-        usage_summary = client.get_last_usage()
+        model_usage = client.get_last_usage()
+        root_model = request.model or client.model_name
+        usage_summary = UsageSummary(model_usage_summaries={root_model: model_usage})
 
         chat_completions = [
             RLMChatCompletion(
-                root_model=request.model or client.model_name,
+                root_model=root_model,
                 prompt=prompt,
                 response=content,
                 usage_summary=usage_summary,

diff --git a/rlm/core/types.py b/rlm/core/types.py
@@ -16,7 +16,7 @@
     "gemini",
     "huggingface",
 ]
-EnvironmentType = Literal["local", "subprocess", "docker", "modal", "prime"]
+EnvironmentType = Literal["local", "subprocess", "docker", "modal", "prime", "daytona"]
 
 
 def _serialize_value(value: Any) -> Any:

diff --git a/rlm/environments/__init__.py b/rlm/environments/__init__.py
@@ -23,14 +23,14 @@
 
 
 def get_environment(
-    environment: Literal["local", "subprocess", "modal", "docker", "prime"],
+    environment: Literal["local", "subprocess", "modal", "docker", "prime", "daytona"],
     environment_kwargs: dict[str, Any],
 ) -> BaseEnv:
     """
     Routes a specific environment and the args (as a dict) to the appropriate environment if supported.
 
     Args:
-        environment: The environment type (e.g., "local", "docker", "modal", "prime")
+        environment: The environment type (e.g., "local", "docker", "modal", "prime", "daytona")
         environment_kwargs: Keyword arguments to pass to the environment constructor
 
     Returns: