-
Notifications
You must be signed in to change notification settings - Fork 10
Expand file tree
/
Copy pathCargo.toml
More file actions
27 lines (24 loc) · 769 Bytes
/
Cargo.toml
File metadata and controls
27 lines (24 loc) · 769 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
# bashkit-eval: LLM evaluation harness for bashkit tool usage
# Measures how well models use a sandboxed bash tool in agentic workloads
# See specs/eval.md for design decisions
[package]
name = "bashkit-eval"
version.workspace = true
edition.workspace = true
license.workspace = true
authors.workspace = true
description = "LLM evaluation harness for bashkit tool usage"
[[bin]]
name = "bashkit-eval"
path = "src/main.rs"
[dependencies]
bashkit = { path = "../bashkit", features = ["scripted_tool", "jq"] }
tokio = { workspace = true, features = ["rt-multi-thread"] }
serde.workspace = true
serde_json.workspace = true
clap.workspace = true
anyhow.workspace = true
reqwest.workspace = true
regex.workspace = true
async-trait.workspace = true
chrono.workspace = true