Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
42 commits
Select commit Hold shift + click to select a range
74c3d93
Initial clone and added VS Code.
nv-twhitehouse Feb 28, 2025
7be40f5
Add model identifier constants and refactor model selection logic
nv-twhitehouse Mar 1, 2025
d5214f7
Finished getting env variable for changing api endpoint prefix implem…
nv-twhitehouse Mar 1, 2025
ae655b6
Refactor model endpoints and internal API handling
nv-twhitehouse Mar 1, 2025
20ca7d6
Ran queries to demonstrate the changes worked.
nv-twhitehouse Mar 1, 2025
0fea6d3
Simplified README
nv-twhitehouse Mar 1, 2025
42f0321
Deleted image from readme
nv-twhitehouse Mar 1, 2025
eeba25c
Continued refactoring of README
nv-twhitehouse Mar 3, 2025
988357f
Eliminated the hierarchy of links at top of README
nv-twhitehouse Mar 3, 2025
bacd69f
Minor changes to README
nv-twhitehouse Mar 3, 2025
183596e
Modified README.md
nv-twhitehouse Mar 3, 2025
aace9cb
Modified README.md
nv-twhitehouse Mar 3, 2025
dd751d0
Modified README.md
nv-twhitehouse Mar 3, 2025
bae8f2e
Modified urls in README to open in in new tab.
nv-twhitehouse Mar 3, 2025
6898dd7
Trying links again.
nv-twhitehouse Mar 3, 2025
5ee7422
Modified README.md
nv-twhitehouse Mar 3, 2025
711a4b4
Modified README.md
nv-twhitehouse Mar 3, 2025
cad55a1
Update README.md
jtcasablanca Mar 6, 2025
d08deb7
Fixed embedding string issues in database and added data to gitignore.
nv-twhitehouse Mar 8, 2025
48a9554
Revised README to fit with downloadable nim readme.
jtcasablanca Mar 8, 2025
2f33c6f
Modified README.md
nv-twhitehouse Mar 8, 2025
d460a70
minor revisions to read me.
nv-twhitehouse Mar 8, 2025
33cf715
Modified README.md
nv-twhitehouse Mar 8, 2025
d012ace
Update README.md
jtcasablanca Mar 9, 2025
fe4748b
Update README.md
jtcasablanca Mar 9, 2025
8894b5e
Update README.md
jtcasablanca Mar 9, 2025
115d5e9
Update README.md
jtcasablanca Mar 9, 2025
4d35ca9
Update README.md
jtcasablanca Mar 9, 2025
82e3a62
Minor changes to readme
nv-twhitehouse Mar 9, 2025
61d7350
Merge branch 'main' of https://github.com/jtcasablanca/workbench-exam…
nv-twhitehouse Mar 9, 2025
9227b3f
Minor changes.
nv-twhitehouse Mar 9, 2025
9bb32fd
Added nim support and disk size files to drive gpu selection UI
nv-twhitehouse Mar 9, 2025
7d55975
feat: Add GPU configuration support for NIM endpoints
nv-twhitehouse Mar 9, 2025
cc4a0fd
Added info on endpoint prefix for nvidians. Note. feature not impleme…
nv-twhitehouse Mar 9, 2025
d39688a
changed wording around internal endpoints and made specific to nvidians.
nv-twhitehouse Mar 9, 2025
eee7b4a
docs: improve self-hosted endpoint documentation
nv-twhitehouse Mar 9, 2025
57015fd
Changed readme links
nv-twhitehouse Mar 9, 2025
41d28ca
Modified README.md
nv-twhitehouse Mar 9, 2025
d14a9b9
Modified README.md
nv-twhitehouse Mar 9, 2025
9f7ddd2
docs: added instructions tab to UI; modified documents tab (blurb and…
nv-twhitehouse Apr 15, 2025
65e6ba8
docs: changed clear history button
nv-twhitehouse Apr 15, 2025
f8ca62c
docs: modified model tab
nv-twhitehouse Apr 16, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 5 additions & 1 deletion .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -54,4 +54,8 @@ cover/

# Workbench Project Layout
data/scratch/*
!data/scratch/.gitkeep
!data/scratch/.gitkeep
data/chroma.sqlite3

data/*
!data/.gitkeep
2 changes: 2 additions & 0 deletions .project/configpacks
Original file line number Diff line number Diff line change
Expand Up @@ -3,10 +3,12 @@
*cuda.CUDA
*defaults.EnvVars
*defaults.Readme
*defaults.CA
*defaults.Entrypoint
*apt.PackageManager
*bash.PreLanguage
*python.PipPackageManager
*bash.PostBuild
*jupyterlab.JupyterLab
*vs_code.VSCode
*tensorboard.Tensorboard
264 changes: 133 additions & 131 deletions .project/spec.yaml
Original file line number Diff line number Diff line change
@@ -1,137 +1,139 @@
specVersion: v2
specMinorVersion: 2
meta:
name: agentic-rag
image: project-agentic-rag
description: An example project for advanced RAG using agents
labels: []
createdOn: "2024-07-15T21:09:46Z"
defaultBranch: main
name: agentic-rag
image: project-agentic-rag
description: An example project for advanced RAG using agents
labels: []
createdOn: "2024-07-15T21:09:46Z"
defaultBranch: main
layout:
- path: code/
type: code
storage: git
- path: models/
type: models
storage: gitlfs
- path: data/
type: data
storage: gitlfs
- path: data/scratch/
type: data
storage: gitignore
- path: code/
type: code
storage: git
- path: models/
type: models
storage: gitlfs
- path: data/
type: data
storage: gitignore
environment:
base:
registry: nvcr.io
image: nvidia/ai-workbench/pytorch:1.0.2
build_timestamp: "20231102150513"
name: PyTorch
supported_architectures: []
cuda_version: "12.2"
description: A Pytorch 2.1 Base with CUDA 12.2
entrypoint_script: ""
labels:
- cuda12.2
- pytorch2.1
apps:
- name: chat
type: custom
class: webapp
start_command: cd /project/code/ && PROXY_PREFIX=$PROXY_PREFIX python3 -m chatui
health_check_command: curl -f "http://localhost:8080/"
stop_command: pkill -f "^python3 -m chatui"
user_msg: ""
logfile_path: ""
timeout_seconds: 60
icon_url: ""
webapp_options:
autolaunch: true
port: "8080"
proxy:
trim_prefix: true
url: http://localhost:8080/
- name: jupyterlab
type: jupyterlab
class: webapp
start_command: jupyter lab --allow-root --port 8888 --ip 0.0.0.0 --no-browser
--NotebookApp.base_url=\$PROXY_PREFIX --NotebookApp.default_url=/lab --NotebookApp.allow_origin='*'
health_check_command: '[ \$(echo url=\$(jupyter lab list | head -n 2 | tail
-n 1 | cut -f1 -d'' '' | grep -v ''Currently'' | sed "s@/?@/lab?@g") | curl
-o /dev/null -s -w ''%{http_code}'' --config -) == ''200'' ]'
stop_command: jupyter lab stop 8888
user_msg: ""
logfile_path: ""
timeout_seconds: 60
icon_url: ""
webapp_options:
autolaunch: true
port: "8888"
proxy:
trim_prefix: false
url_command: jupyter lab list | head -n 2 | tail -n 1 | cut -f1 -d' ' | grep
-v 'Currently'
- name: tensorboard
type: tensorboard
class: webapp
start_command: tensorboard --logdir \$TENSORBOARD_LOGS_DIRECTORY --path_prefix=\$PROXY_PREFIX
--bind_all
health_check_command: '[ \$(curl -o /dev/null -s -w ''%{http_code}'' http://localhost:\$TENSORBOARD_PORT\$PROXY_PREFIX/)
== ''200'' ]'
stop_command: pkill tensorboard
user_msg: ""
logfile_path: ""
timeout_seconds: 60
icon_url: ""
webapp_options:
autolaunch: true
port: "6006"
proxy:
trim_prefix: false
url: http://localhost:6006
programming_languages:
- python3
icon_url: ""
image_version: 1.0.2
os: linux
os_distro: ubuntu
os_distro_release: "22.04"
schema_version: v2
user_info:
uid: ""
gid: ""
username: ""
package_managers:
- name: apt
binary_path: /usr/bin/apt
installed_packages:
- curl
- git
- git-lfs
- vim
- name: pip
binary_path: /usr/local/bin/pip
installed_packages:
- jupyterlab==4.0.7
package_manager_environment:
name: ""
target: ""
base:
registry: nvcr.io
image: nvidia/ai-workbench/pytorch:1.0.2
build_timestamp: "20231102150513"
name: PyTorch
supported_architectures: []
cuda_version: "12.2"
description: A Pytorch 2.1 Base with CUDA 12.2
entrypoint_script: ""
labels:
- cuda12.2
- pytorch2.1
apps:
- name: chat
type: custom
class: webapp
start_command: cd /project/code/ && PROXY_PREFIX=$PROXY_PREFIX python3 -m chatui
health_check_command: curl -f "http://localhost:8080/"
stop_command: pkill -f "^python3 -m chatui"
user_msg: ""
logfile_path: ""
timeout_seconds: 60
icon_url: ""
webapp_options:
autolaunch: true
port: "8080"
proxy:
trim_prefix: true
url: http://localhost:8080/
- name: jupyterlab
type: jupyterlab
class: webapp
start_command: jupyter lab --allow-root --port 8888 --ip 0.0.0.0 --no-browser --NotebookApp.base_url=\$PROXY_PREFIX --NotebookApp.default_url=/lab --NotebookApp.allow_origin='*'
health_check_command: '[ \$(echo url=\$(jupyter lab list | head -n 2 | tail -n 1 | cut -f1 -d'' '' | grep -v ''Currently'' | sed "s@/?@/lab?@g") | curl -o /dev/null -s -w ''%{http_code}'' --config -) == ''200'' ]'
stop_command: jupyter lab stop 8888
user_msg: ""
logfile_path: ""
timeout_seconds: 60
icon_url: ""
webapp_options:
autolaunch: true
port: "8888"
proxy:
trim_prefix: false
url_command: jupyter lab list | head -n 2 | tail -n 1 | cut -f1 -d' ' | grep -v 'Currently'
- name: tensorboard
type: tensorboard
class: webapp
start_command: tensorboard --logdir \$TENSORBOARD_LOGS_DIRECTORY --path_prefix=\$PROXY_PREFIX --bind_all
health_check_command: '[ \$(curl -o /dev/null -s -w ''%{http_code}'' http://localhost:\$TENSORBOARD_PORT\$PROXY_PREFIX/) == ''200'' ]'
stop_command: pkill tensorboard
user_msg: ""
logfile_path: ""
timeout_seconds: 60
icon_url: ""
webapp_options:
autolaunch: true
port: "6006"
proxy:
trim_prefix: false
url: http://localhost:6006
programming_languages:
- python3
icon_url: ""
image_version: 1.0.2
os: linux
os_distro: ubuntu
os_distro_release: "22.04"
schema_version: v2
user_info:
uid: ""
gid: ""
username: ""
package_managers:
- name: apt
binary_path: /usr/bin/apt
installed_packages:
- curl
- git
- git-lfs
- vim
- name: pip
binary_path: /usr/local/bin/pip
installed_packages:
- jupyterlab==4.0.7
package_manager_environment:
name: ""
target: ""
compose_file_path: ""
execution:
apps: []
resources:
gpu:
requested: 1
sharedMemoryMB: 1024
secrets:
- variable: NVIDIA_API_KEY
description: NVIDIA API Key for accessing the API catalog
- variable: TAVILY_API_KEY
description: Tavily Search API Key
mounts:
- type: project
target: /project/
description: Project directory
options: rw
- type: volume
target: /data/tensorboard/logs/
description: Tensorboard Log Files
options: volumeName=tensorboard-logs-volume
apps:
- name: Visual Studio Code
type: vs-code
class: native
start_command: ""
health_check_command: '[ \$(ps aux | grep ".vscode-server" | grep -v grep | wc -l ) -gt 4 ] && [ \$(ps aux | grep "/.vscode-server/bin/.*/node .* net.createConnection" | grep -v grep | wc -l) -gt 0 ]'
stop_command: ""
user_msg: ""
logfile_path: ""
timeout_seconds: 120
icon_url: ""
resources:
gpu:
requested: 0
sharedMemoryMB: 1024
secrets:
- variable: NVIDIA_API_KEY
description: NVIDIA API Key for accessing the API catalog
- variable: TAVILY_API_KEY
description: Tavily Search API Key
mounts:
- type: project
target: /project/
description: Project directory
options: rw
- type: volume
target: /data/tensorboard/logs/
description: Tensorboard Log Files
options: volumeName=tensorboard-logs-volume
Loading