Skip to content

Commit 1c20c5e

Browse files
committed
fix trust_remote_code
1 parent b2d1466 commit 1c20c5e

File tree

5 files changed

+11
-6
lines changed

5 files changed

+11
-6
lines changed

Dockerfile

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,3 @@ RUN sh INSTALL_MEGATRON.sh
2121
RUN pip install --no-cache-dir tinker==0.14.0 "ray[serve]" transformers peft accelerate -U
2222

2323
RUN pip install -e . --no-build-isolation
24-
25-
ENV TWINKLE_WORKDIR=/data
26-
CMD ["bash", "-c", "mkdir -p $TWINKLE_WORKDIR && cd $TWINKLE_WORKDIR && bash /twinkle/cookbook/client/server/megatron/run.sh 2>&1 | tee $TWINKLE_WORKDIR/run.log"]

cookbook/client/server/megatron/run.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,4 +3,4 @@ export RAY_ROTATION_BACKUP_COUNT=1
33
CUDA_VISIBLE_DEVICES=0,1,2,3 ray start --head --port=6379 --num-gpus=4 --disable-usage-stats --include-dashboard=false
44
CUDA_VISIBLE_DEVICES=4,5,6,7 ray start --address=127.0.0.1:6379 --num-gpus=4
55
CUDA_VISIBLE_DEVICES="" ray start --address=127.0.0.1:6379 --num-gpus=0
6-
python server.py
6+
python "$(dirname "$0")/server.py"

cookbook/client/server/megatron/server.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@
99
import os
1010

1111
# Enable Ray debug mode for verbose logging during development
12-
os.environ['TWINKLE_TRUST_REMOTE_CODE'] = '1'
12+
os.environ['TWINKLE_TRUST_REMOTE_CODE'] = '0'
1313

1414
from twinkle.server import launch_server
1515

src/twinkle/dataset/base.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,9 @@ class Dataset(TorchDataset):
5151
"""
5252

5353
def __init__(self, dataset_meta: DatasetMeta, **kwargs):
54+
trust_remote_code = bool(os.environ.get('TWINKLE_TRUST_REMOTE_CODE', '1'))
55+
if not trust_remote_code:
56+
kwargs['trust_remote_code'] = False
5457
dataset = self._load_dataset(dataset_meta, **kwargs)
5558
self.datasets = {dataset_meta.get_id(): dataset}
5659
self.dataset = dataset
@@ -247,6 +250,9 @@ def add_dataset(self, dataset_meta: DatasetMeta, **kwargs):
247250
Args:
248251
dataset_meta: The dataset_meta information of the loaded dataset.
249252
"""
253+
trust_remote_code = bool(os.environ.get('TWINKLE_TRUST_REMOTE_CODE', '1'))
254+
if not trust_remote_code:
255+
kwargs['trust_remote_code'] = False
250256
dataset = self._load_dataset(dataset_meta, **kwargs)
251257
self.datasets[dataset_meta.get_id()] = dataset
252258

src/twinkle/hub/hub.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -401,7 +401,7 @@ def load_dataset(cls,
401401
cls.try_login(token)
402402
if revision is None or revision == 'main':
403403
revision = 'master'
404-
load_kwargs = {'trust_remote_code': True}
404+
load_kwargs = {'trust_remote_code': kwargs.get('trust_remote_code', True)}
405405
return MsDataset.load(
406406
dataset_id,
407407
subset_name=subset_name,
@@ -595,13 +595,15 @@ def load_dataset(cls,
595595
from datasets import load_dataset
596596
if revision is None or revision == 'master':
597597
revision = 'main'
598+
trust_remote_code = kwargs.get('trust_remote_code', True)
598599
return load_dataset(
599600
dataset_id,
600601
name=subset_name,
601602
split=split,
602603
streaming=streaming,
603604
revision=revision,
604605
download_mode=download_mode,
606+
trust_remote_code=trust_remote_code,
605607
num_proc=num_proc)
606608

607609
@classmethod

0 commit comments

Comments
 (0)