-
Notifications
You must be signed in to change notification settings - Fork 8
t5-small backbone model not found #7
Description
The error:
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 1533, in _get_metadata_or_catch_error
metadata = get_hf_file_metadata(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/utils/_validators.py", line 114, in _inner_fn
return fn(*args, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 1450, in get_hf_file_metadata
r = _request_wrapper(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 286, in _request_wrapper
response = _request_wrapper(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 309, in _request_wrapper
response = http_backoff(method=method, url=url, **params, retry_on_exceptions=(), retry_on_status_codes=(429,))
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/utils/_http.py", line 310, in http_backoff
response = session.request(method=method, url=url, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/requests/sessions.py", line 589, in request
resp = self.send(prep, **send_kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/requests/sessions.py", line 703, in send
r = adapter.send(request, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/utils/_http.py", line 96, in send
return super().send(request, *args, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/requests/adapters.py", line 688, in send
raise ConnectTimeout(e, request=request)
requests.exceptions.ConnectTimeout: (MaxRetryError("HTTPSConnectionPool(host='huggingface.co', port=443): Max retries exceeded with url: /t5-small/resolve/main/config.json (Caused by ConnectTimeoutError(<urllib3.connection.HTTPSConnection object at 0x7feeef1662b0>, 'Connection to huggingface.co timed out. (connect timeout=10)'))"), '(Request ID: 3966454d-04a1-467f-8184-8569e47d6445)')
The above exception was the direct cause of the following exception:
Traceback (most recent call last):
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/transformers/utils/hub.py", line 409, in cached_file
resolved_file = hf_hub_download(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/utils/_validators.py", line 114, in _inner_fn
return fn(*args, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 1008, in hf_hub_download
return _hf_hub_download_to_cache_dir(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 1115, in _hf_hub_download_to_cache_dir
_raise_on_head_call_error(head_call_error, force_download, local_files_only)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/huggingface_hub/file_download.py", line 1648, in _raise_on_head_call_error
raise LocalEntryNotFoundError(
huggingface_hub.errors.LocalEntryNotFoundError: An error happened while trying to locate the file on the Hub and we cannot find the requested files in the local cache. Please check your connection and try again or make sure your Internet connection is on.
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/torch/multiprocessing/spawn.py", line 59, in _wrap
fn(i, *args)
File "/root/autodl-tmp/LLM-RecSys-ID/main.py", line 462, in main_worker
tokenizer = AutoTokenizer.from_pretrained(args.model_type)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/transformers/models/auto/tokenization_auto.py", line 613, in from_pretrained
config = AutoConfig.from_pretrained(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/transformers/models/auto/configuration_auto.py", line 852, in from_pretrained
config_dict, unused_kwargs = PretrainedConfig.get_config_dict(pretrained_model_name_or_path, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/transformers/configuration_utils.py", line 565, in get_config_dict
config_dict, kwargs = cls._get_config_dict(pretrained_model_name_or_path, **kwargs)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/transformers/configuration_utils.py", line 620, in _get_config_dict
resolved_config_file = cached_file(
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/transformers/utils/hub.py", line 443, in cached_file
raise EnvironmentError(
OSError: We couldn't connect to 'https://huggingface.co' to load this file, couldn't find it in the cached files and it looks like t5-small is not the path to a directory containing a file named config.json.
Checkout your internet connection or see how to run the library in offline mode at 'https://huggingface.co/docs/transformers/installation#offline-mode'.
Killing subprocess 3750
Traceback (most recent call last):
File "/root/miniconda3/envs/P5/lib/python3.9/runpy.py", line 197, in _run_module_as_main
return _run_code(code, main_globals, None,
File "/root/miniconda3/envs/P5/lib/python3.9/runpy.py", line 87, in _run_code
exec(code, run_globals)
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/torch/distributed/launch.py", line 340, in
main()
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/torch/distributed/launch.py", line 326, in main
sigkill_handler(signal.SIGTERM, None) # not coming back
File "/root/miniconda3/envs/P5/lib/python3.9/site-packages/torch/distributed/launch.py", line 301, in sigkill_handler
raise subprocess.CalledProcessError(returncode=last_return_code, cmd=cmd)
subprocess.CalledProcessError: Command '['/root/miniconda3/envs/P5/bin/python', '-u', 'main.py', '--local_rank=0', '--distributed', '--multiGPU', '--task', 'beauty', '--seed', '2022', '--warmup_prop', '0.05', '--lr', '1e-3', '--clip', '1.0', '--model_type', 't5-small', '--epochs', '20', '--gpu', '0', '--logging_step', '1000', '--logging_dir', 'log/pretrain_t5_small_beauty_CF.log', '--model_dir', 'model/pretrain_t5_small_beauty_CF.pt', '--train_sequential_item_batch', '64', '--whole_word_embedding', 'shijie', '--item_representation', 'CF', '--data_order', 'remapped_sequential', '--remapped_data_order', 'original', '--cluster_size', '500', '--cluster_number', '20']' returned non-zero exit status 1.
It seems that the t5-small cannot be retrieved from huggingface.co, may I ask how to solve this problem?
Thank you!