Skip to content

Run Error #1

@Don-Joey

Description

@Don-Joey

``I have updated: torchtext==0.4 ray[tune]==0.8.7,
I run "./run_batch_tune.sh base",
but
"Traceback (most recent call last):
File "/root/anaconda3/envs/ept/lib/python3.7/site-packages/ray/tune/trial_runner.py", line 471, in _process_trial
result = self.trial_executor.fetch_result(trial)
File "/root/anaconda3/envs/ept/lib/python3.7/site-packages/ray/tune/ray_trial_executor.py", line 430, in fetch_result
result = ray.get(trial_future[0], DEFAULT_GET_TIMEOUT)
File "/root/anaconda3/envs/ept/lib/python3.7/site-packages/ray/worker.py", line 1538, in get
raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(KeyError): ray::RayTrainer.train() (pid=21573, ip=172.17.0.15)
File "python/ray/_raylet.pyx", line 439, in ray._raylet.execute_task
File "python/ray/_raylet.pyx", line 474, in ray._raylet.execute_task
File "python/ray/_raylet.pyx", line 478, in ray._raylet.execute_task
File "python/ray/_raylet.pyx", line 479, in ray._raylet.execute_task
File "python/ray/_raylet.pyx", line 432, in ray._raylet.execute_task.function_executor
File "/root/anaconda3/envs/ept/lib/python3.7/site-packages/ray/tune/trainable.py", line 245, in init
self.setup(copy.deepcopy(self.config))
File "/root/anaconda3/envs/ept/lib/python3.7/site-packages/ray/tune/trainable.py", line 769, in setup
self._setup(config)
File "tune_hyperopt.py", line 78, in _setup
disable_dataparallel=not data_parallel)
File "/home/leiwang/EPT/page/torch/trainer.py", line 176, in init
self.trainset, self.devset, self.evalset = self._config.read_datasets(train=train, dev=dev, test=test)
File "/home/leiwang/EPT/page/config.py", line 670, in read_datasets
self.batch, testing_purpose=False)
File "/home/leiwang/EPT/page/torch/dataset.py", line 155, in init
self.reset()
File "/home/leiwang/EPT/page/torch/dataset.py", line 254, in reset
self._batches = list(self._generate_batches())
File "/home/leiwang/EPT/page/torch/dataset.py", line 304, in _generate_batches
yield self._concatenate_batch(items[:-1])
File "/home/leiwang/EPT/page/torch/dataset.py", line 341, in _concatenate_batch
kwargs['text'] = self.problem_field.process(kwargs['text'])
KeyError: 'text'
2021-07-30 16:48:43,973 ERROR syncer.py:46 -- Log sync requires rsync to be installed."
image

Then I 'ctrl+C'

Traceback (most recent call last):
File "batch_trainer.py", line 118, in
base_config = TrainerConfig.from_pretrained(config_path)
File "/home/leiwang/EPT/page/config.py", line 611, in from_pretrained
with path.open('r+t', encoding='UTF-8') as fp:
File "/root/anaconda3/envs/ept/lib/python3.7/pathlib.py", line 1208, in open
opener=self._opener)
File "/root/anaconda3/envs/ept/lib/python3.7/pathlib.py", line 1063, in _opener
return self._accessor.open(self, flags, mode)
FileNotFoundError: [Errno 2] No such file or directory: 'config/alg514/base.json/TrainConfig.json'

Metadata

Metadata

Assignees

No one assigned

    Labels

    No labels
    No labels

    Type

    No type

    Projects

    No projects

    Milestone

    No milestone

    Relationships

    None yet

    Development

    No branches or pull requests

    Issue actions