Not able to create the binary file. I have kept 18 HR images in 'rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/DF2K_train_HR/' folder and their corresponding LR images in 'rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/DF2K_train_LR_bicubic/X2' folder. But the error is shown below:
`Total number of parameters: 15444667
Using Dataset(s): DF2K for training
/content/drive/MyDrive/rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/bin/train_bin_HR.pt does not exist. Now making binary...
Bin pt file with name and image
Traceback (most recent call last):
File "main.py", line 135, in
main()
File "main.py", line 98, in main
loader = Data(cfg)
File "/content/drive/MyDrive/rcan-it/ptsr/data/init.py", line 35, in init
datasets.append(getattr(m, module_name)(cfg, name=d))
File "/content/drive/MyDrive/rcan-it/ptsr/data/df2k.py", line 17, in init
cfg, name=name, train=train, benchmark=benchmark
File "/content/drive/MyDrive/rcan-it/ptsr/data/srdata.py", line 39, in init
cfg.DATASET.DATA_EXT, list_hr, self._name_hrbin()
File "/content/drive/MyDrive/rcan-it/ptsr/data/srdata.py", line 148, in _check_and_load
} for _l in l]
File "/content/drive/MyDrive/rcan-it/ptsr/data/srdata.py", line 148, in
} for _l in l]
File "/usr/local/lib/python3.7/dist-packages/imageio/core/functions.py", line 221, in imread
reader = read(uri, format, "i", kwargs)
File "/usr/local/lib/python3.7/dist-packages/imageio/core/functions.py", line 130, in get_reader
request = Request(uri, "r" + mode, kwargs)
File "/usr/local/lib/python3.7/dist-packages/imageio/core/request.py", line 125, in init
self._parse_uri(uri)
File "/usr/local/lib/python3.7/dist-packages/imageio/core/request.py", line 273, in _parse_uri
raise FileNotFoundError("No such file: '%s'" % fn)
FileNotFoundError: No such file: '/content/drive/MyDrive/rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/DF2K_train_HR/0019.png'
ERROR:torch.distributed.elastic.multiprocessing.api:failed (exitcode: 1) local_rank: 0 (pid: 1678) of binary: /usr/bin/python3
Traceback (most recent call last):
File "/usr/lib/python3.7/runpy.py", line 193, in _run_module_as_main
"main", mod_spec)
File "/usr/lib/python3.7/runpy.py", line 85, in _run_code
exec(code, run_globals)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/run.py", line 723, in
main()
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/elastic/multiprocessing/errors/init.py", line 345, in wrapper
return f(*args, *kwargs)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/run.py", line 719, in main
run(args)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/run.py", line 713, in run
)(cmd_args)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/launcher/api.py", line 131, in call
return launch_agent(self._config, self._entrypoint, list(args))
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/launcher/api.py", line 261, in launch_agent
failures=result.failures,
torch.distributed.elastic.multiprocessing.errors.ChildFailedError:`
Not able to create the binary file. I have kept 18 HR images in 'rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/DF2K_train_HR/' folder and their corresponding LR images in 'rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/DF2K_train_LR_bicubic/X2' folder. But the error is shown below: `Total number of parameters: 15444667 Using Dataset(s): DF2K for training
/content/drive/MyDrive/rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/bin/train_bin_HR.pt does not exist. Now making binary... Bin pt file with name and image Traceback (most recent call last): File "main.py", line 135, in
main()
File "main.py", line 98, in main
loader = Data(cfg)
File "/content/drive/MyDrive/rcan-it/ptsr/data/init.py", line 35, in init
datasets.append(getattr(m, module_name)(cfg, name=d))
File "/content/drive/MyDrive/rcan-it/ptsr/data/df2k.py", line 17, in init
cfg, name=name, train=train, benchmark=benchmark
File "/content/drive/MyDrive/rcan-it/ptsr/data/srdata.py", line 39, in init
cfg.DATASET.DATA_EXT, list_hr, self._name_hrbin()
File "/content/drive/MyDrive/rcan-it/ptsr/data/srdata.py", line 148, in _check_and_load
} for _l in l]
File "/content/drive/MyDrive/rcan-it/ptsr/data/srdata.py", line 148, in
} for _l in l]
File "/usr/local/lib/python3.7/dist-packages/imageio/core/functions.py", line 221, in imread
reader = read(uri, format, "i", kwargs)
File "/usr/local/lib/python3.7/dist-packages/imageio/core/functions.py", line 130, in get_reader
request = Request(uri, "r" + mode, kwargs)
File "/usr/local/lib/python3.7/dist-packages/imageio/core/request.py", line 125, in init
self._parse_uri(uri)
File "/usr/local/lib/python3.7/dist-packages/imageio/core/request.py", line 273, in _parse_uri
raise FileNotFoundError("No such file: '%s'" % fn)
FileNotFoundError: No such file: '/content/drive/MyDrive/rcan-it/ptsr/datasets/SR/BIX2X3X4/DF2K/DF2K_train_HR/0019.png'
ERROR:torch.distributed.elastic.multiprocessing.api:failed (exitcode: 1) local_rank: 0 (pid: 1678) of binary: /usr/bin/python3
Traceback (most recent call last):
File "/usr/lib/python3.7/runpy.py", line 193, in _run_module_as_main
"main", mod_spec)
File "/usr/lib/python3.7/runpy.py", line 85, in _run_code
exec(code, run_globals)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/run.py", line 723, in
main()
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/elastic/multiprocessing/errors/init.py", line 345, in wrapper
return f(*args, *kwargs)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/run.py", line 719, in main
run(args)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/run.py", line 713, in run
)(cmd_args)
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/launcher/api.py", line 131, in call
return launch_agent(self._config, self._entrypoint, list(args))
File "/usr/local/lib/python3.7/dist-packages/torch/distributed/launcher/api.py", line 261, in launch_agent
failures=result.failures,
torch.distributed.elastic.multiprocessing.errors.ChildFailedError:`
Please help me to solve this issue @zudi-lin.
Originally posted by @TriB90 in https://github.com/zudi-lin/rcan-it/issues/3#issuecomment-1086562126