Hi @garrett,
I can’t figure out why sometimes I get timeout error when I run experiments. Here is my running command:
guild run train tb_volatility_lookback=range[30:300:10]
it hangs after some time and when I click ctr + c to abort it the below error shows up.
Traceback (most recent call last):
File “C:\ProgramData\Anaconda3\lib\runpy.py”, line 193, in _run_module_as_main
INFO: [numexpr.utils] NumExpr defaulting to 8 threads.
“main”, mod_spec)
File “C:\ProgramData\Anaconda3\lib\runpy.py”, line 85, in _run_code
exec(code, run_globals)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\batch_main.py”, line 38, in
main()
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\batch_main.py”, line 26, in main
batch_util.handle_trials(batch_run, trials)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\batch_util.py”, line 54, in handle_trials
_run_trials(batch_run, trials)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\batch_util.py”, line 79, in _run_trials
_start_trial_run(run, stage)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\batch_util.py”, line 117, in _start_trial_run
run_impl.run(restart=run.id, stage=stage)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1940, in run
main(args)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1017, in main
_dispatch_op(S)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1101, in _dispatch_op
_dispatch_op_cmd(S)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1286, in _dispatch_op_cmd
_confirm_and_run(S)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1354, in _confirm_and_run
_run(S)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1544, in _run
_run_local(S)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1575, in _run_local
_run_op(op, S.args)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\commands\run_impl.py”, line 1683, in _run_op
extra_env=extra_env,
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op.py”, line 160, in run
exit_status = _run(run, op, quiet, stop_after, extra_env)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op.py”, line 195, in _run
exit_status = _op_wait_for_proc(op, proc, run, quiet, stop_after)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op.py”, line 230, in _op_wait_for_proc
return _op_watch_proc(op, proc, run, quiet, stop_after)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op.py”, line 238, in _op_watch_proc
return _proc_wait(proc, stop_after)
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op.py”, line 259, in exit
self._output.wait_and_close()
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op_util_legacy.py”, line 254, in wait_and_close
self.close()
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op_util_legacy.py”, line 219, in close
lock = self._acquire_output_lock()
File “C:\ProgramData\Anaconda3\lib\site-packages\guild\op_util_legacy.py”, line 232, in _acquire_output_lock
raise RuntimeError(“timeout”)
RuntimeError: timeout