Skip to content

Commit

Permalink
bring all workers online
Browse files Browse the repository at this point in the history
  • Loading branch information
phueb committed May 13, 2021
1 parent c0243ce commit 8228482
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 4 deletions.
3 changes: 2 additions & 1 deletion ludwig/__main__.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,7 +55,8 @@ def status():
status_, output = subprocess.getstatusoutput(command)

if status_ != 0:
return 'Something went wrong. Check your access to the shared drive. Try using --mnt flag.'
print(output)
return 'Something went wrong. Check your access to the shared drive. Try using -mnt PATH_TO_DRIVE.'

lines = str(output).split('\n')
lines_with_ludwig_status = [line for line in lines if 'Ludwig' in line]
Expand Down
4 changes: 1 addition & 3 deletions ludwig/configs.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,9 +12,7 @@ class WorkerDirs:
class Remote:
watched_pattern = 'run*.py' # this is required for watcher to know which file to run
path_to_ssh_config = Path.home() / '.ssh' / 'ludwig_config'
online_worker_names = ['norman', 'hebb', 'hinton', 'pitts', 'hawkins', 'lecun']
# TODO bengio is down - march 24 2020
# todo hoff - no NVIDIA driver found by torch.
online_worker_names = ['norman', 'hebb', 'hinton', 'pitts', 'hawkins', 'lecun', 'hoff', 'bengio']
all_worker_names = ['hoff', 'norman', 'hebb', 'hinton', 'pitts', 'hawkins', 'bengio', 'lecun']
group2workers = {'half1': ['hoff', 'norman', 'hebb', 'hinton'],
'half2': ['pitts', 'hawkins', 'bengio', 'lecun']}
Expand Down

0 comments on commit 8228482

Please sign in to comment.