forked from lukeconibear/distributed_deep_learning
-
Notifications
You must be signed in to change notification settings - Fork 0
/
distributed.yaml
116 lines (116 loc) · 4.48 KB
/
distributed.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
# distributed:
# # version: 2
# # # logging:
# # # distributed: info
# # # distributed.client: warning
# # # bokeh: critical
# # # # http://stackoverflow.com/questions/21234772/python-tornado-disable-logging-to-stderr
# # # tornado: critical
# # # tornado.application: error
#
# # scheduler:
# # allowed-failures: 3 # number of retries before a task is considered bad
# # bandwidth: 100000000 # 100 MB/s estimated worker-worker bandwidth
# # blocked-handlers: []
# # default-data-size: 1000
# # # Number of seconds to wait until workers or clients are removed from the events log
# # # after they have been removed from the scheduler
# # events-cleanup-delay: 1h
# # idle-timeout: null # Shut down after this duration, like "1h" or "30 minutes"
# # transition-log-length: 100000
# # work-stealing: True # workers should steal tasks from each other
# # worker-ttl: null # like '60s'. Time to live for workers. They must heartbeat faster than this
# # pickle: True # Is the scheduler allowed to deserialize arbitrary bytestrings
# # preload: []
# # preload-argv: []
# # dashboard:
# # status:
# # task-stream-length: 1000
# # tasks:
# # task-stream-length: 100000
# # tls:
# # ca-file: null
# # key: null
# # cert: null
#
# # worker:
# # blocked-handlers: []
# # multiprocessing-method: forkserver
# # use-file-locking: True
# # connections: # Maximum concurrent connections for data
# # outgoing: 50 # This helps to control network saturation
# # incoming: 10
# # preload: []
# # preload-argv: []
# # daemon: True
# # lifetime:
# # duration: null # Time after which to gracefully shutdown the worker
# # stagger: 0 seconds # Random amount by which to stagger lifetimes
# # restart: False # Do we ressurrect the worker after the lifetime deadline?
#
# # profile:
# # interval: 10ms # Time between statistical profiling queries
# # cycle: 1000ms # Time between starting new profile
# # low-level: False # Whether or not to include low-level functions
# # # Requires https://github.com/numba/stacktrace
#
# # # Fractions of worker memory at which we take action to avoid memory blowup
# # # Set any of the lower three values to False to turn off the behavior entirely
# # memory:
# # target: 0.60 # target fraction to stay below
# # spill: 0.70 # fraction at which we spill to disk
# # pause: 0.80 # fraction at which we pause worker threads
# # terminate: 0.95 # fraction at which we terminate the worker
#
# # client:
# # heartbeat: 5s # time between client heartbeats
#
# # comm:
# # compression: auto
# # default-scheme: tcp
# # socket-backlog: 2048
# # recent-messages-log-length: 0 # number of messages to keep for debugging
#
# # timeouts:
# # connect: 10s # time before connecting fails
# # tcp: 30s # time before calling an unresponsive connection dead
#
# # require-encryption: False # Whether to require encryption on non-local comms
#
# # tls:
# # ciphers: null # Allowed ciphers, specified as an OpenSSL cipher string.
# # ca-file: null # Path to a CA file, in pem format, optional
# # scheduler:
# # cert: null # Path to certificate file for scheduler.
# # key: null # Path to key file for scheduler. Alternatively, the key
# # # can be appended to the cert file above, and this field
# # # left blank.
# # worker:
# # key: null
# # cert: null
# # client:
# # key: null
# # cert: null
#
#
# # ###################
# # # Bokeh dashboard #
# # ###################
#
# # dashboard:
# # link: "{scheme}://{host}:{port}/status"
# # export-tool: False
# link: "/proxy/{port}/status"
#
# # ##################
# # # Administrative #
# # ##################
#
# # admin:
# # tick:
# # interval: 20ms # time between event loop health checks
# # limit: 3s # time allowed before triggering a warning
#
# # log-length: 10000 # default length of logs to keep in memory
# # log-format: '%(name)s - %(levelname)s - %(message)s'
# # pdb-on-err: False # enter debug mode on scheduling error