/usr/lib/python2.7/dist-packages/scoop/utils.py is in python-scoop 0.7.1.1-2.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 | #!/usr/bin/env python
#
# This file is part of Scalable COncurrent Operations in Python (SCOOP).
#
# SCOOP is free software: you can redistribute it and/or modify
# it under the terms of the GNU Lesser General Public License as
# published by the Free Software Foundation, either version 3 of
# the License, or (at your option) any later version.
#
# SCOOP is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with SCOOP. If not, see <http://www.gnu.org/licenses/>.
#
from multiprocessing import cpu_count
from itertools import groupby
import os
import re
import sys
import socket
import logging
if sys.version_info < (2, 7):
from scoop.backports.dictconfig import dictConfig
else:
from logging.config import dictConfig
loopbackReferences = [
"127.0.0.1",
"localhost",
"::1",
]
localHostnames = loopbackReferences + [
socket.getfqdn().split('.')[0],
]
localHostnames.extend([
ip for ip in socket.gethostbyname_ex(socket.gethostname())[2]
if not ip.startswith("127.")][:1]
)
loggingConfig = {}
def initLogging(verbosity=0, name="SCOOP"):
"""Creates a logger."""
global loggingConfig
verbose_levels = {
-2: "CRITICAL",
-1: "ERROR",
0: "WARNING",
1: "INFO",
2: "DEBUG",
3: "NOSET",
}
log_handlers = {
"console":
{
"class": "logging.StreamHandler",
"formatter": "{name}Formatter".format(name=name),
"stream": "ext://sys.stdout",
},
}
loggingConfig.update({
"{name}Logger".format(name=name):
{
"handlers": ["console"],
"level": verbose_levels[verbosity],
},
})
dict_log_config = {
"version": 1,
"handlers": log_handlers,
"loggers": loggingConfig,
"formatters":
{
"{name}Formatter".format(name=name):
{
"format": "[%(asctime)-15s] %(module)-9s "
"%(levelname)-7s %(message)s",
},
},
}
dictConfig(dict_log_config)
return logging.getLogger("{name}Logger".format(name=name))
def externalHostname(hosts):
"""Ensure external hostname is routable."""
hostname = hosts[0][0]
if hostname in localHostnames and len(hosts) > 1:
hostname = socket.getfqdn().split(".")[0]
try:
socket.getaddrinfo(hostname, None)
except socket.gaierror:
raise Exception("\nThe first host (containing a broker) is not"
" routable.\nMake sure the address is correct.")
return hostname
def groupTogether(in_list):
# TODO: This algorithm is not efficient, use itertools.groupby()
return_value = []
already_done = []
for index, element in enumerate(in_list):
if element not in already_done:
how_much = in_list[index + 1:].count(element)
return_value += [element]*(how_much + 1)
already_done.append(element)
return return_value
def getCPUcount():
"""Try to get the number of cpu on the current host."""
try:
return cpu_count()
except NotImplementedError:
return 1
def getEnv():
"""Return the launching environnement"""
if "SLURM_NODELIST" in os.environ:
return "SLURM"
elif "PBS_ENVIRONMENT" in os.environ:
return "PBS"
elif "PE_HOSTFILE" in os.environ:
return "SGE"
else:
return "other"
def getHosts(filename=None, hostlist=None):
"""Return a list of host depending on the environment"""
if filename:
return getHostsFromFile(filename)
elif hostlist:
return getHostsFromList(hostlist)
elif "SLURM_NODELIST" in os.environ:
return getHostsFromSLURM()
elif "PBS_ENVIRONMENT" in os.environ:
return getHostsFromPBS()
elif "PE_HOSTFILE" in os.environ:
return getHostsFromSGE()
else:
return getDefaultHosts()
def getHostsFromFile(filename):
"""Parse a file to return a list of hosts."""
valid_hostname = r"^[^ /\t=\n]+"
workers = r"\d+"
hostname_re = re.compile(valid_hostname)
worker_re = re.compile(workers)
hosts = []
with open(filename) as f:
for line in f:
# check to see if it is a SLURM grouping instead of a
# regular list of hosts
if re.search('[\[\]]',line):
hosts = hosts + parseSLURM(line.strip())
else:
host = hostname_re.search(line.strip())
if host:
hostname = host.group()
n = worker_re.search(line[host.end():])
if n:
n = n.group()
else:
n = 1
hosts.append((hostname, int(n)))
return hosts
def getHostsFromList(hostlist):
"""Return the hosts from the command line"""
# check to see if it is a SLURM grouping instead of a
# regular list of hosts
if any(re.search('[\[\]]', x) for x in hostlist):
return parseSLURM(str(hostlist))
# Counter would be more efficient but:
# 1. Won't be Python 2.6 compatible
# 2. Won't be ordered
hostlist = groupTogether(hostlist)
retVal = []
for key, group in groupby(hostlist):
retVal.append((key, len(list(group))))
return retVal
def parseSLURM(string):
"""Return a host list from a SLURM string"""
bunchedlist = re.findall('([^ /\t=\n\[,]+)(?=\[)(.*?)(?<=\])', string)
hosts = []
# parse out the name followd by range (ex. borgb[001-002,004-006]
for h,n in bunchedlist:
block = re.findall('([^\[\],]+)', n)
for rng in block:
bmin,bmax = rng.split('-')
fill_width = max(len(bmin),len(bmax))
for i in range(int(bmin),int(bmax)+1):
hostname = str(h)+str(i).zfill(fill_width)
hosts.append((hostname, int(1)))
return hosts
def getHostsFromSLURM():
"""Return a host list from a SLURM environment"""
return parseSLURM(os.environ["SLURM_NODELIST"])
def getHostsFromPBS():
"""Return a host list in a PBS environment"""
# See above comment about Counter
with open(os.environ["PBS_NODEFILE"], 'r') as hosts:
hostlist = groupTogether(hosts.read().split())
retVal = []
for key, group in groupby(hostlist):
retVal.append((key, len(list(group))))
return retVal
def getHostsFromSGE():
"""Return a host list in a SGE environment"""
with open(os.environ["PE_HOSTFILE"], 'r') as hosts:
return [(host.split()[0], int(host.split()[1])) for host in hosts]
def getWorkerQte(hosts):
"""Return the number of workers to launch depending on the environment"""
if "SLURM_NTASKS" in os.environ:
return int(os.environ["SLURM_NTASKS"])
elif "PBS_NP" in os.environ:
return int(os.environ["PBS_NP"])
elif "NSLOTS" in os.environ:
return int(os.environ["NSLOTS"])
else:
return sum(host[1] for host in hosts)
def KeyboardInterruptHandler(signum, frame):
"""This is use in the interruption handler"""
raise KeyboardInterrupt("Shutting down!")
def getDefaultHosts():
"""This is the default host for a simple SCOOP launch"""
return [('127.0.0.1', getCPUcount())]
try:
# Python 2.X fallback
basestring # attempt to evaluate basestring
def isStr(string):
return isinstance(string, basestring)
except NameError:
def isStr(string):
return isinstance(string, str)
|