Util.py revision df944f1f83420b44e3a41d379c361b797c827b42
1import os, sys
2
3def detectCPUs():
4    """
5    Detects the number of CPUs on a system. Cribbed from pp.
6    """
7    # Linux, Unix and MacOS:
8    if hasattr(os, "sysconf"):
9        if os.sysconf_names.has_key("SC_NPROCESSORS_ONLN"):
10            # Linux & Unix:
11            ncpus = os.sysconf("SC_NPROCESSORS_ONLN")
12            if isinstance(ncpus, int) and ncpus > 0:
13                return ncpus
14        else: # OSX:
15            return int(os.popen2("sysctl -n hw.ncpu")[1].read())
16    # Windows:
17    if os.environ.has_key("NUMBER_OF_PROCESSORS"):
18        ncpus = int(os.environ["NUMBER_OF_PROCESSORS"])
19        if ncpus > 0:
20            return ncpus
21    return 1 # Default
22
23def mkdir_p(path):
24    """mkdir_p(path) - Make the "path" directory, if it does not exist; this
25    will also make directories for any missing parent directories."""
26    import errno
27
28    if not path or os.path.exists(path):
29        return
30
31    parent = os.path.dirname(path)
32    if parent != path:
33        mkdir_p(parent)
34
35    try:
36        os.mkdir(path)
37    except OSError,e:
38        # Ignore EEXIST, which may occur during a race condition.
39        if e.errno != errno.EEXIST:
40            raise
41
42def capture(args, env=None):
43    import subprocess
44    """capture(command) - Run the given command (or argv list) in a shell and
45    return the standard output."""
46    p = subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE,
47                         env=env)
48    out,_ = p.communicate()
49    return out
50
51def which(command, paths = None):
52    """which(command, [paths]) - Look up the given command in the paths string
53    (or the PATH environment variable, if unspecified)."""
54
55    if paths is None:
56        paths = os.environ.get('PATH','')
57
58    # Check for absolute match first.
59    if os.path.exists(command):
60        return command
61
62    # Would be nice if Python had a lib function for this.
63    if not paths:
64        paths = os.defpath
65
66    # Get suffixes to search.
67    pathext = os.environ.get('PATHEXT', '').split(os.pathsep)
68
69    # Search the paths...
70    for path in paths.split(os.pathsep):
71        for ext in pathext:
72            p = os.path.join(path, command + ext)
73            if os.path.exists(p):
74                return p
75
76    return None
77
78def checkToolsPath(dir, tools):
79    for tool in tools:
80        if not os.path.exists(os.path.join(dir, tool)):
81            return False;
82    return True;
83
84def whichTools(tools, paths):
85    for path in paths.split(os.pathsep):
86        if checkToolsPath(path, tools):
87            return path
88    return None
89
90def printHistogram(items, title = 'Items'):
91    import itertools, math
92
93    items.sort(key = lambda (_,v): v)
94
95    maxValue = max([v for _,v in items])
96
97    # Select first "nice" bar height that produces more than 10 bars.
98    power = int(math.ceil(math.log(maxValue, 10)))
99    for inc in itertools.cycle((5, 2, 2.5, 1)):
100        barH = inc * 10**power
101        N = int(math.ceil(maxValue / barH))
102        if N > 10:
103            break
104        elif inc == 1:
105            power -= 1
106
107    histo = [set() for i in range(N)]
108    for name,v in items:
109        bin = min(int(N * v/maxValue), N-1)
110        histo[bin].add(name)
111
112    barW = 40
113    hr = '-' * (barW + 34)
114    print '\nSlowest %s:' % title
115    print hr
116    for name,value in items[-20:]:
117        print '%.2fs: %s' % (value, name)
118    print '\n%s Times:' % title
119    print hr
120    pDigits = int(math.ceil(math.log(maxValue, 10)))
121    pfDigits = max(0, 3-pDigits)
122    if pfDigits:
123        pDigits += pfDigits + 1
124    cDigits = int(math.ceil(math.log(len(items), 10)))
125    print "[%s] :: [%s] :: [%s]" % ('Range'.center((pDigits+1)*2 + 3),
126                                    'Percentage'.center(barW),
127                                    'Count'.center(cDigits*2 + 1))
128    print hr
129    for i,row in enumerate(histo):
130        pct = float(len(row)) / len(items)
131        w = int(barW * pct)
132        print "[%*.*fs,%*.*fs)" % (pDigits, pfDigits, i*barH,
133                                   pDigits, pfDigits, (i+1)*barH),
134        print ":: [%s%s] :: [%*d/%*d]" % ('*'*w, ' '*(barW-w),
135                                          cDigits, len(row),
136                                          cDigits, len(items))
137
138