update
This commit is contained in:
parent
36bb07ef1a
commit
3ebbf8833f
661
data/ps_mem.py
Normal file
661
data/ps_mem.py
Normal file
@ -0,0 +1,661 @@
|
||||
#!/usr/bin/env python
|
||||
|
||||
# Try to determine how much RAM is currently being used per program.
|
||||
# Note per _program_, not per process. So for example this script
|
||||
# will report RAM used by all httpd process together. In detail it reports:
|
||||
# sum(private RAM for program processes) + sum(Shared RAM for program processes)
|
||||
# The shared RAM is problematic to calculate, and this script automatically
|
||||
# selects the most accurate method available for your kernel.
|
||||
|
||||
# Licence: LGPLv2
|
||||
# Author: P@draigBrady.com
|
||||
# Source: http://www.pixelbeat.org/scripts/ps_mem.py
|
||||
|
||||
# V1.0 06 Jul 2005 Initial release
|
||||
# V1.1 11 Aug 2006 root permission required for accuracy
|
||||
# V1.2 08 Nov 2006 Add total to output
|
||||
# Use KiB,MiB,... for units rather than K,M,...
|
||||
# V1.3 22 Nov 2006 Ignore shared col from /proc/$pid/statm for
|
||||
# 2.6 kernels up to and including 2.6.9.
|
||||
# There it represented the total file backed extent
|
||||
# V1.4 23 Nov 2006 Remove total from output as it's meaningless
|
||||
# (the shared values overlap with other programs).
|
||||
# Display the shared column. This extra info is
|
||||
# useful, especially as it overlaps between programs.
|
||||
# V1.5 26 Mar 2007 Remove redundant recursion from human()
|
||||
# V1.6 05 Jun 2007 Also report number of processes with a given name.
|
||||
# Patch from riccardo.murri@gmail.com
|
||||
# V1.7 20 Sep 2007 Use PSS from /proc/$pid/smaps if available, which
|
||||
# fixes some over-estimation and allows totalling.
|
||||
# Enumerate the PIDs directly rather than using ps,
|
||||
# which fixes the possible race between reading
|
||||
# RSS with ps, and shared memory with this program.
|
||||
# Also we can show non truncated command names.
|
||||
# V1.8 28 Sep 2007 More accurate matching for stats in /proc/$pid/smaps
|
||||
# as otherwise could match libraries causing a crash.
|
||||
# Patch from patrice.bouchand.fedora@gmail.com
|
||||
# V1.9 20 Feb 2008 Fix invalid values reported when PSS is available.
|
||||
# Reported by Andrey Borzenkov <arvidjaar@mail.ru>
|
||||
# V3.13 17 Sep 2018
|
||||
# http://github.com/pixelb/scripts/commits/master/scripts/ps_mem.py
|
||||
|
||||
# Notes:
|
||||
#
|
||||
# All interpreted programs where the interpreter is started
|
||||
# by the shell or with env, will be merged to the interpreter
|
||||
# (as that's what's given to exec). For e.g. all python programs
|
||||
# starting with "#!/usr/bin/env python" will be grouped under python.
|
||||
# You can change this by using the full command line but that will
|
||||
# have the undesirable affect of splitting up programs started with
|
||||
# differing parameters (for e.g. mingetty tty[1-6]).
|
||||
#
|
||||
# For 2.6 kernels up to and including 2.6.13 and later 2.4 redhat kernels
|
||||
# (rmap vm without smaps) it can not be accurately determined how many pages
|
||||
# are shared between processes in general or within a program in our case:
|
||||
# http://lkml.org/lkml/2005/7/6/250
|
||||
# A warning is printed if overestimation is possible.
|
||||
# In addition for 2.6 kernels up to 2.6.9 inclusive, the shared
|
||||
# value in /proc/$pid/statm is the total file-backed extent of a process.
|
||||
# We ignore that, introducing more overestimation, again printing a warning.
|
||||
# Since kernel 2.6.23-rc8-mm1 PSS is available in smaps, which allows
|
||||
# us to calculate a more accurate value for the total RAM used by programs.
|
||||
#
|
||||
# Programs that use CLONE_VM without CLONE_THREAD are discounted by assuming
|
||||
# they're the only programs that have the same /proc/$PID/smaps file for
|
||||
# each instance. This will fail if there are multiple real instances of a
|
||||
# program that then use CLONE_VM without CLONE_THREAD, or if a clone changes
|
||||
# its memory map while we're checksumming each /proc/$PID/smaps.
|
||||
#
|
||||
# I don't take account of memory allocated for a program
|
||||
# by other programs. For e.g. memory used in the X server for
|
||||
# a program could be determined, but is not.
|
||||
#
|
||||
# FreeBSD is supported if linprocfs is mounted at /compat/linux/proc/
|
||||
# FreeBSD 8.0 supports up to a level of Linux 2.6.16
|
||||
|
||||
import getopt
|
||||
import time
|
||||
import errno
|
||||
import os
|
||||
import sys
|
||||
|
||||
# The following exits cleanly on Ctrl-C or EPIPE
|
||||
# while treating other exceptions as before.
|
||||
def std_exceptions(etype, value, tb):
|
||||
sys.excepthook = sys.__excepthook__
|
||||
if issubclass(etype, KeyboardInterrupt):
|
||||
pass
|
||||
elif issubclass(etype, IOError) and value.errno == errno.EPIPE:
|
||||
pass
|
||||
else:
|
||||
sys.__excepthook__(etype, value, tb)
|
||||
sys.excepthook = std_exceptions
|
||||
|
||||
#
|
||||
# Define some global variables
|
||||
#
|
||||
|
||||
PAGESIZE = os.sysconf("SC_PAGE_SIZE") / 1024 #KiB
|
||||
our_pid = os.getpid()
|
||||
|
||||
have_pss = 0
|
||||
have_swap_pss = 0
|
||||
|
||||
class Unbuffered(object):
|
||||
def __init__(self, stream):
|
||||
self.stream = stream
|
||||
def write(self, data):
|
||||
self.stream.write(data)
|
||||
self.stream.flush()
|
||||
def close(self):
|
||||
self.stream.close()
|
||||
def flush(self):
|
||||
self.stream.flush()
|
||||
|
||||
class Proc:
|
||||
def __init__(self):
|
||||
uname = os.uname()
|
||||
if uname[0] == "FreeBSD":
|
||||
self.proc = '/compat/linux/proc'
|
||||
else:
|
||||
self.proc = '/proc'
|
||||
|
||||
def path(self, *args):
|
||||
return os.path.join(self.proc, *(str(a) for a in args))
|
||||
|
||||
def open(self, *args):
|
||||
try:
|
||||
if sys.version_info < (3,):
|
||||
return open(self.path(*args))
|
||||
else:
|
||||
return open(self.path(*args), errors='ignore')
|
||||
except (IOError, OSError):
|
||||
val = sys.exc_info()[1]
|
||||
if (val.errno == errno.ENOENT or # kernel thread or process gone
|
||||
val.errno == errno.EPERM or
|
||||
val.errno == errno.EACCES):
|
||||
raise LookupError
|
||||
raise
|
||||
|
||||
proc = Proc()
|
||||
|
||||
|
||||
#
|
||||
# Functions
|
||||
#
|
||||
|
||||
def parse_options():
|
||||
try:
|
||||
long_options = [
|
||||
'split-args',
|
||||
'help',
|
||||
'version',
|
||||
'total',
|
||||
'discriminate-by-pid',
|
||||
'swap'
|
||||
]
|
||||
opts, args = getopt.getopt(sys.argv[1:], "shtdSp:w:", long_options)
|
||||
except getopt.GetoptError:
|
||||
sys.stderr.write(help())
|
||||
sys.exit(3)
|
||||
|
||||
if len(args):
|
||||
sys.stderr.write("Extraneous arguments: %s\n" % args)
|
||||
sys.exit(3)
|
||||
|
||||
# ps_mem.py options
|
||||
split_args = False
|
||||
pids_to_show = None
|
||||
discriminate_by_pid = False
|
||||
show_swap = False
|
||||
watch = None
|
||||
only_total = False
|
||||
|
||||
for o, a in opts:
|
||||
if o in ('-s', '--split-args'):
|
||||
split_args = True
|
||||
if o in ('-t', '--total'):
|
||||
only_total = True
|
||||
if o in ('-d', '--discriminate-by-pid'):
|
||||
discriminate_by_pid = True
|
||||
if o in ('-S', '--swap'):
|
||||
show_swap = True
|
||||
if o in ('-h', '--help'):
|
||||
sys.stdout.write(help())
|
||||
sys.exit(0)
|
||||
if o in ('--version'):
|
||||
sys.stdout.write('3.13'+'\n')
|
||||
sys.exit(0)
|
||||
if o in ('-p',):
|
||||
try:
|
||||
pids_to_show = [int(x) for x in a.split(',')]
|
||||
except:
|
||||
sys.stderr.write(help())
|
||||
sys.exit(3)
|
||||
if o in ('-w',):
|
||||
try:
|
||||
watch = int(a)
|
||||
except:
|
||||
sys.stderr.write(help())
|
||||
sys.exit(3)
|
||||
|
||||
return (
|
||||
split_args,
|
||||
pids_to_show,
|
||||
watch,
|
||||
only_total,
|
||||
discriminate_by_pid,
|
||||
show_swap
|
||||
)
|
||||
|
||||
|
||||
def help():
|
||||
help_msg = 'Usage: ps_mem [OPTION]...\n' \
|
||||
'Show program core memory usage\n' \
|
||||
'\n' \
|
||||
' -h, -help Show this help\n' \
|
||||
' -p <pid>[,pid2,...pidN] Only show memory usage PIDs in the '\
|
||||
'specified list\n' \
|
||||
' -s, --split-args Show and separate by, all command line'\
|
||||
' arguments\n' \
|
||||
' -t, --total Show only the total value\n' \
|
||||
' -d, --discriminate-by-pid Show by process rather than by program\n' \
|
||||
' -S, --swap Show swap information\n' \
|
||||
' -w <N> Measure and show process memory every'\
|
||||
' N seconds\n'
|
||||
|
||||
return help_msg
|
||||
|
||||
|
||||
# (major,minor,release)
|
||||
def kernel_ver():
|
||||
kv = proc.open('sys/kernel/osrelease').readline().split(".")[:3]
|
||||
last = len(kv)
|
||||
if last == 2:
|
||||
kv.append('0')
|
||||
last -= 1
|
||||
while last > 0:
|
||||
for char in "-_":
|
||||
kv[last] = kv[last].split(char)[0]
|
||||
try:
|
||||
int(kv[last])
|
||||
except:
|
||||
kv[last] = 0
|
||||
last -= 1
|
||||
return (int(kv[0]), int(kv[1]), int(kv[2]))
|
||||
|
||||
|
||||
#return Private,Shared,Swap(Pss),unique_id
|
||||
#Note shared is always a subset of rss (trs is not always)
|
||||
def getMemStats(pid):
|
||||
global have_pss
|
||||
global have_swap_pss
|
||||
mem_id = pid #unique
|
||||
Private_lines = []
|
||||
Shared_lines = []
|
||||
Pss_lines = []
|
||||
Rss = (int(proc.open(pid, 'statm').readline().split()[1])
|
||||
* PAGESIZE)
|
||||
Swap_lines = []
|
||||
Swap_pss_lines = []
|
||||
|
||||
Swap = 0
|
||||
|
||||
if os.path.exists(proc.path(pid, 'smaps')): # stat
|
||||
smaps = 'smaps'
|
||||
if os.path.exists(proc.path(pid, 'smaps_rollup')):
|
||||
smaps = 'smaps_rollup' # faster to process
|
||||
lines = proc.open(pid, smaps).readlines() # open
|
||||
# Note we checksum smaps as maps is usually but
|
||||
# not always different for separate processes.
|
||||
mem_id = hash(''.join(lines))
|
||||
for line in lines:
|
||||
if line.startswith("Shared"):
|
||||
Shared_lines.append(line)
|
||||
elif line.startswith("Private"):
|
||||
Private_lines.append(line)
|
||||
elif line.startswith("Pss"):
|
||||
have_pss = 1
|
||||
Pss_lines.append(line)
|
||||
elif line.startswith("Swap:"):
|
||||
Swap_lines.append(line)
|
||||
elif line.startswith("SwapPss:"):
|
||||
have_swap_pss = 1
|
||||
Swap_pss_lines.append(line)
|
||||
Shared = sum([int(line.split()[1]) for line in Shared_lines])
|
||||
Private = sum([int(line.split()[1]) for line in Private_lines])
|
||||
#Note Shared + Private = Rss above
|
||||
#The Rss in smaps includes video card mem etc.
|
||||
if have_pss:
|
||||
pss_adjust = 0.5 # add 0.5KiB as this avg error due to truncation
|
||||
Pss = sum([float(line.split()[1])+pss_adjust for line in Pss_lines])
|
||||
Shared = Pss - Private
|
||||
if have_swap_pss:
|
||||
# The kernel supports SwapPss, that shows proportional swap share.
|
||||
# Note that Swap - SwapPss is not Private Swap.
|
||||
Swap = sum([int(line.split()[1]) for line in Swap_pss_lines])
|
||||
else:
|
||||
# Note that Swap = Private swap + Shared swap.
|
||||
Swap = sum([int(line.split()[1]) for line in Swap_lines])
|
||||
elif (2,6,1) <= kernel_ver() <= (2,6,9):
|
||||
Shared = 0 #lots of overestimation, but what can we do?
|
||||
Private = Rss
|
||||
else:
|
||||
Shared = int(proc.open(pid, 'statm').readline().split()[2])
|
||||
Shared *= PAGESIZE
|
||||
Private = Rss - Shared
|
||||
return (Private, Shared, Swap, mem_id)
|
||||
|
||||
|
||||
def getCmdName(pid, split_args, discriminate_by_pid, exe_only=False):
|
||||
cmdline = proc.open(pid, 'cmdline').read().split("\0")
|
||||
if cmdline[-1] == '' and len(cmdline) > 1:
|
||||
cmdline = cmdline[:-1]
|
||||
|
||||
path = proc.path(pid, 'exe')
|
||||
try:
|
||||
path = os.readlink(path)
|
||||
# Some symlink targets were seen to contain NULs on RHEL 5 at least
|
||||
# https://github.com/pixelb/scripts/pull/10, so take string up to NUL
|
||||
path = path.split('\0')[0]
|
||||
except OSError:
|
||||
val = sys.exc_info()[1]
|
||||
if (val.errno == errno.ENOENT or # either kernel thread or process gone
|
||||
val.errno == errno.EPERM or
|
||||
val.errno == errno.EACCES):
|
||||
raise LookupError
|
||||
raise
|
||||
|
||||
if split_args:
|
||||
return ' '.join(cmdline).replace('\n', ' ')
|
||||
if path.endswith(" (deleted)"):
|
||||
path = path[:-10]
|
||||
if os.path.exists(path):
|
||||
path += " [updated]"
|
||||
else:
|
||||
#The path could be have prelink stuff so try cmdline
|
||||
#which might have the full path present. This helped for:
|
||||
#/usr/libexec/notification-area-applet.#prelink#.fX7LCT (deleted)
|
||||
if os.path.exists(cmdline[0]):
|
||||
path = cmdline[0] + " [updated]"
|
||||
else:
|
||||
path += " [deleted]"
|
||||
exe = os.path.basename(path)
|
||||
if exe_only: return exe
|
||||
|
||||
proc_status = proc.open(pid, 'status').readlines()
|
||||
cmd = proc_status[0][6:-1]
|
||||
if exe.startswith(cmd):
|
||||
cmd = exe #show non truncated version
|
||||
#Note because we show the non truncated name
|
||||
#one can have separated programs as follows:
|
||||
#584.0 KiB + 1.0 MiB = 1.6 MiB mozilla-thunder (exe -> bash)
|
||||
# 56.0 MiB + 22.2 MiB = 78.2 MiB mozilla-thunderbird-bin
|
||||
else:
|
||||
#Lookup the parent's exe and use that if matching
|
||||
#which will merge "Web Content" with "firefox" for example
|
||||
ppid = 0
|
||||
for l in range(10):
|
||||
ps_line = proc_status[l]
|
||||
if ps_line.startswith('PPid:'):
|
||||
ppid = int(ps_line[6:-1])
|
||||
break
|
||||
if ppid:
|
||||
p_exe = getCmdName(ppid, False, False, exe_only=True)
|
||||
if exe == p_exe:
|
||||
cmd = exe
|
||||
if sys.version_info >= (3,):
|
||||
cmd = cmd.encode(errors='replace').decode()
|
||||
if discriminate_by_pid:
|
||||
cmd = '%s [%d]' % (cmd, pid)
|
||||
return cmd
|
||||
|
||||
|
||||
#The following matches "du -h" output
|
||||
#see also human.py
|
||||
def human(num, power="Ki", units=None):
|
||||
if units is None:
|
||||
powers = ["Ki", "Mi", "Gi", "Ti"]
|
||||
while num >= 1000: #4 digits
|
||||
num /= 1024.0
|
||||
power = powers[powers.index(power)+1]
|
||||
return "%.1f %sB" % (num, power)
|
||||
else:
|
||||
return "%.f" % ((num * 1024) / units)
|
||||
|
||||
|
||||
def cmd_with_count(cmd, count):
|
||||
if count > 1:
|
||||
return "%s (%u)" % (cmd, count)
|
||||
else:
|
||||
return cmd
|
||||
|
||||
#Warn of possible inaccuracies
|
||||
#RAM:
|
||||
#2 = accurate & can total
|
||||
#1 = accurate only considering each process in isolation
|
||||
#0 = some shared mem not reported
|
||||
#-1= all shared mem not reported
|
||||
#SWAP:
|
||||
#2 = accurate & can total
|
||||
#1 = accurate only considering each process in isolation
|
||||
#-1= not available
|
||||
def val_accuracy(show_swap):
|
||||
"""http://wiki.apache.org/spamassassin/TopSharedMemoryBug"""
|
||||
kv = kernel_ver()
|
||||
pid = os.getpid()
|
||||
swap_accuracy = -1
|
||||
if kv[:2] == (2,4):
|
||||
if proc.open('meminfo').read().find("Inact_") == -1:
|
||||
return 1, swap_accuracy
|
||||
return 0, swap_accuracy
|
||||
elif kv[:2] == (2,6):
|
||||
if os.path.exists(proc.path(pid, 'smaps')):
|
||||
swap_accuracy = 1
|
||||
if proc.open(pid, 'smaps').read().find("Pss:")!=-1:
|
||||
return 2, swap_accuracy
|
||||
else:
|
||||
return 1, swap_accuracy
|
||||
if (2,6,1) <= kv <= (2,6,9):
|
||||
return -1, swap_accuracy
|
||||
return 0, swap_accuracy
|
||||
elif kv[0] > 2 and os.path.exists(proc.path(pid, 'smaps')):
|
||||
swap_accuracy = 1
|
||||
if show_swap and proc.open(pid, 'smaps').read().find("SwapPss:")!=-1:
|
||||
swap_accuracy = 2
|
||||
return 2, swap_accuracy
|
||||
else:
|
||||
return 1, swap_accuracy
|
||||
|
||||
def show_val_accuracy( ram_inacc, swap_inacc, only_total, show_swap ):
|
||||
level = ("Warning","Error")[only_total]
|
||||
|
||||
# Only show significant warnings
|
||||
if not show_swap:
|
||||
swap_inacc = 2
|
||||
elif only_total:
|
||||
ram_inacc = 2
|
||||
|
||||
if ram_inacc == -1:
|
||||
sys.stderr.write(
|
||||
"%s: Shared memory is not reported by this system.\n" % level
|
||||
)
|
||||
sys.stderr.write(
|
||||
"Values reported will be too large, and totals are not reported\n"
|
||||
)
|
||||
elif ram_inacc == 0:
|
||||
sys.stderr.write(
|
||||
"%s: Shared memory is not reported accurately by this system.\n" % level
|
||||
)
|
||||
sys.stderr.write(
|
||||
"Values reported could be too large, and totals are not reported\n"
|
||||
)
|
||||
elif ram_inacc == 1:
|
||||
sys.stderr.write(
|
||||
"%s: Shared memory is slightly over-estimated by this system\n"
|
||||
"for each program, so totals are not reported.\n" % level
|
||||
)
|
||||
|
||||
if swap_inacc == -1:
|
||||
sys.stderr.write(
|
||||
"%s: Swap is not reported by this system.\n" % level
|
||||
)
|
||||
elif swap_inacc == 1:
|
||||
sys.stderr.write(
|
||||
"%s: Swap is over-estimated by this system for each program,\n"
|
||||
"so totals are not reported.\n" % level
|
||||
)
|
||||
|
||||
sys.stderr.close()
|
||||
if only_total:
|
||||
if show_swap:
|
||||
accuracy = swap_inacc
|
||||
else:
|
||||
accuracy = ram_inacc
|
||||
if accuracy != 2:
|
||||
sys.exit(1)
|
||||
|
||||
|
||||
def get_memory_usage(pids_to_show, split_args, discriminate_by_pid,
|
||||
include_self=False, only_self=False):
|
||||
cmds = {}
|
||||
shareds = {}
|
||||
mem_ids = {}
|
||||
count = {}
|
||||
swaps = {}
|
||||
for pid in os.listdir(proc.path('')):
|
||||
if not pid.isdigit():
|
||||
continue
|
||||
pid = int(pid)
|
||||
|
||||
# Some filters
|
||||
if only_self and pid != our_pid:
|
||||
continue
|
||||
if pid == our_pid and not include_self:
|
||||
continue
|
||||
if pids_to_show is not None and pid not in pids_to_show:
|
||||
continue
|
||||
|
||||
try:
|
||||
cmd = getCmdName(pid, split_args, discriminate_by_pid)
|
||||
except LookupError:
|
||||
#operation not permitted
|
||||
#kernel threads don't have exe links or
|
||||
#process gone
|
||||
continue
|
||||
|
||||
try:
|
||||
private, shared, swap, mem_id = getMemStats(pid)
|
||||
except RuntimeError:
|
||||
continue #process gone
|
||||
if shareds.get(cmd):
|
||||
if have_pss: #add shared portion of PSS together
|
||||
shareds[cmd] += shared
|
||||
elif shareds[cmd] < shared: #just take largest shared val
|
||||
shareds[cmd] = shared
|
||||
else:
|
||||
shareds[cmd] = shared
|
||||
cmds[cmd] = cmds.setdefault(cmd, 0) + private
|
||||
if cmd in count:
|
||||
count[cmd] += 1
|
||||
else:
|
||||
count[cmd] = 1
|
||||
mem_ids.setdefault(cmd, {}).update({mem_id: None})
|
||||
|
||||
# Swap (overcounting for now...)
|
||||
swaps[cmd] = swaps.setdefault(cmd, 0) + swap
|
||||
|
||||
# Total swaped mem for each program
|
||||
total_swap = 0
|
||||
|
||||
# Add shared mem for each program
|
||||
total = 0
|
||||
|
||||
for cmd in cmds:
|
||||
cmd_count = count[cmd]
|
||||
if len(mem_ids[cmd]) == 1 and cmd_count > 1:
|
||||
# Assume this program is using CLONE_VM without CLONE_THREAD
|
||||
# so only account for one of the processes
|
||||
cmds[cmd] /= cmd_count
|
||||
if have_pss:
|
||||
shareds[cmd] /= cmd_count
|
||||
cmds[cmd] = cmds[cmd] + shareds[cmd]
|
||||
total += cmds[cmd] # valid if PSS available
|
||||
total_swap += swaps[cmd]
|
||||
|
||||
sorted_cmds = sorted(cmds.items(), key=lambda x:x[1])
|
||||
sorted_cmds = [x for x in sorted_cmds if x[1]]
|
||||
|
||||
return sorted_cmds, shareds, count, total, swaps, total_swap
|
||||
|
||||
def print_header(show_swap, discriminate_by_pid):
|
||||
output_string = " Private + Shared = RAM used"
|
||||
if show_swap:
|
||||
output_string += " Swap used"
|
||||
output_string += "\tProgram"
|
||||
if discriminate_by_pid:
|
||||
output_string += "[pid]"
|
||||
output_string += "\n\n"
|
||||
sys.stdout.write(output_string)
|
||||
|
||||
|
||||
def print_memory_usage(sorted_cmds, shareds, count, total, swaps, total_swap,
|
||||
show_swap):
|
||||
for cmd in sorted_cmds:
|
||||
|
||||
output_string = "%9s + %9s = %9s"
|
||||
output_data = (human(cmd[1]-shareds[cmd[0]]),
|
||||
human(shareds[cmd[0]]), human(cmd[1]))
|
||||
if show_swap:
|
||||
output_string += " %9s"
|
||||
output_data += (human(swaps[cmd[0]]),)
|
||||
output_string += "\t%s\n"
|
||||
output_data += (cmd_with_count(cmd[0], count[cmd[0]]),)
|
||||
|
||||
sys.stdout.write(output_string % output_data)
|
||||
|
||||
# Only show totals if appropriate
|
||||
if have_swap_pss and show_swap: # kernel will have_pss
|
||||
sys.stdout.write("%s\n%s%9s%s%9s\n%s\n" %
|
||||
("-" * 45, " " * 24, human(total), " " * 3,
|
||||
human(total_swap), "=" * 45))
|
||||
elif have_pss:
|
||||
sys.stdout.write("%s\n%s%9s\n%s\n" %
|
||||
("-" * 33, " " * 24, human(total), "=" * 33))
|
||||
|
||||
|
||||
def verify_environment(pids_to_show):
|
||||
if os.geteuid() != 0 and not pids_to_show:
|
||||
sys.stderr.write("Sorry, root permission required, or specify pids with -p\n")
|
||||
sys.stderr.close()
|
||||
sys.exit(1)
|
||||
|
||||
try:
|
||||
kernel_ver()
|
||||
except (IOError, OSError):
|
||||
val = sys.exc_info()[1]
|
||||
if val.errno == errno.ENOENT:
|
||||
sys.stderr.write(
|
||||
"Couldn't access " + proc.path('') + "\n"
|
||||
"Only GNU/Linux and FreeBSD (with linprocfs) are supported\n")
|
||||
sys.exit(2)
|
||||
else:
|
||||
raise
|
||||
|
||||
def main():
|
||||
# Force the stdout and stderr streams to be unbuffered
|
||||
sys.stdout = Unbuffered(sys.stdout)
|
||||
sys.stderr = Unbuffered(sys.stderr)
|
||||
|
||||
split_args, pids_to_show, watch, only_total, discriminate_by_pid, \
|
||||
show_swap = parse_options()
|
||||
|
||||
verify_environment(pids_to_show)
|
||||
|
||||
if not only_total:
|
||||
print_header(show_swap, discriminate_by_pid)
|
||||
|
||||
if watch is not None:
|
||||
try:
|
||||
sorted_cmds = True
|
||||
while sorted_cmds:
|
||||
sorted_cmds, shareds, count, total, swaps, total_swap = \
|
||||
get_memory_usage(pids_to_show, split_args,
|
||||
discriminate_by_pid)
|
||||
if only_total and show_swap and have_swap_pss:
|
||||
sys.stdout.write(human(total_swap, units=1)+'\n')
|
||||
elif only_total and not show_swap and have_pss:
|
||||
sys.stdout.write(human(total, units=1)+'\n')
|
||||
elif not only_total:
|
||||
print_memory_usage(sorted_cmds, shareds, count, total,
|
||||
swaps, total_swap, show_swap)
|
||||
|
||||
sys.stdout.flush()
|
||||
time.sleep(watch)
|
||||
else:
|
||||
sys.stdout.write('Process does not exist anymore.\n')
|
||||
except KeyboardInterrupt:
|
||||
pass
|
||||
else:
|
||||
# This is the default behavior
|
||||
sorted_cmds, shareds, count, total, swaps, total_swap = \
|
||||
get_memory_usage(pids_to_show, split_args,
|
||||
discriminate_by_pid)
|
||||
if only_total and show_swap and have_swap_pss:
|
||||
sys.stdout.write(human(total_swap, units=1)+'\n')
|
||||
elif only_total and not show_swap and have_pss:
|
||||
sys.stdout.write(human(total, units=1)+'\n')
|
||||
elif not only_total:
|
||||
print_memory_usage(sorted_cmds, shareds, count, total, swaps,
|
||||
total_swap, show_swap)
|
||||
|
||||
# We must close explicitly, so that any EPIPE exception
|
||||
# is handled by our excepthook, rather than the default
|
||||
# one which is reenabled after this script finishes.
|
||||
sys.stdout.close()
|
||||
|
||||
ram_accuracy, swap_accuracy = val_accuracy( show_swap )
|
||||
show_val_accuracy( ram_accuracy, swap_accuracy, only_total, show_swap )
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
23
data/show-queue.sh
Normal file
23
data/show-queue.sh
Normal file
@ -0,0 +1,23 @@
|
||||
#!/bin/bash
|
||||
# Show High-priority
|
||||
echo '-------------------------------'
|
||||
echo 'Queue in high-priority clusters'
|
||||
echo '-------------------------------'
|
||||
queues="yq01-v100-box-1-8 yq01-v100-box-idl-2-8"
|
||||
for queue in ${queues}
|
||||
do
|
||||
showjob -p ${queue}
|
||||
sleep 0.3s
|
||||
done
|
||||
|
||||
echo '-------------------------------'
|
||||
echo 'Queue in low-priority clusters'
|
||||
echo '-------------------------------'
|
||||
|
||||
#queues="yq01-p40-3-8 yq01-p40-2-8 yq01-p40-box-1-8 yq01-v100-box-2-8"
|
||||
queues="yq01-p40-3-8 yq01-p40-box-1-8 yq01-v100-box-2-8 yq01-v100-box-idl-8"
|
||||
for queue in ${queues}
|
||||
do
|
||||
showjob -p ${queue}
|
||||
sleep 0.3s
|
||||
done
|
@ -10,4 +10,5 @@ bash scripts-cluster/submit.sh yq01-v100-box-idl-2-8 PTB-GDAS 1 "bash ./scripts-
|
||||
```
|
||||
bash scripts-cluster/submit.sh yq01-v100-box-idl-2-8 CIFAR10-CUT-GDAS-F1 1 "bash ./scripts-cnn/train-cifar.sh GDAS_F1 cifar10 cut"
|
||||
bash scripts-cluster/submit.sh yq01-v100-box-idl-2-8 IMAGENET-GDAS-F1 1 "bash ./scripts-cnn/train-imagenet.sh GDAS_F1 52 14"
|
||||
bash scripts-cluster/submit.sh yq01-v100-box-idl-2-8 IMAGENET-GDAS-V1 1 "bash ./scripts-cnn/train-imagenet.sh GDAS_V1 50 14"
|
||||
```
|
||||
|
Loading…
Reference in New Issue
Block a user