Merge pull request #95 from mokaddem/module_handling

Module handling
This commit is contained in:
Alexandre Dulaunoy 2016-12-22 22:18:31 +01:00 committed by GitHub
commit ddfe3cf66a

View file

@ -25,9 +25,9 @@ import json
from terminaltables import AsciiTable from terminaltables import AsciiTable
import textwrap import textwrap
from colorama import Fore, Back, Style, init from colorama import Fore, Back, Style, init
import curses
# CONFIG VARIABLES # CONFIG VARIABLES
threshold_stucked_module = 60*10*1 #1 hour
kill_retry_threshold = 60 #1m kill_retry_threshold = 60 #1m
log_filename = "../logs/moduleInfo.log" log_filename = "../logs/moduleInfo.log"
command_search_pid = "ps a -o pid,cmd | grep {}" command_search_pid = "ps a -o pid,cmd | grep {}"
@ -39,6 +39,15 @@ printarrayGlob = [None]*14
printarrayGlob.insert(0, ["Time", "Module", "PID", "Action"]) printarrayGlob.insert(0, ["Time", "Module", "PID", "Action"])
lastTimeKillCommand = {} lastTimeKillCommand = {}
#Curses init
#stdscr = curses.initscr()
#curses.cbreak()
#stdscr.keypad(1)
# GLOBAL
last_refresh = 0
def getPid(module): def getPid(module):
p = Popen([command_search_pid.format(module+".py")], stdin=PIPE, stdout=PIPE, bufsize=1, shell=True) p = Popen([command_search_pid.format(module+".py")], stdin=PIPE, stdout=PIPE, bufsize=1, shell=True)
for line in p.stdout: for line in p.stdout:
@ -145,23 +154,33 @@ def get_color(time, idle):
temp = time.split(':') temp = time.split(':')
time = int(temp[0])*3600 + int(temp[1])*60 + int(temp[2]) time = int(temp[0])*3600 + int(temp[1])*60 + int(temp[2])
if time >= threshold_stucked_module: if time >= args.treshold:
if not idle: if not idle:
return Back.RED + Style.BRIGHT return Back.RED + Style.BRIGHT
else: else:
return Back.MAGENTA + Style.BRIGHT return Back.MAGENTA + Style.BRIGHT
elif time > threshold_stucked_module/2: elif time > args.treshold/2:
return Back.YELLOW + Style.BRIGHT return Back.YELLOW + Style.BRIGHT
else: else:
return Back.GREEN + Style.BRIGHT return Back.GREEN + Style.BRIGHT
else: else:
return Style.RESET_ALL return Style.RESET_ALL
def waiting_refresh():
global last_refresh
if time.time() - last_refresh < args.refresh:
return False
else:
last_refresh = time.time()
return True
if __name__ == "__main__": if __name__ == "__main__":
parser = argparse.ArgumentParser(description='Show info concerning running modules and log suspected stucked modules. May be use to automatically kill and restart stucked one.') parser = argparse.ArgumentParser(description='Show info concerning running modules and log suspected stucked modules. May be use to automatically kill and restart stucked one.')
parser.add_argument('-r', '--refresh', type=int, required=False, default=1, help='Refresh rate') parser.add_argument('-r', '--refresh', type=int, required=False, default=1, help='Refresh rate')
parser.add_argument('-t', '--treshold', type=int, required=False, default=60*10*1, help='Refresh rate')
parser.add_argument('-k', '--autokill', type=int, required=False, default=0, help='Enable auto kill option (1 for TRUE, anything else for FALSE)') parser.add_argument('-k', '--autokill', type=int, required=False, default=0, help='Enable auto kill option (1 for TRUE, anything else for FALSE)')
parser.add_argument('-c', '--clear', type=int, required=False, default=0, help='Clear the current module information (Used to clear data from old launched modules)') parser.add_argument('-c', '--clear', type=int, required=False, default=0, help='Clear the current module information (Used to clear data from old launched modules)')
@ -176,8 +195,6 @@ if __name__ == "__main__":
cfg = ConfigParser.ConfigParser() cfg = ConfigParser.ConfigParser()
cfg.read(configfile) cfg.read(configfile)
threshold_stucked_module = cfg.getint("Module_ModuleInformation", "threshold_stucked_module")
# REDIS # # REDIS #
server = redis.StrictRedis( server = redis.StrictRedis(
host=cfg.get("Redis_Queues", "host"), host=cfg.get("Redis_Queues", "host"),
@ -199,123 +216,138 @@ if __name__ == "__main__":
cleanRedis() cleanRedis()
while True: while True:
if waiting_refresh():
all_queue = set() #key = ''
printarray1 = [] #while key != 'q':
printarray2 = [] # key = stdsrc.getch()
printarray3 = [] # stdscr.refresh()
for queue, card in server.hgetall("queues").iteritems():
all_queue.add(queue)
key = "MODULE_" + queue + "_"
keySet = "MODULE_TYPE_" + queue
array_module_type = []
for moduleNum in server.smembers(keySet): all_queue = set()
value = server.get(key + str(moduleNum)) printarray1 = []
if value is not None: printarray2 = []
timestamp, path = value.split(", ") printarray3 = []
if timestamp is not None and path is not None: for queue, card in server.hgetall("queues").iteritems():
startTime_readable = datetime.datetime.fromtimestamp(int(timestamp)) all_queue.add(queue)
processed_time_readable = str((datetime.datetime.now() - startTime_readable)).split('.')[0] key = "MODULE_" + queue + "_"
keySet = "MODULE_TYPE_" + queue
array_module_type = []
if int(card) > 0: for moduleNum in server.smembers(keySet):
if int((datetime.datetime.now() - startTime_readable).total_seconds()) > threshold_stucked_module: value = server.get(key + str(moduleNum))
log = open(log_filename, 'a') if value is not None:
log.write(json.dumps([queue, card, str(startTime_readable), str(processed_time_readable), path]) + "\n") timestamp, path = value.split(", ")
try: if timestamp is not None and path is not None:
last_kill_try = time.time() - lastTimeKillCommand[moduleNum] startTime_readable = datetime.datetime.fromtimestamp(int(timestamp))
except KeyError: processed_time_readable = str((datetime.datetime.now() - startTime_readable)).split('.')[0]
last_kill_try = kill_retry_threshold+1
if args.autokill == 1 and last_kill_try > kill_retry_threshold :
kill_module(queue, int(moduleNum))
array_module_type.append([get_color(processed_time_readable, False) + str(queue), str(moduleNum), str(card), str(startTime_readable), str(processed_time_readable), str(path) + get_color(None, False)]) if int(card) > 0:
if int((datetime.datetime.now() - startTime_readable).total_seconds()) > args.treshold:
log = open(log_filename, 'a')
log.write(json.dumps([queue, card, str(startTime_readable), str(processed_time_readable), path]) + "\n")
try:
last_kill_try = time.time() - lastTimeKillCommand[moduleNum]
except KeyError:
last_kill_try = kill_retry_threshold+1
if args.autokill == 1 and last_kill_try > kill_retry_threshold :
kill_module(queue, int(moduleNum))
else: array_module_type.append([get_color(processed_time_readable, False) + str(queue), str(moduleNum), str(card), str(startTime_readable), str(processed_time_readable), str(path) + get_color(None, False)])
printarray2.append([get_color(processed_time_readable, True) + str(queue), str(moduleNum), str(card), str(startTime_readable), str(processed_time_readable), str(path) + get_color(None, True)])
array_module_type.sort(lambda x,y: cmp(x[4], y[4]), reverse=True)
for e in array_module_type:
printarray1.append(e)
for curr_queue in module_file_array: else:
if curr_queue not in all_queue: printarray2.append([get_color(processed_time_readable, True) + str(queue), str(moduleNum), str(card), str(startTime_readable), str(processed_time_readable), str(path) + get_color(None, True)])
printarray3.append([curr_queue, "Not running"]) array_module_type.sort(lambda x,y: cmp(x[4], y[4]), reverse=True)
else: for e in array_module_type:
if len(list(server.smembers('MODULE_TYPE_'+curr_queue))) == 0: printarray1.append(e)
if curr_queue not in no_info_modules:
no_info_modules[curr_queue] = int(time.time()) for curr_queue in module_file_array:
printarray3.append([curr_queue, "No data"]) if curr_queue not in all_queue:
else: printarray3.append([curr_queue, "Not running"])
#If no info since long time, try to kill else:
if args.autokill == 1 and int(time.time()) - no_info_modules[curr_queue] > threshold_stucked_module: if len(list(server.smembers('MODULE_TYPE_'+curr_queue))) == 0:
kill_module(curr_queue, None) if curr_queue not in no_info_modules:
no_info_modules[curr_queue] = int(time.time()) no_info_modules[curr_queue] = int(time.time())
printarray3.append([curr_queue, "Stuck or idle, restarting in " + str(threshold_stucked_module - (int(time.time()) - no_info_modules[curr_queue])) + "s"]) printarray3.append([curr_queue, "No data"])
else:
#If no info since long time, try to kill
if args.autokill == 1:
if int(time.time()) - no_info_modules[curr_queue] > args.treshold:
kill_module(curr_queue, None)
no_info_modules[curr_queue] = int(time.time())
printarray3.append([curr_queue, "Stuck or idle, restarting in " + str(abs(args.treshold - (int(time.time()) - no_info_modules[curr_queue]))) + "s"])
else:
printarray3.append([curr_queue, "Stuck or idle, restarting disabled"])
## FIXME To add:
## Button KILL Process using Curses
#printarray1.sort(lambda x,y: cmp(x[0], y[0]), reverse=False) printarray1.sort(key=lambda x: x[0][9:], reverse=False)
printarray1.sort(key=lambda x: x[0][9:], reverse=False) printarray2.sort(key=lambda x: x[0][9:], reverse=False)
#printarray2.sort(lambda x,y: cmp(x[0], y[0]), reverse=False) printarray1.insert(0,["Queue", "PID", "Amount", "Paste start time", "Processing time for current paste (H:M:S)", "Paste hash"])
printarray2.sort(key=lambda x: x[0][9:], reverse=False) printarray2.insert(0,["Queue", "PID","Amount", "Paste start time", "Time since idle (H:M:S)", "Last paste hash"])
printarray1.insert(0,["Queue", "PID", "Amount", "Paste start time", "Processing time for current paste (H:M:S)", "Paste hash"]) printarray3.insert(0,["Queue", "State"])
printarray2.insert(0,["Queue", "PID","Amount", "Paste start time", "Time since idle (H:M:S)", "Last paste hash"])
printarray3.insert(0,["Queue", "State"])
os.system('clear') os.system('clear')
t1 = AsciiTable(printarray1, title="Working queues") t1 = AsciiTable(printarray1, title="Working queues")
t1.column_max_width(1) t1.column_max_width(1)
if not t1.ok: if not t1.ok:
longest_col = t1.column_widths.index(max(t1.column_widths)) longest_col = t1.column_widths.index(max(t1.column_widths))
max_length_col = t1.column_max_width(longest_col) max_length_col = t1.column_max_width(longest_col)
if max_length_col > 0: if max_length_col > 0:
for i, content in enumerate(t1.table_data): for i, content in enumerate(t1.table_data):
if len(content[longest_col]) > max_length_col: if len(content[longest_col]) > max_length_col:
temp = '' temp = ''
for l in content[longest_col].splitlines(): for l in content[longest_col].splitlines():
if len(l) > max_length_col: if len(l) > max_length_col:
temp += '\n'.join(textwrap.wrap(l, max_length_col)) + '\n' temp += '\n'.join(textwrap.wrap(l, max_length_col)) + '\n'
else: else:
temp += l + '\n' temp += l + '\n'
content[longest_col] = temp.strip() content[longest_col] = temp.strip()
t1.table_data[i] = content t1.table_data[i] = content
t2 = AsciiTable(printarray2, title="Idling queues") t2 = AsciiTable(printarray2, title="Idling queues")
t2.column_max_width(1) t2.column_max_width(1)
if not t2.ok: if not t2.ok:
longest_col = t2.column_widths.index(max(t2.column_widths)) longest_col = t2.column_widths.index(max(t2.column_widths))
max_length_col = t2.column_max_width(longest_col) max_length_col = t2.column_max_width(longest_col)
if max_length_col > 0: if max_length_col > 0:
for i, content in enumerate(t2.table_data): for i, content in enumerate(t2.table_data):
if len(content[longest_col]) > max_length_col: if len(content[longest_col]) > max_length_col:
temp = '' temp = ''
for l in content[longest_col].splitlines(): for l in content[longest_col].splitlines():
if len(l) > max_length_col: if len(l) > max_length_col:
temp += '\n'.join(textwrap.wrap(l, max_length_col)) + '\n' temp += '\n'.join(textwrap.wrap(l, max_length_col)) + '\n'
else: else:
temp += l + '\n' temp += l + '\n'
content[longest_col] = temp.strip() content[longest_col] = temp.strip()
t2.table_data[i] = content t2.table_data[i] = content
t3 = AsciiTable(printarray3, title="Not running queues") t3 = AsciiTable(printarray3, title="Not running queues")
t3.column_max_width(1) t3.column_max_width(1)
printarray4 = [] printarray4 = []
for elem in printarrayGlob: for elem in printarrayGlob:
if elem is not None: if elem is not None:
printarray4.append(elem) printarray4.append(elem)
t4 = AsciiTable(printarray4, title="Last actions") t4 = AsciiTable(printarray4, title="Last actions")
t4.column_max_width(1) t4.column_max_width(1)
print t1.table legend_array = [["Color", "Meaning"], [Back.RED+Style.BRIGHT+" "*10+Style.RESET_ALL, "Time >=" +str(args.treshold)+Style.RESET_ALL], [Back.MAGENTA+Style.BRIGHT+" "*10+Style.RESET_ALL, "Time >=" +str(args.treshold)+" while idle"+Style.RESET_ALL], [Back.YELLOW+Style.BRIGHT+" "*10+Style.RESET_ALL, "Time >=" +str(args.treshold/2)+Style.RESET_ALL], [Back.GREEN+Style.BRIGHT+" "*10+Style.RESET_ALL, "Time <" +str(args.treshold)]]
print '\n' legend = AsciiTable(legend_array, title="Legend")
print t2.table legend.column_max_width(1)
print '\n'
print t3.table
print '\n'
print t4.table
if (datetime.datetime.now() - lastTime).total_seconds() > args.refresh*5: print legend.table
lastTime = datetime.datetime.now() print '\n'
cleanRedis() print t1.table
time.sleep(args.refresh) print '\n'
print t2.table
print '\n'
print t3.table
print '\n'
print t4.table
if (datetime.datetime.now() - lastTime).total_seconds() > args.refresh*5:
lastTime = datetime.datetime.now()
cleanRedis()
#time.sleep(args.refresh)