Commit eec12ab7 authored by Xavier Thompson's avatar Xavier Thompson

WIP

parent 3e813ce2
...@@ -13,68 +13,60 @@ from slapos.grid.promise import interface ...@@ -13,68 +13,60 @@ from slapos.grid.promise import interface
class RunPromise(JSONRunPromise): class RunPromise(JSONRunPromise):
def __init__(self, config): def __init__(self, config):
super(RunPromise, self).__init__(config) super(RunPromise, self).__init__(config)
self.setPeriodicity(minute=2) self.setPeriodicity(minute=2)
self.last_avg_computation_file = self.getConfig( self.avg_flag_file = self.getConfig('last-avg-computation-file', 'last_avg')
'last-avg-computation-file', 'last_avg') self.max_spot_temp = float(self.getConfig('max-spot-temp', 90))
self.max_avg_temp = float(self.getConfig('max-avg-temp', 80))
def sense(self):
promise_success = True
max_spot_temp = float(self.getConfig('max-spot-temp', 90))
max_avg_temp = float(self.getConfig('max-avg-temp', 80))
avg_temp_duration_sec = int(self.getConfig('avg-temp-duration-sec', 0)) avg_temp_duration_sec = int(self.getConfig('avg-temp-duration-sec', 0))
if avg_temp_duration_sec: if avg_temp_duration_sec:
avg_temp_duration = avg_temp_duration_sec self.avg_temp_duration = avg_temp_duration_sec
else: else:
avg_temp_duration = 60 * int(self.getConfig('avg-temp-duration', 5)) self.avg_temp_duration = 60 * int(self.getConfig('avg-temp-duration', 5))
testing = self.getConfig('testing') == "True"
# For theia JHGD def sense(self):
#testing = True # JHGD success = True
# Get current temperature # Get current temperature
if testing: try:
from random import randint cpu_temp = psutil.sensors_temperatures()['coretemp'][0][1]
cpu_temp = randint(40, 75) except (KeyError, IndexError) as e:
else: self.logger.error("Could not retrieve core temperature:\n%r", e, exc_info=True)
data = psutil.sensors_temperatures() return
cpu_temp = data['coretemp'][0][1] if cpu_temp > iself.max_spot_temp:
if cpu_temp > max_spot_temp: success = False
self.logger.error("Temperature reached critical threshold: %s degrees "\ self.logger.error(
"celsius (threshold is %s degrees celsius)" % (cpu_temp, max_spot_temp)) "Temperature reached critical threshold: %s °C (threshold is %s °C)",
promise_success = False cpu_temp, max_spot_temp)
# Log temperature # Log temperature
data = json.dumps({'cpu_temperature': cpu_temp}) data = json.dumps({'cpu_temperature': cpu_temp})
self.json_logger.info("Temperature data", extra={'data': data}) self.json_logger.info("Temperature data", extra={'data': data})
# TODO: promise should computer average only with logs between interval # TODO: promise should compute average only with logs between interval
# Computer average temperature # Computer average temperature
avg_computation_period = avg_temp_duration / 4 avg_computation_period = self.avg_temp_duration / 4
try: try:
t = os.path.getmtime(self.last_avg_computation_file) t = os.path.getmtime(self.avg_flag_file)
except OSError: except OSError:
t = 0 t = 0
if (time.time() - t) > avg_computation_period: if (time.time() - t) > avg_computation_period:
open(self.last_avg_computation_file, 'w').close() open(self.avg_flag_file, 'w').close()
temp_list = get_data_interval_json_log(self.log_file, avg_temp_duration) temp_list = get_data_interval_json_log(self.log_file, self.avg_temp_duration)
if temp_list: if temp_list:
avg_temp = sum(map(lambda x: x['cpu_temperature'], temp_list)) / len(temp_list) avg_temp = sum(map(lambda x: x['cpu_temperature'], temp_list)) / len(temp_list)
if avg_temp > max_avg_temp: if avg_temp > self.max_avg_temp:
self.logger.error("Average temperature over the last %s seconds "\ success = False
"reached threshold: %s degrees celsius (threshold is %s degrees "\ self.logger.error(
"celsius)" % (avg_temp_duration, avg_temp, max_avg_temp)) "Average temperature over the last %d s reached threshold: %s °C"
promise_success = False " (threshold is %s °C)",
avg_temp_duration, avg_temp, max_avg_temp)
else: else:
success = False
self.logger.error("Couldn't read temperature from log") self.logger.error("Couldn't read temperature from log")
promise_success = False
if promise_success: if success:
self.logger.info("Temperature OK") self.logger.info("Temperature OK (%s °C)", cpu_temp)
def test(self): def test(self):
""" """
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment