Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
S
slapos.toolbox
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Guillaume Hervier
slapos.toolbox
Commits
238b167d
Commit
238b167d
authored
Sep 29, 2016
by
Alain Takoudjou
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
monitor: run all promises in a single cron task with timeout of 12 seconds per promises
parent
54399dda
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
290 additions
and
188 deletions
+290
-188
slapos/monitor/monitor.py
slapos/monitor/monitor.py
+21
-53
slapos/monitor/runpromise.py
slapos/monitor/runpromise.py
+269
-135
No files found.
slapos/monitor/monitor.py
View file @
238b167d
...
@@ -75,7 +75,7 @@ class Monitoring(object):
...
@@ -75,7 +75,7 @@ class Monitoring(object):
self
.
crond_folder
=
config
.
get
(
"monitor"
,
"crond-folder"
)
self
.
crond_folder
=
config
.
get
(
"monitor"
,
"crond-folder"
)
self
.
logrotate_d
=
config
.
get
(
"monitor"
,
"logrotate-folder"
)
self
.
logrotate_d
=
config
.
get
(
"monitor"
,
"logrotate-folder"
)
self
.
promise_runner
=
config
.
get
(
"monitor"
,
"promise-runner"
)
self
.
promise_runner
=
config
.
get
(
"monitor"
,
"promise-runner"
)
self
.
promise_folder
_list
=
config
.
get
(
"monitor"
,
"promise-folder-list"
).
split
(
)
self
.
promise_folder
=
config
.
get
(
"monitor"
,
"promise-folder"
)
self
.
public_folder
=
config
.
get
(
"monitor"
,
"public-folder"
)
self
.
public_folder
=
config
.
get
(
"monitor"
,
"public-folder"
)
self
.
private_folder
=
config
.
get
(
"monitor"
,
"private-folder"
)
self
.
private_folder
=
config
.
get
(
"monitor"
,
"private-folder"
)
self
.
collector_db
=
config
.
get
(
"monitor"
,
"collector-db"
)
self
.
collector_db
=
config
.
get
(
"monitor"
,
"collector-db"
)
...
@@ -98,10 +98,6 @@ class Monitoring(object):
...
@@ -98,10 +98,6 @@ class Monitoring(object):
self
.
promise_output_file
=
config
.
get
(
"monitor"
,
"promise-output-file"
)
self
.
promise_output_file
=
config
.
get
(
"monitor"
,
"promise-output-file"
)
self
.
bootstrap_is_ok
=
True
self
.
bootstrap_is_ok
=
True
self
.
promise_dict
=
{}
for
promise_folder
in
self
.
promise_folder_list
:
self
.
setupPromiseDictFromFolder
(
promise_folder
)
def
loadConfig
(
self
,
pathes
,
config
=
None
):
def
loadConfig
(
self
,
pathes
,
config
=
None
):
if
config
is
None
:
if
config
is
None
:
config
=
ConfigParser
.
ConfigParser
()
config
=
ConfigParser
.
ConfigParser
()
...
@@ -182,13 +178,6 @@ class Monitoring(object):
...
@@ -182,13 +178,6 @@ class Monitoring(object):
pass
pass
return
configuration_list
return
configuration_list
def
setupPromiseDictFromFolder
(
self
,
folder
):
for
filename
in
os
.
listdir
(
folder
):
path
=
os
.
path
.
join
(
folder
,
filename
)
if
os
.
path
.
isfile
(
path
)
and
os
.
access
(
path
,
os
.
X_OK
):
self
.
promise_dict
[
filename
]
=
{
"path"
:
path
,
"configuration"
:
ConfigParser
.
ConfigParser
()}
def
createSymlinksFromConfig
(
self
,
destination_folder
,
source_path_list
,
name
=
""
):
def
createSymlinksFromConfig
(
self
,
destination_folder
,
source_path_list
,
name
=
""
):
if
destination_folder
:
if
destination_folder
:
if
source_path_list
:
if
source_path_list
:
...
@@ -406,37 +395,30 @@ class Monitoring(object):
...
@@ -406,37 +395,30 @@ class Monitoring(object):
def
generateServiceCronEntries
(
self
):
def
generateServiceCronEntries
(
self
):
# XXX only if at least one configuration file is modified, then write in the cron
# XXX only if at least one configuration file is modified, then write in the cron
#cron_line_list = ['PATH=%s\n' % os.environ['PATH']]
cron_line_list
=
[]
service_name_list
=
[
name
.
replace
(
'.status.json'
,
''
)
service_name_list
=
[
name
.
replace
(
'.status.json'
,
''
)
for
name
in
os
.
listdir
(
self
.
public_folder
)
if
name
.
endswith
(
'.status.json'
)]
for
name
in
os
.
listdir
(
self
.
public_folder
)
if
name
.
endswith
(
'.status.json'
)]
for
service_name
,
promise
in
self
.
promise_items
:
service_config
=
promise
[
"configuration"
]
service_status_path
=
"%s/%s.status.json"
%
(
self
.
public_folder
,
service_name
)
mkdirAll
(
os
.
path
.
dirname
(
service_status_path
))
promise_cmd_line
=
[
promise_cmd_line
=
[
softConfigGet
(
service_config
,
"service"
,
"frequency"
)
or
"* * * * *"
,
"* * * * *"
,
"sleep $((1 + RANDOM % 30)) &&"
,
# Sleep between 1 to 30 seconds
self
.
promise_runner
,
self
.
promise_runner
,
'--pid_path "%s"'
%
os
.
path
.
join
(
self
.
service_pid_folder
,
'--pid_path "%s"'
%
os
.
path
.
join
(
self
.
service_pid_folder
,
"%s.pid"
%
service_name
),
"monitor-promises.pid"
),
'--output "%s"'
%
service_status_path
,
'--output "%s"'
%
self
.
public_folder
,
'--promise_script "%s"'
%
promise
[
"path"
],
'--promise_folder "%s"'
%
self
.
promise_folder
,
'--promise_name "%s"'
%
service_name
,
'--monitor_url "%s/jio_private/"'
%
self
.
webdav_url
,
# XXX hardcoded,
'--monitor_url "%s/jio_private/"'
%
self
.
webdav_url
,
# XXX hardcoded,
'--history_folder "%s"'
%
self
.
public_folder
,
'--history_folder "%s"'
%
self
.
public_folder
,
'--instance_name "%s"'
%
self
.
title
,
'--instance_name "%s"'
%
self
.
title
,
'--hosting_name "%s"'
%
self
.
root_title
]
'--hosting_name "%s"'
%
self
.
root_title
]
cron_line_list
.
append
(
' '
.
join
(
promise_cmd_line
)
)
registered_promise_list
=
os
.
listdir
(
self
.
promise_folder
)
for
service_name
in
service_name_list
:
if
service_name
in
service_nam
e_list
:
if
service_name
in
registered_promis
e_list
:
service_name_list
.
pop
(
service_name_list
.
index
(
service_name
))
service_name_list
.
pop
(
service_name_list
.
index
(
service_name
))
if
service_name_list
!=
[]:
if
service_name_list
!=
[]:
# XXX Some service was removed, delete his status file so monitor will not consider
his
status anymore
# XXX Some service was removed, delete his status file so monitor will not consider
the
status anymore
for
service_name
in
service_name_list
:
for
service_name
in
service_name_list
:
status_path
=
os
.
path
.
join
(
self
.
public_folder
,
'%s.status.json'
%
service_name
)
status_path
=
os
.
path
.
join
(
self
.
public_folder
,
'%s.status.json'
%
service_name
)
if
os
.
path
.
exists
(
status_path
):
if
os
.
path
.
exists
(
status_path
):
...
@@ -447,7 +429,7 @@ class Monitoring(object):
...
@@ -447,7 +429,7 @@ class Monitoring(object):
pass
pass
with
open
(
self
.
crond_folder
+
"/monitor-promises"
,
"w"
)
as
fp
:
with
open
(
self
.
crond_folder
+
"/monitor-promises"
,
"w"
)
as
fp
:
fp
.
write
(
"
\
n
"
.
join
(
cron_line_list
))
fp
.
write
(
' '
.
join
(
promise_cmd_line
))
def
addCronEntry
(
self
,
name
,
frequency
,
command
):
def
addCronEntry
(
self
,
name
,
frequency
,
command
):
entry_line
=
'%s %s'
%
(
frequency
,
command
)
entry_line
=
'%s %s'
%
(
frequency
,
command
)
...
@@ -466,21 +448,6 @@ class Monitoring(object):
...
@@ -466,21 +448,6 @@ class Monitoring(object):
self
.
configureFolders
()
self
.
configureFolders
()
# create symlinks from service configurations
self
.
promise_items
=
self
.
promise_dict
.
items
()
for
service_name
,
promise
in
self
.
promise_items
:
service_config
=
promise
[
"configuration"
]
public_path_list
=
softConfigGet
(
service_config
,
"service"
,
"public-path-list"
)
private_path_list
=
softConfigGet
(
service_config
,
"service"
,
"private-path-list"
)
if
public_path_list
:
self
.
createSymlinksFromConfig
(
self
.
public_folder
,
public_path_list
.
split
(),
service_name
)
if
private_path_list
:
self
.
createSymlinksFromConfig
(
self
.
private_folder
,
private_path_list
.
split
(),
service_name
)
# Generate OPML file
# Generate OPML file
self
.
generateOpmlFile
(
self
.
monitor_url_list
,
self
.
generateOpmlFile
(
self
.
monitor_url_list
,
os
.
path
.
join
(
self
.
public_folder
,
'feeds'
))
os
.
path
.
join
(
self
.
public_folder
,
'feeds'
))
...
@@ -514,7 +481,8 @@ class Monitoring(object):
...
@@ -514,7 +481,8 @@ class Monitoring(object):
self
.
generateLogrotateEntry
(
'monitor.service.status'
,
file_list
,
option_list
)
self
.
generateLogrotateEntry
(
'monitor.service.status'
,
file_list
,
option_list
)
# Add cron entry for SlapOS Collect
# Add cron entry for SlapOS Collect
command
=
"%s %s --output_folder %s --collector_db %s"
%
(
self
.
python
,
command
=
"sleep $((1 + RANDOM % 60)) && "
# Random sleep between 1 to 60 seconds
command
+=
"%s %s --output_folder %s --collector_db %s"
%
(
self
.
python
,
self
.
collect_script
,
self
.
data_folder
,
self
.
collector_db
)
self
.
collect_script
,
self
.
data_folder
,
self
.
collector_db
)
self
.
addCronEntry
(
'monitor_collect'
,
'* * * * *'
,
command
)
self
.
addCronEntry
(
'monitor_collect'
,
'* * * * *'
,
command
)
...
...
slapos/monitor/runpromise.py
View file @
238b167d
...
@@ -12,6 +12,9 @@ import glob
...
@@ -12,6 +12,9 @@ import glob
import
argparse
import
argparse
import
traceback
import
traceback
# Promise timeout after 12 seconds
promise_timeout
=
12
def
parseArguments
():
def
parseArguments
():
"""
"""
Parse arguments for monitor collector instance.
Parse arguments for monitor collector instance.
...
@@ -23,6 +26,8 @@ def parseArguments():
...
@@ -23,6 +26,8 @@ def parseArguments():
help
=
'The Path of file where Json result of this promise will be saved.'
)
help
=
'The Path of file where Json result of this promise will be saved.'
)
parser
.
add_argument
(
'--promise_script'
,
parser
.
add_argument
(
'--promise_script'
,
help
=
'Promise script to execute.'
)
help
=
'Promise script to execute.'
)
parser
.
add_argument
(
'--promise_folder'
,
help
=
'Folder where to find promises to execute. Hide --promise_script and --promise_name'
)
parser
.
add_argument
(
'--promise_name'
,
parser
.
add_argument
(
'--promise_name'
,
help
=
'Title to give to this promise.'
)
help
=
'Title to give to this promise.'
)
parser
.
add_argument
(
'--promise_type'
,
parser
.
add_argument
(
'--promise_type'
,
...
@@ -41,10 +46,19 @@ def parseArguments():
...
@@ -41,10 +46,19 @@ def parseArguments():
return
parser
return
parser
def
runpromise
(
parser
):
class
RunPromise
(
object
):
def
__init__
(
self
,
config_parser
):
self
.
config
=
config_parser
def
runpromise
(
self
):
if
os
.
path
.
exists
(
parser
.
pid_path
):
if
self
.
config
.
promise_folder
:
with
open
(
parser
.
pid_path
,
"r"
)
as
pidfile
:
# run all promises from the given folder
return
self
.
runpromise_synchronous
()
if
os
.
path
.
exists
(
self
.
config
.
pid_path
):
with
open
(
self
.
config
.
pid_path
,
"r"
)
as
pidfile
:
try
:
try
:
pid
=
int
(
pidfile
.
read
(
6
))
pid
=
int
(
pidfile
.
read
(
6
))
except
ValueError
:
except
ValueError
:
...
@@ -53,24 +67,24 @@ def runpromise(parser):
...
@@ -53,24 +67,24 @@ def runpromise(parser):
print
(
"A process is already running with pid "
+
str
(
pid
))
print
(
"A process is already running with pid "
+
str
(
pid
))
return
1
return
1
start_date
=
""
start_date
=
""
with
open
(
parser
.
pid_path
,
"w"
)
as
pidfile
:
with
open
(
self
.
config
.
pid_path
,
"w"
)
as
pidfile
:
process
=
executeCommand
(
parser
.
promise_script
)
process
=
self
.
executeCommand
(
self
.
config
.
promise_script
)
ps_process
=
psutil
.
Process
(
process
.
pid
)
ps_process
=
psutil
.
Process
(
process
.
pid
)
start_date
=
time
.
strftime
(
"%Y-%m-%d %H:%M:%S"
,
time
.
localtime
(
ps_process
.
create_time
()))
start_date
=
time
.
strftime
(
"%Y-%m-%d %H:%M:%S"
,
time
.
localtime
(
ps_process
.
create_time
()))
pidfile
.
write
(
str
(
process
.
pid
))
pidfile
.
write
(
str
(
process
.
pid
))
status_json
=
generateStatusJsonFromProcess
(
process
,
start_date
=
start_date
)
status_json
=
self
.
generateStatusJsonFromProcess
(
process
,
start_date
=
start_date
)
status_json
[
'_links'
]
=
{
"monitor"
:
{
"href"
:
parser
.
monitor_url
}}
status_json
[
'_links'
]
=
{
"monitor"
:
{
"href"
:
self
.
config
.
monitor_url
}}
status_json
[
'title'
]
=
parser
.
promise_name
status_json
[
'title'
]
=
self
.
config
.
promise_name
status_json
[
'instance'
]
=
parser
.
instance_name
status_json
[
'instance'
]
=
self
.
config
.
instance_name
status_json
[
'hosting_subscription'
]
=
parser
.
hosting_name
status_json
[
'hosting_subscription'
]
=
self
.
config
.
hosting_name
status_json
[
'type'
]
=
parser
.
promise_type
status_json
[
'type'
]
=
self
.
config
.
promise_type
# Save the lastest status change date (needed for rss)
# Save the lastest status change date (needed for rss)
status_json
[
'change-time'
]
=
ps_process
.
create_time
()
status_json
[
'change-time'
]
=
ps_process
.
create_time
()
if
os
.
path
.
exists
(
parser
.
output
):
if
os
.
path
.
exists
(
self
.
config
.
output
):
with
open
(
parser
.
output
)
as
f
:
with
open
(
self
.
config
.
output
)
as
f
:
try
:
try
:
last_result
=
json
.
loads
(
f
.
read
())
last_result
=
json
.
loads
(
f
.
read
())
if
status_json
[
'status'
]
==
last_result
[
'status'
]
and
last_result
.
has_key
(
'change-time'
):
if
status_json
[
'status'
]
==
last_result
[
'status'
]
and
last_result
.
has_key
(
'change-time'
):
...
@@ -78,17 +92,75 @@ def runpromise(parser):
...
@@ -78,17 +92,75 @@ def runpromise(parser):
except
ValueError
:
except
ValueError
:
pass
pass
updateStatusHistoryFolder
(
self
.
updateStatusHistoryFolder
(
parser
.
promise_name
,
self
.
config
.
promise_name
,
parser
.
output
,
self
.
config
.
output
,
parser
.
history_folder
,
self
.
config
.
history_folder
,
parser
.
promise_type
self
.
config
.
promise_type
)
)
with
open
(
parser
.
output
,
"w"
)
as
outputfile
:
with
open
(
self
.
config
.
output
,
"w"
)
as
outputfile
:
json
.
dump
(
status_json
,
outputfile
)
json
.
dump
(
status_json
,
outputfile
)
os
.
remove
(
parser
.
pid_path
)
os
.
remove
(
self
.
config
.
pid_path
)
def
runpromise_synchronous
(
self
):
if
os
.
path
.
exists
(
self
.
config
.
pid_path
):
# Check if another run promise is running
with
open
(
self
.
config
.
pid_path
)
as
fpid
:
try
:
pid
=
int
(
fpid
.
read
(
6
))
except
ValueError
:
pid
=
None
if
pid
and
os
.
path
.
exists
(
"/proc/"
+
str
(
pid
)):
print
(
"A process is already running with pid "
+
str
(
pid
))
return
[]
with
open
(
self
.
config
.
pid_path
,
'w'
)
as
fpid
:
fpid
.
write
(
str
(
os
.
getpid
()))
status_list
=
self
.
checkPromises
(
self
.
config
.
promise_folder
)
promises_status_file
=
os
.
path
.
join
(
self
.
config
.
output
,
'_promise_status'
)
previous_state_dict
=
{}
new_state_dict
=
{}
base_dict
=
{
'_links'
:
{
"monitor"
:
{
"href"
:
self
.
config
.
monitor_url
}},
'instance'
:
self
.
config
.
instance_name
,
'hosting_subscription'
:
self
.
config
.
hosting_name
,
}
if
os
.
path
.
exists
(
promises_status_file
):
with
open
(
promises_status_file
)
as
f
:
try
:
previous_state_dict
=
json
.
loads
(
f
.
read
())
except
ValueError
:
pass
def
updateStatusHistoryFolder
(
name
,
status_file
,
history_folder
,
promise_type
):
for
status_dict
in
status_list
:
status_dict
.
update
(
base_dict
)
if
previous_state_dict
.
has_key
(
status_dict
[
'title'
]):
status
,
time
=
previous_state_dict
[
status_dict
[
'title'
]].
split
(
'#'
)
if
status_dict
[
'status'
]
==
status
:
status_dict
[
'change-time'
]
=
float
(
time
)
promise_result_file
=
os
.
path
.
join
(
self
.
config
.
output
,
"%s.status.json"
%
status_dict
[
'title'
])
with
open
(
promise_result_file
,
"w"
)
as
outputfile
:
json
.
dump
(
status_dict
,
outputfile
)
new_state_dict
[
status_dict
[
'title'
]]
=
'%s#%s'
%
(
status_dict
[
'status'
],
status_dict
[
'change-time'
])
self
.
updateStatusHistoryFolder
(
status_dict
[
'title'
],
promise_result_file
,
self
.
config
.
history_folder
,
'status'
)
with
open
(
promises_status_file
,
"w"
)
as
outputfile
:
json
.
dump
(
new_state_dict
,
outputfile
)
os
.
remove
(
self
.
config
.
pid_path
)
def
updateStatusHistoryFolder
(
self
,
name
,
status_file
,
history_folder
,
promise_type
):
history_path
=
os
.
path
.
join
(
history_folder
)
history_path
=
os
.
path
.
join
(
history_folder
)
if
not
os
.
path
.
exists
(
status_file
):
if
not
os
.
path
.
exists
(
status_file
):
return
return
...
@@ -154,7 +226,7 @@ def updateStatusHistoryFolder(name, status_file, history_folder, promise_type):
...
@@ -154,7 +226,7 @@ def updateStatusHistoryFolder(name, status_file, history_folder, promise_type):
except OSError:
except OSError:
raise"""
raise"""
def
generateStatusJsonFromProcess
(
process
,
start_date
=
None
,
title
=
None
):
def
generateStatusJsonFromProcess
(
self
,
process
,
start_date
=
None
,
title
=
None
):
stdout
,
stderr
=
process
.
communicate
()
stdout
,
stderr
=
process
.
communicate
()
status_json
=
{}
status_json
=
{}
if
process
.
returncode
!=
0
:
if
process
.
returncode
!=
0
:
...
@@ -172,7 +244,7 @@ def generateStatusJsonFromProcess(process, start_date=None, title=None):
...
@@ -172,7 +244,7 @@ def generateStatusJsonFromProcess(process, start_date=None, title=None):
return
status_json
return
status_json
def
executeCommand
(
args
):
def
executeCommand
(
self
,
args
):
return
subprocess
.
Popen
(
return
subprocess
.
Popen
(
args
,
args
,
#cwd=instance_path,
#cwd=instance_path,
...
@@ -182,6 +254,68 @@ def executeCommand(args):
...
@@ -182,6 +254,68 @@ def executeCommand(args):
stderr
=
subprocess
.
PIPE
stderr
=
subprocess
.
PIPE
)
)
def
checkPromises
(
self
,
promise_dir
):
"""
Run all promises found into specified folder
"""
if
not
os
.
path
.
exists
(
promise_dir
)
or
not
os
.
path
.
isdir
(
promise_dir
):
return
[]
promise_result_list
=
[]
# Check whether every promise is kept
for
promise
in
os
.
listdir
(
promise_dir
):
promise_script
=
os
.
path
.
join
(
promise_dir
,
promise
)
if
not
os
.
path
.
isfile
(
promise_script
)
or
not
os
.
access
(
promise_script
,
os
.
X_OK
):
# Not executable file
continue
command
=
[
promise_script
]
promise_name
=
os
.
path
.
basename
(
command
[
0
])
result_dict
=
{
"status"
:
"ERROR"
,
"type"
:
"status"
,
"title"
:
promise_name
,
"start-date"
:
time
.
strftime
(
"%Y-%m-%d %H:%M:%S"
,
time
.
localtime
(
time
.
time
())),
"change-time"
:
time
.
time
()
}
process_handler
=
subprocess
.
Popen
(
command
,
stdout
=
subprocess
.
PIPE
,
stderr
=
subprocess
.
PIPE
,
stdin
=
subprocess
.
PIPE
)
process_handler
.
stdin
.
flush
()
process_handler
.
stdin
.
close
()
process_handler
.
stdin
=
None
sleep_time
=
0.1
increment_limit
=
int
(
promise_timeout
/
sleep_time
)
for
current_increment
in
range
(
0
,
increment_limit
):
if
process_handler
.
poll
()
is
None
:
time
.
sleep
(
sleep_time
)
continue
if
process_handler
.
poll
()
==
0
:
# Success!
result_dict
[
"message"
]
=
process_handler
.
communicate
()[
0
]
result_dict
[
"status"
]
=
"OK"
else
:
result_dict
[
"message"
]
=
process_handler
.
communicate
()[
1
]
break
else
:
process_handler
.
terminate
()
message
=
process_handler
.
stderr
.
read
()
if
message
is
None
:
message
=
process_handler
.
stdout
.
read
()
or
""
message
+=
'
\
n
PROMISE TIME OUT AFTER %s SECONDS'
%
promise_timeout
result_dict
[
"message"
]
=
message
promise_result_list
.
append
(
result_dict
)
return
promise_result_list
def
main
():
def
main
():
arg_parser
=
parseArguments
()
arg_parser
=
parseArguments
()
sys
.
exit
(
runpromise
(
arg_parser
.
parse_args
()))
promise_runner
=
RunPromise
(
arg_parser
.
parse_args
())
sys
.
exit
(
promise_runner
.
runpromise
())
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment