"""
Custom datasources provide functionality beyond ``simple_file`` and ``simple_command``
type datasources. If the custom datasource is short and concise it may be added to
this module. Other datasources should be added as a separate module.
Normally custom datasources are necessary for core-collection. In order for a custom
datasource to execute, all of its dependencies must be explicitly loaded by the client.
The client uses the YAML template :py:data:`insights.collect.default_manifest` and each
parser/combiner/component required by a custom datasource must be included in the YAML
template to ensure it is loaded.
"""
import os
import time
DEFAULT_SHELL_TIMEOUT = 10
""" int: Default timeout in seconds for ctx.shell_out() commands, must be provided as an arg """
[docs]
def get_running_commands(ps, ctx, commands):
"""
Search for a list of commands in Ps combiner output and returns the full path
to the command
Arguments:
ps: Ps combiner object
ctx: Context of the current collection
commands(list): List of commands to search for in ps output
Returns:
list: List of the full command paths of the all ``command``.
Raises:
TypeError: Raised when ``commands`` args is not a list
"""
if not commands or not isinstance(commands, list):
raise TypeError('Commands argument must be a list object and contain at least one item')
ps_list = [ps.search(COMMAND_NAME__contains=c) for c in commands]
if ps_list and isinstance(ps_list[0], list):
ps_cmds = [i for sub_l in ps_list for i in sub_l]
else:
ps_cmds = ps_list
ret = set()
for cmd in set(p['COMMAND'] for p in ps_cmds):
try:
cmd_prefix = cmd.split(None, 1)[0]
which = ctx.shell_out(
"/usr/bin/which {0}".format(cmd_prefix), timeout=DEFAULT_SHELL_TIMEOUT
)
except Exception:
continue
ret.add(which[0]) if which else None
return sorted(ret)
[docs]
def get_recent_files(target_path, last_modify_hours=24, latest_count=0):
"""
Get the recent updated or created files, limited to lastest_count files
Arguments:
target_path (string): target path to search
last_modify_hours (int): specify the recent hours
latest_count (int): specify the lastest files count with a positive integer
Returns:
list: files that updated or creates just in last_modify_hours hours
"""
latest_files = {}
if os.path.exists(target_path):
current_time = time.time()
for parent_path, _, report_files in os.walk(target_path):
for one_file in report_files:
t_full_file = os.path.join(parent_path, one_file)
file_time = os.path.getmtime(t_full_file)
if (current_time - file_time) // 3600 < last_modify_hours:
latest_files[t_full_file] = file_time
result_files = sorted(latest_files, key=lambda x: latest_files[x], reverse=True)
return result_files[:latest_count] if latest_count > 0 else result_files