azurelinuxagent/common/utils/shellutil.py (209 lines of code) (raw):
# Microsoft Azure Linux Agent
#
# Copyright 2018 Microsoft Corporation
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# Requires Python 2.6+ and Openssl 1.0+
#
import os
import subprocess
import sys
import tempfile
import threading
if sys.version_info[0] == 2:
# TimeoutExpired was introduced on Python 3; define a dummy class for Python 2
class TimeoutExpired(Exception):
pass
else:
from subprocess import TimeoutExpired
import azurelinuxagent.common.logger as logger
from azurelinuxagent.common.future import ustr
if not hasattr(subprocess, 'check_output'):
def check_output(*popenargs, **kwargs):
r"""Backport from subprocess module from python 2.7"""
if 'stdout' in kwargs:
raise ValueError('stdout argument not allowed, '
'it will be overridden.')
process = subprocess.Popen(stdout=subprocess.PIPE, *popenargs, **kwargs)
output, unused_err = process.communicate()
retcode = process.poll()
if retcode:
cmd = kwargs.get("args")
if cmd is None:
cmd = popenargs[0]
raise subprocess.CalledProcessError(retcode, cmd, output=output)
return output
# Exception classes used by this module.
class CalledProcessError(Exception):
def __init__(self, returncode, cmd, output=None): # pylint: disable=W0231
self.returncode = returncode
self.cmd = cmd
self.output = output
def __str__(self):
return ("Command '{0}' returned non-zero exit status {1}"
"").format(self.cmd, self.returncode)
subprocess.check_output = check_output
subprocess.CalledProcessError = CalledProcessError
# pylint: disable=W0105
"""
Shell command util functions
"""
# pylint: enable=W0105
def has_command(cmd):
"""
Return True if the given command is on the path
"""
return not run(cmd, False)
def run(cmd, chk_err=True, expected_errors=None):
"""
Note: Deprecating in favour of `azurelinuxagent.common.utils.shellutil.run_command` function.
Calls run_get_output on 'cmd', returning only the return code.
If chk_err=True then errors will be reported in the log.
If chk_err=False then errors will be suppressed from the log.
"""
if expected_errors is None:
expected_errors = []
retcode, out = run_get_output(cmd, chk_err=chk_err, expected_errors=expected_errors) # pylint: disable=W0612
return retcode
def run_get_output(cmd, chk_err=True, log_cmd=True, expected_errors=None):
"""
Wrapper for subprocess.check_output.
Execute 'cmd'. Returns return code and STDOUT, trapping expected
exceptions.
Reports exceptions to Error if chk_err parameter is True
For new callers, consider using run_command instead as it separates stdout from stderr,
returns only stdout on success, logs both outputs and return code on error and raises an exception.
"""
if expected_errors is None:
expected_errors = []
if log_cmd:
logger.verbose(u"Command: [{0}]", cmd)
try:
process = _popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, shell=True)
output, _ = process.communicate()
_on_command_completed(process.pid)
output = __encode_command_output(output)
if process.returncode != 0:
if chk_err:
msg = u"Command: [{0}], " \
u"return code: [{1}], " \
u"result: [{2}]".format(cmd, process.returncode, output)
if process.returncode in expected_errors:
logger.info(msg)
else:
logger.error(msg)
return process.returncode, output
except Exception as exception:
if chk_err:
logger.error(u"Command [{0}] raised unexpected exception: [{1}]"
.format(cmd, ustr(exception)))
return -1, ustr(exception)
return 0, output
def __format_command(command):
"""
Formats the command taken by run_command/run_pipe.
Examples:
> __format_command("sort")
'sort'
> __format_command(["sort", "-u"])
'sort -u'
> __format_command([["sort"], ["unique", "-n"]])
'sort | unique -n'
"""
if isinstance(command, list):
if command and isinstance(command[0], list):
return " | ".join([" ".join(cmd) for cmd in command])
return " ".join(command)
return command
def __encode_command_output(output):
"""
Encodes the stdout/stderr returned by subprocess.communicate()
"""
return ustr(output if output is not None else b'', encoding='utf-8', errors="backslashreplace")
class CommandError(Exception):
"""
Exception raised by run_command/run_pipe when the command returns an error
"""
@staticmethod
def _get_message(command, return_code, stderr):
command_name = command[0] if isinstance(command, list) and len(command) > 0 else command
return "'{0}' failed: {1} ({2})".format(command_name, return_code, stderr.rstrip())
def __init__(self, command, return_code, stdout, stderr):
super(Exception, self).__init__(CommandError._get_message(command, return_code, stderr)) # pylint: disable=E1003
self.command = command
self.returncode = return_code
self.stdout = stdout
self.stderr = stderr
def __run_command(command_action, command, log_error, encode_output):
"""
Executes the given command_action and returns its stdout. The command_action is a function that executes a command/pipe
and returns its exit code, stdout, and stderr.
If there are any errors executing the command it raises a RunCommandException; if 'log_error'
is True, it also logs details about the error.
If encode_output is True the stdout is returned as a string, otherwise it is returned as a bytes object.
"""
try:
return_code, stdout, stderr = command_action()
if encode_output:
stdout = __encode_command_output(stdout)
stderr = __encode_command_output(stderr)
if return_code != 0:
if log_error:
logger.error(
"Command: [{0}], return code: [{1}], stdout: [{2}] stderr: [{3}]",
__format_command(command),
return_code,
stdout,
stderr)
raise CommandError(command=__format_command(command), return_code=return_code, stdout=stdout, stderr=stderr)
return stdout
except CommandError:
raise
except Exception as exception:
if log_error:
logger.error(u"Command [{0}] raised unexpected exception: [{1}]", __format_command(command), ustr(exception))
raise
# W0622: Redefining built-in 'input' -- disabled: the parameter name mimics subprocess.communicate()
def run_command(command, input=None, stdin=None, stdout=subprocess.PIPE, stderr=subprocess.PIPE, log_error=False, encode_input=True, encode_output=True, track_process=True, timeout=None): # pylint:disable=W0622
"""
Executes the given command and returns its stdout.
If there are any errors executing the command it raises a RunCommandException; if 'log_error'
is True, it also logs details about the error.
If encode_output is True the stdout is returned as a string, otherwise it is returned as a bytes object.
If track_process is False the command is not added to list of running commands
This function is a thin wrapper around Popen/communicate in the subprocess module:
* The 'input' parameter corresponds to the same parameter in communicate
* The 'stdin' parameter corresponds to the same parameters in Popen
* Only one of 'input' and 'stdin' can be specified
* The 'stdout' and 'stderr' parameters correspond to the same parameters in Popen, except that they
default to subprocess.PIPE instead of None
* If the output of the command is redirected using the 'stdout' or 'stderr' parameters (i.e. if the
value for these parameters is anything other than the default (subprocess.PIPE)), then the corresponding
values returned by this function or the CommandError exception will be empty strings.
NOTE: The 'timeout' parameter is ignored on Python 2
NOTE: This is the preferred method to execute shell commands over `azurelinuxagent.common.utils.shellutil.run` function.
"""
if input is not None and stdin is not None:
raise ValueError("The input and stdin arguments are mutually exclusive")
def command_action():
popen_stdin = communicate_input = None
if input is not None:
popen_stdin = subprocess.PIPE
communicate_input = input.encode() if encode_input and isinstance(input, str) else input # communicate() needs an array of bytes
if stdin is not None:
popen_stdin = stdin
communicate_input = None
if track_process:
process = _popen(command, stdin=popen_stdin, stdout=stdout, stderr=stderr, shell=False)
else:
process = subprocess.Popen(command, stdin=popen_stdin, stdout=stdout, stderr=stderr, shell=False)
try:
if sys.version_info[0] == 2: # communicate() doesn't support timeout on Python 2
command_stdout, command_stderr = process.communicate(input=communicate_input)
else:
command_stdout, command_stderr = process.communicate(input=communicate_input, timeout=timeout)
except TimeoutExpired:
if log_error:
logger.error(u"Command [{0}] timed out", __format_command(command))
command_stdout, command_stderr = '', ''
try:
process.kill()
# try to get any output from the command, but ignore any errors if we can't
try:
command_stdout, command_stderr = process.communicate()
# W0702: No exception type(s) specified (bare-except)
except: # pylint: disable=W0702
pass
except Exception as exception:
if log_error:
logger.error(u"Can't terminate timed out process: {0}", ustr(exception))
raise CommandError(command=__format_command(command), return_code=-1, stdout=command_stdout, stderr="command timeout\n{0}".format(command_stderr))
if track_process:
_on_command_completed(process.pid)
return process.returncode, command_stdout, command_stderr
return __run_command(command_action=command_action, command=command, log_error=log_error, encode_output=encode_output)
def run_pipe(pipe, stdin=None, stdout=subprocess.PIPE, stderr=subprocess.PIPE, log_error=False, encode_output=True):
"""
Executes the given commands as a pipe and returns its stdout as a string.
The pipe is a list of commands, which in turn are a list of strings, e.g.
[["sort"], ["uniq", "-n"]] represents 'sort | unique -n'
If there are any errors executing the command it raises a RunCommandException; if 'log_error'
is True, it also logs details about the error.
If encode_output is True the stdout is returned as a string, otherwise it is returned as a bytes object.
This function is a thin wrapper around Popen/communicate in the subprocess module:
* The 'stdin' parameter is used as input for the first command in the pipe
* The 'stdout', and 'stderr' can be used to redirect the output of the pipe
* If the output of the pipe is redirected using the 'stdout' or 'stderr' parameters (i.e. if the
value for these parameters is anything other than the default (subprocess.PIPE)), then the corresponding
values returned by this function or the CommandError exception will be empty strings.
"""
if len(pipe) < 2:
raise ValueError("The pipe must consist of at least 2 commands")
def command_action():
stderr_file = None
try:
popen_stdin = stdin
# If stderr is subprocess.PIPE each call to Popen would create a new pipe. We want to collect the stderr of all the
# commands in the pipe so we replace stderr with a temporary file that we read once the pipe completes.
if stderr == subprocess.PIPE:
stderr_file = tempfile.TemporaryFile()
popen_stderr = stderr_file
else:
popen_stderr = stderr
processes = []
i = 0
while i < len(pipe) - 1:
processes.append(_popen(pipe[i], stdin=popen_stdin, stdout=subprocess.PIPE, stderr=popen_stderr))
popen_stdin = processes[i].stdout
i += 1
processes.append(_popen(pipe[i], stdin=popen_stdin, stdout=stdout, stderr=popen_stderr))
i = 0
while i < len(processes) - 1:
processes[i].stdout.close() # see https://docs.python.org/2/library/subprocess.html#replacing-shell-pipeline
i += 1
pipe_stdout, pipe_stderr = processes[i].communicate()
for proc in processes:
_on_command_completed(proc.pid)
if stderr_file is not None:
stderr_file.seek(0)
pipe_stderr = stderr_file.read()
return processes[i].returncode, pipe_stdout, pipe_stderr
finally:
if stderr_file is not None:
stderr_file.close()
return __run_command(command_action=command_action, command=pipe, log_error=log_error, encode_output=encode_output)
def quote(word_list):
"""
Quote a list or tuple of strings for Unix Shell as words, using the
byte-literal single quote.
The resulting string is safe for use with ``shell=True`` in ``subprocess``,
and in ``os.system``. ``assert shlex.split(ShellQuote(wordList)) == wordList``.
See POSIX.1:2013 Vol 3, Chap 2, Sec 2.2.2:
http://pubs.opengroup.org/onlinepubs/9699919799/utilities/V3_chap02.html#tag_18_02_02
"""
if not isinstance(word_list, (tuple, list)):
word_list = (word_list,)
return " ".join(list("'{0}'".format(s.replace("'", "'\\''")) for s in word_list))
#
# The run_command/run_pipe/run/run_get_output functions maintain a list of the commands that they are currently executing.
#
#
_running_commands = []
_running_commands_lock = threading.RLock()
PARENT_PROCESS_NAME = "AZURE_GUEST_AGENT_PARENT_PROCESS_NAME"
AZURE_GUEST_AGENT = "AZURE_GUEST_AGENT"
def _popen(*args, **kwargs):
with _running_commands_lock:
# Add the environment variables
env = {}
if 'env' in kwargs:
env.update(kwargs['env'])
else:
env.update(os.environ)
# Set the marker before process start
env[PARENT_PROCESS_NAME] = AZURE_GUEST_AGENT
kwargs['env'] = env
process = subprocess.Popen(*args, **kwargs)
_running_commands.append(process.pid)
return process
def _on_command_completed(pid):
with _running_commands_lock:
_running_commands.remove(pid)
def get_running_commands():
"""
Returns the commands started by run/run_get_output/run_command/run_pipe that are currently running.
NOTE: This function is not synchronized with process completion, so the returned array may include processes that have
already completed. Also, keep in mind that by the time this function returns additional processes may have
started or completed.
"""
with _running_commands_lock:
return _running_commands[:] # return a copy, since the call may originate on another thread