# -*- coding: utf-8 -*-
 
# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 
# See https://llvm.org/LICENSE.txt for license information.
 
# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 
""" This module implements basic shell escaping/unescaping methods. """
 
 
 
import re
 
import shlex
 
 
 
__all__ = ['encode', 'decode']
 
 
 
 
 
def encode(command):
 
    """ Takes a command as list and returns a string. """
 
 
 
    def needs_quote(word):
 
        """ Returns true if arguments needs to be protected by quotes.
 
 
 
        Previous implementation was shlex.split method, but that's not good
 
        for this job. Currently is running through the string with a basic
 
        state checking. """
 
 
 
        reserved = {' ', '$', '%', '&', '(', ')', '[', ']', '{', '}', '*', '|',
 
                    '<', '>', '@', '?', '!'}
 
        state = 0
 
        for current in word:
 
            if state == 0 and current in reserved:
 
                return True
 
            elif state == 0 and current == '\\':
 
                state = 1
 
            elif state == 1 and current in reserved | {'\\'}:
 
                state = 0
 
            elif state == 0 and current == '"':
 
                state = 2
 
            elif state == 2 and current == '"':
 
                state = 0
 
            elif state == 0 and current == "'":
 
                state = 3
 
            elif state == 3 and current == "'":
 
                state = 0
 
        return state != 0
 
 
 
    def escape(word):
 
        """ Do protect argument if that's needed. """
 
 
 
        table = {'\\': '\\\\', '"': '\\"'}
 
        escaped = ''.join([table.get(c, c) for c in word])
 
 
 
        return '"' + escaped + '"' if needs_quote(word) else escaped
 
 
 
    return " ".join([escape(arg) for arg in command])
 
 
 
 
 
def decode(string):
 
    """ Takes a command string and returns as a list. """
 
 
 
    def unescape(arg):
 
        """ Gets rid of the escaping characters. """
 
 
 
        if len(arg) >= 2 and arg[0] == arg[-1] and arg[0] == '"':
 
            arg = arg[1:-1]
 
            return re.sub(r'\\(["\\])', r'\1', arg)
 
        return re.sub(r'\\([\\ $%&\(\)\[\]\{\}\*|<>@?!])', r'\1', arg)
 
 
 
    return [unescape(arg) for arg in shlex.split(string)]