Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Feature/additional secrets improvements #80

Open
wants to merge 14 commits into
base: dev
Choose a base branch
from
Open
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

[tool.poetry]
name="pyracf"
version="1.0b5"
version="1.0b6"
description="Python interface to RACF using IRRSMO00 RACF Callable Service."
license = "Apache-2.0"
authors = [
Expand Down
30 changes: 29 additions & 1 deletion pyracf/common/security_admin.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,6 +54,8 @@ class SecurityAdmin:

_valid_segment_traits = {}
_extracted_key_value_pair_segment_traits_map = {}
# Use this structure to map traits to their RACF keywords and Message keywords for redaction
_racf_trait_and_message_key_map = {"trait_map": {}, "message_map": {}}
_case_sensitive_extracted_values = []
__running_userid = None
_logger = Logger()
Expand Down Expand Up @@ -170,24 +172,49 @@ def __raw_dump(self) -> None:
if self.__debug:
# Note, since the hex dump is logged to the console,
# secrets will be redacted.
self._logger.log_hex_dump(raw_result_xml, self.__secret_traits)
self._logger.log_hex_dump(
raw_result_xml,
self.__secret_traits,
self._racf_trait_and_message_key_map,
)

# ============================================================================
# Secrets Redaction
# ============================================================================
def __add_additional_secret_traits(self, additional_secret_traits: list) -> None:
"""Add additional fields to be redacted in logger output."""
unsupported_profile_types = ["permission", "groupConnection", "systemSettings"]
error_message = (
f"Cannot add specified additional secrets to '{self._profile_type}' object."
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

You should be able to use inspect.stack() here to get the name of the "admin" class (i.e., UserAdmin):

admin_class = "".join(class_tokens)

Also change the word object to type and change Cannot to Unable.

You should get an exception message like this when you are done:

Unable to add specified additional secrets to 'UserAdmin' type.

Make similar corresponding changes to the unsupported profile type exception message.

)
if self._profile_type in unsupported_profile_types:
error_message = error_message + (
f"\n'{self._profile_type}' object does not support additional secrets redaction."
)
raise ValueError(error_message)
bad_secret_traits = []
for secret in additional_secret_traits:
if secret in self.__secret_traits:
continue
if ":" not in secret:
bad_secret_traits.append(
f"\nCould not map {secret} to a valid segment trait."
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I think it is sufficient to say "\n'{secret}' is not a valid trait."

)
continue
segment = secret.split(":")[0]
if segment not in self._valid_segment_traits:
bad_secret_traits.append(
f"\nCould not map {secret} to a valid segment trait."
)
continue
if secret not in self._valid_segment_traits[segment]:
bad_secret_traits.append(
f"\nCould not map {secret} to a valid segment trait."
)
continue
self.__secret_traits[secret] = self._valid_segment_traits[segment][secret]
if bad_secret_traits:
raise ValueError(error_message + "".join(bad_secret_traits))

# ============================================================================
# Request Execution
Expand Down Expand Up @@ -242,6 +269,7 @@ def _make_request(
self.__running_userid,
),
self.__secret_traits,
self._racf_trait_and_message_key_map,
)
self.__clear_state(security_request)
if isinstance(raw_result, list):
Expand Down
161 changes: 136 additions & 25 deletions pyracf/common/utilities/logger.py
Original file line number Diff line number Diff line change
Expand Up @@ -149,49 +149,122 @@ def __redact_request_dictionary(
def __redact_string(
self,
input_string: Union[str, bytes],
start_ind: int,
end_pattern: Union[str, bytes],
):
"""
Redacts characters in a string between a starting index and ending pattern.
trait_key: str,
) -> Union[str, bytes]:
r"""
Redacts characters in a string between a starting index and ending tag.
Replaces the identified characters with '********' regardless of the original length.

This function employs the following regular expressions explained below

Regex 1 ("quoted") - {trait_key.upper()}( +){{0,}}\(\'.*?(?<!\')\'\)
This is designed to match the pattern TRAIT('value') by matching the TRAIT name, a
variable (potentially zero) amount of spaces, then the ('value') portion which must
start and end with (' and '), but can conceivably contain any characters, but a negative
lookbehind is used to look for any unescaped single quotes that would indicate the matching
of ') is otherwise a coincidence.

Regex 2 ("nested") - {trait_key.upper()}( +){{0,}}\([^)]*\(.*\)( +){{0,}}\)
This is designed to match the pattern TRAIT( subtrait1(value) subtrait2(value)) by
matching the TRAIT name, a variable (potentially zero) amount of spaces, then the
( subtrait1(value) subtrait2(value)) portion which must start and end with ( and ),
but must also contain a'(' before the ')'. This indicates that there is a "nested"
structure rather than a sequential one. In the example, this portion of the pattern
matches '( subtrait1(', but would not match '(value) subtrait2(' because of the ')'
character between the two '(' characters. The pattern looks for these nested open
parenthesis as a sequence would have a ')' character between them. Then the expression
allows any non-newline characters to handle all possible trait values and subtrait names
followed by the "end pattern" of ')' and ')' separated by a variable (potentially zero)
whitespace.

If neither of these two patterns is found for a supplied trait_key, then it is assumed
this trait is set with the default pattern below.

Regex 3 ("default") - {trait_key.upper()}( +){{0,}}\(.*?(?<!\\)\)
This is designed to match the pattern TRAIT(value) by matching the TRAIT name, a variable
(potentially zero) amount of spaces, then the (value) portion which must start and end
with '(' and ')', but can conceivably contain any characters, but a negative lookbehind
is used to look for any escape character '\' that would indicate the matching of the
'(' and ')' is otherwise a coincidence.

In all replacement expressions, the variable amounts of whitespace are captured so that
they can be preserved by this redaction operations.

"""
asterisks = "********"
is_bytes = False
quoted_regex = rf"{trait_key.upper()}( +){{0,}}\(\'.*?(?<!\')\'\)"
nested_regex = rf"{trait_key.upper()}( +){{0,}}\([^)]*\(.*\)( +){{0,}}\)"
default_regex = rf"{trait_key.upper()}( +){{0,}}\(.*?(?<!\\)\)"
redacted_regex = rf"{trait_key.upper()}\1({asterisks})"
redacted_w_quotes_regex = rf"{trait_key.upper()}\1('{asterisks}')"
if isinstance(input_string, bytes):
asterisks = asterisks.encode("cp1047")
pre_keyword = input_string[:start_ind]
post_keyword = end_pattern.join(input_string[start_ind:].split(end_pattern)[1:])
return pre_keyword + asterisks + end_pattern + post_keyword
input_string = input_string.decode("cp1047")
is_bytes = True
quoted = re.search(quoted_regex, input_string)
nested = re.search(nested_regex, input_string)
if quoted is not None:
input_string = re.sub(
quoted_regex,
redacted_w_quotes_regex,
input_string,
)
else:
if nested is not None:
input_string = re.sub(
nested_regex,
redacted_regex,
input_string,
)
else:
input_string = re.sub(
default_regex,
redacted_regex,
input_string,
)
if is_bytes:
return input_string.encode("cp1047")
return input_string

def redact_request_xml(
self,
xml_string: Union[str, bytes],
secret_traits: dict,
) -> Union[str, bytes]:
"""
r"""
lcarcaramo marked this conversation as resolved.
Show resolved Hide resolved
Redact a list of specific secret traits in a request xml string or bytes object.
Based the following xml pattern:
'<xmltag attribute="any">xml value</xmltag>'
This function also accounts for any number of arbitrary xml attributes.

This function employs the following regular expression:
{xml_key}(.*)>.*<\/{xml_key} - Designed to match the above pattern by starting and ending
with the xmltag string as shown, but the starting tag allows for any characters between
"xmltag" and the > character to allow for the attribute specification shown above. This
results in the starting of the xml as {xml_key}(.*)> and the ending as <\/{xml_key}.
The characters between the xml tags are "captured" as a variable and preserved by the
substitution operation through the use of the \1 supplied in the replacement string.
Between these tags, any non-newline characters are allowed using the .* expression.
"""
is_bytes = False
if isinstance(xml_string, bytes):
is_bytes = True
xml_string = xml_string.decode("utf-8")
for xml_key in secret_traits.values():
match = re.search(rf"\<{xml_key}+[^>]*\>", xml_string)
if not match:
continue
start_tag_end_tag_regex = rf"{xml_key}(.*)>.*<\/{xml_key}"
redacted_regex = rf"{xml_key}\1>********</{xml_key}"
# Delete operation has no end tag and and redaction should not be attempted.
#
# Redact this:
# <tag operation="set">secret</tag>
#
# Don't try to redact this:
# <tag operation="del" />
if f"</{xml_key}>" not in xml_string:
continue
xml_string = self.__redact_string(xml_string, match.end(), f"</{xml_key}")
xml_string = re.sub(
lcarcaramo marked this conversation as resolved.
Show resolved Hide resolved
start_tag_end_tag_regex,
redacted_regex,
xml_string,
)
lcarcaramo marked this conversation as resolved.
Show resolved Hide resolved
lcarcaramo marked this conversation as resolved.
Show resolved Hide resolved
if is_bytes:
xml_string = xml_string.encode("utf-8")
return xml_string
Expand All @@ -200,30 +273,62 @@ def redact_result_xml(
self,
security_result: Union[str, bytes, List[int]],
secret_traits: dict,
racf_trait_and_message_key_map: dict = {},
) -> str:
"""
r"""
Redacts a list of specific secret traits in a result xml string.
Based on the following RACF command pattern:
Based on the following RACF command patterns:
'TRAIT (value)'
'TRAIT (subtrait1(value) subtrait2(value))
"TRAIT ('value')"
This function also accounts for varied amounts of whitespace in the pattern.

This function employs the following regular expression:
<message>([A-Z]*[0-9]*[A-Z]) [^<>]*{racf_key.upper()}[^<>]*<\/message>" -
Designed to match the above pattern by starting and ending with the message xml tag
string as shown, the value of the message is targeted based on the racf_key. This
should capture only messages that contain information about a redacted key.
The message identifier is "captured" as a variable and preserved by the substitution
operation through the use of the \1 supplied in the replacement string.
"""
if isinstance(security_result, list):
return security_result
for xml_key in secret_traits.values():
racf_key = xml_key.split(":")[1] if ":" in xml_key else xml_key
end_pattern = ")"
if racf_key in racf_trait_and_message_key_map.get("trait_map", {}):
racf_key = racf_trait_and_message_key_map["trait_map"][racf_key]
racf_command_argument_regex = rf"{racf_key.upper()}( +){{0,}}\("
if isinstance(security_result, bytes):
match = re.search(
rf"{racf_key.upper()} +\(", security_result.decode("cp1047")
racf_command_argument_regex, security_result.decode("cp1047")
)
end_pattern = end_pattern.encode("cp1047")
else:
match = re.search(rf"{racf_key.upper()} +\(", security_result)
match = re.search(rf"{racf_key.upper()}( +){{0,}}\(", security_result)
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

match = re.search(racf_command_argument_regex, security_result)

if not match:
continue
security_result = self.__redact_string(
security_result, match.end(), end_pattern
security_result = self.__redact_string(security_result, racf_key)
if racf_key in racf_trait_and_message_key_map.get("message_map", {}):
Copy link
Member

@lcarcaramo lcarcaramo Mar 6, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Comments to indicate which stage of processing we are at? Looks like there are two steps. Redact the "RACF command" and redact any corresponding "RACF messages"

racf_key = racf_trait_and_message_key_map["message_map"][racf_key]
racf_message_regex = (
r"<message>([A-Z]*[0-9]*[A-Z]) [^<>]*"
+ rf"{racf_key.upper()}[^<>]*<\/message>"
)
redacted_racf_message_regex = (
rf"<message>REDACTED MESSAGE CONCERNING {racf_key.upper()}, "
+ r"REVIEW DOCUMENTATION OF \1 FOR MORE INFORMATION</message>"
)
if isinstance(security_result, bytes):
security_result = re.sub(
racf_message_regex,
redacted_racf_message_regex,
security_result.decode("cp1047"),
).encode("cp1047")
else:
security_result = re.sub(
racf_message_regex,
redacted_racf_message_regex,
security_result,
)
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Also explain how these regexes work.

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Added the following:

    This function employs the following regular expression:
    <message>([A-Z]*[0-9]*[A-Z]) [^<>]*{racf_key.upper()}[^<>]*<\/message>" - 
    Designed to match the above pattern by starting and ending with the message xml tag 
    string as shown, the value of the message is targeted based on the racf_key. This
    should capture only messages that contain information about a redacted key.
    The message identifier is "captured" as a variable and preserved by the substitution
    operation through the use of the \1 supplied in the replacement string.

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Just a slight working change suggestion:

Designed to match any message xml element that contains the provided racf_key.

Instead of

Designed to match the above pattern by starting and ending with the message xml tag string as shown, the value of the message is targeted based on the racf_key.

return security_result

def __colorize_json(self, json_text: str) -> str:
Expand Down Expand Up @@ -355,7 +460,12 @@ def __indent_xml(self, minified_xml: str) -> str:
indented_xml += f"{' ' * indent_level}{current_line}\n"
return indented_xml[:-2]

def log_hex_dump(self, raw_result_xml: bytes, secret_traits: dict) -> None:
def log_hex_dump(
self,
raw_result_xml: bytes,
secret_traits: dict,
racf_trait_and_message_key_map: dict,
) -> None:
"""
Log the raw result XML returned by IRRSMO00 as a hex dump.
"""
Expand All @@ -368,6 +478,7 @@ def log_hex_dump(self, raw_result_xml: bytes, secret_traits: dict) -> None:
raw_result_xml = self.redact_result_xml(
raw_result_xml,
secret_traits,
racf_trait_and_message_key_map,
)
for byte in raw_result_xml:
color_function = self.__green
Expand Down
10 changes: 10 additions & 0 deletions pyracf/data_set/data_set_admin.py
Original file line number Diff line number Diff line change
Expand Up @@ -63,6 +63,16 @@ def __init__(
"dfp": {"dfp:owner": "racf:resowner", "dfp:ckds_data_key": "racf:datakey"},
"tme": {"tme:roles": "racf:roles"},
}
self._racf_trait_and_message_key_map["trait_map"] = {
"audaltr": "audit",
"audcntl": "audit",
"audnone": "audit",
"audread": "audit",
"audupdt": "audit",
}
self._racf_trait_and_message_key_map["message_map"] = {
"uacc": "universal access"
}
self._valid_segment_traits["base"].update(
self._common_base_traits_data_set_generic
)
Expand Down
10 changes: 10 additions & 0 deletions pyracf/resource/resource_admin.py
Original file line number Diff line number Diff line change
Expand Up @@ -238,6 +238,16 @@ def __init__(
"sigrequired": "signatureRequired",
},
}
self._racf_trait_and_message_key_map["trait_map"] = {
"audaltr": "audit",
"audcntl": "audit",
"audnone": "audit",
"audread": "audit",
"audupdt": "audit",
}
self._racf_trait_and_message_key_map["message_map"] = {
"uacc": "universal access"
}
super().__init__(
"resource",
irrsmo00_result_buffer_size=irrsmo00_result_buffer_size,
Expand Down
Loading
Loading