# SPDX-FileCopyrightText: OpenSSF project contributors # SPDX-License-Identifier: MIT """Compliant Code Example""" import re import sys if sys.stdout.encoding.lower() != "utf-8": sys.stdout.reconfigure(encoding="UTF-8") def filter_string(input_string: str): """Normalize and validate untrusted string Parameters: input_string(string): String to validate """ # TODO Canonicalize (normalize) before Validating # validate, only allow harmless tags for tag in re.findall("<[^>]*>", input_string): if tag not in ["", "
", "
"]: raise ValueError("Invalid input tag") else: # Showing why incorrectly filtering could cause problems decoded = name.encode("utf-8") print(decoded.decode("ascii", "ignore")) # TODO handle exception ##################### # attempting to exploit above code example ##################### names = [ "YES 毛泽东先生", "YES dash-", "NOK ", "NOK ", ] for name in names: print(name) filter_string(name)