# Copyright (c) Microsoft Corporation. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import re # https://developer.mozilla.org/en-US/docs/Web/JavaScript/Guide/Regular_expressions#escaping escaped_chars = {"$", "^", "+", ".", "*", "(", ")", "|", "\\", "?", "{", "}", "[", "]"} def glob_to_regex(glob: str) -> "re.Pattern[str]": tokens = ["^"] in_group = False i = 0 while i < len(glob): c = glob[i] if c == "\\" and i + 1 < len(glob): char = glob[i + 1] tokens.append("\\" + char if char in escaped_chars else char) i += 1 elif c == "*": before_deep = glob[i - 1] if i > 0 else None star_count = 1 while i + 1 < len(glob) and glob[i + 1] == "*": star_count += 1 i += 1 after_deep = glob[i + 1] if i + 1 < len(glob) else None is_deep = ( star_count > 1 and (before_deep == "/" or before_deep is None) and (after_deep == "/" or after_deep is None) ) if is_deep: tokens.append("((?:[^/]*(?:/|$))*)") i += 1 else: tokens.append("([^/]*)") else: if c == "?": tokens.append(".") elif c == "[": tokens.append("[") elif c == "]": tokens.append("]") elif c == "{": in_group = True tokens.append("(") elif c == "}": in_group = False tokens.append(")") elif c == "," and in_group: tokens.append("|") else: tokens.append("\\" + c if c in escaped_chars else c) i += 1 tokens.append("$") return re.compile("".join(tokens))