| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576 |
- # Copyright (c) Microsoft Corporation.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import json
- import re
- from typing import Pattern, Union
- def escape_regex_flags(pattern: Pattern) -> str:
- flags = ""
- if pattern.flags != 0:
- flags = ""
- if (pattern.flags & int(re.IGNORECASE)) != 0:
- flags += "i"
- if (pattern.flags & int(re.DOTALL)) != 0:
- flags += "s"
- if (pattern.flags & int(re.MULTILINE)) != 0:
- flags += "m"
- assert (
- pattern.flags
- & ~(int(re.MULTILINE) | int(re.IGNORECASE) | int(re.DOTALL) | int(re.UNICODE))
- == 0
- ), "Unexpected re.Pattern flag, only MULTILINE, IGNORECASE and DOTALL are supported."
- return flags
- def escape_for_regex(text: str) -> str:
- return re.sub(r"[.*+?^>${}()|[\]\\]", "\\$&", text)
- def escape_regex_for_selector(text: Pattern) -> str:
- # Even number of backslashes followed by the quote -> insert a backslash.
- return (
- "/"
- + re.sub(r'(^|[^\\])(\\\\)*(["\'`])', r"\1\2\\\3", text.pattern).replace(
- ">>", "\\>\\>"
- )
- + "/"
- + escape_regex_flags(text)
- )
- def escape_for_text_selector(
- text: Union[str, Pattern[str]], exact: bool = None, case_sensitive: bool = None
- ) -> str:
- if isinstance(text, Pattern):
- return escape_regex_for_selector(text)
- return json.dumps(text) + ("s" if exact else "i")
- def escape_for_attribute_selector(
- value: Union[str, Pattern], exact: bool = None
- ) -> str:
- if isinstance(value, Pattern):
- return escape_regex_for_selector(value)
- # TODO: this should actually be
- # cssEscape(value).replace(/\\ /g, ' ')
- # However, our attribute selectors do not conform to CSS parsing spec,
- # so we escape them differently.
- return (
- '"'
- + value.replace("\\", "\\\\").replace('"', '\\"')
- + '"'
- + ("s" if exact else "i")
- )
|