0f386bc12b
Previously, the signature_trie python library would reject classes which started with a lower case character which in turn caused the verify_overlaps tool to fail. That meant that it was impossible to add obfuscated classes (which commonly used lower case characters for their name) from being used on the bootclasspath. This change removes that restriction and the accompanying test. Bug: 265833521 Test: TH and partner testing Change-Id: I70710484e427f64d79fb30301f3413f3b67b27e7
341 lines
12 KiB
Python
341 lines
12 KiB
Python
#!/usr/bin/env python
|
|
#
|
|
# Copyright (C) 2022 The Android Open Source Project
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
"""Verify that one set of hidden API flags is a subset of another."""
|
|
import dataclasses
|
|
import typing
|
|
|
|
from itertools import chain
|
|
|
|
|
|
@dataclasses.dataclass()
|
|
class Node:
|
|
"""A node in the signature trie."""
|
|
|
|
# The type of the node.
|
|
#
|
|
# Leaf nodes are of type "member".
|
|
# Interior nodes can be either "package", or "class".
|
|
type: str
|
|
|
|
# The selector of the node.
|
|
#
|
|
# That is a string that can be used to select the node, e.g. in a pattern
|
|
# that is passed to InteriorNode.get_matching_rows().
|
|
selector: str
|
|
|
|
def values(self, selector):
|
|
"""Get the values from a set of selected nodes.
|
|
|
|
:param selector: a function that can be applied to a key in the nodes
|
|
attribute to determine whether to return its values.
|
|
|
|
:return: A list of iterables of all the values associated with
|
|
this node and its children.
|
|
"""
|
|
values = []
|
|
self.append_values(values, selector)
|
|
return values
|
|
|
|
def append_values(self, values, selector):
|
|
"""Append the values associated with this node and its children.
|
|
|
|
For each item (key, child) in nodes the child node's values are returned
|
|
if and only if the selector returns True when called on its key. A child
|
|
node's values are all the values associated with it and all its
|
|
descendant nodes.
|
|
|
|
:param selector: a function that can be applied to a key in the nodes
|
|
attribute to determine whether to return its values.
|
|
:param values: a list of a iterables of values.
|
|
"""
|
|
raise NotImplementedError("Please Implement this method")
|
|
|
|
def child_nodes(self):
|
|
"""Get an iterable of the child nodes of this node."""
|
|
raise NotImplementedError("Please Implement this method")
|
|
|
|
|
|
# pylint: disable=line-too-long
|
|
@dataclasses.dataclass()
|
|
class InteriorNode(Node):
|
|
"""An interior node in a trie.
|
|
|
|
Each interior node has a dict that maps from an element of a signature to
|
|
either another interior node or a leaf. Each interior node represents either
|
|
a package, class or nested class. Class members are represented by a Leaf.
|
|
|
|
Associating the set of flags [public-api] with the signature
|
|
"Ljava/lang/Object;->String()Ljava/lang/String;" will cause the following
|
|
nodes to be created:
|
|
Node()
|
|
^- package:java -> Node()
|
|
^- package:lang -> Node()
|
|
^- class:Object -> Node()
|
|
^- member:String()Ljava/lang/String; -> Leaf([public-api])
|
|
|
|
Associating the set of flags [blocked,core-platform-api] with the signature
|
|
"Ljava/lang/Character$UnicodeScript;->of(I)Ljava/lang/Character$UnicodeScript;"
|
|
will cause the following nodes to be created:
|
|
Node()
|
|
^- package:java -> Node()
|
|
^- package:lang -> Node()
|
|
^- class:Character -> Node()
|
|
^- class:UnicodeScript -> Node()
|
|
^- member:of(I)Ljava/lang/Character$UnicodeScript;
|
|
-> Leaf([blocked,core-platform-api])
|
|
"""
|
|
|
|
# pylint: enable=line-too-long
|
|
|
|
# A dict from an element of the signature to the Node/Leaf containing the
|
|
# next element/value.
|
|
nodes: typing.Dict[str, Node] = dataclasses.field(default_factory=dict)
|
|
|
|
# pylint: disable=line-too-long
|
|
@staticmethod
|
|
def signature_to_elements(signature):
|
|
"""Split a signature or a prefix into a number of elements:
|
|
|
|
1. The packages (excluding the leading L preceding the first package).
|
|
2. The class names, from outermost to innermost.
|
|
3. The member signature.
|
|
e.g.
|
|
Ljava/lang/Character$UnicodeScript;->of(I)Ljava/lang/Character$UnicodeScript;
|
|
will be broken down into these elements:
|
|
1. package:java
|
|
2. package:lang
|
|
3. class:Character
|
|
4. class:UnicodeScript
|
|
5. member:of(I)Ljava/lang/Character$UnicodeScript;
|
|
"""
|
|
# Remove the leading L.
|
|
# - java/lang/Character$UnicodeScript;->of(I)Ljava/lang/Character$UnicodeScript;
|
|
text = signature.removeprefix("L")
|
|
# Split the signature between qualified class name and the class member
|
|
# signature.
|
|
# 0 - java/lang/Character$UnicodeScript
|
|
# 1 - of(I)Ljava/lang/Character$UnicodeScript;
|
|
parts = text.split(";->")
|
|
# If there is no member then this will be an empty list.
|
|
member = parts[1:]
|
|
# Split the qualified class name into packages, and class name.
|
|
# 0 - java
|
|
# 1 - lang
|
|
# 2 - Character$UnicodeScript
|
|
elements = parts[0].split("/")
|
|
last_element = elements[-1]
|
|
wildcard = []
|
|
classes = []
|
|
if "*" in last_element:
|
|
if last_element not in ("*", "**"):
|
|
raise Exception(f"Invalid signature '{signature}': invalid "
|
|
f"wildcard '{last_element}'")
|
|
packages = elements[0:-1]
|
|
# Cannot specify a wildcard and target a specific member
|
|
if member:
|
|
raise Exception(f"Invalid signature '{signature}': contains "
|
|
f"wildcard '{last_element}' and "
|
|
f"member signature '{member[0]}'")
|
|
wildcard = [last_element]
|
|
else:
|
|
packages = elements[0:-1]
|
|
# Split the class name into outer / inner classes
|
|
# 0 - Character
|
|
# 1 - UnicodeScript
|
|
classes = last_element.removesuffix(";").split("$")
|
|
|
|
# Assemble the parts into a single list, adding prefixes to identify
|
|
# the different parts. If a wildcard is provided then it looks something
|
|
# like this:
|
|
# 0 - package:java
|
|
# 1 - package:lang
|
|
# 2 - *
|
|
#
|
|
# Otherwise, it looks something like this:
|
|
# 0 - package:java
|
|
# 1 - package:lang
|
|
# 2 - class:Character
|
|
# 3 - class:UnicodeScript
|
|
# 4 - member:of(I)Ljava/lang/Character$UnicodeScript;
|
|
return list(
|
|
chain([("package", x) for x in packages],
|
|
[("class", x) for x in classes],
|
|
[("member", x) for x in member],
|
|
[("wildcard", x) for x in wildcard]))
|
|
|
|
# pylint: enable=line-too-long
|
|
|
|
@staticmethod
|
|
def split_element(element):
|
|
element_type, element_value = element
|
|
return element_type, element_value
|
|
|
|
@staticmethod
|
|
def element_type(element):
|
|
element_type, _ = InteriorNode.split_element(element)
|
|
return element_type
|
|
|
|
@staticmethod
|
|
def elements_to_selector(elements):
|
|
"""Compute a selector for a set of elements.
|
|
|
|
A selector uniquely identifies a specific Node in the trie. It is
|
|
essentially a prefix of a signature (without the leading L).
|
|
|
|
e.g. a trie containing "Ljava/lang/Object;->String()Ljava/lang/String;"
|
|
would contain nodes with the following selectors:
|
|
* "java"
|
|
* "java/lang"
|
|
* "java/lang/Object"
|
|
* "java/lang/Object;->String()Ljava/lang/String;"
|
|
"""
|
|
signature = ""
|
|
preceding_type = ""
|
|
for element in elements:
|
|
element_type, element_value = InteriorNode.split_element(element)
|
|
separator = ""
|
|
if element_type == "package":
|
|
separator = "/"
|
|
elif element_type == "class":
|
|
if preceding_type == "class":
|
|
separator = "$"
|
|
else:
|
|
separator = "/"
|
|
elif element_type == "wildcard":
|
|
separator = "/"
|
|
elif element_type == "member":
|
|
separator += ";->"
|
|
|
|
if signature:
|
|
signature += separator
|
|
|
|
signature += element_value
|
|
|
|
preceding_type = element_type
|
|
|
|
return signature
|
|
|
|
def add(self, signature, value, only_if_matches=False):
|
|
"""Associate the value with the specific signature.
|
|
|
|
:param signature: the member signature
|
|
:param value: the value to associated with the signature
|
|
:param only_if_matches: True if the value is added only if the signature
|
|
matches at least one of the existing top level packages.
|
|
:return: n/a
|
|
"""
|
|
# Split the signature into elements.
|
|
elements = self.signature_to_elements(signature)
|
|
# Find the Node associated with the deepest class.
|
|
node = self
|
|
for index, element in enumerate(elements[:-1]):
|
|
if element in node.nodes:
|
|
node = node.nodes[element]
|
|
elif only_if_matches and index == 0:
|
|
return
|
|
else:
|
|
selector = self.elements_to_selector(elements[0:index + 1])
|
|
next_node = InteriorNode(
|
|
type=InteriorNode.element_type(element), selector=selector)
|
|
node.nodes[element] = next_node
|
|
node = next_node
|
|
# Add a Leaf containing the value and associate it with the member
|
|
# signature within the class.
|
|
last_element = elements[-1]
|
|
last_element_type = self.element_type(last_element)
|
|
if last_element_type != "member":
|
|
raise Exception(
|
|
f"Invalid signature: {signature}, does not identify a "
|
|
"specific member")
|
|
if last_element in node.nodes:
|
|
raise Exception(f"Duplicate signature: {signature}")
|
|
leaf = Leaf(
|
|
type=last_element_type,
|
|
selector=signature,
|
|
value=value,
|
|
)
|
|
node.nodes[last_element] = leaf
|
|
|
|
def get_matching_rows(self, pattern):
|
|
"""Get the values (plural) associated with the pattern.
|
|
|
|
e.g. If the pattern is a full signature then this will return a list
|
|
containing the value associated with that signature.
|
|
|
|
If the pattern is a class then this will return a list containing the
|
|
values associated with all members of that class.
|
|
|
|
If the pattern ends with "*" then the preceding part is treated as a
|
|
package and this will return a list containing the values associated
|
|
with all the members of all the classes in that package.
|
|
|
|
If the pattern ends with "**" then the preceding part is treated
|
|
as a package and this will return a list containing the values
|
|
associated with all the members of all the classes in that package and
|
|
all sub-packages.
|
|
|
|
:param pattern: the pattern which could be a complete signature or a
|
|
class, or package wildcard.
|
|
:return: an iterable containing all the values associated with the
|
|
pattern.
|
|
"""
|
|
elements = self.signature_to_elements(pattern)
|
|
node = self
|
|
|
|
# Include all values from this node and all its children.
|
|
selector = lambda x: True
|
|
|
|
last_element = elements[-1]
|
|
last_element_type, last_element_value = self.split_element(last_element)
|
|
if last_element_type == "wildcard":
|
|
elements = elements[:-1]
|
|
if last_element_value == "*":
|
|
# Do not include values from sub-packages.
|
|
selector = lambda x: InteriorNode.element_type(x) != "package"
|
|
|
|
for element in elements:
|
|
if element in node.nodes:
|
|
node = node.nodes[element]
|
|
else:
|
|
return []
|
|
|
|
return node.values(selector)
|
|
|
|
def append_values(self, values, selector):
|
|
for key, node in self.nodes.items():
|
|
if selector(key):
|
|
node.append_values(values, lambda x: True)
|
|
|
|
def child_nodes(self):
|
|
return self.nodes.values()
|
|
|
|
|
|
@dataclasses.dataclass()
|
|
class Leaf(Node):
|
|
"""A leaf of the trie"""
|
|
|
|
# The value associated with this leaf.
|
|
value: typing.Any
|
|
|
|
def append_values(self, values, selector):
|
|
values.append(self.value)
|
|
|
|
def child_nodes(self):
|
|
return []
|
|
|
|
|
|
def signature_trie():
|
|
return InteriorNode(type="root", selector="")
|