Get NDK python script tests running.
Imports weren't working in tests because the package had been created.
The Python "binaries" built by Soong don't seem to take their own
pkg_path into account, so I split the separate pieces of code here out
into their own packages.
Note that the ndk_api_coverage_parser tests do not actually pass
before or after this change (seems like it might be a
non-deterministic ordering issue in the attributes of the generated
output?), but they can at least be run now.
Test: pytest ndkstubgen
Test: pytest symbolfile
Test: pytest ndk_api_coverage_parser
Test: out/host/linux-x86/nativetest64/test_ndkstubgen/test_ndkstubgen
Test: out/host/linux-x86/nativetest64/test_symbolfile/test_symbolfile
Test: out/host/linux-x86/nativetest64/test_ndk_api_coverage_parser/test_ndk_api_coverage_parser
Bug: None
Change-Id: I2ac22f7ced7566e4808070f2f72fd04355846e0b
diff --git a/cc/symbolfile/__init__.py b/cc/symbolfile/__init__.py
new file mode 100644
index 0000000..faa3823
--- /dev/null
+++ b/cc/symbolfile/__init__.py
@@ -0,0 +1,384 @@
+#
+# Copyright (C) 2016 The Android Open Source Project
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+"""Parser for Android's version script information."""
+import logging
+import re
+
+
+ALL_ARCHITECTURES = (
+ 'arm',
+ 'arm64',
+ 'x86',
+ 'x86_64',
+)
+
+
+# Arbitrary magic number. We use the same one in api-level.h for this purpose.
+FUTURE_API_LEVEL = 10000
+
+
+def logger():
+ """Return the main logger for this module."""
+ return logging.getLogger(__name__)
+
+
+def get_tags(line):
+ """Returns a list of all tags on this line."""
+ _, _, all_tags = line.strip().partition('#')
+ return [e for e in re.split(r'\s+', all_tags) if e.strip()]
+
+
+def is_api_level_tag(tag):
+ """Returns true if this tag has an API level that may need decoding."""
+ if tag.startswith('introduced='):
+ return True
+ if tag.startswith('introduced-'):
+ return True
+ if tag.startswith('versioned='):
+ return True
+ return False
+
+
+def decode_api_level(api, api_map):
+ """Decodes the API level argument into the API level number.
+
+ For the average case, this just decodes the integer value from the string,
+ but for unreleased APIs we need to translate from the API codename (like
+ "O") to the future API level for that codename.
+ """
+ try:
+ return int(api)
+ except ValueError:
+ pass
+
+ if api == "current":
+ return FUTURE_API_LEVEL
+
+ return api_map[api]
+
+
+def decode_api_level_tags(tags, api_map):
+ """Decodes API level code names in a list of tags.
+
+ Raises:
+ ParseError: An unknown version name was found in a tag.
+ """
+ for idx, tag in enumerate(tags):
+ if not is_api_level_tag(tag):
+ continue
+ name, value = split_tag(tag)
+
+ try:
+ decoded = str(decode_api_level(value, api_map))
+ tags[idx] = '='.join([name, decoded])
+ except KeyError:
+ raise ParseError('Unknown version name in tag: {}'.format(tag))
+ return tags
+
+
+def split_tag(tag):
+ """Returns a key/value tuple of the tag.
+
+ Raises:
+ ValueError: Tag is not a key/value type tag.
+
+ Returns: Tuple of (key, value) of the tag. Both components are strings.
+ """
+ if '=' not in tag:
+ raise ValueError('Not a key/value tag: ' + tag)
+ key, _, value = tag.partition('=')
+ return key, value
+
+
+def get_tag_value(tag):
+ """Returns the value of a key/value tag.
+
+ Raises:
+ ValueError: Tag is not a key/value type tag.
+
+ Returns: Value part of tag as a string.
+ """
+ return split_tag(tag)[1]
+
+
+def version_is_private(version):
+ """Returns True if the version name should be treated as private."""
+ return version.endswith('_PRIVATE') or version.endswith('_PLATFORM')
+
+
+def should_omit_version(version, arch, api, llndk, apex):
+ """Returns True if the version section should be ommitted.
+
+ We want to omit any sections that do not have any symbols we'll have in the
+ stub library. Sections that contain entirely future symbols or only symbols
+ for certain architectures.
+ """
+ if version_is_private(version.name):
+ return True
+ if 'platform-only' in version.tags:
+ return True
+
+ no_llndk_no_apex = ('llndk' not in version.tags
+ and 'apex' not in version.tags)
+ keep = no_llndk_no_apex or \
+ ('llndk' in version.tags and llndk) or \
+ ('apex' in version.tags and apex)
+ if not keep:
+ return True
+ if not symbol_in_arch(version.tags, arch):
+ return True
+ if not symbol_in_api(version.tags, arch, api):
+ return True
+ return False
+
+
+def should_omit_symbol(symbol, arch, api, llndk, apex):
+ """Returns True if the symbol should be omitted."""
+ no_llndk_no_apex = 'llndk' not in symbol.tags and 'apex' not in symbol.tags
+ keep = no_llndk_no_apex or \
+ ('llndk' in symbol.tags and llndk) or \
+ ('apex' in symbol.tags and apex)
+ if not keep:
+ return True
+ if not symbol_in_arch(symbol.tags, arch):
+ return True
+ if not symbol_in_api(symbol.tags, arch, api):
+ return True
+ return False
+
+
+def symbol_in_arch(tags, arch):
+ """Returns true if the symbol is present for the given architecture."""
+ has_arch_tags = False
+ for tag in tags:
+ if tag == arch:
+ return True
+ if tag in ALL_ARCHITECTURES:
+ has_arch_tags = True
+
+ # If there were no arch tags, the symbol is available for all
+ # architectures. If there were any arch tags, the symbol is only available
+ # for the tagged architectures.
+ return not has_arch_tags
+
+
+def symbol_in_api(tags, arch, api):
+ """Returns true if the symbol is present for the given API level."""
+ introduced_tag = None
+ arch_specific = False
+ for tag in tags:
+ # If there is an arch-specific tag, it should override the common one.
+ if tag.startswith('introduced=') and not arch_specific:
+ introduced_tag = tag
+ elif tag.startswith('introduced-' + arch + '='):
+ introduced_tag = tag
+ arch_specific = True
+ elif tag == 'future':
+ return api == FUTURE_API_LEVEL
+
+ if introduced_tag is None:
+ # We found no "introduced" tags, so the symbol has always been
+ # available.
+ return True
+
+ return api >= int(get_tag_value(introduced_tag))
+
+
+def symbol_versioned_in_api(tags, api):
+ """Returns true if the symbol should be versioned for the given API.
+
+ This models the `versioned=API` tag. This should be a very uncommonly
+ needed tag, and is really only needed to fix versioning mistakes that are
+ already out in the wild.
+
+ For example, some of libc's __aeabi_* functions were originally placed in
+ the private version, but that was incorrect. They are now in LIBC_N, but
+ when building against any version prior to N we need the symbol to be
+ unversioned (otherwise it won't resolve on M where it is private).
+ """
+ for tag in tags:
+ if tag.startswith('versioned='):
+ return api >= int(get_tag_value(tag))
+ # If there is no "versioned" tag, the tag has been versioned for as long as
+ # it was introduced.
+ return True
+
+
+class ParseError(RuntimeError):
+ """An error that occurred while parsing a symbol file."""
+
+
+class MultiplyDefinedSymbolError(RuntimeError):
+ """A symbol name was multiply defined."""
+ def __init__(self, multiply_defined_symbols):
+ super(MultiplyDefinedSymbolError, self).__init__(
+ 'Version script contains multiple definitions for: {}'.format(
+ ', '.join(multiply_defined_symbols)))
+ self.multiply_defined_symbols = multiply_defined_symbols
+
+
+class Version:
+ """A version block of a symbol file."""
+ def __init__(self, name, base, tags, symbols):
+ self.name = name
+ self.base = base
+ self.tags = tags
+ self.symbols = symbols
+
+ def __eq__(self, other):
+ if self.name != other.name:
+ return False
+ if self.base != other.base:
+ return False
+ if self.tags != other.tags:
+ return False
+ if self.symbols != other.symbols:
+ return False
+ return True
+
+
+class Symbol:
+ """A symbol definition from a symbol file."""
+ def __init__(self, name, tags):
+ self.name = name
+ self.tags = tags
+
+ def __eq__(self, other):
+ return self.name == other.name and set(self.tags) == set(other.tags)
+
+
+class SymbolFileParser:
+ """Parses NDK symbol files."""
+ def __init__(self, input_file, api_map, arch, api, llndk, apex):
+ self.input_file = input_file
+ self.api_map = api_map
+ self.arch = arch
+ self.api = api
+ self.llndk = llndk
+ self.apex = apex
+ self.current_line = None
+
+ def parse(self):
+ """Parses the symbol file and returns a list of Version objects."""
+ versions = []
+ while self.next_line() != '':
+ if '{' in self.current_line:
+ versions.append(self.parse_version())
+ else:
+ raise ParseError(
+ 'Unexpected contents at top level: ' + self.current_line)
+
+ self.check_no_duplicate_symbols(versions)
+ return versions
+
+ def check_no_duplicate_symbols(self, versions):
+ """Raises errors for multiply defined symbols.
+
+ This situation is the normal case when symbol versioning is actually
+ used, but this script doesn't currently handle that. The error message
+ will be a not necessarily obvious "error: redefition of 'foo'" from
+ stub.c, so it's better for us to catch this situation and raise a
+ better error.
+ """
+ symbol_names = set()
+ multiply_defined_symbols = set()
+ for version in versions:
+ if should_omit_version(version, self.arch, self.api, self.llndk,
+ self.apex):
+ continue
+
+ for symbol in version.symbols:
+ if should_omit_symbol(symbol, self.arch, self.api, self.llndk,
+ self.apex):
+ continue
+
+ if symbol.name in symbol_names:
+ multiply_defined_symbols.add(symbol.name)
+ symbol_names.add(symbol.name)
+ if multiply_defined_symbols:
+ raise MultiplyDefinedSymbolError(
+ sorted(list(multiply_defined_symbols)))
+
+ def parse_version(self):
+ """Parses a single version section and returns a Version object."""
+ name = self.current_line.split('{')[0].strip()
+ tags = get_tags(self.current_line)
+ tags = decode_api_level_tags(tags, self.api_map)
+ symbols = []
+ global_scope = True
+ cpp_symbols = False
+ while self.next_line() != '':
+ if '}' in self.current_line:
+ # Line is something like '} BASE; # tags'. Both base and tags
+ # are optional here.
+ base = self.current_line.partition('}')[2]
+ base = base.partition('#')[0].strip()
+ if not base.endswith(';'):
+ raise ParseError(
+ 'Unterminated version/export "C++" block (expected ;).')
+ if cpp_symbols:
+ cpp_symbols = False
+ else:
+ base = base.rstrip(';').rstrip()
+ if base == '':
+ base = None
+ return Version(name, base, tags, symbols)
+ elif 'extern "C++" {' in self.current_line:
+ cpp_symbols = True
+ elif not cpp_symbols and ':' in self.current_line:
+ visibility = self.current_line.split(':')[0].strip()
+ if visibility == 'local':
+ global_scope = False
+ elif visibility == 'global':
+ global_scope = True
+ else:
+ raise ParseError('Unknown visiblity label: ' + visibility)
+ elif global_scope and not cpp_symbols:
+ symbols.append(self.parse_symbol())
+ else:
+ # We're in a hidden scope or in 'extern "C++"' block. Ignore
+ # everything.
+ pass
+ raise ParseError('Unexpected EOF in version block.')
+
+ def parse_symbol(self):
+ """Parses a single symbol line and returns a Symbol object."""
+ if ';' not in self.current_line:
+ raise ParseError(
+ 'Expected ; to terminate symbol: ' + self.current_line)
+ if '*' in self.current_line:
+ raise ParseError(
+ 'Wildcard global symbols are not permitted.')
+ # Line is now in the format "<symbol-name>; # tags"
+ name, _, _ = self.current_line.strip().partition(';')
+ tags = get_tags(self.current_line)
+ tags = decode_api_level_tags(tags, self.api_map)
+ return Symbol(name, tags)
+
+ def next_line(self):
+ """Returns the next non-empty non-comment line.
+
+ A return value of '' indicates EOF.
+ """
+ line = self.input_file.readline()
+ while line.strip() == '' or line.strip().startswith('#'):
+ line = self.input_file.readline()
+
+ # We want to skip empty lines, but '' indicates EOF.
+ if line == '':
+ break
+ self.current_line = line
+ return self.current_line