blob: e883c6bed755b979349a97969a7bb8a29dc7531c [file] [log] [blame]
David Brazdil8503b902018-08-30 13:35:03 +01001#!/usr/bin/env python
2#
3# Copyright (C) 2018 The Android Open Source Project
4#
5# Licensed under the Apache License, Version 2.0 (the "License");
6# you may not use this file except in compliance with the License.
7# You may obtain a copy of the License at
8#
9# http://www.apache.org/licenses/LICENSE-2.0
10#
11# Unless required by applicable law or agreed to in writing, software
12# distributed under the License is distributed on an "AS IS" BASIS,
13# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14# See the License for the specific language governing permissions and
15# limitations under the License.
16"""
17Generate API lists for non-SDK API enforcement.
David Brazdil8503b902018-08-30 13:35:03 +010018"""
19import argparse
David Brazdil17d16e82018-12-13 17:00:09 +000020from collections import defaultdict
David Brazdil8503b902018-08-30 13:35:03 +010021import os
22import sys
23import re
Andrei Oneaa6e09b42019-03-29 15:27:55 +000024import functools
David Brazdil8503b902018-08-30 13:35:03 +010025
David Brazdil89bf0f22018-10-30 18:21:24 +000026# Names of flags recognized by the `hiddenapi` tool.
27FLAG_WHITELIST = "whitelist"
28FLAG_GREYLIST = "greylist"
29FLAG_BLACKLIST = "blacklist"
30FLAG_GREYLIST_MAX_O = "greylist-max-o"
David Brazdil5cd148f2018-11-01 09:54:25 +000031FLAG_GREYLIST_MAX_P = "greylist-max-p"
David Brazdila4e64da2019-05-01 11:57:05 +010032FLAG_GREYLIST_MAX_Q = "greylist-max-q"
David Brazdil439d3492018-12-07 11:49:55 +000033FLAG_CORE_PLATFORM_API = "core-platform-api"
Andrei Onea80a56602019-03-01 18:49:15 +000034FLAG_PUBLIC_API = "public-api"
35FLAG_SYSTEM_API = "system-api"
36FLAG_TEST_API = "test-api"
David Brazdil89bf0f22018-10-30 18:21:24 +000037
38# List of all known flags.
David Brazdil439d3492018-12-07 11:49:55 +000039FLAGS_API_LIST = [
David Brazdil89bf0f22018-10-30 18:21:24 +000040 FLAG_WHITELIST,
41 FLAG_GREYLIST,
42 FLAG_BLACKLIST,
43 FLAG_GREYLIST_MAX_O,
David Brazdil5cd148f2018-11-01 09:54:25 +000044 FLAG_GREYLIST_MAX_P,
David Brazdila4e64da2019-05-01 11:57:05 +010045 FLAG_GREYLIST_MAX_Q,
David Brazdil89bf0f22018-10-30 18:21:24 +000046]
Andrei Onea80a56602019-03-01 18:49:15 +000047ALL_FLAGS = FLAGS_API_LIST + [
48 FLAG_CORE_PLATFORM_API,
49 FLAG_PUBLIC_API,
50 FLAG_SYSTEM_API,
51 FLAG_TEST_API,
52 ]
David Brazdil439d3492018-12-07 11:49:55 +000053
54FLAGS_API_LIST_SET = set(FLAGS_API_LIST)
55ALL_FLAGS_SET = set(ALL_FLAGS)
David Brazdil89bf0f22018-10-30 18:21:24 +000056
57# Suffix used in command line args to express that only known and
58# otherwise unassigned entries should be assign the given flag.
59# For example, the P dark greylist is checked in as it was in P,
60# but signatures have changes since then. The flag instructs this
61# script to skip any entries which do not exist any more.
62FLAG_IGNORE_CONFLICTS_SUFFIX = "-ignore-conflicts"
63
Andrei Oneaa6e09b42019-03-29 15:27:55 +000064# Suffix used in command line args to express that all apis within a given set
65# of packages should be assign the given flag.
66FLAG_PACKAGES_SUFFIX = "-packages"
67
David Brazdil89bf0f22018-10-30 18:21:24 +000068# Regex patterns of fields/methods used in serialization. These are
69# considered public API despite being hidden.
70SERIALIZATION_PATTERNS = [
71 r'readObject\(Ljava/io/ObjectInputStream;\)V',
72 r'readObjectNoData\(\)V',
73 r'readResolve\(\)Ljava/lang/Object;',
74 r'serialVersionUID:J',
75 r'serialPersistentFields:\[Ljava/io/ObjectStreamField;',
76 r'writeObject\(Ljava/io/ObjectOutputStream;\)V',
77 r'writeReplace\(\)Ljava/lang/Object;',
78]
79
80# Single regex used to match serialization API. It combines all the
81# SERIALIZATION_PATTERNS into a single regular expression.
82SERIALIZATION_REGEX = re.compile(r'.*->(' + '|'.join(SERIALIZATION_PATTERNS) + r')$')
83
84# Predicates to be used with filter_apis.
David Brazdil439d3492018-12-07 11:49:55 +000085HAS_NO_API_LIST_ASSIGNED = lambda api, flags: not FLAGS_API_LIST_SET.intersection(flags)
David Brazdil89bf0f22018-10-30 18:21:24 +000086IS_SERIALIZATION = lambda api, flags: SERIALIZATION_REGEX.match(api)
87
David Brazdil8503b902018-08-30 13:35:03 +010088def get_args():
89 """Parses command line arguments.
90
91 Returns:
92 Namespace: dictionary of parsed arguments
93 """
94 parser = argparse.ArgumentParser()
David Brazdil89bf0f22018-10-30 18:21:24 +000095 parser.add_argument('--output', required=True)
David Brazdil89bf0f22018-10-30 18:21:24 +000096 parser.add_argument('--csv', nargs='*', default=[], metavar='CSV_FILE',
97 help='CSV files to be merged into output')
98
David Brazdil439d3492018-12-07 11:49:55 +000099 for flag in ALL_FLAGS:
David Brazdil89bf0f22018-10-30 18:21:24 +0000100 ignore_conflicts_flag = flag + FLAG_IGNORE_CONFLICTS_SUFFIX
Andrei Oneaa6e09b42019-03-29 15:27:55 +0000101 packages_flag = flag + FLAG_PACKAGES_SUFFIX
David Brazdil89bf0f22018-10-30 18:21:24 +0000102 parser.add_argument('--' + flag, dest=flag, nargs='*', default=[], metavar='TXT_FILE',
103 help='lists of entries with flag "' + flag + '"')
104 parser.add_argument('--' + ignore_conflicts_flag, dest=ignore_conflicts_flag, nargs='*',
105 default=[], metavar='TXT_FILE',
106 help='lists of entries with flag "' + flag +
107 '". skip entry if missing or flag conflict.')
Andrei Oneaa6e09b42019-03-29 15:27:55 +0000108 parser.add_argument('--' + packages_flag, dest=packages_flag, nargs='*',
109 default=[], metavar='TXT_FILE',
110 help='lists of packages to be added to ' + flag + ' list')
David Brazdil89bf0f22018-10-30 18:21:24 +0000111
David Brazdil8503b902018-08-30 13:35:03 +0100112 return parser.parse_args()
113
114def read_lines(filename):
115 """Reads entire file and return it as a list of lines.
116
David Brazdilae88d4e2018-09-06 14:46:55 +0100117 Lines which begin with a hash are ignored.
118
David Brazdil8503b902018-08-30 13:35:03 +0100119 Args:
120 filename (string): Path to the file to read from.
121
122 Returns:
David Brazdil89bf0f22018-10-30 18:21:24 +0000123 Lines of the file as a list of string.
David Brazdil8503b902018-08-30 13:35:03 +0100124 """
125 with open(filename, 'r') as f:
David Brazdil89bf0f22018-10-30 18:21:24 +0000126 lines = f.readlines();
127 lines = filter(lambda line: not line.startswith('#'), lines)
128 lines = map(lambda line: line.strip(), lines)
129 return set(lines)
David Brazdil8503b902018-08-30 13:35:03 +0100130
131def write_lines(filename, lines):
132 """Writes list of lines into a file, overwriting the file it it exists.
133
134 Args:
135 filename (string): Path to the file to be writting into.
136 lines (list): List of strings to write into the file.
137 """
David Brazdil89bf0f22018-10-30 18:21:24 +0000138 lines = map(lambda line: line + '\n', lines)
David Brazdil8503b902018-08-30 13:35:03 +0100139 with open(filename, 'w') as f:
140 f.writelines(lines)
141
Andrei Oneaa6e09b42019-03-29 15:27:55 +0000142def extract_package(signature):
143 """Extracts the package from a signature.
144
145 Args:
146 signature (string): JNI signature of a method or field.
147
148 Returns:
149 The package name of the class containing the field/method.
150 """
151 full_class_name = signature.split(";->")[0]
152 package_name = full_class_name[1:full_class_name.rindex("/")]
153 return package_name.replace('/', '.')
154
David Brazdil89bf0f22018-10-30 18:21:24 +0000155class FlagsDict:
David Brazdil17d16e82018-12-13 17:00:09 +0000156 def __init__(self):
157 self._dict_keyset = set()
158 self._dict = defaultdict(set)
David Brazdil4a55eeb2018-09-11 11:09:01 +0100159
David Brazdil89bf0f22018-10-30 18:21:24 +0000160 def _check_entries_set(self, keys_subset, source):
161 assert isinstance(keys_subset, set)
162 assert keys_subset.issubset(self._dict_keyset), (
163 "Error processing: {}\n"
164 "The following entries were unexpected:\n"
165 "{}"
166 "Please visit go/hiddenapi for more information.").format(
167 source, "".join(map(lambda x: " " + str(x), keys_subset - self._dict_keyset)))
David Brazdil4a55eeb2018-09-11 11:09:01 +0100168
David Brazdil89bf0f22018-10-30 18:21:24 +0000169 def _check_flags_set(self, flags_subset, source):
170 assert isinstance(flags_subset, set)
David Brazdil439d3492018-12-07 11:49:55 +0000171 assert flags_subset.issubset(ALL_FLAGS_SET), (
David Brazdil89bf0f22018-10-30 18:21:24 +0000172 "Error processing: {}\n"
173 "The following flags were not recognized: \n"
174 "{}\n"
175 "Please visit go/hiddenapi for more information.").format(
David Brazdil439d3492018-12-07 11:49:55 +0000176 source, "\n".join(flags_subset - ALL_FLAGS_SET))
David Brazdil4a55eeb2018-09-11 11:09:01 +0100177
David Brazdil89bf0f22018-10-30 18:21:24 +0000178 def filter_apis(self, filter_fn):
179 """Returns APIs which match a given predicate.
David Brazdil4a55eeb2018-09-11 11:09:01 +0100180
David Brazdil89bf0f22018-10-30 18:21:24 +0000181 This is a helper function which allows to filter on both signatures (keys) and
182 flags (values). The built-in filter() invokes the lambda only with dict's keys.
David Brazdil4a55eeb2018-09-11 11:09:01 +0100183
David Brazdil89bf0f22018-10-30 18:21:24 +0000184 Args:
185 filter_fn : Function which takes two arguments (signature/flags) and returns a boolean.
David Brazdil4a55eeb2018-09-11 11:09:01 +0100186
David Brazdil89bf0f22018-10-30 18:21:24 +0000187 Returns:
188 A set of APIs which match the predicate.
189 """
190 return set(filter(lambda x: filter_fn(x, self._dict[x]), self._dict_keyset))
David Brazdil4a55eeb2018-09-11 11:09:01 +0100191
David Brazdil89bf0f22018-10-30 18:21:24 +0000192 def get_valid_subset_of_unassigned_apis(self, api_subset):
193 """Sanitizes a key set input to only include keys which exist in the dictionary
David Brazdil439d3492018-12-07 11:49:55 +0000194 and have not been assigned any API list flags.
David Brazdil8503b902018-08-30 13:35:03 +0100195
David Brazdil89bf0f22018-10-30 18:21:24 +0000196 Args:
197 entries_subset (set/list): Key set to be sanitized.
David Brazdil8503b902018-08-30 13:35:03 +0100198
David Brazdil89bf0f22018-10-30 18:21:24 +0000199 Returns:
200 Sanitized key set.
201 """
202 assert isinstance(api_subset, set)
David Brazdil439d3492018-12-07 11:49:55 +0000203 return api_subset.intersection(self.filter_apis(HAS_NO_API_LIST_ASSIGNED))
David Brazdil8503b902018-08-30 13:35:03 +0100204
David Brazdil89bf0f22018-10-30 18:21:24 +0000205 def generate_csv(self):
206 """Constructs CSV entries from a dictionary.
David Brazdil8503b902018-08-30 13:35:03 +0100207
David Brazdil89bf0f22018-10-30 18:21:24 +0000208 Returns:
209 List of lines comprising a CSV file. See "parse_and_merge_csv" for format description.
210 """
211 return sorted(map(lambda api: ",".join([api] + sorted(self._dict[api])), self._dict))
David Brazdil8503b902018-08-30 13:35:03 +0100212
David Brazdil89bf0f22018-10-30 18:21:24 +0000213 def parse_and_merge_csv(self, csv_lines, source = "<unknown>"):
214 """Parses CSV entries and merges them into a given dictionary.
David Brazdil8503b902018-08-30 13:35:03 +0100215
David Brazdil89bf0f22018-10-30 18:21:24 +0000216 The expected CSV format is:
217 <api signature>,<flag1>,<flag2>,...,<flagN>
David Brazdil8503b902018-08-30 13:35:03 +0100218
David Brazdil89bf0f22018-10-30 18:21:24 +0000219 Args:
220 csv_lines (list of strings): Lines read from a CSV file.
221 source (string): Origin of `csv_lines`. Will be printed in error messages.
David Brazdil4a55eeb2018-09-11 11:09:01 +0100222
David Brazdil89bf0f22018-10-30 18:21:24 +0000223 Throws:
David Brazdil17d16e82018-12-13 17:00:09 +0000224 AssertionError if parsed flags are invalid.
David Brazdil89bf0f22018-10-30 18:21:24 +0000225 """
226 # Split CSV lines into arrays of values.
227 csv_values = [ line.split(',') for line in csv_lines ]
228
David Brazdil17d16e82018-12-13 17:00:09 +0000229 # Update the full set of API signatures.
230 self._dict_keyset.update([ csv[0] for csv in csv_values ])
David Brazdil89bf0f22018-10-30 18:21:24 +0000231
232 # Check that all flags are known.
Andrei Oneaa6e09b42019-03-29 15:27:55 +0000233 csv_flags = set(functools.reduce(
234 lambda x, y: set(x).union(y),
235 [ csv[1:] for csv in csv_values ],
236 []))
David Brazdil89bf0f22018-10-30 18:21:24 +0000237 self._check_flags_set(csv_flags, source)
238
239 # Iterate over all CSV lines, find entry in dict and append flags to it.
240 for csv in csv_values:
Andrei Onea80a56602019-03-01 18:49:15 +0000241 flags = csv[1:]
242 if (FLAG_PUBLIC_API in flags) or (FLAG_SYSTEM_API in flags):
243 flags.append(FLAG_WHITELIST)
244 elif FLAG_TEST_API in flags:
245 flags.append(FLAG_GREYLIST)
246 self._dict[csv[0]].update(flags)
David Brazdil89bf0f22018-10-30 18:21:24 +0000247
248 def assign_flag(self, flag, apis, source="<unknown>"):
249 """Assigns a flag to given subset of entries.
250
251 Args:
David Brazdil439d3492018-12-07 11:49:55 +0000252 flag (string): One of ALL_FLAGS.
Andrei Onea80a56602019-03-01 18:49:15 +0000253 apis (set): Subset of APIs to receive the flag.
David Brazdil89bf0f22018-10-30 18:21:24 +0000254 source (string): Origin of `entries_subset`. Will be printed in error messages.
255
256 Throws:
257 AssertionError if parsed API signatures of flags are invalid.
258 """
259 # Check that all APIs exist in the dict.
260 self._check_entries_set(apis, source)
261
262 # Check that the flag is known.
263 self._check_flags_set(set([ flag ]), source)
264
265 # Iterate over the API subset, find each entry in dict and assign the flag to it.
266 for api in apis:
267 self._dict[api].add(flag)
David Brazdil4a55eeb2018-09-11 11:09:01 +0100268
David Brazdil8503b902018-08-30 13:35:03 +0100269def main(argv):
David Brazdil89bf0f22018-10-30 18:21:24 +0000270 # Parse arguments.
271 args = vars(get_args())
David Brazdil8503b902018-08-30 13:35:03 +0100272
David Brazdil17d16e82018-12-13 17:00:09 +0000273 # Initialize API->flags dictionary.
274 flags = FlagsDict()
275
276 # Merge input CSV files into the dictionary.
277 # Do this first because CSV files produced by parsing API stubs will
278 # contain the full set of APIs. Subsequent additions from text files
279 # will be able to detect invalid entries, and/or filter all as-yet
280 # unassigned entries.
281 for filename in args["csv"]:
282 flags.parse_and_merge_csv(read_lines(filename), filename)
David Brazdil8503b902018-08-30 13:35:03 +0100283
David Brazdil89bf0f22018-10-30 18:21:24 +0000284 # Combine inputs which do not require any particular order.
285 # (1) Assign serialization API to whitelist.
286 flags.assign_flag(FLAG_WHITELIST, flags.filter_apis(IS_SERIALIZATION))
David Brazdil8503b902018-08-30 13:35:03 +0100287
David Brazdil17d16e82018-12-13 17:00:09 +0000288 # (2) Merge text files with a known flag into the dictionary.
David Brazdil439d3492018-12-07 11:49:55 +0000289 for flag in ALL_FLAGS:
David Brazdil89bf0f22018-10-30 18:21:24 +0000290 for filename in args[flag]:
291 flags.assign_flag(flag, read_lines(filename), filename)
David Brazdil8503b902018-08-30 13:35:03 +0100292
David Brazdil89bf0f22018-10-30 18:21:24 +0000293 # Merge text files where conflicts should be ignored.
294 # This will only assign the given flag if:
295 # (a) the entry exists, and
296 # (b) it has not been assigned any other flag.
297 # Because of (b), this must run after all strict assignments have been performed.
David Brazdil439d3492018-12-07 11:49:55 +0000298 for flag in ALL_FLAGS:
David Brazdil89bf0f22018-10-30 18:21:24 +0000299 for filename in args[flag + FLAG_IGNORE_CONFLICTS_SUFFIX]:
300 valid_entries = flags.get_valid_subset_of_unassigned_apis(read_lines(filename))
301 flags.assign_flag(flag, valid_entries, filename)
David Brazdil8503b902018-08-30 13:35:03 +0100302
Andrei Oneaa6e09b42019-03-29 15:27:55 +0000303 # All members in the specified packages will be assigned the appropriate flag.
304 for flag in ALL_FLAGS:
305 for filename in args[flag + FLAG_PACKAGES_SUFFIX]:
306 packages_needing_list = set(read_lines(filename))
307 should_add_signature_to_list = lambda sig,lists: extract_package(
308 sig) in packages_needing_list and not lists
309 valid_entries = flags.filter_apis(should_add_signature_to_list)
310 flags.assign_flag(flag, valid_entries)
311
David Brazdil89bf0f22018-10-30 18:21:24 +0000312 # Assign all remaining entries to the blacklist.
David Brazdil439d3492018-12-07 11:49:55 +0000313 flags.assign_flag(FLAG_BLACKLIST, flags.filter_apis(HAS_NO_API_LIST_ASSIGNED))
David Brazdil8503b902018-08-30 13:35:03 +0100314
David Brazdil89bf0f22018-10-30 18:21:24 +0000315 # Write output.
316 write_lines(args["output"], flags.generate_csv())
David Brazdil8503b902018-08-30 13:35:03 +0100317
318if __name__ == "__main__":
319 main(sys.argv)