blob: 31cc2e1429c01d860fef760231e7485de471e9d4 [file] [log] [blame]
Patrick Rohr92d74122022-10-21 15:50:52 -07001# Copyright (C) 2022 The Android Open Source Project
2#
3# Licensed under the Apache License, Version 2.0 (the "License");
4# you may not use this file except in compliance with the License.
5# You may obtain a copy of the License at
6#
7# http://www.apache.org/licenses/LICENSE-2.0
8#
9# Unless required by applicable law or agreed to in writing, software
10# distributed under the License is distributed on an "AS IS" BASIS,
11# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12# See the License for the specific language governing permissions and
13# limitations under the License.
14
15# A collection of utilities for extracting build rule information from GN
16# projects.
17
18from __future__ import print_function
19import collections
20import errno
21import filecmp
22import json
Patrick Rohraf92fa62022-11-04 14:27:04 -070023import logging as log
Patrick Rohr92d74122022-10-21 15:50:52 -070024import os
25import re
26import shutil
27import subprocess
28import sys
Patrick Rohr92d74122022-10-21 15:50:52 -070029
30BUILDFLAGS_TARGET = '//gn:gen_buildflags'
31GEN_VERSION_TARGET = '//src/base:version_gen_h'
Patrick Rohr92d74122022-10-21 15:50:52 -070032LINKER_UNIT_TYPES = ('executable', 'shared_library', 'static_library')
33
34# TODO(primiano): investigate these, they require further componentization.
35ODR_VIOLATION_IGNORE_TARGETS = {
36 '//test/cts:perfetto_cts_deps',
37 '//:perfetto_integrationtests',
38}
39
40
Patrick Rohr92d74122022-10-21 15:50:52 -070041def repo_root():
42 """Returns an absolute path to the repository root."""
43 return os.path.join(
44 os.path.realpath(os.path.dirname(__file__)), os.path.pardir)
45
46
Patrick Rohr92d74122022-10-21 15:50:52 -070047def label_to_path(label):
48 """Turn a GN output label (e.g., //some_dir/file.cc) into a path."""
49 assert label.startswith('//')
Patrick Rohrc6331c82022-10-25 11:34:20 -070050 return label[2:] or "./"
Patrick Rohr92d74122022-10-21 15:50:52 -070051
52
53def label_without_toolchain(label):
54 """Strips the toolchain from a GN label.
55
56 Return a GN label (e.g //buildtools:protobuf(//gn/standalone/toolchain:
57 gcc_like_host) without the parenthesised toolchain part.
58 """
59 return label.split('(')[0]
60
61
62def label_to_target_name_with_path(label):
63 """
64 Turn a GN label into a target name involving the full path.
65 e.g., //src/perfetto:tests -> src_perfetto_tests
66 """
67 name = re.sub(r'^//:?', '', label)
68 name = re.sub(r'[^a-zA-Z0-9_]', '_', name)
69 return name
70
71
Patrick Rohr92d74122022-10-21 15:50:52 -070072class GnParser(object):
73 """A parser with some cleverness for GN json desc files
74
75 The main goals of this parser are:
76 1) Deal with the fact that other build systems don't have an equivalent
77 notion to GN's source_set. Conversely to Bazel's and Soong's filegroups,
78 GN source_sets expect that dependencies, cflags and other source_set
79 properties propagate up to the linker unit (static_library, executable or
80 shared_library). This parser simulates the same behavior: when a
81 source_set is encountered, some of its variables (cflags and such) are
82 copied up to the dependent targets. This is to allow gen_xxx to create
83 one filegroup for each source_set and then squash all the other flags
84 onto the linker unit.
85 2) Detect and special-case protobuf targets, figuring out the protoc-plugin
86 being used.
87 """
88
89 class Target(object):
90 """Reperesents A GN target.
91
92 Maked properties are propagated up the dependency chain when a
93 source_set dependency is encountered.
94 """
Patrick Rohr02ad51f2022-11-15 13:54:07 -080095 class Arch():
96 """Architecture-dependent properties
97 """
98 def __init__(self):
99 self.sources = set()
100
Patrick Rohr92d74122022-10-21 15:50:52 -0700101
102 def __init__(self, name, type):
103 self.name = name # e.g. //src/ipc:ipc
104
105 VALID_TYPES = ('static_library', 'shared_library', 'executable', 'group',
Patrick Rohrda778a02022-10-25 16:17:31 -0700106 'action', 'source_set', 'proto_library', 'copy', 'action_foreach')
Patrick Rohr92d74122022-10-21 15:50:52 -0700107 assert (type in VALID_TYPES)
108 self.type = type
109 self.testonly = False
110 self.toolchain = None
111
112 # These are valid only for type == proto_library.
113 # This is typically: 'proto', 'protozero', 'ipc'.
114 self.proto_plugin = None
115 self.proto_paths = set()
116 self.proto_exports = set()
Motomu Utsumid7e0e422022-11-08 17:49:52 +0900117 self.proto_in_dir = ""
Patrick Rohr92d74122022-10-21 15:50:52 -0700118
119 self.sources = set()
120 # TODO(primiano): consider whether the public section should be part of
121 # bubbled-up sources.
122 self.public_headers = set() # 'public'
123
124 # These are valid only for type == 'action'
125 self.inputs = set()
126 self.outputs = set()
127 self.script = None
128 self.args = []
Patrick Rohr09716f52022-10-27 13:02:36 -0700129 self.response_file_contents = None
Patrick Rohr92d74122022-10-21 15:50:52 -0700130
131 # These variables are propagated up when encountering a dependency
132 # on a source_set target.
133 self.cflags = set()
134 self.defines = set()
135 self.deps = set()
136 self.libs = set()
137 self.include_dirs = set()
138 self.ldflags = set()
139 self.source_set_deps = set() # Transitive set of source_set deps.
140 self.proto_deps = set()
141 self.transitive_proto_deps = set()
Patrick Rohr5de9f2e2022-11-11 15:33:20 -0800142 self.transitive_static_libs_deps = set()
Patrick Rohr92d74122022-10-21 15:50:52 -0700143
144 # Deps on //gn:xxx have this flag set to True. These dependencies
145 # are special because they pull third_party code from buildtools/.
146 # We don't want to keep recursing into //buildtools in generators,
147 # this flag is used to stop the recursion and create an empty
148 # placeholder target once we hit //gn:protoc or similar.
149 self.is_third_party_dep_ = False
150
Patrick Rohr70913562022-11-15 21:49:28 -0800151 # TODO: come up with a better way to only run this once.
152 # is_finalized tracks whether finalize() was called on this target.
153 self.is_finalized = False
Patrick Rohr02ad51f2022-11-15 13:54:07 -0800154 self.arch = dict()
155
Patrick Rohrc8f41cd2022-11-15 22:46:10 -0800156 def host_supported(self):
157 return 'host' in self.arch
158
159 def device_supported(self):
160 return any([name.startswith('android') for name in self.arch.keys()])
161
Patrick Rohr92d74122022-10-21 15:50:52 -0700162 def __lt__(self, other):
163 if isinstance(other, self.__class__):
164 return self.name < other.name
165 raise TypeError(
166 '\'<\' not supported between instances of \'%s\' and \'%s\'' %
167 (type(self).__name__, type(other).__name__))
168
169 def __repr__(self):
170 return json.dumps({
171 k: (list(sorted(v)) if isinstance(v, set) else v)
Patrick Rohr23f26192022-10-25 09:45:22 -0700172 for (k, v) in self.__dict__.items()
Patrick Rohr92d74122022-10-21 15:50:52 -0700173 },
174 indent=4,
175 sort_keys=True)
176
177 def update(self, other):
178 for key in ('cflags', 'defines', 'deps', 'include_dirs', 'ldflags',
179 'source_set_deps', 'proto_deps', 'transitive_proto_deps',
180 'libs', 'proto_paths'):
181 self.__dict__[key].update(other.__dict__.get(key, []))
182
Patrick Rohr70913562022-11-15 21:49:28 -0800183 def finalize(self):
184 """Move common properties out of arch-dependent subobjects to Target object.
185
186 TODO: find a better name for this function.
187 """
188 if self.is_finalized:
189 return
190 self.is_finalized = True
191
Patrick Rohr70913562022-11-15 21:49:28 -0800192 # Target contains the intersection of arch-dependent properties
193 self.sources = set.intersection(*[arch.sources for arch in self.arch.values()])
194
195 # Deduplicate arch-dependent properties
196 for arch in self.arch.keys():
197 self.arch[arch].sources -= self.sources
198
199
Patrick Rohr564d6be2022-11-15 12:57:57 -0800200 def __init__(self):
Patrick Rohr92d74122022-10-21 15:50:52 -0700201 self.all_targets = {}
202 self.linker_units = {} # Executables, shared or static libraries.
203 self.source_sets = {}
204 self.actions = {}
205 self.proto_libs = {}
Patrick Rohrb27587e2022-11-04 14:57:24 -0700206 self.java_sources = set()
Patrick Rohr92d74122022-10-21 15:50:52 -0700207
Patrick Rohr09716f52022-10-27 13:02:36 -0700208 def _get_response_file_contents(self, action_desc):
Patrick Rohrc20887d2022-10-28 12:59:20 -0700209 # response_file_contents are formatted as:
210 # ['--flags', '--flag=true && false'] and need to be formatted as:
211 # '--flags --flag=\"true && false\"'
212 flags = action_desc.get('response_file_contents', [])
213 formatted_flags = []
214 for flag in flags:
215 if '=' in flag:
216 key, val = flag.split('=')
217 formatted_flags.append('%s=\\"%s\\"' % (key, val))
218 else:
219 formatted_flags.append(flag)
220
221 return ' '.join(formatted_flags)
Patrick Rohr09716f52022-10-27 13:02:36 -0700222
Patrick Rohraf92fa62022-11-04 14:27:04 -0700223 def _is_java_target(self, target):
224 # Per https://chromium.googlesource.com/chromium/src/build/+/HEAD/android/docs/java_toolchain.md
225 # java target names must end in "_java".
226 # TODO: There are some other possible variations we might need to support.
Patrick Rohr67f53122022-11-09 10:57:40 -0800227 return target.type == 'group' and re.match('.*_java$', target.name)
Patrick Rohraf92fa62022-11-04 14:27:04 -0700228
Patrick Rohr81a4ac32022-11-15 14:38:21 -0800229 def _get_arch(self, toolchain):
Patrick Rohrd938d532022-11-15 22:17:08 -0800230 if toolchain == '//build/toolchain/android:android_clang_x86':
Patrick Rohr4eff2102022-11-15 22:21:52 -0800231 return 'android_x86'
Patrick Rohr81a4ac32022-11-15 14:38:21 -0800232 elif toolchain == '//build/toolchain/android:android_clang_x64':
Patrick Rohr4eff2102022-11-15 22:21:52 -0800233 return 'android_x86_64'
Patrick Rohr81a4ac32022-11-15 14:38:21 -0800234 elif toolchain == '//build/toolchain/android:android_clang_arm':
Patrick Rohr4eff2102022-11-15 22:21:52 -0800235 return 'android_arm'
Patrick Rohr81a4ac32022-11-15 14:38:21 -0800236 elif toolchain == '//build/toolchain/android:android_clang_arm64':
Patrick Rohr4eff2102022-11-15 22:21:52 -0800237 return 'android_arm64'
Patrick Rohr81a4ac32022-11-15 14:38:21 -0800238 else:
239 return 'host'
240
Patrick Rohr92d74122022-10-21 15:50:52 -0700241 def get_target(self, gn_target_name):
242 """Returns a Target object from the fully qualified GN target name.
243
Patrick Rohrd0077b72022-11-15 12:43:26 -0800244 get_target() requires that parse_gn_desc() has already been called.
245 """
Patrick Rohr70913562022-11-15 21:49:28 -0800246 # Run this every time as parse_gn_desc can be called at any time.
247 for target in self.all_targets.values():
248 target.finalize()
249
Patrick Rohr7705bdb2022-11-15 13:26:30 -0800250 return self.all_targets[label_without_toolchain(gn_target_name)]
Patrick Rohrd0077b72022-11-15 12:43:26 -0800251
Patrick Rohr564d6be2022-11-15 12:57:57 -0800252 def parse_gn_desc(self, gn_desc, gn_target_name):
Patrick Rohrd0077b72022-11-15 12:43:26 -0800253 """Parses a gn desc tree and resolves all target dependencies.
254
Patrick Rohr92d74122022-10-21 15:50:52 -0700255 It bubbles up variables from source_set dependencies as described in the
256 class-level comments.
257 """
Patrick Rohr7705bdb2022-11-15 13:26:30 -0800258 # Use name without toolchain for targets to support targets built for
259 # multiple archs.
260 target_name = label_without_toolchain(gn_target_name)
261 target = self.all_targets.get(target_name)
Patrick Rohr02ad51f2022-11-15 13:54:07 -0800262 desc = gn_desc[gn_target_name]
Patrick Rohrd938d532022-11-15 22:17:08 -0800263 arch = self._get_arch(desc['toolchain'])
Patrick Rohr02ad51f2022-11-15 13:54:07 -0800264 if target is None:
265 target = GnParser.Target(target_name, desc['type'])
266 self.all_targets[target_name] = target
267
268 if arch not in target.arch:
269 target.arch[arch] = GnParser.Target.Arch()
270 else:
Patrick Rohr92d74122022-10-21 15:50:52 -0700271 return target # Target already processed.
272
Patrick Rohr92d74122022-10-21 15:50:52 -0700273 target.testonly = desc.get('testonly', False)
Patrick Rohr92d74122022-10-21 15:50:52 -0700274
Patrick Rohr0d40da32022-11-15 13:08:12 -0800275 proto_target_type, proto_desc = self.get_proto_target_type(gn_desc, gn_target_name)
Patrick Rohr92d74122022-10-21 15:50:52 -0700276 if proto_target_type is not None:
277 self.proto_libs[target.name] = target
278 target.type = 'proto_library'
279 target.proto_plugin = proto_target_type
280 target.proto_paths.update(self.get_proto_paths(proto_desc))
281 target.proto_exports.update(self.get_proto_exports(proto_desc))
Motomu Utsumid7e0e422022-11-08 17:49:52 +0900282 target.proto_in_dir = self.get_proto_in_dir(proto_desc)
Motomu Utsumidee9ce02022-11-16 18:02:41 +0900283 target.deps.update(proto_desc.get('deps', []))
Patrick Rohr53dcd102022-11-15 21:53:02 -0800284 target.arch[arch].sources.update(proto_desc.get('sources', []))
285 assert (all(x.endswith('.proto') for x in target.arch[arch].sources))
Patrick Rohr92d74122022-10-21 15:50:52 -0700286 elif target.type == 'source_set':
287 self.source_sets[gn_target_name] = target
Patrick Rohr53dcd102022-11-15 21:53:02 -0800288 target.arch[arch].sources.update(desc.get('sources', []))
Patrick Rohr92d74122022-10-21 15:50:52 -0700289 elif target.type in LINKER_UNIT_TYPES:
290 self.linker_units[gn_target_name] = target
Patrick Rohr53dcd102022-11-15 21:53:02 -0800291 target.arch[arch].sources.update(desc.get('sources', []))
Patrick Rohrda778a02022-10-25 16:17:31 -0700292 elif target.type in ['action', 'action_foreach']:
Patrick Rohr92d74122022-10-21 15:50:52 -0700293 self.actions[gn_target_name] = target
294 target.inputs.update(desc.get('inputs', []))
Patrick Rohr53dcd102022-11-15 21:53:02 -0800295 target.arch[arch].sources.update(desc.get('sources', []))
Patrick Rohr92d74122022-10-21 15:50:52 -0700296 outs = [re.sub('^//out/.+?/gen/', '', x) for x in desc['outputs']]
297 target.outputs.update(outs)
298 target.script = desc['script']
Patrick Rohr7aa98f92022-10-28 11:16:36 -0700299 target.args = desc['args']
Patrick Rohr09716f52022-10-27 13:02:36 -0700300 target.response_file_contents = self._get_response_file_contents(desc)
Patrick Rohrda778a02022-10-25 16:17:31 -0700301 elif target.type == 'copy':
302 # TODO: copy rules are not currently implemented.
303 self.actions[gn_target_name] = target
Patrick Rohr67f53122022-11-09 10:57:40 -0800304 elif self._is_java_target(target):
Patrick Rohraf92fa62022-11-04 14:27:04 -0700305 # java_group identifies the group target generated by the android_library
306 # or java_library template. A java_group must not be added as a dependency, but sources are collected
307 log.debug('Found java target %s', target.name)
308 target.type = 'java_group'
Patrick Rohr92d74122022-10-21 15:50:52 -0700309
310 # Default for 'public' is //* - all headers in 'sources' are public.
311 # TODO(primiano): if a 'public' section is specified (even if empty), then
312 # the rest of 'sources' is considered inaccessible by gn. Consider
313 # emulating that, so that generated build files don't end up with overly
314 # accessible headers.
315 public_headers = [x for x in desc.get('public', []) if x != '*']
316 target.public_headers.update(public_headers)
317
318 target.cflags.update(desc.get('cflags', []) + desc.get('cflags_cc', []))
319 target.libs.update(desc.get('libs', []))
320 target.ldflags.update(desc.get('ldflags', []))
321 target.defines.update(desc.get('defines', []))
322 target.include_dirs.update(desc.get('include_dirs', []))
323
324 # Recurse in dependencies.
Patrick Rohr7f4631e2022-11-15 14:35:03 -0800325 for gn_dep_name in desc.get('deps', []):
326 dep = self.parse_gn_desc(gn_desc, gn_dep_name)
327 dep_name = label_without_toolchain(gn_dep_name)
Patrick Rohr92d74122022-10-21 15:50:52 -0700328 if dep.is_third_party_dep_:
329 target.deps.add(dep_name)
330 elif dep.type == 'proto_library':
331 target.proto_deps.add(dep_name)
332 target.transitive_proto_deps.add(dep_name)
333 target.proto_paths.update(dep.proto_paths)
334 target.transitive_proto_deps.update(dep.transitive_proto_deps)
335 elif dep.type == 'source_set':
336 target.source_set_deps.add(dep_name)
337 target.update(dep) # Bubble up source set's cflags/ldflags etc.
338 elif dep.type == 'group':
339 target.update(dep) # Bubble up groups's cflags/ldflags etc.
Patrick Rohrda778a02022-10-25 16:17:31 -0700340 elif dep.type in ['action', 'action_foreach', 'copy']:
Patrick Rohr92d74122022-10-21 15:50:52 -0700341 if proto_target_type is None:
342 target.deps.add(dep_name)
343 elif dep.type in LINKER_UNIT_TYPES:
344 target.deps.add(dep_name)
Patrick Rohr3624f952022-11-04 14:30:18 -0700345 elif dep.type == 'java_group':
346 # Explicitly break dependency chain when a java_group is added.
347 # Java sources are collected and eventually compiled as one large
348 # java_library.
349 pass
Patrick Rohr92d74122022-10-21 15:50:52 -0700350
Patrick Rohr5de9f2e2022-11-11 15:33:20 -0800351 if dep.type == 'static_library':
352 # Bubble up static_libs. Necessary, since soong does not propagate
353 # static_libs up the build tree.
Motomu Utsumi6ccc9d82022-11-16 18:05:45 +0900354 target.transitive_static_libs_deps.add(dep_name)
Patrick Rohra9c1dda2022-11-14 19:02:40 -0800355
356 target.transitive_static_libs_deps.update(dep.transitive_static_libs_deps)
357 target.deps.update(target.transitive_static_libs_deps)
Patrick Rohr5de9f2e2022-11-11 15:33:20 -0800358
Patrick Rohrb27587e2022-11-04 14:57:24 -0700359 # Collect java sources. Java sources are kept inside the __compile_java target.
360 # This target can be used for both host and target compilation; only add
361 # the sources if they are destined for the target (i.e. they are a
362 # dependency of the __dex target)
363 # Note: this skips prebuilt java dependencies. These will have to be
364 # added manually when building the jar.
365 if re.match('.*__dex$', target.name):
366 if re.match('.*__compile_java$', dep.name):
367 log.debug('Adding java sources for %s', dep.name)
368 java_srcs = [src for src in dep.inputs if os.path.splitext(src)[1] == '.java']
369 self.java_sources.update(java_srcs)
370
Patrick Rohr92d74122022-10-21 15:50:52 -0700371 return target
372
373 def get_proto_exports(self, proto_desc):
374 # exports in metadata will be available for source_set targets.
375 metadata = proto_desc.get('metadata', {})
376 return metadata.get('exports', [])
377
378 def get_proto_paths(self, proto_desc):
379 # import_dirs in metadata will be available for source_set targets.
380 metadata = proto_desc.get('metadata', {})
381 return metadata.get('import_dirs', [])
382
Motomu Utsumid7e0e422022-11-08 17:49:52 +0900383
384 def get_proto_in_dir(self, proto_desc):
385 args = proto_desc.get('args')
386 return re.sub('^\.\./\.\./', '', args[args.index('--proto-in-dir') + 1])
387
Patrick Rohr0d40da32022-11-15 13:08:12 -0800388 def get_proto_target_type(self, gn_desc, gn_target_name):
Patrick Rohr92d74122022-10-21 15:50:52 -0700389 """ Checks if the target is a proto library and return the plugin.
390
391 Returns:
392 (None, None): if the target is not a proto library.
393 (plugin, proto_desc) where |plugin| is 'proto' in the default (lite)
394 case or 'protozero' or 'ipc' or 'descriptor'; |proto_desc| is the GN
395 json desc of the target with the .proto sources (_gen target for
396 non-descriptor types or the target itself for descriptor type).
397 """
Patrick Rohr0d40da32022-11-15 13:08:12 -0800398 parts = gn_target_name.split('(', 1)
Patrick Rohr92d74122022-10-21 15:50:52 -0700399 name = parts[0]
400 toolchain = '(' + parts[1] if len(parts) > 1 else ''
401
402 # Descriptor targets don't have a _gen target; instead we look for the
403 # characteristic flag in the args of the target itself.
Patrick Rohr0d40da32022-11-15 13:08:12 -0800404 desc = gn_desc.get(gn_target_name)
Patrick Rohr92d74122022-10-21 15:50:52 -0700405 if '--descriptor_set_out' in desc.get('args', []):
406 return 'descriptor', desc
407
408 # Source set proto targets have a non-empty proto_library_sources in the
409 # metadata of the description.
410 metadata = desc.get('metadata', {})
411 if 'proto_library_sources' in metadata:
412 return 'source_set', desc
413
414 # In all other cases, we want to look at the _gen target as that has the
415 # important information.
Patrick Rohr564d6be2022-11-15 12:57:57 -0800416 gen_desc = gn_desc.get('%s_gen%s' % (name, toolchain))
Patrick Rohr92d74122022-10-21 15:50:52 -0700417 if gen_desc is None or gen_desc['type'] != 'action':
418 return None, None
Patrick Rohrc5980782022-11-07 16:34:03 -0800419 if gen_desc['script'] != '//tools/protoc_wrapper/protoc_wrapper.py':
Patrick Rohr92d74122022-10-21 15:50:52 -0700420 return None, None
421 plugin = 'proto'
Patrick Rohrc5980782022-11-07 16:34:03 -0800422 args = gen_desc.get('args', [])
Patrick Rohr92d74122022-10-21 15:50:52 -0700423 for arg in (arg for arg in args if arg.startswith('--plugin=')):
424 # |arg| at this point looks like:
425 # --plugin=protoc-gen-plugin=gcc_like_host/protozero_plugin
426 # or
427 # --plugin=protoc-gen-plugin=protozero_plugin
428 plugin = arg.split('=')[-1].split('/')[-1].replace('_plugin', '')
429 return plugin, gen_desc