-
Notifications
You must be signed in to change notification settings - Fork 3.3k
/
Copy pathsystem_libs.py
2029 lines (1653 loc) · 64.5 KB
/
system_libs.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
# Copyright 2014 The Emscripten Authors. All rights reserved.
# Emscripten is available under two separate licenses, the MIT license and the
# University of Illinois/NCSA Open Source License. Both these licenses can be
# found in the LICENSE file.
from .toolchain_profiler import ToolchainProfiler
import itertools
import logging
import os
import shutil
import textwrap
from enum import IntEnum, auto
from glob import iglob
from . import shared, building, utils
from . import deps_info, tempfiles
from . import diagnostics
from tools.shared import demangle_c_symbol_name
from tools.settings import settings
logger = logging.getLogger('system_libs')
# Files that are part of libsockets.a and so should be excluded from libc.a
LIBC_SOCKETS = ['socket.c', 'socketpair.c', 'shutdown.c', 'bind.c', 'connect.c',
'listen.c', 'accept.c', 'getsockname.c', 'getpeername.c', 'send.c',
'recv.c', 'sendto.c', 'recvfrom.c', 'sendmsg.c', 'recvmsg.c',
'getsockopt.c', 'setsockopt.c', 'freeaddrinfo.c',
'in6addr_any.c', 'in6addr_loopback.c', 'accept4.c']
def files_in_path(path, filenames):
srcdir = utils.path_from_root(path)
return [os.path.join(srcdir, f) for f in filenames]
def glob_in_path(path, glob_pattern, excludes=()):
srcdir = utils.path_from_root(path)
files = iglob(os.path.join(srcdir, glob_pattern), recursive=True)
return sorted(f for f in files if os.path.basename(f) not in excludes)
def get_base_cflags(force_object_files=False):
# Always build system libraries with debug information. Non-debug builds
# will ignore this at link time because we link with `-strip-debug`.
flags = ['-g']
if settings.LTO and not force_object_files:
flags += ['-flto=' + settings.LTO]
if settings.RELOCATABLE:
flags += ['-sRELOCATABLE']
if settings.MEMORY64:
flags += ['-sMEMORY64=' + str(settings.MEMORY64)]
return flags
def clean_env():
# building system libraries and ports should be hermetic in that it is not
# affected by things like EMCC_CFLAGS which the user may have set.
# At least one port also uses autoconf (harfbuzz) so we also need to clear
# CFLAGS/LDFLAGS which we don't want to effect the inner call to configure.
safe_env = os.environ.copy()
for opt in ['CFLAGS', 'CXXFLAGS', 'LDFLAGS',
'EMCC_CFLAGS',
'EMCC_FORCE_STDLIBS',
'EMCC_ONLY_FORCED_STDLIBS',
'EMMAKEN_JUST_CONFIGURE']:
if opt in safe_env:
del safe_env[opt]
return safe_env
def run_build_commands(commands):
# Before running a set of build commands make sure the common sysroot
# headers are installed. This prevents each sub-process from attempting
# to setup the sysroot itself.
ensure_sysroot()
shared.run_multiple_processes(commands, env=clean_env())
def create_lib(libname, inputs):
"""Create a library from a set of input objects."""
suffix = shared.suffix(libname)
inputs = sorted(inputs, key=lambda x: os.path.basename(x))
if suffix in ('.bc', '.o'):
if len(inputs) == 1:
if inputs[0] != libname:
shutil.copyfile(inputs[0], libname)
else:
building.link_to_object(inputs, libname)
else:
assert suffix == '.a'
building.emar('cr', libname, inputs)
def is_case_insensitive(path):
"""Returns True if the filesystem at `path` is case insensitive."""
utils.write_file(os.path.join(path, 'test_file'), '')
case_insensitive = os.path.exists(os.path.join(path, 'TEST_FILE'))
os.remove(os.path.join(path, 'test_file'))
return case_insensitive
class Library:
"""
`Library` is the base class of all system libraries.
There are two types of libraries: abstract and concrete.
* An abstract library, e.g. MTLibrary, is a subclass of `Library` that
implements certain behaviour common to multiple libraries. The features
of multiple abstract libraries can be used through multiple inheritance.
* A concrete library, e.g. libc, is a subclass of `Library` that describes
how to build a particular library, and its properties, such as name and
dependencies.
This library system is meant to handle having many versions of the same library,
which we call *variations*. For example, some libraries (those that inherit
from MTLibrary), have both single-threaded and multi-threaded versions.
An instance of a `Library` subclass represents a specific variation of the
library. Instance methods perform operations relating to this variation.
For example, `get_cflags()` would return the emcc flags needed to build this
variation, and `build()` would generate the library file for this variation.
The constructor takes keyword arguments that defines the variation.
Class methods perform tasks relating to all variations. For example,
`variations()` returns a list of all variations that exists for this library,
and `get_default_variation()` returns the variation suitable for the current
environment.
Other class methods act upon a group of libraries. For example,
`Library.get_all_variations()` returns a mapping of all variations of
existing libraries.
To add a new type of variation, you must add an parameter to `__init__` that
selects the variant. Then, override one of `vary_on` or `variations`, as well
as `get_default_variation`.
If the parameter is boolean, overriding `vary_on` to add the parameter name
to the returned list is sufficient:
@classmethod
def vary_on(cls):
return super().vary_on() + ['my_parameter']
Otherwise, you must override `variations`:
@classmethod
def variations(cls):
return [{'my_parameter': value, **other} for value, other in
itertools.product([1, 2, 3], super().variations())]
Overriding either `vary_on` or `variations` allows `embuilder.py` to know all
possible variations so it can build all of them.
You then need to modify `get_default_variation` to detect the correct value
for your new parameter based on the settings:
@classmethod
def get_default_variation(cls, **kwargs):
return super().get_default_variation(my_parameter=settings.MY_PARAMETER, **kwargs)
This allows the correct variation of the library to be selected when building
code with Emscripten.
"""
# The simple name of the library. When linking, this is the name to use to
# automatically get the correct version of the library.
# This should only be overridden in a concrete library class, e.g. libc,
# and left as None in an abstract library class, e.g. MTLibrary.
name = None
# Set to true to prevent EMCC_FORCE_STDLIBS from linking this library.
never_force = False
# A list of flags to pass to emcc.
# The flags for the parent class is automatically inherited.
# TODO: Investigate whether perf gains from loop unrolling would be worth the
# extra code size. The -fno-unroll-loops flags was added here when loop
# unrolling landed upstream in LLVM to avoid changing behavior but was not
# specifically evaluated.
cflags = ['-O2', '-Werror', '-fno-unroll-loops']
# A list of directories to put in the include path when building.
# This is a list of tuples of path components.
# For example, to put system/lib/a and system/lib/b under the emscripten
# directory into the include path, you would write:
# includes = [('system', 'lib', 'a'), ('system', 'lib', 'b')]
# The include path of the parent class is automatically inherited.
includes = []
# By default, `get_files` look for source files for this library under `src_dir`.
# It will either use the files listed in `src_files`, or use the glob pattern in
# `src_glob`. You may not specify both `src_files` and `src_glob`.
# When using `src_glob`, you can specify a list of files in `src_glob_exclude`
# to be excluded from the library.
# Alternatively, you can override `get_files` to use your own logic.
src_dir = None
src_files = None
src_glob = None
src_glob_exclude = None
# Whether to always generate WASM object files, even when LTO is set
force_object_files = False
def __init__(self):
"""
Creates a variation of this library.
A variation is a specific combination of settings a library can have.
For example, libc++-mt-noexcept is a variation of libc++.
There might be only one variation of a library.
The constructor keyword arguments will define what variation to use.
Use the `variations` classmethod to get the list of all possible constructor
arguments for this library.
Use the `get_default_variation` classmethod to construct the variation
suitable for the current invocation of emscripten.
"""
if not self.name:
raise NotImplementedError('Cannot instantiate an abstract library')
def can_use(self):
"""
Whether this library can be used in the current environment.
For example, libmalloc would override this and return False
if the user requested no malloc.
"""
return True
def can_build(self):
"""
Whether this library can be built in the current environment.
Override this if, for example, the library can only be built on WASM backend.
"""
return True
def erase(self):
shared.Cache.erase_file(shared.Cache.get_lib_name(self.get_filename()))
def get_path(self):
"""
Gets the cached path of this library.
This will trigger a build if this library is not in the cache.
"""
return shared.Cache.get_lib(self.get_filename(), self.build)
def get_link_flag(self):
"""
Gets the link flags needed to use the library.
This will trigger a build if this library is not in the cache.
"""
fullpath = self.get_path()
# For non-libaries (e.g. crt1.o) we pass the entire path to the linker
if self.get_ext() != '.a':
return fullpath
# For libraries (.a) files, we pass the abbreviated `-l` form.
base = shared.unsuffixed_basename(fullpath)
return '-l' + shared.strip_prefix(base, 'lib')
def get_files(self):
"""
Gets a list of source files for this library.
Typically, you will use `src_dir`, `src_files`, `src_glob` and `src_glob_exclude`.
If those are insufficient to describe the files needed, you can override this method.
"""
if self.src_dir:
if self.src_files and self.src_glob:
raise Exception('Cannot use src_files and src_glob together')
if self.src_files:
return files_in_path(self.src_dir, self.src_files)
elif self.src_glob:
return glob_in_path(self.src_dir, self.src_glob, self.src_glob_exclude or ())
raise NotImplementedError()
def build_objects(self, build_dir):
"""
Returns a list of compiled object files for this library.
By default, this builds all the source files returned by `self.get_files()`,
with the `cflags` returned by `self.get_cflags()`.
"""
commands = []
objects = []
cflags = self.get_cflags()
case_insensitive = is_case_insensitive(build_dir)
for src in self.get_files():
object_basename = shared.unsuffixed_basename(src)
# Resolve duplicates by appending unique.
# This is needed on case insensitve filesystem to handle,
# for example, _exit.o and _Exit.o.
if case_insensitive:
object_basename = object_basename.lower()
o = os.path.join(build_dir, object_basename + '.o')
object_uuid = 0
# Find a unique basename
while o in objects:
object_uuid += 1
o = os.path.join(build_dir, f'{object_basename}__{object_uuid}.o')
ext = shared.suffix(src)
if ext in ('.s', '.S', '.c'):
cmd = [shared.EMCC]
else:
cmd = [shared.EMXX]
cmd += cflags
if ext in ('.s', '.S'):
# TODO(sbc) There is an llvm bug that causes a crash when `-g` is used with
# assembly files that define wasm globals.
cmd = [arg for arg in cmd if arg != '-g']
cmd = self.customize_build_cmd(cmd, src)
commands.append(cmd + ['-c', src, '-o', o])
objects.append(o)
run_build_commands(commands)
return objects
def customize_build_cmd(self, cmd, filename): # noqa
"""Allows libraries to customize the build command used on per-file basis.
For example, libc uses this to replace -Oz with -O2 for some subset of files."""
return cmd
def build(self, out_filename):
"""Builds the library and returns the path to the file."""
build_dir = shared.Cache.get_path(os.path.join('build', self.get_base_name()))
utils.safe_ensure_dirs(build_dir)
create_lib(out_filename, self.build_objects(build_dir))
if not shared.DEBUG:
tempfiles.try_delete(build_dir)
@classmethod
def _inherit_list(cls, attr):
# Some properties, like cflags and includes, makes more sense to inherit
# via concatenation than replacement.
result = []
for item in cls.__mro__[::-1]:
# Using __dict__ to avoid inheritance
result += item.__dict__.get(attr, [])
return result
def get_cflags(self):
"""
Returns the list of flags to pass to emcc when building this variation
of the library.
Override and add any flags as needed to handle new variations.
"""
cflags = self._inherit_list('cflags')
cflags += get_base_cflags(force_object_files=self.force_object_files)
if self.includes:
cflags += ['-I' + utils.path_from_root(i) for i in self._inherit_list('includes')]
return cflags
def get_base_name_prefix(self):
"""
Returns the base name of the library without any suffixes.
"""
return self.name
def get_base_name(self):
"""
Returns the base name of the library file.
This will include suffixes such as -mt, but will not include a file extension.
"""
return self.get_base_name_prefix()
def get_ext(self):
"""
Return the appropriate file extension for this library.
"""
return '.a'
def get_filename(self):
"""
Return the full name of the library file, including the file extension.
"""
return self.get_base_name() + self.get_ext()
@classmethod
def vary_on(cls):
"""
Returns a list of strings that are the names of boolean constructor
arguments that defines the variations of this library.
This is used by the default implementation of `cls.variations()` to generate
every possible combination of boolean values to pass to these arguments.
"""
return []
@classmethod
def variations(cls):
"""
Returns a list of keyword arguments to pass to the constructor to create
every possible variation of this library.
By default, this is every possible combination of boolean values to pass
to the list of arguments returned by `vary_on`, but you can override
the behaviour.
"""
vary_on = cls.vary_on()
return [dict(zip(vary_on, toggles)) for toggles in
itertools.product([False, True], repeat=len(vary_on))]
@classmethod
def get_default_variation(cls, **kwargs):
"""
Construct the variation suitable for the current invocation of emscripten.
Subclasses should pass the keyword arguments they introduce to the
superclass version, and propagate **kwargs. The base class collects
all the keyword arguments and creates the instance.
"""
return cls(**kwargs)
@classmethod
def get_inheritance_tree(cls):
"""Returns all the classes in the inheritance tree of the current class."""
yield cls
for subclass in cls.__subclasses__():
for subclass in subclass.get_inheritance_tree():
yield subclass
@classmethod
def get_all_variations(cls):
"""
Gets all the variations of libraries in the inheritance tree of the current
library.
Calling Library.get_all_variations() returns the variations of ALL libraries
that can be built as a dictionary of variation names to Library objects.
"""
result = {}
for library in cls.get_inheritance_tree():
if library.name:
for flags in library.variations():
variation = library(**flags)
if variation.can_build():
result[variation.get_base_name()] = variation
return result
@classmethod
def get_usable_variations(cls):
"""
Gets all libraries suitable for the current invocation of emscripten.
This returns a dictionary of simple names to Library objects.
"""
if not hasattr(cls, 'useable_variations'):
cls.useable_variations = {}
for subclass in cls.get_inheritance_tree():
if subclass.name:
library = subclass.get_default_variation()
if library.can_build() and library.can_use():
cls.useable_variations[subclass.name] = library
return cls.useable_variations
class MTLibrary(Library):
def __init__(self, **kwargs):
self.is_mt = kwargs.pop('is_mt')
self.is_ww = kwargs.pop('is_ww') and not self.is_mt
super().__init__(**kwargs)
def get_cflags(self):
cflags = super().get_cflags()
if self.is_mt:
cflags += ['-sUSE_PTHREADS', '-sWASM_WORKERS']
if self.is_ww:
cflags += ['-sWASM_WORKERS']
return cflags
def get_base_name(self):
name = super().get_base_name()
if self.is_mt:
name += '-mt'
if self.is_ww:
name += '-ww'
return name
@classmethod
def vary_on(cls):
return super().vary_on() + ['is_mt', 'is_ww']
@classmethod
def get_default_variation(cls, **kwargs):
return super().get_default_variation(is_mt=settings.USE_PTHREADS, is_ww=settings.WASM_WORKERS and not settings.USE_PTHREADS, **kwargs)
@classmethod
def variations(cls):
combos = super(MTLibrary, cls).variations()
# To save on # of variations, pthreads and Wasm workers when used together, just use pthreads variation.
return [combo for combo in combos if not combo['is_mt'] or not combo['is_ww']]
class DebugLibrary(Library):
def __init__(self, **kwargs):
self.is_debug = kwargs.pop('is_debug')
super().__init__(**kwargs)
def get_cflags(self):
cflags = super().get_cflags()
if not self.is_debug:
cflags += ['-DNDEBUG']
return cflags
def get_base_name(self):
name = super().get_base_name()
if self.is_debug:
name += '-debug'
return name
@classmethod
def vary_on(cls):
return super().vary_on() + ['is_debug']
@classmethod
def get_default_variation(cls, **kwargs):
return super().get_default_variation(is_debug=settings.ASSERTIONS, **kwargs)
class Exceptions(IntEnum):
"""
This represents exception handling mode of Emscripten. Currently there are
three modes of exception handling:
- None: Does not handle exceptions. This includes -fno-exceptions, which
prevents both throwing and catching, and -fignore-exceptions, which only
allows throwing, but library-wise they use the same version.
- Emscripten: Emscripten provides exception handling capability using JS
emulation. This causes code size increase and performance degradation.
- Wasm: Wasm native exception handling support uses Wasm EH instructions and
is meant to be fast. You need to use a VM that has the EH support to use
this. This is not fully working yet and still experimental.
"""
NONE = auto()
EMSCRIPTEN = auto()
WASM = auto()
class NoExceptLibrary(Library):
def __init__(self, **kwargs):
self.eh_mode = kwargs.pop('eh_mode')
super().__init__(**kwargs)
def get_cflags(self):
cflags = super().get_cflags()
if self.eh_mode == Exceptions.NONE:
cflags += ['-fno-exceptions']
elif self.eh_mode == Exceptions.EMSCRIPTEN:
cflags += ['-sDISABLE_EXCEPTION_CATCHING=0']
elif self.eh_mode == Exceptions.WASM:
cflags += ['-fwasm-exceptions']
return cflags
def get_base_name(self):
name = super().get_base_name()
# TODO Currently emscripten-based exception is the default mode, thus no
# suffixes. Change the default to wasm exception later.
if self.eh_mode == Exceptions.NONE:
name += '-noexcept'
elif self.eh_mode == Exceptions.WASM:
name += '-except'
return name
@classmethod
def variations(cls, **kwargs): # noqa
combos = super().variations()
return ([dict(eh_mode=Exceptions.NONE, **combo) for combo in combos] +
[dict(eh_mode=Exceptions.EMSCRIPTEN, **combo) for combo in combos] +
[dict(eh_mode=Exceptions.WASM, **combo) for combo in combos])
@classmethod
def get_default_variation(cls, **kwargs):
if settings.WASM_EXCEPTIONS:
eh_mode = Exceptions.WASM
elif settings.DISABLE_EXCEPTION_CATCHING == 1:
eh_mode = Exceptions.NONE
else:
eh_mode = Exceptions.EMSCRIPTEN
return super().get_default_variation(eh_mode=eh_mode, **kwargs)
class SjLjLibrary(Library):
def __init__(self, **kwargs):
# Whether we use Wasm EH instructions for SjLj support
self.is_wasm = kwargs.pop('is_wasm')
super().__init__(**kwargs)
def get_cflags(self):
cflags = super().get_cflags()
if self.is_wasm:
# DISABLE_EXCEPTION_THROWING=0 is the default, which is for Emscripten
# EH/SjLj, so we should reverse it.
cflags += ['-sSUPPORT_LONGJMP=wasm',
'-sDISABLE_EXCEPTION_THROWING=1',
'-D__USING_WASM_SJLJ__']
return cflags
def get_base_name(self):
name = super().get_base_name()
# TODO Currently emscripten-based SjLj is the default mode, thus no
# suffixes. Change the default to wasm exception later.
if self.is_wasm:
name += '-wasm-sjlj'
return name
@classmethod
def vary_on(cls):
return super().vary_on() + ['is_wasm']
@classmethod
def get_default_variation(cls, **kwargs):
is_wasm = settings.SUPPORT_LONGJMP == 'wasm'
return super().get_default_variation(is_wasm=is_wasm, **kwargs)
def can_build(self):
# wasm-sjlj is not yet supported with MEMORY64
return not (settings.MEMORY64 and self.is_wasm)
class MuslInternalLibrary(Library):
includes = [
'system/lib/libc/musl/src/internal',
'system/lib/libc/musl/src/include',
'system/lib/pthread',
]
cflags = [
'-std=c99',
'-D_XOPEN_SOURCE=700',
'-Wno-unused-result', # system call results are often ignored in musl, and in wasi that warns
]
class AsanInstrumentedLibrary(Library):
def __init__(self, **kwargs):
self.is_asan = kwargs.pop('is_asan', False)
super().__init__(**kwargs)
def get_cflags(self):
cflags = super().get_cflags()
if self.is_asan:
cflags += ['-fsanitize=address']
return cflags
def get_base_name(self):
name = super().get_base_name()
if self.is_asan:
name += '-asan'
return name
@classmethod
def vary_on(cls):
return super().vary_on() + ['is_asan']
@classmethod
def get_default_variation(cls, **kwargs):
return super().get_default_variation(is_asan=settings.USE_ASAN, **kwargs)
# Subclass of SjLjLibrary because emscripten_setjmp.c uses SjLj support
class libcompiler_rt(MTLibrary, SjLjLibrary):
name = 'libcompiler_rt'
# compiler_rt files can't currently be part of LTO although we are hoping to remove this
# restriction soon: https://reviews.llvm.org/D71738
force_object_files = True
cflags = ['-fno-builtin']
src_dir = 'system/lib/compiler-rt/lib/builtins'
# gcc_personality_v0.c depends on libunwind, which don't include by default.
src_files = glob_in_path(src_dir, '*.c', excludes=['gcc_personality_v0.c'])
src_files += files_in_path(
path='system/lib/compiler-rt',
filenames=[
'stack_ops.S',
'stack_limits.S',
'emscripten_setjmp.c',
'emscripten_exception_builtins.c',
'__trap.c',
])
class libnoexit(Library):
name = 'libnoexit'
# __cxa_atexit calls can be generated during LTO the implemenation cannot
# itself be LTO. See `get_libcall_files` below for more details.
force_object_files = True
src_dir = 'system/lib/libc'
src_files = ['atexit_dummy.c']
class libc(MuslInternalLibrary,
DebugLibrary,
AsanInstrumentedLibrary,
MTLibrary):
name = 'libc'
# Without -fno-builtin, LLVM can optimize away or convert calls to library
# functions to something else based on assumptions that they behave exactly
# like the standard library. This can cause unexpected bugs when we use our
# custom standard library. The same for other libc/libm builds.
cflags = ['-Os', '-fno-builtin']
# Disable certain warnings for code patterns that are contained in upstream musl
cflags += ['-Wno-ignored-attributes',
# tre.h defines NDEBUG internally itself
'-Wno-macro-redefined',
'-Wno-shift-op-parentheses',
'-Wno-string-plus-int',
'-Wno-pointer-sign']
def __init__(self, **kwargs):
self.non_lto_files = self.get_libcall_files()
super().__init__(**kwargs)
def get_libcall_files(self):
# Combining static linking with LTO is tricky under LLVM. The codegen that
# happens during LTO can generate references to new symbols that didn't exist
# in the linker inputs themselves.
# These symbols are called libcalls in LLVM and are the result of intrinsics
# and builtins at the LLVM level. These libcalls cannot themselves be part
# of LTO because once the linker is running the LTO phase new bitcode objects
# cannot be added to link. Another way of putting it: by the time LTO happens
# the decision about which bitcode symbols to compile has already been made.
# See: https://bugs.llvm.org/show_bug.cgi?id=44353.
# To solve this we force certain parts of libc to never be compiled as LTO/bitcode.
# Note that this also includes things that may be depended on by those
# functions - fmin uses signbit, for example, so signbit must be here (so if
# fmin is added by codegen, it will have all it needs).
math_files = [
'fmin.c', 'fminf.c', 'fminl.c',
'fmax.c', 'fmaxf.c', 'fmaxl.c',
'fmod.c', 'fmodf.c', 'fmodl.c',
'logf.c', 'logf_data.c',
'log2f.c', 'log2f_data.c',
'log10.c', 'log10f.c',
'exp.c', 'exp_data.c',
'exp2.c',
'exp2f.c', 'exp2f_data.c',
'exp10.c', 'exp10f.c',
'ldexp.c', 'ldexpf.c', 'ldexpl.c',
'scalbn.c', '__fpclassifyl.c',
'__signbitl.c', '__signbitf.c', '__signbit.c',
'__math_divzero.c', '__math_divzerof.c',
'__math_oflow.c', '__math_oflowf.c',
'__math_uflow.c', '__math_uflowf.c',
'__math_invalid.c', '__math_invalidf.c', '__math_invalidl.c',
'pow.c', 'pow_data.c', 'log.c', 'log_data.c', 'log2.c', 'log2_data.c'
]
math_files = files_in_path(path='system/lib/libc/musl/src/math', filenames=math_files)
exit_files = files_in_path(
path='system/lib/libc/musl/src/exit',
filenames=['atexit.c'])
other_files = files_in_path(
path='system/lib/libc',
filenames=['emscripten_memcpy.c', 'emscripten_memset.c',
'emscripten_scan_stack.c',
'emscripten_memmove.c'])
# Calls to iprintf can be generated during codegen. Ideally we wouldn't
# compile these with -O2 like we do the rest of compiler-rt since its
# probably not performance sensitive. However we don't currently have
# a way to set per-file compiler flags. And hopefully we should be able
# move all this stuff back into libc once we it LTO compatible.
iprintf_files = files_in_path(
path='system/lib/libc/musl/src/stdio',
filenames=['__towrite.c', '__overflow.c', 'fwrite.c', 'fputs.c',
'getc.c',
'fputc.c',
'fgets.c',
'putc.c', 'putc_unlocked.c',
'putchar.c', 'putchar_unlocked.c',
'printf.c', 'puts.c', '__lockfile.c'])
iprintf_files += files_in_path(
path='system/lib/libc/musl/src/string',
filenames=['strlen.c'])
return math_files + exit_files + other_files + iprintf_files
def get_files(self):
libc_files = []
musl_srcdir = utils.path_from_root('system/lib/libc/musl/src')
# musl modules
ignore = [
'ipc', 'passwd', 'signal', 'sched', 'time', 'linux',
'aio', 'exit', 'legacy', 'mq', 'setjmp', 'env',
'ldso', 'malloc'
]
# individual files
ignore += [
'memcpy.c', 'memset.c', 'memmove.c', 'getaddrinfo.c', 'getnameinfo.c',
'res_query.c', 'res_querydomain.c',
'proto.c', 'gethostbyaddr.c', 'gethostbyaddr_r.c', 'gethostbyname.c',
'gethostbyname2_r.c', 'gethostbyname_r.c', 'gethostbyname2.c',
'alarm.c', 'syscall.c', 'popen.c', 'pclose.c',
'getgrouplist.c', 'initgroups.c', 'wordexp.c', 'timer_create.c',
'getentropy.c',
# 'process' exclusion
'fork.c', 'vfork.c', 'posix_spawn.c', 'posix_spawnp.c', 'execve.c', 'waitid.c', 'system.c',
'_Fork.c',
]
ignore += LIBC_SOCKETS
if self.is_mt:
ignore += [
'clone.c',
'pthread_create.c',
'pthread_kill.c', 'pthread_sigmask.c',
'__set_thread_area.c', 'synccall.c',
'__syscall_cp.c', '__tls_get_addr.c',
'__unmapself.c',
# Empty files, simply ignore them.
'syscall_cp.c', 'tls.c',
# TODO: Support this. See #12216.
'pthread_setname_np.c',
]
libc_files += files_in_path(
path='system/lib/pthread',
filenames=[
'library_pthread.c',
'proxying.c',
'pthread_create.c',
'pthread_kill.c',
'emscripten_proxy_main.c',
'emscripten_thread_init.c',
'emscripten_thread_state.S',
'emscripten_futex_wait.c',
'emscripten_futex_wake.c',
'emscripten_yield.c',
])
else:
ignore += ['thread']
libc_files += files_in_path(
path='system/lib/libc/musl/src/thread',
filenames=[
'pthread_self.c',
'pthread_cleanup_push.c',
'pthread_attr_get.c',
# C11 thread library functions
'call_once.c',
'tss_create.c',
'tss_delete.c',
'tss_set.c',
'cnd_broadcast.c',
'cnd_destroy.c',
'cnd_init.c',
'cnd_signal.c',
'cnd_timedwait.c',
'cnd_wait.c',
'mtx_destroy.c',
'mtx_init.c',
'mtx_lock.c',
'mtx_timedlock.c',
'mtx_trylock.c',
'mtx_unlock.c',
'thrd_create.c',
'thrd_exit.c',
'thrd_join.c',
'thrd_sleep.c',
'thrd_yield.c',
])
libc_files += files_in_path(
path='system/lib/pthread',
filenames=[
'library_pthread_stub.c',
'pthread_self_stub.c',
'proxying_stub.c',
])
# These files are in libc directories, but only built in libc_optz.
ignore += [
'pow_small.c', 'log_small.c', 'log2_small.c'
]
ignore = set(ignore)
for dirpath, dirnames, filenames in os.walk(musl_srcdir):
# Don't recurse into ingored directories
remove = [d for d in dirnames if d in ignore]
for r in remove:
dirnames.remove(r)
for f in filenames:
if f.endswith('.c') and f not in ignore:
libc_files.append(os.path.join(musl_srcdir, dirpath, f))
# Allowed files from ignored modules
libc_files += files_in_path(
path='system/lib/libc/musl/src/time',
filenames=[
'clock_settime.c',
'asctime_r.c',
'asctime.c',
'ctime.c',
'difftime.c',
'ftime.c',
'gmtime.c',
'localtime.c',
'nanosleep.c',
'clock_nanosleep.c',
'ctime_r.c',
'timespec_get.c',
'utime.c',
'__map_file.c',
])
libc_files += files_in_path(
path='system/lib/libc/musl/src/legacy',
filenames=['getpagesize.c', 'err.c'])
libc_files += files_in_path(
path='system/lib/libc/musl/src/linux',
filenames=['getdents.c', 'gettid.c', 'utimes.c'])
libc_files += files_in_path(
path='system/lib/libc/musl/src/env',
filenames=['__environ.c', 'getenv.c', 'putenv.c', 'setenv.c', 'unsetenv.c'])
libc_files += files_in_path(
path='system/lib/libc/musl/src/sched',
filenames=['sched_yield.c'])
libc_files += files_in_path(
path='system/lib/libc/musl/src/exit',
filenames=['_Exit.c', 'atexit.c'])
libc_files += files_in_path(
path='system/lib/libc/musl/src/ldso',
filenames=['dlerror.c', 'dlsym.c', 'dlclose.c'])
libc_files += files_in_path(
path='system/lib/libc/musl/src/signal',
filenames=[
'block.c',
'getitimer.c',
'killpg.c',
'setitimer.c',
'sigorset.c',
'sigandset.c',
'sigaddset.c',
'sigdelset.c',
'sigemptyset.c',
'sigfillset.c',
'sigismember.c',
'siginterrupt.c',
'signal.c',
'sigprocmask.c',
'sigrtmax.c',
'sigrtmin.c',
'sigwait.c',
'sigwaitinfo.c',
])
libc_files += files_in_path(
path='system/lib/libc',
filenames=[
'dynlink.c',
'wasi-helpers.c',
'emscripten_get_heap_size.c',
'raise.c',
'kill.c',
'sigaction.c',
'sigtimedwait.c',
'pthread_sigmask.c',
'emscripten_console.c',
'emscripten_time.c',
])
libc_files += files_in_path(
path='system/lib/pthread',
filenames=['emscripten_atomic.c', 'thread_profiler.c'])
libc_files += files_in_path(
path='system/lib/libc',
filenames=['emscripten_memcpy.c',
'emscripten_memset.c',
'emscripten_scan_stack.c',
'emscripten_memmove.c',
'emscripten_mmap.c'
])
libc_files += glob_in_path('system/lib/libc/compat', '*.c')
# Check for missing file in non_lto_files list. Do this here
# rather than in the constructor so it only happens when the
# library is actually built (not when its instantiated).
for f in self.non_lto_files:
assert os.path.exists(f), f
return libc_files