1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
|
/*
* Copyright 2017 WebAssembly Community Group participants
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
//
// wasm-emscripten-finalize console tool
// Performs Emscripten-specific transforms on .wasm files
//
#include <exception>
#include "abi/js.h"
#include "ir/trapping.h"
#include "support/colors.h"
#include "support/debug.h"
#include "support/file.h"
#include "tool-options.h"
#include "wasm-binary.h"
#include "wasm-emscripten.h"
#include "wasm-io.h"
#include "wasm-printing.h"
#include "wasm-validator.h"
#define DEBUG_TYPE "emscripten"
using namespace cashew;
using namespace wasm;
int main(int argc, const char* argv[]) {
const uint64_t INVALID_BASE = -1;
std::string infile;
std::string outfile;
std::string inputSourceMapFilename;
std::string outputSourceMapFilename;
std::string outputSourceMapUrl;
std::string dataSegmentFile;
bool emitBinary = true;
bool debugInfo = false;
bool DWARF = false;
bool sideModule = false;
bool legacyPIC = true;
bool legalizeJavaScriptFFI = true;
bool bigInt = false;
bool checkStackOverflow = false;
uint64_t globalBase = INVALID_BASE;
bool standaloneWasm = false;
// TODO: remove after https://github.com/WebAssembly/binaryen/issues/3043
bool minimizeWasmChanges = false;
bool noDynCalls = false;
bool onlyI64DynCalls = false;
ToolOptions options("wasm-emscripten-finalize",
"Performs Emscripten-specific transforms on .wasm files");
options
.add("--output",
"-o",
"Output file",
Options::Arguments::One,
[&outfile](Options*, const std::string& argument) {
outfile = argument;
Colors::setEnabled(false);
})
.add("--debuginfo",
"-g",
"Emit names section in wasm binary (or full debuginfo in wast)",
Options::Arguments::Zero,
[&debugInfo](Options*, const std::string&) { debugInfo = true; })
.add("--dwarf",
"",
"Update DWARF debug info",
Options::Arguments::Zero,
[&DWARF](Options*, const std::string&) { DWARF = true; })
.add("--emit-text",
"-S",
"Emit text instead of binary for the output file. "
"In this mode if no output file is specified, we write to stdout.",
Options::Arguments::Zero,
[&emitBinary](Options*, const std::string&) { emitBinary = false; })
.add("--global-base",
"",
"The address at which static globals were placed",
Options::Arguments::One,
[&globalBase](Options*, const std::string& argument) {
globalBase = std::stoull(argument);
})
// TODO(sbc): Remove this one this argument is no longer passed by
// emscripten. See https://github.com/emscripten-core/emscripten/issues/8905
.add("--initial-stack-pointer",
"",
"ignored - will be removed in a future release",
Options::Arguments::One,
[](Options*, const std::string& argument) {})
.add("--side-module",
"",
"Input is an emscripten side module",
Options::Arguments::Zero,
[&sideModule](Options* o, const std::string& argument) {
sideModule = true;
})
.add("--new-pic-abi",
"",
"Use new/llvm PIC abi",
Options::Arguments::Zero,
[&legacyPIC](Options* o, const std::string& argument) {
legacyPIC = false;
})
.add("--input-source-map",
"-ism",
"Consume source map from the specified file",
Options::Arguments::One,
[&inputSourceMapFilename](Options* o, const std::string& argument) {
inputSourceMapFilename = argument;
})
.add("--no-legalize-javascript-ffi",
"-nj",
"Do not fully legalize (i64->i32, "
"f32->f64) the imports and exports for interfacing with JS",
Options::Arguments::Zero,
[&legalizeJavaScriptFFI](Options* o, const std::string&) {
legalizeJavaScriptFFI = false;
})
.add("--bigint",
"-bi",
"Assume JS will use wasm/JS BigInt integration, so wasm i64s will "
"turn into JS BigInts, and there is no need for any legalization at "
"all (not even minimal legalization of dynCalls)",
Options::Arguments::Zero,
[&bigInt](Options* o, const std::string&) { bigInt = true; })
.add("--output-source-map",
"-osm",
"Emit source map to the specified file",
Options::Arguments::One,
[&outputSourceMapFilename](Options* o, const std::string& argument) {
outputSourceMapFilename = argument;
})
.add("--output-source-map-url",
"-osu",
"Emit specified string as source map URL",
Options::Arguments::One,
[&outputSourceMapUrl](Options* o, const std::string& argument) {
outputSourceMapUrl = argument;
})
.add("--separate-data-segments",
"",
"Separate data segments to a file",
Options::Arguments::One,
[&dataSegmentFile](Options* o, const std::string& argument) {
dataSegmentFile = argument;
})
.add("--check-stack-overflow",
"",
"Check for stack overflows every time the stack is extended",
Options::Arguments::Zero,
[&checkStackOverflow](Options* o, const std::string&) {
checkStackOverflow = true;
})
.add("--standalone-wasm",
"",
"Emit a wasm file that does not depend on JS, as much as possible,"
" using wasi and other standard conventions etc. where possible",
Options::Arguments::Zero,
[&standaloneWasm](Options* o, const std::string&) {
standaloneWasm = true;
})
.add("--minimize-wasm-changes",
"",
"Modify the wasm as little as possible. This is useful during "
"development as we reduce the number of changes to the wasm, as it "
"lets emscripten control how much modifications to do.",
Options::Arguments::Zero,
[&minimizeWasmChanges](Options* o, const std::string&) {
minimizeWasmChanges = true;
})
.add("--no-dyncalls",
"",
"",
Options::Arguments::Zero,
[&noDynCalls](Options* o, const std::string&) { noDynCalls = true; })
.add("--dyncalls-i64",
"",
"",
Options::Arguments::Zero,
[&onlyI64DynCalls](Options* o, const std::string&) {
onlyI64DynCalls = true;
})
.add_positional("INFILE",
Options::Arguments::One,
[&infile](Options* o, const std::string& argument) {
infile = argument;
});
options.parse(argc, argv);
if (infile == "") {
Fatal() << "Need to specify an infile\n";
}
Module wasm;
ModuleReader reader;
reader.setDWARF(DWARF);
try {
reader.read(infile, wasm, inputSourceMapFilename);
} catch (ParseException& p) {
p.dump(std::cerr);
std::cerr << '\n';
Fatal() << "error in parsing input";
} catch (MapParseException& p) {
p.dump(std::cerr);
std::cerr << '\n';
Fatal() << "error in parsing wasm source map";
}
options.applyFeatures(wasm);
BYN_TRACE_WITH_TYPE("emscripten-dump", "Module before:\n");
BYN_DEBUG_WITH_TYPE("emscripten-dump",
WasmPrinter::printModule(&wasm, std::cerr));
uint32_t dataSize = 0;
if (!sideModule) {
if (globalBase == INVALID_BASE) {
Fatal() << "globalBase must be set";
}
Export* dataEndExport = wasm.getExport("__data_end");
if (dataEndExport == nullptr) {
Fatal() << "__data_end export not found";
}
Global* dataEnd = wasm.getGlobal(dataEndExport->value);
if (dataEnd == nullptr) {
Fatal() << "__data_end global not found";
}
if (dataEnd->type != Type::i32) {
Fatal() << "__data_end global has wrong type";
}
if (dataEnd->imported()) {
Fatal() << "__data_end must not be an imported global";
}
Const* dataEndConst = dataEnd->init->cast<Const>();
dataSize = dataEndConst->value.geti32() - globalBase;
}
EmscriptenGlueGenerator generator(wasm);
generator.standalone = standaloneWasm;
generator.sideModule = sideModule;
generator.minimizeWasmChanges = minimizeWasmChanges;
generator.onlyI64DynCalls = onlyI64DynCalls;
generator.noDynCalls = noDynCalls;
generator.fixInvokeFunctionNames();
std::vector<Name> initializerFunctions;
// The wasm backend emits "__indirect_function_table" as the import name for
// the table, while older emscripten expects "table"
if (wasm.table.imported() && !minimizeWasmChanges) {
wasm.table.base = Name("table");
}
wasm.updateMaps();
if (!standaloneWasm) {
// This is also not needed in standalone mode since standalone mode uses
// crt1.c to invoke the main and is aware of __main_argc_argv mangling.
generator.renameMainArgcArgv();
}
PassRunner passRunner(&wasm, options.passOptions);
passRunner.setDebug(options.debug);
passRunner.setDebugInfo(debugInfo);
if (checkStackOverflow && !sideModule) {
if (!standaloneWasm) {
// In standalone mode we don't set a handler at all.. which means
// just trap on overflow.
passRunner.options.arguments["stack-check-handler"] =
"__handle_stack_overflow";
}
passRunner.add("stack-check");
}
if (sideModule) {
passRunner.add("replace-stack-pointer");
}
if (legacyPIC) {
if (sideModule) {
passRunner.add("emscripten-pic");
} else {
passRunner.add("emscripten-pic-main-module");
}
}
if (!noDynCalls && !standaloneWasm) {
// If not standalone wasm then JS is relevant and we need dynCalls.
if (onlyI64DynCalls) {
passRunner.add("generate-i64-dyncalls");
} else {
passRunner.add("generate-dyncalls");
}
}
// Legalize the wasm, if BigInts don't make that moot.
if (!bigInt) {
passRunner.add(ABI::getLegalizationPass(
legalizeJavaScriptFFI ? ABI::LegalizationLevel::Full
: ABI::LegalizationLevel::Minimal));
}
// Strip target features section (its information is in the metadata)
passRunner.add("strip-target-features");
// If DWARF is unused, strip it out. This avoids us keeping it alive
// until wasm-opt strips it later.
if (!DWARF) {
passRunner.add("strip-dwarf");
}
passRunner.run();
if (sideModule) {
BYN_TRACE("finalizing as side module\n");
generator.generatePostInstantiateFunction();
} else {
BYN_TRACE("finalizing as regular module\n");
generator.internalizeStackPointerGlobal();
// For side modules these gets called via __post_instantiate
if (Function* F = wasm.getFunctionOrNull(ASSIGN_GOT_ENTRIES)) {
auto* ex = new Export();
ex->value = F->name;
ex->name = F->name;
ex->kind = ExternalKind::Function;
wasm.addExport(ex);
initializerFunctions.push_back(F->name);
}
// Costructors get called from crt1 in wasm standalone mode.
// Unless there is no entry point.
if (!standaloneWasm || !wasm.getExportOrNull("_start")) {
if (auto* e = wasm.getExportOrNull(WASM_CALL_CTORS)) {
initializerFunctions.push_back(e->name);
}
}
}
BYN_TRACE("generated metadata\n");
// Substantial changes to the wasm are done, enough to create the metadata.
std::string metadata =
generator.generateEmscriptenMetadata(dataSize, initializerFunctions);
// Finally, separate out data segments if relevant (they may have been needed
// for metadata).
if (!dataSegmentFile.empty()) {
Output memInitFile(dataSegmentFile, Flags::Binary);
if (globalBase == INVALID_BASE) {
Fatal() << "globalBase must be set";
}
generator.separateDataSegments(&memInitFile, globalBase);
}
BYN_TRACE_WITH_TYPE("emscripten-dump", "Module after:\n");
BYN_DEBUG_WITH_TYPE("emscripten-dump",
WasmPrinter::printModule(&wasm, std::cerr));
// Write the modified wasm if the user asked us to, either by specifying an
// output file, or requesting text output (which goes to stdout by default).
if (outfile.size() > 0 || !emitBinary) {
Output output(outfile, emitBinary ? Flags::Binary : Flags::Text);
ModuleWriter writer;
writer.setDebugInfo(debugInfo);
// writer.setSymbolMap(symbolMap);
writer.setBinary(emitBinary);
if (outputSourceMapFilename.size()) {
writer.setSourceMapFilename(outputSourceMapFilename);
writer.setSourceMapUrl(outputSourceMapUrl);
}
writer.write(wasm, output);
if (!emitBinary) {
output << "(;\n";
output << "--BEGIN METADATA --\n" << metadata << "-- END METADATA --\n";
output << ";)\n";
}
}
// If we emit text then we emitted the metadata together with that text
// earlier. Otherwise emit it to stdout.
if (emitBinary) {
std::cout << metadata;
}
return 0;
}
|