binaryen/src/passes/RemoveUnusedBrs.cpp at string-builtin-effects · WebAssembly/binaryen

History

2083 lines (1982 loc) · 81 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

435

436

437

438

439

440

441

442

443

444

445

446

447

448

449

450

451

452

453

454

455

456

457

458

459

460

461

462

463

464

465

466

467

468

469

470

471

472

473

474

475

476

477

478

479

480

481

482

483

484

485

486

487

488

489

490

491

492

493

494

495

496

497

498

499

500

501

502

503

504

505

506

507

508

509

510

511

512

513

514

515

516

517

518

519

520

521

522

523

524

525

526

527

528

529

530

531

532

533

534

535

536

537

538

539

540

541

542

543

544

545

546

547

548

549

550

551

552

553

554

555

556

557

558

559

560

561

562

563

564

565

566

567

568

569

570

571

572

573

574

575

576

577

578

579

580

581

582

583

584

585

586

587

588

589

590

591

592

593

594

595

596

597

598

599

600

601

602

603

604

605

606

607

608

609

610

611

612

613

614

615

616

617

618

619

620

621

622

623

624

625

626

627

628

629

630

631

632

633

634

635

636

637

638

639

640

641

642

643

644

645

646

647

648

649

650

651

652

653

654

655

656

657

658

659

660

661

662

663

664

665

666

667

668

669

670

671

672

673

674

675

676

677

678

679

680

681

682

683

684

685

686

687

688

689

690

691

692

693

694

695

696

697

698

699

700

701

702

703

704

705

706

707

708

709

710

711

712

713

714

715

716

717

718

719

720

721

722

723

724

725

726

727

728

729

730

731

732

733

734

735

736

737

738

739

740

741

742

743

744

745

746

747

748

749

750

751

752

753

754

755

756

757

758

759

760

761

762

763

764

765

766

767

768

769

770

771

772

773

774

775

776

777

778

779

780

781

782

783

784

785

786

787

788

789

790

791

792

793

794

795

796

797

798

799

800

801

802

803

804

805

806

807

808

809

810

811

812

813

814

815

816

817

818

819

820

821

822

823

824

825

826

827

828

829

830

831

832

833

834

835

836

837

838

839

840

841

842

843

844

845

846

847

848

849

850

851

852

853

854

855

856

857

858

859

860

861

862

863

864

865

866

867

868

869

870

871

872

873

874

875

876

877

878

879

880

881

882

883

884

885

886

887

888

889

890

891

892

893

894

895

896

897

898

899

900

901

902

903

904

905

906

907

908

909

910

911

912

913

914

915

916

917

918

919

920

921

922

923

924

925

926

927

928

929

930

931

932

933

934

935

936

937

938

939

940

941

942

943

944

945

946

947

948

949

950

951

952

953

954

955

956

957

958

959

960

961

962

963

964

965

966

967

968

969

970

971

972

973

974

975

976

977

978

979

980

981

982

983

984

985

986

987

988

989

990

991

992

993

994

995

996

997

998

999

1000

* Licensed under the Apache License, Version 2.0 (the "License");

* you may not use this file except in compliance with the License.

* You may obtain a copy of the License at

* http://www.apache.org/licenses/LICENSE-2.0

* Unless required by applicable law or agreed to in writing, software

* distributed under the License is distributed on an "AS IS" BASIS,

* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

* See the License for the specific language governing permissions and

* limitations under the License.

// Removes branches for which we go to where they go anyhow.

#include "ir/branch-hints.h"

#include "ir/branch-utils.h"

#include "ir/cost.h"

#include "ir/drop.h"

#include "ir/effects.h"

#include "ir/gc-type-utils.h"

#include "ir/literal-utils.h"

#include "ir/localize.h"

#include "ir/properties.h"

#include "ir/utils.h"

#include "parsing.h"

#include "pass.h"

#include "support/small_set.h"

#include "wasm-builder.h"

#include "wasm-type.h"

#include "wasm.h"

namespace wasm {

// Grab a slice out of a block, replacing it with nops, and returning

// either another block with the contents (if more than 1) or a single

// expression.

// This does not finalize the input block; it leaves that for the caller.

static Expression*

stealSlice(Builder& builder, Block* input, Index from, Index to) {

Expression* ret;

if (to == from + 1) {

// just one

ret = input->list[from];

} else {

auto* block = builder.makeBlock();

for (Index i = from; i < to; i++) {

block->list.push_back(input->list[i]);

}

block->finalize();

ret = block;

}

if (to == input->list.size()) {

input->list.resize(from);

} else {

for (Index i = from; i < to; i++) {

input->list[i] = builder.makeNop();

}

return ret;

}

// to turn an if into a br-if, we must be able to reorder the

// condition and possible value, and the possible value must

// not have side effects (as they would run unconditionally)

static bool canTurnIfIntoBrIf(Expression* ifCondition,

Expression* brValue,

PassOptions& options,

Module& wasm) {

// if the if isn't even reached, this is all dead code anyhow

if (ifCondition->type == Type::unreachable) {

return false;

}

if (!brValue) {

return true;

}

EffectAnalyzer value(options, wasm, brValue);

if (value.hasSideEffects()) {

return false;

}

return !EffectAnalyzer(options, wasm, ifCondition).invalidates(value);

}

// This leads to similar choices as LLVM does in some cases, by balancing the

// extra work of code that is run unconditionally with the speedup from not

// branching to decide whether to run it or not.

// See:

// * https://github.com/WebAssembly/binaryen/pull/4228

// * https://github.com/WebAssembly/binaryen/issues/5983

const Index TooCostlyToRunUnconditionally = 8;

// Some costs are known to be too high to move from conditional to unconditional

// execution.

static_assert(CostAnalyzer::AtomicCost >= TooCostlyToRunUnconditionally,

"We never run atomics unconditionally");

static_assert(CostAnalyzer::ThrowCost >= TooCostlyToRunUnconditionally,

"We never run throws unconditionally");

static_assert(CostAnalyzer::CastCost > TooCostlyToRunUnconditionally / 2,

"We only run casts unconditionally when optimizing for size");

static bool tooCostlyToRunUnconditionally(const PassOptions& passOptions,

Index cost) {

if (passOptions.shrinkLevel == 0) {

// We are focused on speed. Any extra cost is risky, but allow a small

// amount.

return cost > TooCostlyToRunUnconditionally / 2;

} else if (passOptions.shrinkLevel == 1) {

// We are optimizing for size in a balanced manner. Allow some extra

// overhead here.

return cost >= TooCostlyToRunUnconditionally;

} else {

// We should have already decided what to do if shrink_level=2 and not

// gotten here, and other values are invalid.

WASM_UNREACHABLE("bad shrink level");

}

// As above, but a single expression that we are considering moving to a place

// where it executes unconditionally.

static bool tooCostlyToRunUnconditionally(const PassOptions& passOptions,

Expression* curr) {

// If we care entirely about code size, just do it for that reason (early

// exit to avoid work).

if (passOptions.shrinkLevel >= 2) {

return false;

}

auto cost = CostAnalyzer(curr).cost;

return tooCostlyToRunUnconditionally(passOptions, cost);

}

// Check if it is not worth it to run code unconditionally. This

// assumes we are trying to run two expressions where previously

// only one of the two might have executed. We assume here that

// executing both is good for code size.

static bool tooCostlyToRunUnconditionally(const PassOptions& passOptions,

Expression* one,

Expression* two) {

// If we care entirely about code size, just do it for that reason (early

// exit to avoid work).

if (passOptions.shrinkLevel >= 2) {

return false;

}

// Consider the cost of executing all the code unconditionally, which adds

// either the cost of running one or two, so the maximum is the worst case.

auto max = std::max(CostAnalyzer(one).cost, CostAnalyzer(two).cost);

return tooCostlyToRunUnconditionally(passOptions, max);

}

struct RemoveUnusedBrs : public WalkerPass<PostWalker<RemoveUnusedBrs>> {

bool isFunctionParallel() override { return true; }

std::unique_ptr<Pass> create() override {

return std::make_unique<RemoveUnusedBrs>();

}

bool anotherCycle;

// Whether we are allowed to unconditionalize code, that is, make code run

// that previously might not have. Unconditionalizing code is a problem for

// fuzzing branch hints: a branch hint that never ran might be wrong, and if

// we start to run it, the fuzzer would report a finding.

bool neverUnconditionalize;

using Flows = std::vector<Expression**>;

// list of breaks that are currently flowing. if they reach their target

// without interference, they can be removed (or their value forwarded TODO)

Flows flows;

// a stack for if-else contents, we merge their outputs

std::vector<Flows> ifStack;

// list of all loops, so we can optimize them

std::vector<Loop*> loops;

static void visitAny(RemoveUnusedBrs* self, Expression** currp) {

auto* curr = *currp;

auto& flows = self->flows;

if (curr->is<Break>()) {

flows.clear();

auto* br = curr->cast<Break>();

if (!br->condition) { // TODO: optimize?

// a break, let's see where it flows to

flows.push_back(currp);

} else {

self->stopValueFlow();

}

} else if (curr->is<Return>()) {

flows.clear();

flows.push_back(currp);

} else if (curr->is<If>()) {

auto* iff = curr->cast<If>();

if (iff->condition->type == Type::unreachable) {

// avoid trying to optimize this, we never reach it anyhow

self->stopFlow();

return;

}

if (iff->ifFalse) {

assert(self->ifStack.size() > 0);

auto ifTrueFlows = std::move(self->ifStack.back());

self->ifStack.pop_back();

// we can flow values out in most cases, except if one arm

// has the none type - we will update the types later, but

// there is no way to emit a proper type for one arm being

// none and the other flowing a value; and there is no way

// to flow a value from a none.

if (iff->ifTrue->type == Type::none ||

iff->ifFalse->type == Type::none) {

self->removeValueFlow(ifTrueFlows);

self->stopValueFlow();

}

for (auto* flow : ifTrueFlows) {

flows.push_back(flow);

}

} else {

// if without else stops the flow of values

self->stopValueFlow();

}

} else if (auto* block = curr->dynCast<Block>()) {

// any breaks flowing to here are unnecessary, as we get here anyhow

auto name = block->name;

auto& list = block->list;

if (name.is()) {

Index size = flows.size();

Index skip = 0;

for (Index i = 0; i < size; i++) {

auto* flow = (*flows[i])->dynCast<Break>();

if (flow && flow->name == name) {

if (!flow->value) {

// br => nop

ExpressionManipulator::nop<Break>(flow);

} else {

// br with value => value

*flows[i] = flow->value;

}

skip++;

self->anotherCycle = true;

} else if (skip > 0) {

flows[i - skip] = flows[i];

}

if (skip > 0) {

flows.resize(size - skip);

}

// Drop a nop at the end of a block, which prevents a value flowing. Note

// that this is worth doing regardless of whether we have a name on this

// block or not (which the if right above us checks) - such a nop is

// always unneeded and can limit later optimizations.

while (list.size() > 0 && list.back()->is<Nop>()) {

list.resize(list.size() - 1);

self->anotherCycle = true;

}

// A value flowing is only valid if it is a value that the block actually

// flows out. If it is never reached, it does not flow out, and may be

// invalid to represent as such.

auto size = list.size();

for (Index i = 0; i < size; i++) {

if (i != size - 1 && list[i]->type == Type::unreachable) {

// No value flows out of this block.

self->stopValueFlow();

break;

}

} else if (curr->is<Nop>()) {

// Ignore (could be result of a previous cycle).

self->stopValueFlow();

} else if (curr->is<Loop>() || curr->is<TryTable>()) {

// Do nothing - it's ok for values to flow out.

// TODO: Legacy Try as well?

} else if (auto* sw = curr->dynCast<Switch>()) {

self->stopFlow();

self->optimizeSwitch(sw);

} else {

// Anything else stops the flow.

self->stopFlow();

}

void stopFlow() { flows.clear(); }

void removeValueFlow(Flows& currFlows) {

currFlows.erase(std::remove_if(currFlows.begin(),

currFlows.end(),

[&](Expression** currp) {

auto* curr = *currp;

if (auto* ret = curr->dynCast<Return>()) {

return ret->value;

}

return curr->cast<Break>()->value;

}),

currFlows.end());

}

void stopValueFlow() { removeValueFlow(flows); }

static void clear(RemoveUnusedBrs* self, Expression** currp) {

self->flows.clear();

}

static void saveIfTrue(RemoveUnusedBrs* self, Expression** currp) {

self->ifStack.push_back(std::move(self->flows));

}

void visitLoop(Loop* curr) { loops.push_back(curr); }

void optimizeSwitch(Switch* curr) {

// if the final element is the default, we don't need it

while (!curr->targets.empty() && curr->targets.back() == curr->default_) {

curr->targets.pop_back();

}

// if the first element is the default, we can remove it by shifting

// everything (which does add a subtraction of a constant, but often that is

// worth it as the constant can be folded away and/or we remove multiple

// elements here)

Index removable = 0;

while (removable < curr->targets.size() &&

curr->targets[removable] == curr->default_) {

removable++;

}

if (removable > 0) {

for (Index i = removable; i < curr->targets.size(); i++) {

curr->targets[i - removable] = curr->targets[i];

}

curr->targets.resize(curr->targets.size() - removable);

Builder builder(*getModule());

curr->condition = builder.makeBinary(

SubInt32, curr->condition, builder.makeConst(int32_t(removable)));

}

// when there isn't a value, we can do some trivial optimizations without

// worrying about the value being executed before the condition

if (curr->value) {

return;

}

if (curr->targets.size() == 0) {

// a switch with just a default always goes there

Builder builder(*getModule());

replaceCurrent(builder.makeSequence(builder.makeDrop(curr->condition),

builder.makeBreak(curr->default_)));

} else if (curr->targets.size() == 1) {

// a switch with two options is basically an if

Builder builder(*getModule());

replaceCurrent(builder.makeIf(curr->condition,

builder.makeBreak(curr->default_),

builder.makeBreak(curr->targets.front())));

} else {

// there are also some other cases where we want to convert a switch into

// ifs, especially if the switch is large and we are focusing on size. an

// especially egregious case is a switch like this: [a b b [..] b b c]

// with default b (which may be arrived at after we trim away excess

// default values on both sides). in this case, we really have 3 values in

// a simple form, so it is the next logical case after handling 1 and 2

// values right above here. to optimize this, we must add a local + a

// bunch of nodes (if*2, tee, eq, get, const, break*3), so the table must

// be big enough for it to make sense

// How many targets we need when shrinking. This is literally the size at

// which the transformation begins to be smaller.

const uint32_t MIN_SHRINK = 13;

// How many targets we need when not shrinking, in which case, 2 ifs may

// be slower, so we do this when the table is ridiculously large for one

// with just 3 values in it.

const uint32_t MIN_GENERAL = 128;

auto shrink = getPassRunner()->options.shrinkLevel > 0;

if ((curr->targets.size() >= MIN_SHRINK && shrink) ||

(curr->targets.size() >= MIN_GENERAL && !shrink)) {

for (Index i = 1; i < curr->targets.size() - 1; i++) {

if (curr->targets[i] != curr->default_) {

return;

}

// great, we are in that case, optimize

Builder builder(*getModule());

auto temp = builder.addVar(getFunction(), Type::i32);

Expression* z;

replaceCurrent(z = builder.makeIf(

builder.makeLocalTee(temp, curr->condition, Type::i32),

builder.makeIf(builder.makeBinary(

EqInt32,

builder.makeLocalGet(temp, Type::i32),

builder.makeConst(

int32_t(curr->targets.size() - 1))),

builder.makeBreak(curr->targets.back()),

builder.makeBreak(curr->default_)),

builder.makeBreak(curr->targets.front())));

}

void visitIf(If* curr) {

if (!curr->ifFalse) {

// if without an else. try to reduce

// if (condition) br => br_if (condition)

if (Break* br = curr->ifTrue->dynCast<Break>()) {

if (canTurnIfIntoBrIf(

curr->condition, br->value, getPassOptions(), *getModule())) {

if (!br->condition) {

br->condition = curr->condition;

BranchHints::copyTo(curr, br, getFunction());

} else {

// In this case we can replace

// if (condition1) br_if (condition2)

// =>

// br_if select (condition1) (condition2) (i32.const 0)

// In other words, we replace an if (3 bytes) with a select and a

// zero (also 3 bytes). The size is unchanged, but the select may

// be further optimizable, and if select does not branch we also

// avoid one branch.

if (neverUnconditionalize) {

// Creating a select, below, would unconditionally run the

// select's condition.

return;

}

// Multivalue selects are not supported.

if (br->value && br->value->type.isTuple()) {

return;

}

// If running the br's condition unconditionally is too expensive,

// give up.

auto* zero = LiteralUtils::makeZero(Type::i32, *getModule());

if (tooCostlyToRunUnconditionally(

getPassOptions(), br->condition, zero)) {

return;

}

// Of course we can't do this if the br's condition has side

// effects, as we would then execute those unconditionally.

if (EffectAnalyzer(getPassOptions(), *getModule(), br->condition)

.hasSideEffects()) {

return;

}

Builder builder(*getModule());

// Note that we use the br's condition as the select condition.

// That keeps the order of the two conditions as it was originally.

br->condition =

builder.makeSelect(br->condition, curr->condition, zero);

BranchHints::applyAndTo(curr, br, br, getFunction());

}

br->finalize();

replaceCurrent(Builder(*getModule()).dropIfConcretelyTyped(br));

anotherCycle = true;

}

// if (condition-A) { if (condition-B) .. }

// =>

// if (condition-A ? condition-B : 0) { .. }

// This replaces an if, which is 3 bytes, with a select plus a zero, which

// is also 3 bytes. The benefit is that the select may be faster, and also

// further optimizations may be possible on the select.

if (auto* child = curr->ifTrue->dynCast<If>()) {

if (child->ifFalse) {

return;

}

if (neverUnconditionalize) {

// Creating a select, below, would unconditionally run the inner if's

// condition (condition-B, in the comment above).

return;

}

// If running the child's condition unconditionally is too expensive,

// give up.

if (tooCostlyToRunUnconditionally(getPassOptions(), child->condition)) {

return;

}

// Of course we can't do this if the inner if's condition has side

// effects, as we would then execute those unconditionally.

if (EffectAnalyzer(getPassOptions(), *getModule(), child->condition)

.hasSideEffects()) {

return;

}

Builder builder(*getModule());

curr->condition = builder.makeSelect(

child->condition, curr->condition, builder.makeConst(int32_t(0)));

BranchHints::applyAndTo(curr, child, curr, getFunction());

curr->ifTrue = child->ifTrue;

}

// TODO: if-else can be turned into a br_if as well, if one of the sides is

// a dead end we handle the case of a returned value to a local.set

// later down, see visitLocalSet.

}

// A stack of catching expressions that are parents of the current expression,

// that is, Try and TryTable.

std::vector<Expression*> catchers;

static void popCatcher(RemoveUnusedBrs* self, Expression** currp) {

assert(!self->catchers.empty() && self->catchers.back() == *currp);

self->catchers.pop_back();

}

void visitThrow(Throw* curr) {

// If a throw will definitely be caught, and it is not a catch with a

// reference, then it is just a branch (i.e. the code is using exceptions as

// control flow). Turn it into a branch here so that the rest of the pass

// can optimize it with all other branches.

// To do so, look at the closest try and see if it will catch us, and

// proceed outwards if not.

auto thrownTag = curr->tag;

for (int i = catchers.size() - 1; i >= 0; i--) {

auto* tryy = catchers[i]->dynCast<TryTable>();

if (!tryy) {

// We do not handle mixtures of Try and TryTable.

return;

}

for (Index j = 0; j < tryy->catchTags.size(); j++) {

auto tag = tryy->catchTags[j];

// The tag must match, or be a catch_all.

if (tag == thrownTag || tag.isNull()) {

// This must not be a catch with exnref.

if (!tryy->catchRefs[j]) {

// Success! Create a break to replace the throw.

auto dest = tryy->catchDests[j];

auto& wasm = *getModule();

Builder builder(wasm);

if (!tag.isNull()) {

// We are catching a specific tag, so values might be sent.

Expression* value = nullptr;

if (curr->operands.size() == 1) {

value = curr->operands[0];

} else if (curr->operands.size() > 1) {

value = builder.makeTupleMake(curr->operands);

}

auto* br = builder.makeBreak(dest, value);

replaceCurrent(br);

return;

}

// catch_all: no values are sent. Drop the throw's children (while

// ignoring parent effects: the parent is a throw, but we have

// proven we can remove that effect).

auto* br = builder.makeBreak(dest);

auto* rep = getDroppedChildrenAndAppend(

curr, wasm, getPassOptions(), br, DropMode::IgnoreParentEffects);

replaceCurrent(rep);

// We modified the code here and may have added a drop, etc., so

// stop the flow (rather than re-scan it somehow). We leave

// optimizing anything that flows out for later iterations.

stopFlow();

}

// Return even if we did not optimize: we found our tag was caught.

return;

}

// override scan to add a pre and a post check task to all nodes

static void scan(RemoveUnusedBrs* self, Expression** currp) {

self->pushTask(visitAny, currp);

if (auto* iff = (*currp)->dynCast<If>()) {

if (iff->condition->type == Type::unreachable) {

// avoid trying to optimize this, we never reach it anyhow

return;

}

self->pushTask(doVisitIf, currp);

if (iff->ifFalse) {

// we need to join up if-else control flow, and clear after the

// condition

self->pushTask(scan, &iff->ifFalse);

// safe the ifTrue flow, we'll join it later

self->pushTask(saveIfTrue, currp);

}

self->pushTask(scan, &iff->ifTrue);

self->pushTask(clear, currp); // clear all flow after the condition

self->pushTask(scan, &iff->condition);

return;

}

if ((*currp)->is<TryTable>() || (*currp)->is<Try>()) {

// Push the try we are reaching, and add a task to pop it, after all the

// tasks that Super::scan will push for its children.

self->catchers.push_back(*currp);

self->pushTask(popCatcher, currp);

}

Super::scan(self, currp);

}

// optimizes a loop. returns true if we made changes

bool optimizeLoop(Loop* loop) {

// if a loop ends in

// (loop $in

// (block $out

// if (..) br $in; else br $out;

// )

// then our normal opts can remove the break out since it flows directly out

// (and later passes make the if one-armed). however, the simple analysis

// fails on patterns like

// if (..) br $out;

// br $in;

// which is a common way to do a while (1) loop (end it with a jump to the

// top), so we handle that here. Specifically we want to conditionalize

// breaks to the loop top, i.e., put them behind a condition, so that other

// code can flow directly out and thus brs out can be removed. (even if

// the change is to let a break somewhere else flow out, that can still be

// helpful, as it shortens the logical loop. it is also good to generate

// an if-else instead of an if, as it might allow an eqz to be removed

// by flipping arms)

if (!loop->name.is()) {

return false;

}

auto* block = loop->body->dynCast<Block>();

if (!block) {

return false;

}

// does the last element break to the top of the loop?

auto& list = block->list;

if (list.size() <= 1) {

return false;

}

auto* last = list.back()->dynCast<Break>();

if (!last || !ExpressionAnalyzer::isSimple(last) ||

last->name != loop->name) {

return false;

}

// last is a simple break to the top of the loop. if we can conditionalize

// it, it won't block things from flowing out and not needing breaks to do

// so.

Index i = list.size() - 2;

Builder builder(*getModule());

while (1) {

auto* curr = list[i];

if (auto* iff = curr->dynCast<If>()) {

// let's try to move the code going to the top of the loop into the

// if-else

if (!iff->ifFalse) {

// we need the ifTrue to break, so it cannot reach the code we want to

// move

if (iff->ifTrue->type == Type::unreachable) {

iff->ifFalse = stealSlice(builder, block, i + 1, list.size());

iff->finalize();

block->finalize();

return true;

}

} else if (iff->condition->type != Type::unreachable) {

// This is already an if-else. If one side is a dead end, we can

// append to the other, if there is no returned value to concern us.

// Note that we skip ifs with unreachable conditions, as they are dead

// code that DCE can remove, and modifying them can lead to errors

// (one of the arms may still be concrete, in which case appending to

// it would be invalid).

// can't be, since in the middle of a block

assert(!iff->type.isConcrete());

// ensures the first node is a block, if it isn't already, and merges

// in the second, either as a single element or, if a block, by

// appending to the first block. this keeps the order of operations in

// place, that is, the appended element will be executed after the

// first node's elements

auto blockifyMerge = [&](Expression* any,

Expression* append) -> Block* {

Block* block = nullptr;

if (any) {

block = any->dynCast<Block>();

}

// if the first isn't a block, or it's a block with a name (so we

// might branch to the end, and so can't append to it, we might skip

// that code!) then make a new block

if (!block || block->name.is()) {

block = builder.makeBlock(any);

} else {

assert(!block->type.isConcrete());

}

auto* other = append->dynCast<Block>();

if (!other) {

block->list.push_back(append);

} else {

for (auto* item : other->list) {

block->list.push_back(item);

}

block->finalize();

return block;

};

if (iff->ifTrue->type == Type::unreachable) {

iff->ifFalse = blockifyMerge(

iff->ifFalse, stealSlice(builder, block, i + 1, list.size()));

iff->finalize();

block->finalize();

return true;

} else if (iff->ifFalse->type == Type::unreachable) {

iff->ifTrue = blockifyMerge(

iff->ifTrue, stealSlice(builder, block, i + 1, list.size()));

iff->finalize();

block->finalize();

return true;

}

return false;

} else if (auto* brIf = curr->dynCast<Break>()) {

// br_if is similar to if.

if (brIf->condition && !brIf->value && brIf->name != loop->name) {

if (i == list.size() - 2) {

// there is the br_if, and then the br to the top, so just flip them

// and the condition

brIf->condition = builder.makeUnary(EqZInt32, brIf->condition);

last->name = brIf->name;

brIf->name = loop->name;

BranchHints::flip(brIf, getFunction());

return true;

} else {

// there are elements in the middle,

// br_if $somewhere (condition)

// (..more..)

// br $in

// we can convert the br_if to an if. this has a cost, though,

// so only do it if it looks useful, which it definitely is if

// (a) $somewhere is straight out (so the br out vanishes), and

// (b) this br_if is the only branch to that block (so the block

// will vanish)

if (brIf->name == block->name &&

BranchUtils::BranchSeeker::count(block, block->name) == 1) {

// note that we could drop the last element here, it is a br we

// know for sure is removable, but telling stealSlice to steal all

// to the end is more efficient, it can just truncate.

list[i] =

builder.makeIf(brIf->condition,

builder.makeBreak(brIf->name),

stealSlice(builder, block, i + 1, list.size()));

BranchHints::copyTo(brIf, list[i], getFunction());

block->finalize();

return true;

}

return false;

}

// if there is control flow, we must stop looking

if (EffectAnalyzer(getPassOptions(), *getModule(), curr)

.transfersControlFlow()) {

return false;

}

if (i == 0) {

return false;

}

i--;

}

bool sinkBlocks(Function* func) {

struct Sinker : public PostWalker<Sinker> {

bool worked = false;

void visitBlock(Block* curr) {

// If the block has a single child which is a loop, and the block is

// named, then it is the exit for the loop. It's better to move it into

// the loop, where it can be better optimized by other passes. Similar

// logic for ifs: if the block is an exit for the if, we can move the

// block in, consider for example:

// (block $label

// (if (..condition1..)

// (block

// (br_if $label (..condition2..))

// (..code..)

// )

// After also merging the blocks, we have

// (if (..condition1..)

// (block $label

// (br_if $label (..condition2..))

// (..code..)

// )

// which can be further optimized later.

if (curr->name.is() && curr->list.size() == 1) {

if (auto* loop = curr->list[0]->dynCast<Loop>()) {

curr->list[0] = loop->body;

loop->body = curr;

curr->finalize(curr->type);

loop->finalize();

replaceCurrent(loop);

worked = true;

} else if (auto* iff = curr->list[0]->dynCast<If>()) {

if (iff->condition->type == Type::unreachable) {

// The block result type may not be compatible with the arm result

// types since the unreachable If can satisfy any type of block.

// Just leave this for DCE.

return;

}

// The label can't be used in the condition.

if (BranchUtils::BranchSeeker::count(iff->condition, curr->name) ==

0) {

// We can move the block into either arm, if there are no uses in

// the other.

Expression** target = nullptr;

if (!iff->ifFalse || BranchUtils::BranchSeeker::count(

iff->ifFalse, curr->name) == 0) {

target = &iff->ifTrue;

} else if (BranchUtils::BranchSeeker::count(iff->ifTrue,

curr->name) == 0) {

target = &iff->ifFalse;

}

if (target) {

curr->list[0] = *target;

*target = curr;

// The block used to contain the if, and may have changed type

// from unreachable to none, for example, if the if has an

// unreachable condition but the arm is not unreachable.

curr->finalize();

iff->finalize();

replaceCurrent(iff);

worked = true;

// Note that the type might change, e.g. if the if condition is

// unreachable but the block that was on the outside had a

// break.

}

} sinker;

sinker.doWalkFunction(func);

if (sinker.worked) {

ReFinalize().walkFunctionInModule(func, getModule());

return true;

}

return false;

}

// GC-specific optimizations. These are split out from the main code to keep

// things as simple as possible.

bool optimizeGC(Function* func) {

if (!getModule()->features.hasGC()) {

return false;

}

struct Optimizer : public PostWalker<Optimizer> {

PassOptions& passOptions;

bool worked = false;

Optimizer(PassOptions& passOptions) : passOptions(passOptions) {}

void visitBrOn(BrOn* curr) {

// Ignore unreachable BrOns which we cannot improve anyhow. Note that

// we must check the ref field manually, as we may be changing types as

// we go here. (Another option would be to use a TypeUpdater here

// instead of calling ReFinalize at the very end, but that would be more

// complex and slower.)

if (curr->type == Type::unreachable ||

curr->ref->type == Type::unreachable) {

return;

}

Builder builder(*getModule());

Type refType =

Properties::getFallthroughType(curr->ref, passOptions, *getModule());

if (refType == Type::unreachable) {

// Leave this to DCE.

return;

}

assert(refType.isRef());

// When we optimize based on all the fallthrough type information

// available, we may need to insert a cast to maintain validity. For

// example, in this case we know the cast will succeed, but it would be

// invalid to send curr->ref directly:

// (br_on_cast $l anyref i31ref

// (block (result anyref)

// (ref.i31 ...)))

// We could just always do the cast and leave removing the casts to

// OptimizeInstructions, but it's simple enough to avoid unnecessary

// casting here.

auto maybeCast = [&](Expression* expr, Type type) -> Expression* {

assert(expr->type.isRef() && type.isRef());

if (Type::isSubType(expr->type, type)) {

return expr;

}

if (type.isNonNullable() && expr->type.isNullable() &&

Type::isSubType(expr->type.with(NonNullable), type)) {

return builder.makeRefAs(RefAsNonNull, expr);

}

return builder.makeRefCast(expr, type);

};

// When we optimize out a cast, we still need the ref value to either

// send on the optimized branch or return from the current expression.

// When we have a descriptor cast, the ref value needs to be moved

// across the descriptor value, which might have side effects. If so, we

// need to use a scratch local.

auto getRefValue = [&]() -> Expression* {

if (curr->desc) {

// Preserve the trap on a null descriptor.

if (curr->desc->type.isNullable()) {

curr->desc = builder.makeRefAs(RefAsNonNull, curr->desc);

}

Block* ref =

ChildLocalizer(curr, getFunction(), *getModule(), passOptions)

.getChildrenReplacement();

ref->list.push_back(curr->ref);

ref->type = curr->ref->type;

return ref;

}

return curr->ref;

};

switch (curr->op) {

case BrOnNull:

if (refType.isNull()) {

// The branch will definitely be taken.

replaceCurrent(builder.makeSequence(

builder.makeDrop(curr->ref), builder.makeBreak(curr->name)));

worked = true;

return;

}

if (refType.isNonNullable()) {

// The branch will definitely not be taken.

replaceCurrent(maybeCast(curr->ref, curr->type));

worked = true;

return;

}

return;

case BrOnNonNull:

if (refType.isNull()) {

// Definitely not taken.

replaceCurrent(builder.makeDrop(curr->ref));

worked = true;

return;

}

if (refType.isNonNullable()) {

// Definitely taken.

replaceCurrent(builder.makeBreak(

curr->name, maybeCast(curr->ref, curr->getSentType())));

worked = true;

return;

}

return;

case BrOnCast:

case BrOnCastFail:

case BrOnCastDescEq:

case BrOnCastDescEqFail: {

bool onFail =

curr->op == BrOnCastFail || curr->op == BrOnCastDescEqFail;

bool isDesc =

curr->op == BrOnCastDescEq || curr->op == BrOnCastDescEqFail;

// Improve the cast target type as much as possible given what we

// know about the input. Unlike in BrOn::finalize(), we consider

// type information from all the fallthrough values here. We can

// continue to further optimizations after this, and those

// optimizations might even benefit from this improvement.

auto improvedType = curr->castType;

if (!isDesc) {

improvedType = Type::getGreatestLowerBound(improvedType, refType);

} else {

// For descriptor casts, the target heap type is controlled by the

// descriptor operand, but we can still improve nullability.

if (improvedType.isNullable() && refType.isNonNullable()) {

improvedType = improvedType.with(NonNullable);

}

if (!curr->castType.isExact()) {

// When custom descriptors is not enabled, nontrivial exact casts

// are not allowed.

improvedType =

improvedType.withInexactIfNoCustomDescs(getModule()->features);

}

if (onFail) {

// BrOnCastFail sends the input type, with adjusted nullability.

// The input heap type makes sense for the branch target, and we

// will not change it anyhow, but we need to be careful with

// nullability: if the cast type was nullable, then we were

// sending a non-nullable value to the branch, and if we refined

// the cast type to non- nullable, we would no longer be doing

// that. In other words, we must not refine the nullability, as

// that would *un*refine the send type.

// TODO: Consider allowing this change if the branch target

// expects a nullable type anyway.

if (curr->castType.isNullable() && improvedType.isNonNullable()) {

improvedType = improvedType.with(Nullable);

}

if (improvedType != Type::unreachable &&

improvedType != curr->castType) {

curr->castType = improvedType;

auto oldType = curr->type;

curr->finalize();

worked = true;

// We refined the castType, which may *un*-refine the BrOn itself.

// Imagine the castType was nullable before, then nulls would go

// on the branch, and so the BrOn could only flow out a

View remainder of file in raw view

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

RemoveUnusedBrs.cpp

Latest commit

History

RemoveUnusedBrs.cpp

File metadata and controls