tensorflow/tensorflow/python/ops/control_flow_ops.py at master · evdevdev/tensorflow

History

1977 lines (1649 loc) · 67.6 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

435

436

437

438

439

440

441

442

443

444

445

446

447

448

449

450

451

452

453

454

455

456

457

458

459

460

461

462

463

464

465

466

467

468

469

470

471

472

473

474

475

476

477

478

479

480

481

482

483

484

485

486

487

488

489

490

491

492

493

494

495

496

497

498

499

500

501

502

503

504

505

506

507

508

509

510

511

512

513

514

515

516

517

518

519

520

521

522

523

524

525

526

527

528

529

530

531

532

533

534

535

536

537

538

539

540

541

542

543

544

545

546

547

548

549

550

551

552

553

554

555

556

557

558

559

560

561

562

563

564

565

566

567

568

569

570

571

572

573

574

575

576

577

578

579

580

581

582

583

584

585

586

587

588

589

590

591

592

593

594

595

596

597

598

599

600

601

602

603

604

605

606

607

608

609

610

611

612

613

614

615

616

617

618

619

620

621

622

623

624

625

626

627

628

629

630

631

632

633

634

635

636

637

638

639

640

641

642

643

644

645

646

647

648

649

650

651

652

653

654

655

656

657

658

659

660

661

662

663

664

665

666

667

668

669

670

671

672

673

674

675

676

677

678

679

680

681

682

683

684

685

686

687

688

689

690

691

692

693

694

695

696

697

698

699

700

701

702

703

704

705

706

707

708

709

710

711

712

713

714

715

716

717

718

719

720

721

722

723

724

725

726

727

728

729

730

731

732

733

734

735

736

737

738

739

740

741

742

743

744

745

746

747

748

749

750

751

752

753

754

755

756

757

758

759

760

761

762

763

764

765

766

767

768

769

770

771

772

773

774

775

776

777

778

779

780

781

782

783

784

785

786

787

788

789

790

791

792

793

794

795

796

797

798

799

800

801

802

803

804

805

806

807

808

809

810

811

812

813

814

815

816

817

818

819

820

821

822

823

824

825

826

827

828

829

830

831

832

833

834

835

836

837

838

839

840

841

842

843

844

845

846

847

848

849

850

851

852

853

854

855

856

857

858

859

860

861

862

863

864

865

866

867

868

869

870

871

872

873

874

875

876

877

878

879

880

881

882

883

884

885

886

887

888

889

890

891

892

893

894

895

896

897

898

899

900

901

902

903

904

905

906

907

908

909

910

911

912

913

914

915

916

917

918

919

920

921

922

923

924

925

926

927

928

929

930

931

932

933

934

935

936

937

938

939

940

941

942

943

944

945

946

947

948

949

950

951

952

953

954

955

956

957

958

959

960

961

962

963

964

965

966

967

968

969

970

971

972

973

974

975

976

977

978

979

980

981

982

983

984

985

986

987

988

989

990

991

992

993

994

995

996

997

998

999

1000

# Licensed under the Apache License, Version 2.0 (the "License");

# you may not use this file except in compliance with the License.

# You may obtain a copy of the License at

# http://www.apache.org/licenses/LICENSE-2.0

# Unless required by applicable law or agreed to in writing, software

# distributed under the License is distributed on an "AS IS" BASIS,

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

# See the License for the specific language governing permissions and

# limitations under the License.

# ==============================================================================

"""## Control Flow Operations

TensorFlow provides several operations and classes that you can use to control

the execution of operations and add conditional dependencies to your graph.

@@identity

@@tuple

@@group

@@no_op

@@count_up_to

@@cond

## Logical Operators

TensorFlow provides several operations that you can use to add logical operators

to your graph.

@@logical_and

@@logical_not

@@logical_or

@@logical_xor

## Comparison Operators

TensorFlow provides several operations that you can use to add comparison

operators to your graph.

@@equal

@@not_equal

@@less

@@less_equal

@@greater

@@greater_equal

@@select

@@where

## Debugging Operations

TensorFlow provides several operations that you can use to validate values and

debug your graph.

@@is_finite

@@is_inf

@@is_nan

@@verify_tensor_all_finite

@@check_numerics

@@add_check_numerics_ops

@@Assert

@@Print

"""

# pylint: disable=g-bad-name

from __future__ import absolute_import

from __future__ import division

from __future__ import print_function

import six

from six.moves import xrange # pylint: disable=redefined-builtin

from tensorflow.python.framework import dtypes

from tensorflow.python.framework import ops

from tensorflow.python.framework import tensor_shape

from tensorflow.python.ops import array_ops

from tensorflow.python.ops import common_shapes

from tensorflow.python.ops import constant_op

from tensorflow.python.ops import gen_array_ops

from tensorflow.python.ops import gen_control_flow_ops

from tensorflow.python.ops import gen_data_flow_ops

from tensorflow.python.ops import math_ops

# pylint: disable=wildcard-import,undefined-variable

from tensorflow.python.ops.gen_control_flow_ops import *

from tensorflow.python.platform import logging

# We override the 'tuple' for a control flow op, so we keep python's

# existing 'tuple' for later use in this module.

_basetuple = tuple

# pylint: disable=protected-access

def _Identity(data, name=None):

"""Return a tensor with the same shape and contents as the input tensor.

Args:

data: A Tensor.

Returns:

A Tensor with the same type and value as the input Tensor.

"""

if not data.dtype.is_ref_dtype:

return array_ops.identity(data, name=name)

else:

return gen_array_ops._ref_identity(data, name=name)

def _NextIteration(data, name=None):

if not data.dtype.is_ref_dtype:

return next_iteration(data, name=name)

else:

return ref_next_iteration(data, name=name)

def _Merge(values, name=None):

if all([v.dtype.is_ref_dtype for v in values]):

return gen_control_flow_ops._ref_merge(values, name)

else:

return gen_control_flow_ops._merge(values, name)

def _Enter(data, frame_name, is_constant=False, parallel_iterations=10,

use_ref=True, name=None):

"""Creates or finds a child frame, and makes `data` available to it.

The unique `frame_name` is used by the `Executor` to identify frames. If

`is_constant` is true, `output` is a constant in the child frame; otherwise

it may be changed in the child frame. At most `parallel_iterations` iterations

are run in parallel in the child frame.

Args:

data: The tensor to be made available to the child frame.

frame_name: The name of the child frame.

is_constant: If true, the output is constant within the child frame.

parallel_iterations: The number of iterations allowed to run in parallel.

use_ref: If true, use ref_enter if data is of ref type.

Returns:

The same tensor as `data`.

"""

if data.dtype.is_ref_dtype and use_ref:

return ref_enter(data, frame_name, is_constant, parallel_iterations,

name=name)

else:

return enter(data, frame_name, is_constant, parallel_iterations,

name=name)

def exit(data, name=None):

"""Exits the current frame to its parent frame.

Exit makes its input `data` available to the parent frame.

Args:

data: The tensor to be made available to the parent frame.

Returns:

The same tensor as `data`.

"""

if data.dtype.is_ref_dtype:

return gen_control_flow_ops._ref_exit(data, name)

else:

return gen_control_flow_ops._exit(data, name)

def switch(data, pred, dtype=None, name=None):

"""Forwards `data` to an output determined by `pred`.

If `pred` is true, the `data` input is forwared to the first output.

Otherwise, the data goes to the second output.

This op handles `Tensor`s and `IndexedSlices`.

Args:

data: The tensor to be forwarded to the appropriate output.

pred: A scalar that specifies which output port will receive data.

dtype: Optional element type for the returned tensor. If missing,

the type is inferred from the type of `value`.

Returns:

`(output_false, output_true)`: If `pred` is true, data will be forwarded to

`output_true`, otherwise it goes to `output_false`.

"""

with ops.op_scope([data, pred], name, "Switch") as name:

data = ops.convert_to_tensor_or_indexed_slices(data, dtype=dtype,

name="data")

pred = ops.convert_to_tensor(pred, name="pred")

if isinstance(data, ops.Tensor):

return gen_control_flow_ops._switch(data, pred, name=name)

else:

val, ind, dense_shape = data.values, data.indices, data.dense_shape

val_f, val_t = gen_control_flow_ops._switch(val, pred, name=name)

ind_f, ind_t = gen_control_flow_ops._switch(ind, pred, name="indices")

if dense_shape:

dense_shape_f, dense_shape_t = gen_control_flow_ops._switch(

dense_shape, pred, name="dense_shape")

else:

dense_shape_f, dense_shape_t = None, None

return (ops.IndexedSlices(val_f, ind_f, dense_shape_f),

ops.IndexedSlices(val_t, ind_t, dense_shape_t))

def merge(inputs, name=None):

"""Returns the value of an available element of `inputs`.

This op tests each of the tensors in `inputs` in turn to determine if any of

them is available. If it finds an available tensor, it returns it and its

index in `inputs`.

It is an error if more than one tensor in `inputs` is available. If no tensor

in `inputs` is available, the returned tensor and index are not set.

This op handles both `Tensor`s and `IndexedSlices`. If inputs has a mix of

`Tensor`s and `IndexedSlices`, all inputs are converted to IndexedSlices

before merging.

Args:

inputs: The input tensors, at most one of which is available.

Returns:

A tuple containing the chosen input tensor and its index in `inputs`.

Raises:

ValueError: If inputs are IndexedSlices and some but not all have a

dense_shape property.

"""

with ops.op_scope(inputs, name, "Merge") as name:

inputs = [ops.convert_to_tensor_or_indexed_slices(inp)

for inp in inputs]

if all([isinstance(inp, ops.Tensor) for inp in inputs]):

return _Merge(inputs, name=name)

else:

inputs = math_ops._as_indexed_slices_list(inputs)

values, _ = _Merge([inp.values for inp in inputs], name=name)

indices, chosen_index = _Merge(

[inp.indices for inp in inputs], name="indices")

if any(inp.dense_shape for inp in inputs):

if not all(inp.dense_shape for inp in inputs):

raise ValueError("Either all merged IndexedSlices must have a "

"dense_shape, or none must have a dense_shape.")

dense_shape, _ = _Merge(

[inp.dense_shape for inp in inputs], name="dense_shape")

else:

dense_shape = None

return ops.IndexedSlices(values, indices, dense_shape), chosen_index

def _SwitchRefOrTensor(data, pred, name="Switch"):

"""Forwards `data` to an output determined by `pred`.

If `pred` is true, the `data` input is forwared to the first output.

Otherwise, the data goes to the second output.

This op handles `Tensor`s and `IndexedSlices`.

Args:

data: The tensor to be forwarded to the appropriate output.

pred: A scalar that specifies which output port will receive data.

Returns:

`(output_false, output_false)`: If `pred` is true, data will be forwarded to

`output_true`, otherwise it goes to `output_false`.

Raises:

TypeError: if data is not a Tensor or IndexedSlices

"""

data = ops.convert_to_tensor_or_indexed_slices(data, name="data")

with ops.device(data.device):

if isinstance(data, ops.Tensor):

if not data.dtype.is_ref_dtype:

return switch(data, pred, name=name)

else:

return ref_switch(data, pred, name=name)

else:

return switch(data, pred, name=name)

class ControlFlowOpWrapper(object):

"""A wrapper class for Operation.

A wrapped op allows us to capture the uses of its inputs and outputs. In

gradients(), right before calling the gradient function of an op, we wrap

the op by calling MakeWrapper. So during the exection of the gradient

function of an op , any time when one of its inputs/outputs is used, we

generate code to remember its values for all iterations.

"""

class _ControlFlowOpInputs(object):

"""An indirection to capture the input tensors needed in backprop."""

def __init__(self, op, grad_state):

self._op = op

self._grad_state = grad_state

self._inputs = None

def __len__(self):

return len(self._op._inputs)

def __getitem__(self, index):

if self._inputs is None:

self._inputs = [None for _ in self._op.inputs]

if isinstance(index, int):

val = self._inputs[index]

if val is None:

f_val = self._op.inputs[index]

val = self._grad_state.GetRealValue(f_val)

self._inputs[index] = val

return val

elif isinstance(index, slice):

start, stop, step = index.indices(len(self))

vals = [self[i] for i in xrange(start, stop, step)]

return vals

else:

raise TypeError("index must be an integer or slice")

class _ControlFlowOpOutputs(object):

"""An indirection to capture the output tensors needed in backprop."""

def __init__(self, op, grad_state):

self._op = op

self._grad_state = grad_state

self._outputs = None

def __len__(self):

return len(self._op._outputs)

def __getitem__(self, index):

if self._outputs is None:

self._outputs = [None for _ in self._op.outputs]

if isinstance(index, int):

val = self._outputs[index]

if val is None:

f_val = self._op.outputs[index]

val = self._grad_state.GetRealValue(f_val)

self._outputs[index] = val

return val

elif isinstance(index, slice):

start, stop, step = index.indices(len(self))

vals = [self[i] for i in xrange(start, stop, step)]

return vals

else:

raise TypeError("index must be an integer or slice")

def __init__(self, op, grad_state):

self._grad_state = grad_state # The GradLoopState this op belongs to.

self._op = op

self._inputs = None

self._outputs = None

@property

def grad_state(self):

return self._grad_state

@property

def inputs(self):

if self._inputs is None:

self._inputs = self._ControlFlowOpInputs(self._op, self._grad_state)

return self._inputs

@property

def outputs(self):

if self._outputs is None:

self._outputs = self._ControlFlowOpOutputs(self._op, self._grad_state)

return self._outputs

@property

def op(self):

return self._op

@property

def name(self):

"""Returns the name of this instance of op."""

return self._op.name

@property

def _id(self):

"""Returns the unique id of this operation."""

return self._op._id

@property

def device(self):

"""Returns the device of this operation.

Returns:

a string or None if the device was not set.

"""

return self._op.device

@property

def type(self):

"""Returns the type of the op."""

return self._op.type

@property

def graph(self):

"""The `Graph` that contains this operation."""

return self._op.graph

def get_attr(self, name):

"""Returns the value of the attr of this op with the given `name`."""

return self._op.get_attr(name)

def _get_control_flow_context(self):

"""Returns the control flow context of this op."""

return self._op._get_control_flow_context()

def _IsLoopConstantEnter(op):

"""Returns true iff op is a loop invariant."""

is_enter = (op.type == "Enter" or op.type == "RefEnter")

return is_enter and op.get_attr("is_constant")

def _IsLoopExit(op):

return op.type == "Exit" or op.type == "RefExit"

class GradLoopState(object):

"""The state used for constructing the gradient graph for a while loop.

We create a GradLoopState for each while loop in forward and its

corresponding while loop in backprop. This gives us access to both

the forward and the backprop WhileContexts.

During the construction of gradient graph, any time when we detect

a forward value that is needed for backprop, we create a history

accumulator and add it to `history_map`. Any time when we backprop

a loop switch op (in _SwitchGrad), we add the grad merge op in

`switch_map`.

"""

def __init__(self, forward_ctxt, outer_grad_state):

# The grad loop state for the outer while loop.

self._outer_grad_state = None

# The while loop context for forward.

self._forward_context = None

# The loop counter added by AddForwardCounter. It is the value

# of the loop counter for the next iteration.

self._forward_index = None

# A sync op for forward.

self._forward_sync = None

# The while loop context for backprop.

self._grad_context = None

# The loop counter added by AddBackPropCounter. It is the value

# of the loop counter for the current iteration.

self._grad_index = None

# A sync op for backprop.

self._grad_sync = None

# Information needed by backprop.

self._history_map = {}

self._switch_map = {}

self._outer_grad_state = outer_grad_state

if outer_grad_state:

outer_forward_ctxt = outer_grad_state.forward_context

else:

outer_forward_ctxt = forward_ctxt.outer_context

# Add the forward loop counter.

if outer_forward_ctxt: outer_forward_ctxt.Enter()

cnt, forward_index = forward_ctxt.AddForwardCounter()

if outer_forward_ctxt: outer_forward_ctxt.Exit()

self._forward_context = forward_ctxt

self._forward_index = forward_index

# Add the backprop WhileContext, and the backprop loop counter.

if outer_grad_state:

# This is a nested loop. Remember the iteration counts for each

# execution of this inner loop.

outer_forward_ctxt.AddName(cnt.name)

history_cnt = outer_grad_state.AddForwardAccumulator(cnt)

outer_grad_ctxt = outer_grad_state.grad_context

outer_grad_ctxt.Enter()

self._grad_context = WhileContext(forward_ctxt.parallel_iterations,

forward_ctxt.back_prop,

forward_ctxt.name)

real_cnt = outer_grad_state.AddBackPropAccumulatedValue(history_cnt, cnt)

self._grad_index = self._grad_context.AddBackPropCounter(real_cnt)

outer_grad_ctxt.Exit()

else:

if outer_forward_ctxt: outer_forward_ctxt.Enter()

self._grad_context = WhileContext(forward_ctxt.parallel_iterations,

forward_ctxt.back_prop,

forward_ctxt.name)

self._grad_index = self._grad_context.AddBackPropCounter(cnt)

if outer_forward_ctxt: outer_forward_ctxt.Exit()

@property

def outer_grad_state(self):

"""The grad loop state for outer loop."""

return self._outer_grad_state

@property

def forward_context(self):

"""The while loop context for forward."""

return self._forward_context

@property

def forward_index(self):

"""The loop index of forward loop."""

return self._forward_index

@property

def forward_sync(self):

"""A control trigger node for synchronization in the forward loop.

One main use is to keep the push ops of a stack executed in the

iteration order.

"""

if self._forward_sync is None:

with ops.control_dependencies(None):

self._forward_sync = control_trigger(name="f_sync")

self._forward_sync._set_control_flow_context(self._forward_context)

self._forward_index.op._add_control_input(self._forward_sync)

return self._forward_sync

@property

def grad_context(self):

"""The corresponding WhileContext for gradient."""

return self._grad_context

@property

def grad_index(self):

"""The loop index of backprop loop."""

return self._grad_index

@property

def grad_sync(self):

"""A control trigger node for synchronization in the grad loop.

One main use is to keep the pop ops of a stack executed in the

iteration order.

"""

if self._grad_sync is None:

with ops.control_dependencies(None):

self._grad_sync = control_trigger(name="b_sync")

self._grad_sync._set_control_flow_context(self._grad_context)

self._grad_index.op._add_control_input(self._grad_sync)

return self._grad_sync

@property

def history_map(self):

"""The map that records all the tensors needed for backprop."""

return self._history_map

@property

def switch_map(self):

"""The map that records all the Switch ops for the While loop."""

return self._switch_map

def AddForwardAccumulator(self, value, dead_branch=False):

"""Add an accumulator for each forward tensor that is needed in backprop.

This is added to the forward loop at the first time when a tensor

in the forward loop is used by backprop gradient computation loop.

We create an accumulator that accumulates the value of tensor at each

iteration. Called in the control flow context where gradients() is called.

The pseudocode is:

```

acc = stack();

while (_pivot) {

acc = stack_push(acc, value);

}

```

We make sure that the stack push op in one iteration is executed before

next iteration. This is achieved by adding a control edge from

`forward_index.op.inputs[0].op` to the push op, and another control

edge from the push op to either `forward_index.op` or `forward_sync`.

Args:

value: The tensor that is to be accumulated.

dead_branch: True iff the tensor is on a dead branch of a cond.

Returns:

The stack that contains the accumulated history of the tensor.

"""

# TODO(yuanbyu): Make sure the colocation of stack ops and value.

# pylint: disable=protected-access

acc = gen_data_flow_ops._stack(value.dtype.base_dtype, name="f_acc")

# pylint: enable=protected-access

# Make acc available in the forward context.

enter_acc = self.forward_context.AddValue(acc)

# Add the stack_push op in the context of value.op.

value_ctxt = value.op._get_control_flow_context()

if _IsLoopExit(value.op):

value_ctxt = value_ctxt.outer_context

if value_ctxt == self.forward_context:

# value is not nested in the forward context.

self.forward_context.Enter()

push = gen_data_flow_ops._stack_push(enter_acc, value)

# Protect stack push and order it before forward_index.

self.forward_index.op._add_control_input(push.op)

self.forward_context.Exit()

else:

# value is in a cond context within the forward context.

assert isinstance(value_ctxt, CondContext)

if dead_branch:

# The special case for creating a zero tensor for a dead

# branch of a switch. See ControlFlowState.ZerosLike().

value_ctxt.outer_context.Enter()

push = gen_data_flow_ops._stack_push(enter_acc, value)

value_ctxt.outer_context.Exit()

# Guard with a switch but take the other branch.

pred = self.history_map.get(value_ctxt.pred.name)

branch = value_ctxt.branch

value_ctxt.AddName(push.name)

value_ctxt.Enter()

push = _SwitchRefOrTensor(push, pred)[1 - branch]

value_ctxt.Exit()

else:

value_ctxt.Enter()

push = gen_data_flow_ops._stack_push(enter_acc, value)

value_ctxt.Exit()

# Protect stack push and order it before forward_sync.

self.forward_sync._add_control_input(push.op)

# Order stack push after the successor of forward_index

add_op = self.forward_index.op.inputs[0].op

push.op._add_control_input(add_op)

return acc

def AddBackPropAccumulatedValue(self, history_value, value,

dead_branch=False):

"""Add the getter for an accumulated value in the grad context.

This is added to the backprop loop. Called in the grad context to

get the value of an accumulated value. The stack pop op must be guarded

by the pred of the controlling cond.

Args:

history_value: The history (a stack) of a value.

value: The value that is pushed onto the stack.

dead_branch: True iff the tensor is on a dead branch of a cond.

Returns:

The current value (the top of the stack).

"""

history_ctxt = history_value.op._get_control_flow_context()

# Find the cond context that controls history_value.

cond_ctxt = None

value_ctxt = value.op._get_control_flow_context()

while value_ctxt and value_ctxt != history_ctxt:

if isinstance(value_ctxt, CondContext):

cond_ctxt = value_ctxt

break

value_ctxt = value_ctxt.outer_context

if cond_ctxt:

# Guard stack pop with a switch if it is controlled by a cond

grad_state = self

pred = None

while not pred and grad_state:

pred = grad_state.history_map.get(cond_ctxt.pred.name)

grad_state = grad_state.outer_grad_state

branch = (1 - cond_ctxt.branch) if dead_branch else cond_ctxt.branch

history_value = _SwitchRefOrTensor(history_value, pred)[branch]

pop = gen_data_flow_ops._stack_pop(history_value, value.dtype.base_dtype)

if self.grad_context.parallel_iterations > 1:

# All pops are ordered after pivot_for_body and before grad_sync.

self.grad_sync._add_control_input(pop.op)

return pop

def GetRealValue(self, value):

"""Get the real value.

If backprop "uses" a value produced by forward inference, an

accumulator is added in the forward loop to accumulate its values.

We use the accumulated value.

Args:

value: A tensor to be captured.

Returns:

The same tensor value from the saved history.

"""

assert value.op.type != "Variable"

real_value = self._history_map.get(value.name)

if real_value is None:

if _IsLoopConstantEnter(value.op):

# Special case for loop invariant.

if self._outer_grad_state:

# This is a nested loop so we record the history of this

# value in outer_forward_ctxt.

self._grad_context.Exit()

outer_value = value.op.inputs[0]

history_value = self._outer_grad_state.AddForwardAccumulator(

outer_value)

self._grad_context.Enter()

else:

# Just use the input value of this Enter node.

real_value = GetRealOp(value.op).inputs[0]

else:

# Record the history of this value in forward_ctxt.

# NOTE(yuanbyu): Don't record for constants.

self._grad_context.Exit()

history_value = self.AddForwardAccumulator(value)

self._grad_context.Enter()

if real_value is None:

# Add the stack pop op in the grad context.

real_value = self.AddBackPropAccumulatedValue(history_value, value)

self._history_map[value.name] = real_value

return real_value

def _GetWhileContext(op):

"""Get the WhileContext to which this op belongs."""

ctxt = op._get_control_flow_context()

if ctxt:

ctxt = ctxt.GetWhileContext()

return ctxt

class ControlFlowState(object):

"""Maintain the mapping from the loops to their grad states."""

def __init__(self):

self._map = {} # maps forward loop context to GradLoopState

def _GetGradState(self, op):

forward_ctxt = _GetWhileContext(op)

if forward_ctxt is None:

return None

return self._map.get(forward_ctxt)

def MakeWrapper(self, op):

"""Make a wrapper for op if it is in a WhileContext."""

grad_state = self._GetGradState(op)

if grad_state:

return ControlFlowOpWrapper(op, grad_state)

return op

def GetAllLoopExits(self):

"""Return a list containing the exits of all the loops."""

loop_exits = []

for forward_ctxt in self._map:

for loop_exit in forward_ctxt.loop_exits:

loop_exits.append(loop_exit)

return loop_exits

def EnterGradWhileContext(self, op):

"""Enter the WhileContext for gradient computation."""

grad_state = self._GetGradState(op)

if grad_state:

grad_state.grad_context.Enter()

def ExitGradWhileContext(self, op):

"""Exit the WhileContext for gradient computation."""

grad_state = self._GetGradState(op)

if grad_state:

grad_state.grad_context.Exit()

def AddWhileContext(self, op, between_op_list, between_ops):

"""Add the grad state for the while loop that op belongs to.

Note that op is an Exit, and this method must be called in

the control flow context where gradients() is called.

Note that this method modifies `between_op_list` and `between_ops`.

"""

forward_ctxt = _GetWhileContext(op)

grad_state = self._map.get(forward_ctxt)

if grad_state is None:

# This is a new while loop so create a grad state for it.

outer_forward_ctxt = forward_ctxt.outer_context

if outer_forward_ctxt:

outer_forward_ctxt = outer_forward_ctxt.GetWhileContext()

outer_grad_state = None

if outer_forward_ctxt:

outer_grad_state = self._map.get(outer_forward_ctxt)

grad_state = GradLoopState(forward_ctxt, outer_grad_state)

self._map[forward_ctxt] = grad_state

# We need to include all exits of a loop for backprop.

for loop_exit in forward_ctxt.loop_exits:

if not between_ops[loop_exit.op._id]:

between_ops[loop_exit.op._id] = True

between_op_list.append(loop_exit.op)

def ZerosLikeForExit(self, val):

"""Create zeros_like gradient for a loop exit.

If the result of a loop variable is not used but is involved in

computing the result of some needed loop variable, we create a

zero-valued tensor that is fed as gradient for the Exit node of that

loop variable. Note that val.op is an Exit, and this method must be

called in the control flow context where gradients() is called.

Args:

val: The output tensor of an Exit op.

Returns:

A zero tensor of the same shape of val.

"""

val_shape = val.get_shape()

forward_ctxt = val.op._get_control_flow_context()

outer_forward_ctxt = forward_ctxt.outer_context

if outer_forward_ctxt:

outer_forward_ctxt = outer_forward_ctxt.GetWhileContext()

outer_grad_state = None

if outer_forward_ctxt:

outer_grad_state = self._map.get(outer_forward_ctxt)

if outer_grad_state:

# This is a nested loop.

if val_shape.is_fully_defined():

# If the shape is known statically, just create a zero tensor

# with the right shape in the right context.

outer_grad_state.grad_context.Enter()

result = array_ops.zeros(val_shape.dims, val.dtype)

outer_grad_state.grad_context.Exit()

else:

history_val = outer_grad_state.AddForwardAccumulator(val)

outer_grad_ctxt = outer_grad_state.grad_context

outer_grad_ctxt.Enter()

real_val = outer_grad_state.AddBackPropAccumulatedValue(

history_val, val)

result = array_ops.zeros_like(real_val)

outer_grad_ctxt.Exit()

else:

# This is not a nested loop.

if val_shape.is_fully_defined():

# If the shape is known statically, just create a zero tensor

# with the right shape.

result = array_ops.zeros(val_shape.dims, val.dtype)

else:

result = array_ops.zeros_like(val)

return result

def ZerosLike(self, op, index):

"""Create zeros_like for the specified output of an op.

This method must be called in the grad loop context.

Args:

op: A tensorflow operation.

index: the index for a specific output of the op.

Returns:

A zero tensor of the same shape of op.outputs[index].

"""

if IsLoopSwitch(op): return None

dead_branch = op.type in {"Switch", "RefSwitch"}

forward_ctxt = _GetWhileContext(op)

if forward_ctxt is None:

return array_ops.zeros_like(op.outputs[index])

op_ctxt = op._get_control_flow_context()

grad_state = self._map.get(forward_ctxt)

val = ops.convert_to_tensor(op.outputs[index], name="tensor")

shape = val.get_shape()

if shape.is_fully_defined():

# If the shape is known statically, just create a zero tensor with

# the right shape in the grad loop context.

result = constant_op.constant(0, shape=shape.dims, dtype=val.dtype)

if dead_branch:

# op is a cond switch. Guard the zero tensor with a switch.

pred = grad_state.history_map.get(op_ctxt.pred.name)

branch = op_ctxt.branch

result = _SwitchRefOrTensor(result, pred)[1 - branch]

else:

# Unknown shape so keep a history of the shape at runtime.

op_ctxt.Enter()

zeros_shape = shape(val)

op_ctxt.Exit()

# Add forward accumulator for shape.

grad_state.grad_context.Exit()

history_shape = grad_state.AddForwardAccumulator(zeros_shape, dead_branch)

grad_state.grad_context.Enter()

# Create a zero tensor with the right shape.

shape = grad_state.AddBackPropAccumulatedValue(

history_shape, zero_shape, dead_branch)

result = array_ops.zeros(shape, val.dtype)

return result

def GetRealOp(op):

"""Get the real op by removing the wrapper."""

while isinstance(op, ControlFlowOpWrapper):

op = op.op

return op

def MaybeCreateControlFlowState(between_op_list, between_ops):

"""Create the state for all the while loops involved in one gradients().

We create a ControlFlowState when there are while loops involved in

gradients(). In gradients(), control flow logic is only invoked when

the ControlFlowState is not None.

Note that this method modifies `between_op_list` and `between_ops`.

"""

loop_state = None

for op in between_op_list:

if _IsLoopExit(op):

if loop_state is None:

loop_state = ControlFlowState()

loop_state.AddWhileContext(op, between_op_list, between_ops)

return loop_state

def IsLoopSwitch(op):

"""Return true if `op` is the Switch for a While loop."""

if op.type == "Switch" or op.type == "RefSwitch":

ctxt = op._get_control_flow_context()

return ctxt and isinstance(ctxt, WhileContext)

return False

class ControlFlowContext(object):

"""The base class for control flow context.

The usage pattern is a sequence of (Enter, Exit) followed by a final

ExitResult.

We maintain the following state for control flow contexts during graph

construction:

1. graph has _control_flow_context: the current context used to

construct new nodes. Changed by ctxt.Enter() and ctxt.Exit()

2. op has _control_flow_context: the context to which the op belongs.

Set at the time the op is created. Immutable.

3. A ControlFlowContext has _outer_context: the context in which this

context is created. Set at the time a context is created. Immutable.

4. A ControlFlowContext has _context_stack.

Pushed and popped by ctxt.Enter() and ctxt.Exit()

"""

def __init__(self):

self._outer_context = ops.get_default_graph()._get_control_flow_context()

self._context_stack = []

# Values that have been already seen in this context.

self._values = set()

# Values referenced by but external to this context.

self._external_values = {}

@property

def outer_context(self):

"""Return the context containing this context."""

return self._outer_context

def AddName(self, name):

self._values.add(name)

# pylint: disable=protected-access

def Enter(self):

"""Enter this control flow context."""

graph = ops.get_default_graph()

self._context_stack.append(graph._get_control_flow_context())

graph._set_control_flow_context(self)

def Exit(self):

"""Exit this control flow context."""

graph = ops.get_default_graph()

last_context = self._context_stack.pop()

graph._set_control_flow_context(last_context)

def ExitResult(self, result):

"""Make a list of tensors available in the outer context."""

if self._outer_context:

for x in result:

self._outer_context.AddName(x.name)

def GetWhileContext(self):

"""Return the while context containing this context."""

if self._outer_context:

return self._outer_context.GetWhileContext()

return None

def MaybeAddToWhileContext(self, op):

"""Add a control dependency to the containing WhileContext.

The added control dependency ensures that the outputs of this op

belong to the WhileContext. Do nothing if the op is not contained

in a WhileContext.

Args:

op: An operation.

"""

while_ctxt = self.GetWhileContext()

if while_ctxt is not None:

# pylint: disable=protected-access

op._add_control_input(while_ctxt.GetControlPivot().op)

# pylint: enable=protected-access

View remainder of file in raw view

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

control_flow_ops.py

Latest commit

History

control_flow_ops.py

File metadata and controls