Intelegentny_Pszczelarz/.venv/Lib/site-packages/tensorflow/python/ops/gen_cudnn_rnn_ops.py
2023-06-19 00:49:18 +02:00

2009 lines
99 KiB
Python

"""Python wrappers around TensorFlow ops.
This file is MACHINE GENERATED! Do not edit.
"""
import collections
from tensorflow.python import pywrap_tfe as pywrap_tfe
from tensorflow.python.eager import context as _context
from tensorflow.python.eager import core as _core
from tensorflow.python.eager import execute as _execute
from tensorflow.python.framework import dtypes as _dtypes
from tensorflow.python.framework import op_def_registry as _op_def_registry
from tensorflow.python.framework import ops as _ops
from tensorflow.python.framework import op_def_library as _op_def_library
from tensorflow.python.util.deprecation import deprecated_endpoints
from tensorflow.python.util import dispatch as _dispatch
from tensorflow.python.util.tf_export import tf_export
from typing import TypeVar
_CudnnRNNOutput = collections.namedtuple(
"CudnnRNN",
["output", "output_h", "output_c", "reserve_space"])
def cudnn_rnn(input, input_h, input_c, params, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, is_training=True, name=None):
r"""A RNN backed by cuDNN.
Computes the RNN from the input and initial states, with respect to the params
buffer.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
the actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used. Should be
"unidirectional" or "bidirectional".
dropout: Dropout probability. When set to 0., dropout is disabled.
seed: The 1st part of a seed to initialize dropout.
seed2: The 2nd part of a seed to initialize dropout.
input: A 3-D tensor with the shape of [seq_length, batch_size, input_size].
input_h: A 3-D tensor with the shape of [num_layer * dir, batch_size,
num_units].
input_c: For LSTM, a 3-D tensor with the shape of
[num_layer * dir, batch, num_units]. For other models, it is ignored.
params: A 1-D tensor that contains the weights and biases in an opaque layout.
The size must be created through CudnnRNNParamsSize, and initialized
separately. Note that they might not be compatible across different
generations. So it is a good idea to save and restore
output: A 3-D tensor with the shape of [seq_length, batch_size,
dir * num_units].
output_h: The same shape has input_h.
output_c: The same shape as input_c for LSTM. An empty tensor for other models.
is_training: Indicates whether this operation is used for inference or
training.
reserve_space: An opaque tensor that can be used in backprop calculation. It
is only produced if is_training is false.
Args:
input: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
input_h: A `Tensor`. Must have the same type as `input`.
input_c: A `Tensor`. Must have the same type as `input`.
params: A `Tensor`. Must have the same type as `input`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
is_training: An optional `bool`. Defaults to `True`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (output, output_h, output_c, reserve_space).
output: A `Tensor`. Has the same type as `input`.
output_h: A `Tensor`. Has the same type as `input`.
output_c: A `Tensor`. Has the same type as `input`.
reserve_space: A `Tensor`. Has the same type as `input`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNN", name, input, input_h, input_c, params, "rnn_mode",
rnn_mode, "input_mode", input_mode, "direction", direction, "dropout",
dropout, "seed", seed, "seed2", seed2, "is_training", is_training)
_result = _CudnnRNNOutput._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_eager_fallback(
input, input_h, input_c, params, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction, dropout=dropout,
seed=seed, seed2=seed2, is_training=is_training, name=name,
ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if is_training is None:
is_training = True
is_training = _execute.make_bool(is_training, "is_training")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNN", input=input, input_h=input_h, input_c=input_c,
params=params, rnn_mode=rnn_mode, input_mode=input_mode,
direction=direction, dropout=dropout, seed=seed,
seed2=seed2, is_training=is_training, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "is_training",
_op._get_attr_bool("is_training"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNN", _inputs_flat, _attrs, _result)
_result = _CudnnRNNOutput._make(_result)
return _result
CudnnRNN = tf_export("raw_ops.CudnnRNN")(_ops.to_raw_op(cudnn_rnn))
def cudnn_rnn_eager_fallback(input, input_h, input_c, params, rnn_mode, input_mode, direction, dropout, seed, seed2, is_training, name, ctx):
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if is_training is None:
is_training = True
is_training = _execute.make_bool(is_training, "is_training")
_attr_T, _inputs_T = _execute.args_to_matching_eager([input, input_h, input_c, params], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
(input, input_h, input_c, params) = _inputs_T
_inputs_flat = [input, input_h, input_c, params]
_attrs = ("T", _attr_T, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2,
"is_training", is_training)
_result = _execute.execute(b"CudnnRNN", 4, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNN", _inputs_flat, _attrs, _result)
_result = _CudnnRNNOutput._make(_result)
return _result
_CudnnRNNBackpropOutput = collections.namedtuple(
"CudnnRNNBackprop",
["input_backprop", "input_h_backprop", "input_c_backprop", "params_backprop"])
def cudnn_rnn_backprop(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, name=None):
r"""Backprop step of CudnnRNN.
Compute the backprop of both data and weights in a RNN.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
the actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used. Should be
"unidirectional" or "bidirectional".
dropout: Dropout probability. When set to 0., dropout is disabled.
seed: The 1st part of a seed to initialize dropout.
seed2: The 2nd part of a seed to initialize dropout.
input: A 3-D tensor with the shape of [seq_length, batch_size, input_size].
input_h: A 3-D tensor with the shape of [num_layer * dir, batch_size,
num_units].
input_c: For LSTM, a 3-D tensor with the shape of
[num_layer * dir, batch, num_units]. For other models, it is ignored.
params: A 1-D tensor that contains the weights and biases in an opaque layout.
The size must be created through CudnnRNNParamsSize, and initialized
separately. Note that they might not be compatible across different
generations. So it is a good idea to save and restore
output: A 3-D tensor with the shape of [seq_length, batch_size,
dir * num_units].
output_h: The same shape has input_h.
output_c: The same shape as input_c for LSTM. An empty tensor for other models.
output_backprop: A 3-D tensor with the same shape as output in the forward pass.
output_h_backprop: A 3-D tensor with the same shape as output_h in the forward
pass.
output_c_backprop: A 3-D tensor with the same shape as output_c in the forward
pass.
reserve_space: The same reserve_space produced in for forward operation.
input_backprop: The backprop to input in the forward pass. Has the same shape
as input.
input_h_backprop: The backprop to input_h in the forward pass. Has the same
shape as input_h.
input_c_backprop: The backprop to input_c in the forward pass. Has the same
shape as input_c.
params_backprop: The backprop to the params buffer in the forward pass. Has the
same shape as params.
Args:
input: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
input_h: A `Tensor`. Must have the same type as `input`.
input_c: A `Tensor`. Must have the same type as `input`.
params: A `Tensor`. Must have the same type as `input`.
output: A `Tensor`. Must have the same type as `input`.
output_h: A `Tensor`. Must have the same type as `input`.
output_c: A `Tensor`. Must have the same type as `input`.
output_backprop: A `Tensor`. Must have the same type as `input`.
output_h_backprop: A `Tensor`. Must have the same type as `input`.
output_c_backprop: A `Tensor`. Must have the same type as `input`.
reserve_space: A `Tensor`. Must have the same type as `input`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (input_backprop, input_h_backprop, input_c_backprop, params_backprop).
input_backprop: A `Tensor`. Has the same type as `input`.
input_h_backprop: A `Tensor`. Has the same type as `input`.
input_c_backprop: A `Tensor`. Has the same type as `input`.
params_backprop: A `Tensor`. Has the same type as `input`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNBackprop", name, input, input_h, input_c, params,
output, output_h, output_c, output_backprop, output_h_backprop,
output_c_backprop, reserve_space, "rnn_mode", rnn_mode, "input_mode",
input_mode, "direction", direction, "dropout", dropout, "seed", seed,
"seed2", seed2)
_result = _CudnnRNNBackpropOutput._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_backprop_eager_fallback(
input, input_h, input_c, params, output, output_h, output_c,
output_backprop, output_h_backprop, output_c_backprop,
reserve_space, rnn_mode=rnn_mode, input_mode=input_mode,
direction=direction, dropout=dropout, seed=seed, seed2=seed2,
name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNBackprop", input=input, input_h=input_h, input_c=input_c,
params=params, output=output, output_h=output_h,
output_c=output_c,
output_backprop=output_backprop,
output_h_backprop=output_h_backprop,
output_c_backprop=output_c_backprop,
reserve_space=reserve_space, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2,
name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNBackprop", _inputs_flat, _attrs, _result)
_result = _CudnnRNNBackpropOutput._make(_result)
return _result
CudnnRNNBackprop = tf_export("raw_ops.CudnnRNNBackprop")(_ops.to_raw_op(cudnn_rnn_backprop))
def cudnn_rnn_backprop_eager_fallback(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, rnn_mode, input_mode, direction, dropout, seed, seed2, name, ctx):
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_attr_T, _inputs_T = _execute.args_to_matching_eager([input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space) = _inputs_T
_inputs_flat = [input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space]
_attrs = ("T", _attr_T, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2)
_result = _execute.execute(b"CudnnRNNBackprop", 4, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNBackprop", _inputs_flat, _attrs, _result)
_result = _CudnnRNNBackpropOutput._make(_result)
return _result
_CudnnRNNBackpropV2Output = collections.namedtuple(
"CudnnRNNBackpropV2",
["input_backprop", "input_h_backprop", "input_c_backprop", "params_backprop"])
def cudnn_rnn_backprop_v2(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, host_reserved, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, name=None):
r"""Backprop step of CudnnRNN.
Compute the backprop of both data and weights in a RNN. Takes an extra
"host_reserved" inupt than CudnnRNNBackprop, which is used to determine RNN
cudnnRNNAlgo_t and cudnnMathType_t.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicates whether there is a linear projection between the input and
the actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used. Should be
"unidirectional" or "bidirectional".
dropout: Dropout probability. When set to 0., dropout is disabled.
seed: The 1st part of a seed to initialize dropout.
seed2: The 2nd part of a seed to initialize dropout.
input: A 3-D tensor with the shape of [seq_length, batch_size, input_size].
input_h: A 3-D tensor with the shape of [num_layer * dir, batch_size,
num_units].
input_c: For LSTM, a 3-D tensor with the shape of
[num_layer * dir, batch, num_units]. For other models, it is ignored.
params: A 1-D tensor that contains the weights and biases in an opaque layout.
The size must be created through CudnnRNNParamsSize, and initialized
separately. Note that they might not be compatible across different
generations. So it is a good idea to save and restore
output: A 3-D tensor with the shape of [seq_length, batch_size,
dir * num_units].
output_h: The same shape has input_h.
output_c: The same shape as input_c for LSTM. An empty tensor for other models.
output_backprop: A 3-D tensor with the same shape as output in the forward pass.
output_h_backprop: A 3-D tensor with the same shape as output_h in the forward
pass.
output_c_backprop: A 3-D tensor with the same shape as output_c in the forward
pass.
reserve_space: The same reserve_space produced in the forward operation.
host_reserved: The same host_reserved produced in the forward operation.
input_backprop: The backprop to input in the forward pass. Has the same shape
as input.
input_h_backprop: The backprop to input_h in the forward pass. Has the same
shape as input_h.
input_c_backprop: The backprop to input_c in the forward pass. Has the same
shape as input_c.
params_backprop: The backprop to the params buffer in the forward pass. Has the
same shape as params.
Args:
input: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
input_h: A `Tensor`. Must have the same type as `input`.
input_c: A `Tensor`. Must have the same type as `input`.
params: A `Tensor`. Must have the same type as `input`.
output: A `Tensor`. Must have the same type as `input`.
output_h: A `Tensor`. Must have the same type as `input`.
output_c: A `Tensor`. Must have the same type as `input`.
output_backprop: A `Tensor`. Must have the same type as `input`.
output_h_backprop: A `Tensor`. Must have the same type as `input`.
output_c_backprop: A `Tensor`. Must have the same type as `input`.
reserve_space: A `Tensor`. Must have the same type as `input`.
host_reserved: A `Tensor` of type `int8`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (input_backprop, input_h_backprop, input_c_backprop, params_backprop).
input_backprop: A `Tensor`. Has the same type as `input`.
input_h_backprop: A `Tensor`. Has the same type as `input`.
input_c_backprop: A `Tensor`. Has the same type as `input`.
params_backprop: A `Tensor`. Has the same type as `input`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNBackpropV2", name, input, input_h, input_c, params,
output, output_h, output_c, output_backprop, output_h_backprop,
output_c_backprop, reserve_space, host_reserved, "rnn_mode", rnn_mode,
"input_mode", input_mode, "direction", direction, "dropout", dropout,
"seed", seed, "seed2", seed2)
_result = _CudnnRNNBackpropV2Output._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_backprop_v2_eager_fallback(
input, input_h, input_c, params, output, output_h, output_c,
output_backprop, output_h_backprop, output_c_backprop,
reserve_space, host_reserved, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction, dropout=dropout,
seed=seed, seed2=seed2, name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNBackpropV2", input=input, input_h=input_h, input_c=input_c,
params=params, output=output, output_h=output_h,
output_c=output_c,
output_backprop=output_backprop,
output_h_backprop=output_h_backprop,
output_c_backprop=output_c_backprop,
reserve_space=reserve_space,
host_reserved=host_reserved, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2,
name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNBackpropV2", _inputs_flat, _attrs, _result)
_result = _CudnnRNNBackpropV2Output._make(_result)
return _result
CudnnRNNBackpropV2 = tf_export("raw_ops.CudnnRNNBackpropV2")(_ops.to_raw_op(cudnn_rnn_backprop_v2))
def cudnn_rnn_backprop_v2_eager_fallback(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, host_reserved, rnn_mode, input_mode, direction, dropout, seed, seed2, name, ctx):
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_attr_T, _inputs_T = _execute.args_to_matching_eager([input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space) = _inputs_T
host_reserved = _ops.convert_to_tensor(host_reserved, _dtypes.int8)
_inputs_flat = [input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, host_reserved]
_attrs = ("T", _attr_T, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2)
_result = _execute.execute(b"CudnnRNNBackpropV2", 4, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNBackpropV2", _inputs_flat, _attrs, _result)
_result = _CudnnRNNBackpropV2Output._make(_result)
return _result
_CudnnRNNBackpropV3Output = collections.namedtuple(
"CudnnRNNBackpropV3",
["input_backprop", "input_h_backprop", "input_c_backprop", "params_backprop"])
def cudnn_rnn_backprop_v3(input, input_h, input_c, params, sequence_lengths, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, host_reserved, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, num_proj=0, time_major=True, name=None):
r"""Backprop step of CudnnRNNV3.
Compute the backprop of both data and weights in a RNN. Takes an extra
"sequence_lengths" input than CudnnRNNBackprop.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicates whether there is a linear projection between the input and
the actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used. Should be
"unidirectional" or "bidirectional".
dropout: Dropout probability. When set to 0., dropout is disabled.
seed: The 1st part of a seed to initialize dropout.
seed2: The 2nd part of a seed to initialize dropout.
input: If time_major is true, this is a 3-D tensor with the shape of
[seq_length, batch_size, input_size]. If time_major is false, the shape is
[batch_size, seq_length, input_size].
input_h: If time_major is true, this is a 3-D tensor with the shape of
[num_layer * dir, batch_size, num_units]. If time_major is false, the shape
is [batch_size, num_layer * dir, num_units].
input_c: For LSTM, a 3-D tensor with the shape of
[num_layer * dir, batch, num_units]. For other models, it is ignored.
params: A 1-D tensor that contains the weights and biases in an opaque layout.
The size must be created through CudnnRNNParamsSize, and initialized
separately. Note that they might not be compatible across different
generations. So it is a good idea to save and restore
sequence_lengths: a vector of lengths of each input sequence.
output: If time_major is true, this is a 3-D tensor with the shape of
[seq_length, batch_size, dir * num_units]. If time_major is false, the
shape is [batch_size, seq_length, dir * num_units].
output_h: The same shape has input_h.
output_c: The same shape as input_c for LSTM. An empty tensor for other models.
output_backprop: A 3-D tensor with the same shape as output in the forward pass.
output_h_backprop: A 3-D tensor with the same shape as output_h in the forward
pass.
output_c_backprop: A 3-D tensor with the same shape as output_c in the forward
pass.
time_major: Indicates whether the input/output format is time major or batch
major.
reserve_space: The same reserve_space produced in the forward operation.
input_backprop: The backprop to input in the forward pass. Has the same shape
as input.
input_h_backprop: The backprop to input_h in the forward pass. Has the same
shape as input_h.
input_c_backprop: The backprop to input_c in the forward pass. Has the same
shape as input_c.
params_backprop: The backprop to the params buffer in the forward pass. Has the
same shape as params.
Args:
input: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
input_h: A `Tensor`. Must have the same type as `input`.
input_c: A `Tensor`. Must have the same type as `input`.
params: A `Tensor`. Must have the same type as `input`.
sequence_lengths: A `Tensor` of type `int32`.
output: A `Tensor`. Must have the same type as `input`.
output_h: A `Tensor`. Must have the same type as `input`.
output_c: A `Tensor`. Must have the same type as `input`.
output_backprop: A `Tensor`. Must have the same type as `input`.
output_h_backprop: A `Tensor`. Must have the same type as `input`.
output_c_backprop: A `Tensor`. Must have the same type as `input`.
reserve_space: A `Tensor`. Must have the same type as `input`.
host_reserved: A `Tensor` of type `int8`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
num_proj: An optional `int`. Defaults to `0`.
time_major: An optional `bool`. Defaults to `True`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (input_backprop, input_h_backprop, input_c_backprop, params_backprop).
input_backprop: A `Tensor`. Has the same type as `input`.
input_h_backprop: A `Tensor`. Has the same type as `input`.
input_c_backprop: A `Tensor`. Has the same type as `input`.
params_backprop: A `Tensor`. Has the same type as `input`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNBackpropV3", name, input, input_h, input_c, params,
sequence_lengths, output, output_h, output_c, output_backprop,
output_h_backprop, output_c_backprop, reserve_space, host_reserved,
"rnn_mode", rnn_mode, "input_mode", input_mode, "direction",
direction, "dropout", dropout, "seed", seed, "seed2", seed2,
"num_proj", num_proj, "time_major", time_major)
_result = _CudnnRNNBackpropV3Output._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_backprop_v3_eager_fallback(
input, input_h, input_c, params, sequence_lengths, output, output_h,
output_c, output_backprop, output_h_backprop, output_c_backprop,
reserve_space, host_reserved, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction, dropout=dropout,
seed=seed, seed2=seed2, num_proj=num_proj, time_major=time_major,
name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
if time_major is None:
time_major = True
time_major = _execute.make_bool(time_major, "time_major")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNBackpropV3", input=input, input_h=input_h, input_c=input_c,
params=params,
sequence_lengths=sequence_lengths,
output=output, output_h=output_h,
output_c=output_c,
output_backprop=output_backprop,
output_h_backprop=output_h_backprop,
output_c_backprop=output_c_backprop,
reserve_space=reserve_space,
host_reserved=host_reserved, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2,
num_proj=num_proj, time_major=time_major,
name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "num_proj",
_op._get_attr_int("num_proj"), "time_major",
_op._get_attr_bool("time_major"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNBackpropV3", _inputs_flat, _attrs, _result)
_result = _CudnnRNNBackpropV3Output._make(_result)
return _result
CudnnRNNBackpropV3 = tf_export("raw_ops.CudnnRNNBackpropV3")(_ops.to_raw_op(cudnn_rnn_backprop_v3))
def cudnn_rnn_backprop_v3_eager_fallback(input, input_h, input_c, params, sequence_lengths, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, host_reserved, rnn_mode, input_mode, direction, dropout, seed, seed2, num_proj, time_major, name, ctx):
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
if time_major is None:
time_major = True
time_major = _execute.make_bool(time_major, "time_major")
_attr_T, _inputs_T = _execute.args_to_matching_eager([input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
(input, input_h, input_c, params, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space) = _inputs_T
sequence_lengths = _ops.convert_to_tensor(sequence_lengths, _dtypes.int32)
host_reserved = _ops.convert_to_tensor(host_reserved, _dtypes.int8)
_inputs_flat = [input, input_h, input_c, params, sequence_lengths, output, output_h, output_c, output_backprop, output_h_backprop, output_c_backprop, reserve_space, host_reserved]
_attrs = ("T", _attr_T, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2,
"num_proj", num_proj, "time_major", time_major)
_result = _execute.execute(b"CudnnRNNBackpropV3", 4, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNBackpropV3", _inputs_flat, _attrs, _result)
_result = _CudnnRNNBackpropV3Output._make(_result)
return _result
def cudnn_rnn_canonical_to_params(num_layers, num_units, input_size, weights, biases, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, name=None):
r"""Converts CudnnRNN params from canonical form to usable form.
Writes a set of weights into the opaque params buffer so they can be used in
upcoming training or inferences.
Note that the params buffer may not be compatible across different GPUs. So any
save and restoration should be converted to and from the canonical weights and
biases.
num_layers: Specifies the number of layers in the RNN model.
num_units: Specifies the size of the hidden state.
input_size: Specifies the size of the input state.
weights: the canonical form of weights that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
biases: the canonical form of biases that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
num_params: number of parameter sets for all layers.
Each layer may contain multiple parameter sets, with each set consisting of
a weight matrix and a bias vector.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
The actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used.
dir = (direction == bidirectional) ? 2 : 1
dropout: dropout probability. When set to 0., dropout is disabled.
seed: the 1st part of a seed to initialize dropout.
seed2: the 2nd part of a seed to initialize dropout.
Args:
num_layers: A `Tensor` of type `int32`.
num_units: A `Tensor` of type `int32`.
input_size: A `Tensor` of type `int32`.
weights: A list of at least 1 `Tensor` objects with the same type in: `half`, `float32`, `float64`.
biases: A list with the same length as `weights` of `Tensor` objects with the same type as `weights`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A `Tensor`. Has the same type as `weights`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNCanonicalToParams", name, num_layers, num_units,
input_size, weights, biases, "rnn_mode", rnn_mode, "input_mode",
input_mode, "direction", direction, "dropout", dropout, "seed", seed,
"seed2", seed2)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_canonical_to_params_eager_fallback(
num_layers, num_units, input_size, weights, biases,
rnn_mode=rnn_mode, input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2, name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if not isinstance(weights, (list, tuple)):
raise TypeError(
"Expected list for 'weights' argument to "
"'cudnn_rnn_canonical_to_params' Op, not %r." % weights)
_attr_num_params = len(weights)
if not isinstance(biases, (list, tuple)):
raise TypeError(
"Expected list for 'biases' argument to "
"'cudnn_rnn_canonical_to_params' Op, not %r." % biases)
if len(biases) != _attr_num_params:
raise ValueError(
"List argument 'biases' to 'cudnn_rnn_canonical_to_params' Op with length %d "
"must match length %d of argument 'weights'." %
(len(biases), _attr_num_params))
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNCanonicalToParams", num_layers=num_layers,
num_units=num_units,
input_size=input_size, weights=weights,
biases=biases, rnn_mode=rnn_mode,
input_mode=input_mode,
direction=direction, dropout=dropout,
seed=seed, seed2=seed2, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "num_params",
_op._get_attr_int("num_params"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNCanonicalToParams", _inputs_flat, _attrs, _result)
_result, = _result
return _result
CudnnRNNCanonicalToParams = tf_export("raw_ops.CudnnRNNCanonicalToParams")(_ops.to_raw_op(cudnn_rnn_canonical_to_params))
def cudnn_rnn_canonical_to_params_eager_fallback(num_layers, num_units, input_size, weights, biases, rnn_mode, input_mode, direction, dropout, seed, seed2, name, ctx):
if not isinstance(weights, (list, tuple)):
raise TypeError(
"Expected list for 'weights' argument to "
"'cudnn_rnn_canonical_to_params' Op, not %r." % weights)
_attr_num_params = len(weights)
if not isinstance(biases, (list, tuple)):
raise TypeError(
"Expected list for 'biases' argument to "
"'cudnn_rnn_canonical_to_params' Op, not %r." % biases)
if len(biases) != _attr_num_params:
raise ValueError(
"List argument 'biases' to 'cudnn_rnn_canonical_to_params' Op with length %d "
"must match length %d of argument 'weights'." %
(len(biases), _attr_num_params))
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_attr_T, _inputs_T = _execute.args_to_matching_eager(list(weights) + list(biases), ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
_inputs_T = [_inputs_T[:_attr_num_params]] + _inputs_T[_attr_num_params:]
_inputs_T = _inputs_T[:1] + [_inputs_T[1:]]
(weights, biases) = _inputs_T
num_layers = _ops.convert_to_tensor(num_layers, _dtypes.int32)
num_units = _ops.convert_to_tensor(num_units, _dtypes.int32)
input_size = _ops.convert_to_tensor(input_size, _dtypes.int32)
_inputs_flat = [num_layers, num_units, input_size] + list(weights) + list(biases)
_attrs = ("T", _attr_T, "num_params", _attr_num_params, "rnn_mode",
rnn_mode, "input_mode", input_mode, "direction", direction, "dropout",
dropout, "seed", seed, "seed2", seed2)
_result = _execute.execute(b"CudnnRNNCanonicalToParams", 1,
inputs=_inputs_flat, attrs=_attrs, ctx=ctx,
name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNCanonicalToParams", _inputs_flat, _attrs, _result)
_result, = _result
return _result
def cudnn_rnn_canonical_to_params_v2(num_layers, num_units, input_size, weights, biases, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, num_proj=0, name=None):
r"""Converts CudnnRNN params from canonical form to usable form. It supports the projection in LSTM.
Writes a set of weights into the opaque params buffer so they can be used in
upcoming training or inferences.
Note that the params buffer may not be compatible across different GPUs. So any
save and restoration should be converted to and from the canonical weights and
biases.
num_layers: Specifies the number of layers in the RNN model.
num_units: Specifies the size of the hidden state.
input_size: Specifies the size of the input state.
weights: the canonical form of weights that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
biases: the canonical form of biases that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
num_params_weights: number of weight parameter matrix for all layers.
num_params_biases: number of bias parameter vector for all layers.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
The actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used.
dir = (direction == bidirectional) ? 2 : 1
dropout: dropout probability. When set to 0., dropout is disabled.
seed: the 1st part of a seed to initialize dropout.
seed2: the 2nd part of a seed to initialize dropout.
num_proj: The output dimensionality for the projection matrices. If None or 0,
no projection is performed.
Args:
num_layers: A `Tensor` of type `int32`.
num_units: A `Tensor` of type `int32`.
input_size: A `Tensor` of type `int32`.
weights: A list of at least 1 `Tensor` objects with the same type in: `half`, `float32`, `float64`.
biases: A list of at least 1 `Tensor` objects with the same type as `weights`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
num_proj: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A `Tensor`. Has the same type as `weights`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNCanonicalToParamsV2", name, num_layers, num_units,
input_size, weights, biases, "rnn_mode", rnn_mode, "input_mode",
input_mode, "direction", direction, "dropout", dropout, "seed", seed,
"seed2", seed2, "num_proj", num_proj)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_canonical_to_params_v2_eager_fallback(
num_layers, num_units, input_size, weights, biases,
rnn_mode=rnn_mode, input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2, num_proj=num_proj,
name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if not isinstance(weights, (list, tuple)):
raise TypeError(
"Expected list for 'weights' argument to "
"'cudnn_rnn_canonical_to_params_v2' Op, not %r." % weights)
_attr_num_params_weights = len(weights)
if not isinstance(biases, (list, tuple)):
raise TypeError(
"Expected list for 'biases' argument to "
"'cudnn_rnn_canonical_to_params_v2' Op, not %r." % biases)
_attr_num_params_biases = len(biases)
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNCanonicalToParamsV2", num_layers=num_layers,
num_units=num_units,
input_size=input_size, weights=weights,
biases=biases, rnn_mode=rnn_mode,
input_mode=input_mode,
direction=direction, dropout=dropout,
seed=seed, seed2=seed2,
num_proj=num_proj, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "num_params_weights",
_op._get_attr_int("num_params_weights"), "num_params_biases",
_op._get_attr_int("num_params_biases"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "num_proj",
_op._get_attr_int("num_proj"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNCanonicalToParamsV2", _inputs_flat, _attrs, _result)
_result, = _result
return _result
CudnnRNNCanonicalToParamsV2 = tf_export("raw_ops.CudnnRNNCanonicalToParamsV2")(_ops.to_raw_op(cudnn_rnn_canonical_to_params_v2))
def cudnn_rnn_canonical_to_params_v2_eager_fallback(num_layers, num_units, input_size, weights, biases, rnn_mode, input_mode, direction, dropout, seed, seed2, num_proj, name, ctx):
if not isinstance(weights, (list, tuple)):
raise TypeError(
"Expected list for 'weights' argument to "
"'cudnn_rnn_canonical_to_params_v2' Op, not %r." % weights)
_attr_num_params_weights = len(weights)
if not isinstance(biases, (list, tuple)):
raise TypeError(
"Expected list for 'biases' argument to "
"'cudnn_rnn_canonical_to_params_v2' Op, not %r." % biases)
_attr_num_params_biases = len(biases)
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
_attr_T, _inputs_T = _execute.args_to_matching_eager(list(weights) + list(biases), ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
_inputs_T = [_inputs_T[:_attr_num_params_weights]] + _inputs_T[_attr_num_params_weights:]
_inputs_T = _inputs_T[:1] + [_inputs_T[1:]]
(weights, biases) = _inputs_T
num_layers = _ops.convert_to_tensor(num_layers, _dtypes.int32)
num_units = _ops.convert_to_tensor(num_units, _dtypes.int32)
input_size = _ops.convert_to_tensor(input_size, _dtypes.int32)
_inputs_flat = [num_layers, num_units, input_size] + list(weights) + list(biases)
_attrs = ("T", _attr_T, "num_params_weights", _attr_num_params_weights,
"num_params_biases", _attr_num_params_biases, "rnn_mode", rnn_mode,
"input_mode", input_mode, "direction", direction, "dropout", dropout,
"seed", seed, "seed2", seed2, "num_proj", num_proj)
_result = _execute.execute(b"CudnnRNNCanonicalToParamsV2", 1,
inputs=_inputs_flat, attrs=_attrs, ctx=ctx,
name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNCanonicalToParamsV2", _inputs_flat, _attrs, _result)
_result, = _result
return _result
def cudnn_rnn_params_size(num_layers, num_units, input_size, T, S, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, num_proj=0, name=None):
r"""Computes size of weights that can be used by a Cudnn RNN model.
Return the params size that can be used by the Cudnn RNN model. Subsequent
weight allocation and initialization should use this size.
num_layers: Specifies the number of layers in the RNN model.
num_units: Specifies the size of the hidden state.
input_size: Specifies the size of the input state.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
The actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used.
dir = (direction == bidirectional) ? 2 : 1
dropout: dropout probability. When set to 0., dropout is disabled.
seed: the 1st part of a seed to initialize dropout.
seed2: the 2nd part of a seed to initialize dropout.
params_size: The size of the params buffer that should be allocated and
initialized for this RNN model. Note that this params buffer may not be
compatible across GPUs. Please use CudnnRNNParamsWeights and
CudnnRNNParamsBiases to save and restore them in a way that is compatible
across different runs.
Args:
num_layers: A `Tensor` of type `int32`.
num_units: A `Tensor` of type `int32`.
input_size: A `Tensor` of type `int32`.
T: A `tf.DType` from: `tf.half, tf.float32, tf.float64`.
S: A `tf.DType` from: `tf.int32, tf.int64`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
num_proj: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A `Tensor` of type `S`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNParamsSize", name, num_layers, num_units, input_size,
"T", T, "S", S, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2",
seed2, "num_proj", num_proj)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_params_size_eager_fallback(
num_layers, num_units, input_size, T=T, S=S, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction, dropout=dropout,
seed=seed, seed2=seed2, num_proj=num_proj, name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
T = _execute.make_type(T, "T")
S = _execute.make_type(S, "S")
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNParamsSize", num_layers=num_layers, num_units=num_units,
input_size=input_size, T=T, S=S,
rnn_mode=rnn_mode, input_mode=input_mode,
direction=direction, dropout=dropout, seed=seed,
seed2=seed2, num_proj=num_proj, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "S", _op._get_attr_type("S"),
"rnn_mode", _op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "num_proj",
_op._get_attr_int("num_proj"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNParamsSize", _inputs_flat, _attrs, _result)
_result, = _result
return _result
CudnnRNNParamsSize = tf_export("raw_ops.CudnnRNNParamsSize")(_ops.to_raw_op(cudnn_rnn_params_size))
def cudnn_rnn_params_size_eager_fallback(num_layers, num_units, input_size, T, S, rnn_mode, input_mode, direction, dropout, seed, seed2, num_proj, name, ctx):
T = _execute.make_type(T, "T")
S = _execute.make_type(S, "S")
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
num_layers = _ops.convert_to_tensor(num_layers, _dtypes.int32)
num_units = _ops.convert_to_tensor(num_units, _dtypes.int32)
input_size = _ops.convert_to_tensor(input_size, _dtypes.int32)
_inputs_flat = [num_layers, num_units, input_size]
_attrs = ("T", T, "S", S, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2,
"num_proj", num_proj)
_result = _execute.execute(b"CudnnRNNParamsSize", 1, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNParamsSize", _inputs_flat, _attrs, _result)
_result, = _result
return _result
_CudnnRNNParamsToCanonicalOutput = collections.namedtuple(
"CudnnRNNParamsToCanonical",
["weights", "biases"])
def cudnn_rnn_params_to_canonical(num_layers, num_units, input_size, params, num_params, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, name=None):
r"""Retrieves CudnnRNN params in canonical form.
Retrieves a set of weights from the opaque params buffer that can be saved and
restored in a way compatible with future runs.
Note that the params buffer may not be compatible across different GPUs. So any
save and restoration should be converted to and from the canonical weights and
biases.
num_layers: Specifies the number of layers in the RNN model.
num_units: Specifies the size of the hidden state.
input_size: Specifies the size of the input state.
num_params: number of parameter sets for all layers.
Each layer may contain multiple parameter sets, with each set consisting of
a weight matrix and a bias vector.
weights: the canonical form of weights that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
biases: the canonical form of biases that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
The actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used.
dir = (direction == bidirectional) ? 2 : 1
dropout: dropout probability. When set to 0., dropout is disabled.
seed: the 1st part of a seed to initialize dropout.
seed2: the 2nd part of a seed to initialize dropout.
Args:
num_layers: A `Tensor` of type `int32`.
num_units: A `Tensor` of type `int32`.
input_size: A `Tensor` of type `int32`.
params: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
num_params: An `int` that is `>= 1`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (weights, biases).
weights: A list of `num_params` `Tensor` objects with the same type as `params`.
biases: A list of `num_params` `Tensor` objects with the same type as `params`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNParamsToCanonical", name, num_layers, num_units,
input_size, params, "num_params", num_params, "rnn_mode", rnn_mode,
"input_mode", input_mode, "direction", direction, "dropout", dropout,
"seed", seed, "seed2", seed2)
_result = _CudnnRNNParamsToCanonicalOutput._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_params_to_canonical_eager_fallback(
num_layers, num_units, input_size, params, num_params=num_params,
rnn_mode=rnn_mode, input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2, name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
num_params = _execute.make_int(num_params, "num_params")
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNParamsToCanonical", num_layers=num_layers,
num_units=num_units,
input_size=input_size, params=params,
num_params=num_params, rnn_mode=rnn_mode,
input_mode=input_mode,
direction=direction, dropout=dropout,
seed=seed, seed2=seed2, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "num_params",
_op._get_attr_int("num_params"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNParamsToCanonical", _inputs_flat, _attrs, _result)
_result = [_result[:num_params]] + _result[num_params:]
_result = _result[:1] + [_result[1:]]
_result = _CudnnRNNParamsToCanonicalOutput._make(_result)
return _result
CudnnRNNParamsToCanonical = tf_export("raw_ops.CudnnRNNParamsToCanonical")(_ops.to_raw_op(cudnn_rnn_params_to_canonical))
def cudnn_rnn_params_to_canonical_eager_fallback(num_layers, num_units, input_size, params, num_params, rnn_mode, input_mode, direction, dropout, seed, seed2, name, ctx):
num_params = _execute.make_int(num_params, "num_params")
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
_attr_T, (params,) = _execute.args_to_matching_eager([params], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
num_layers = _ops.convert_to_tensor(num_layers, _dtypes.int32)
num_units = _ops.convert_to_tensor(num_units, _dtypes.int32)
input_size = _ops.convert_to_tensor(input_size, _dtypes.int32)
_inputs_flat = [num_layers, num_units, input_size, params]
_attrs = ("T", _attr_T, "num_params", num_params, "rnn_mode", rnn_mode,
"input_mode", input_mode, "direction", direction, "dropout", dropout,
"seed", seed, "seed2", seed2)
_result = _execute.execute(b"CudnnRNNParamsToCanonical", num_params +
num_params, inputs=_inputs_flat, attrs=_attrs,
ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNParamsToCanonical", _inputs_flat, _attrs, _result)
_result = [_result[:num_params]] + _result[num_params:]
_result = _result[:1] + [_result[1:]]
_result = _CudnnRNNParamsToCanonicalOutput._make(_result)
return _result
_CudnnRNNParamsToCanonicalV2Output = collections.namedtuple(
"CudnnRNNParamsToCanonicalV2",
["weights", "biases"])
def cudnn_rnn_params_to_canonical_v2(num_layers, num_units, input_size, params, num_params_weights, num_params_biases, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, num_proj=0, name=None):
r"""Retrieves CudnnRNN params in canonical form. It supports the projection in LSTM.
Retrieves a set of weights from the opaque params buffer that can be saved and
restored in a way compatible with future runs.
Note that the params buffer may not be compatible across different GPUs. So any
save and restoration should be converted to and from the canonical weights and
biases.
num_layers: Specifies the number of layers in the RNN model.
num_units: Specifies the size of the hidden state.
input_size: Specifies the size of the input state.
num_params_weights: number of weight parameter matrix for all layers.
num_params_biases: number of bias parameter vector for all layers.
weights: the canonical form of weights that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
biases: the canonical form of biases that can be used for saving
and restoration. They are more likely to be compatible across different
generations.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicate whether there is a linear projection between the input and
The actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used.
dir = (direction == bidirectional) ? 2 : 1
dropout: dropout probability. When set to 0., dropout is disabled.
seed: the 1st part of a seed to initialize dropout.
seed2: the 2nd part of a seed to initialize dropout.
num_proj: The output dimensionality for the projection matrices. If None or 0,
no projection is performed.
Args:
num_layers: A `Tensor` of type `int32`.
num_units: A `Tensor` of type `int32`.
input_size: A `Tensor` of type `int32`.
params: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
num_params_weights: An `int` that is `>= 1`.
num_params_biases: An `int` that is `>= 1`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
num_proj: An optional `int`. Defaults to `0`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (weights, biases).
weights: A list of `num_params_weights` `Tensor` objects with the same type as `params`.
biases: A list of `num_params_biases` `Tensor` objects with the same type as `params`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNParamsToCanonicalV2", name, num_layers, num_units,
input_size, params, "num_params_weights", num_params_weights,
"num_params_biases", num_params_biases, "rnn_mode", rnn_mode,
"input_mode", input_mode, "direction", direction, "dropout", dropout,
"seed", seed, "seed2", seed2, "num_proj", num_proj)
_result = _CudnnRNNParamsToCanonicalV2Output._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnn_params_to_canonical_v2_eager_fallback(
num_layers, num_units, input_size, params,
num_params_weights=num_params_weights,
num_params_biases=num_params_biases, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction, dropout=dropout,
seed=seed, seed2=seed2, num_proj=num_proj, name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
num_params_weights = _execute.make_int(num_params_weights, "num_params_weights")
num_params_biases = _execute.make_int(num_params_biases, "num_params_biases")
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNParamsToCanonicalV2", num_layers=num_layers,
num_units=num_units,
input_size=input_size, params=params,
num_params_weights=num_params_weights,
num_params_biases=num_params_biases,
rnn_mode=rnn_mode,
input_mode=input_mode,
direction=direction, dropout=dropout,
seed=seed, seed2=seed2,
num_proj=num_proj, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "num_params_weights",
_op._get_attr_int("num_params_weights"), "num_params_biases",
_op._get_attr_int("num_params_biases"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "num_proj",
_op._get_attr_int("num_proj"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNParamsToCanonicalV2", _inputs_flat, _attrs, _result)
_result = [_result[:num_params_weights]] + _result[num_params_weights:]
_result = _result[:1] + [_result[1:]]
_result = _CudnnRNNParamsToCanonicalV2Output._make(_result)
return _result
CudnnRNNParamsToCanonicalV2 = tf_export("raw_ops.CudnnRNNParamsToCanonicalV2")(_ops.to_raw_op(cudnn_rnn_params_to_canonical_v2))
def cudnn_rnn_params_to_canonical_v2_eager_fallback(num_layers, num_units, input_size, params, num_params_weights, num_params_biases, rnn_mode, input_mode, direction, dropout, seed, seed2, num_proj, name, ctx):
num_params_weights = _execute.make_int(num_params_weights, "num_params_weights")
num_params_biases = _execute.make_int(num_params_biases, "num_params_biases")
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
_attr_T, (params,) = _execute.args_to_matching_eager([params], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
num_layers = _ops.convert_to_tensor(num_layers, _dtypes.int32)
num_units = _ops.convert_to_tensor(num_units, _dtypes.int32)
input_size = _ops.convert_to_tensor(input_size, _dtypes.int32)
_inputs_flat = [num_layers, num_units, input_size, params]
_attrs = ("T", _attr_T, "num_params_weights", num_params_weights,
"num_params_biases", num_params_biases, "rnn_mode", rnn_mode, "input_mode",
input_mode, "direction", direction, "dropout", dropout, "seed", seed,
"seed2", seed2, "num_proj", num_proj)
_result = _execute.execute(b"CudnnRNNParamsToCanonicalV2",
num_params_weights + num_params_biases,
inputs=_inputs_flat, attrs=_attrs, ctx=ctx,
name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNParamsToCanonicalV2", _inputs_flat, _attrs, _result)
_result = [_result[:num_params_weights]] + _result[num_params_weights:]
_result = _result[:1] + [_result[1:]]
_result = _CudnnRNNParamsToCanonicalV2Output._make(_result)
return _result
_CudnnRNNV2Output = collections.namedtuple(
"CudnnRNNV2",
["output", "output_h", "output_c", "reserve_space", "host_reserved"])
def cudnn_rnnv2(input, input_h, input_c, params, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, is_training=True, name=None):
r"""A RNN backed by cuDNN.
Computes the RNN from the input and initial states, with respect to the params
buffer. Produces one extra output "host_reserved" than CudnnRNN.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicates whether there is a linear projection between the input and
the actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used. Should be
"unidirectional" or "bidirectional".
dropout: Dropout probability. When set to 0., dropout is disabled.
seed: The 1st part of a seed to initialize dropout.
seed2: The 2nd part of a seed to initialize dropout.
input: A 3-D tensor with the shape of [seq_length, batch_size, input_size].
input_h: A 3-D tensor with the shape of [num_layer * dir, batch_size,
num_units].
input_c: For LSTM, a 3-D tensor with the shape of
[num_layer * dir, batch, num_units]. For other models, it is ignored.
params: A 1-D tensor that contains the weights and biases in an opaque layout.
The size must be created through CudnnRNNParamsSize, and initialized
separately. Note that they might not be compatible across different
generations. So it is a good idea to save and restore
output: A 3-D tensor with the shape of [seq_length, batch_size,
dir * num_units].
output_h: The same shape has input_h.
output_c: The same shape as input_c for LSTM. An empty tensor for other models.
is_training: Indicates whether this operation is used for inference or
training.
reserve_space: An opaque tensor that can be used in backprop calculation. It
is only produced if is_training is true.
host_reserved: An opaque tensor that can be used in backprop calculation. It is
only produced if is_training is true. It is output on host memory rather than
device memory.
Args:
input: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
input_h: A `Tensor`. Must have the same type as `input`.
input_c: A `Tensor`. Must have the same type as `input`.
params: A `Tensor`. Must have the same type as `input`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
is_training: An optional `bool`. Defaults to `True`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (output, output_h, output_c, reserve_space, host_reserved).
output: A `Tensor`. Has the same type as `input`.
output_h: A `Tensor`. Has the same type as `input`.
output_c: A `Tensor`. Has the same type as `input`.
reserve_space: A `Tensor`. Has the same type as `input`.
host_reserved: A `Tensor` of type `int8`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNV2", name, input, input_h, input_c, params, "rnn_mode",
rnn_mode, "input_mode", input_mode, "direction", direction, "dropout",
dropout, "seed", seed, "seed2", seed2, "is_training", is_training)
_result = _CudnnRNNV2Output._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnnv2_eager_fallback(
input, input_h, input_c, params, rnn_mode=rnn_mode,
input_mode=input_mode, direction=direction, dropout=dropout,
seed=seed, seed2=seed2, is_training=is_training, name=name,
ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if is_training is None:
is_training = True
is_training = _execute.make_bool(is_training, "is_training")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNV2", input=input, input_h=input_h, input_c=input_c,
params=params, rnn_mode=rnn_mode, input_mode=input_mode,
direction=direction, dropout=dropout, seed=seed,
seed2=seed2, is_training=is_training, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "is_training",
_op._get_attr_bool("is_training"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNV2", _inputs_flat, _attrs, _result)
_result = _CudnnRNNV2Output._make(_result)
return _result
CudnnRNNV2 = tf_export("raw_ops.CudnnRNNV2")(_ops.to_raw_op(cudnn_rnnv2))
def cudnn_rnnv2_eager_fallback(input, input_h, input_c, params, rnn_mode, input_mode, direction, dropout, seed, seed2, is_training, name, ctx):
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if is_training is None:
is_training = True
is_training = _execute.make_bool(is_training, "is_training")
_attr_T, _inputs_T = _execute.args_to_matching_eager([input, input_h, input_c, params], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
(input, input_h, input_c, params) = _inputs_T
_inputs_flat = [input, input_h, input_c, params]
_attrs = ("T", _attr_T, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2,
"is_training", is_training)
_result = _execute.execute(b"CudnnRNNV2", 5, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNV2", _inputs_flat, _attrs, _result)
_result = _CudnnRNNV2Output._make(_result)
return _result
_CudnnRNNV3Output = collections.namedtuple(
"CudnnRNNV3",
["output", "output_h", "output_c", "reserve_space", "host_reserved"])
def cudnn_rnnv3(input, input_h, input_c, params, sequence_lengths, rnn_mode="lstm", input_mode="linear_input", direction="unidirectional", dropout=0, seed=0, seed2=0, num_proj=0, is_training=True, time_major=True, name=None):
r"""A RNN backed by cuDNN.
Computes the RNN from the input and initial states, with respect to the params
buffer. Accepts one extra input "sequence_lengths" than CudnnRNN.
rnn_mode: Indicates the type of the RNN model.
input_mode: Indicates whether there is a linear projection between the input and
the actual computation before the first layer. 'skip_input' is only allowed
when input_size == num_units; 'auto_select' implies 'skip_input' when
input_size == num_units; otherwise, it implies 'linear_input'.
direction: Indicates whether a bidirectional model will be used. Should be
"unidirectional" or "bidirectional".
dropout: Dropout probability. When set to 0., dropout is disabled.
seed: The 1st part of a seed to initialize dropout.
seed2: The 2nd part of a seed to initialize dropout.
input: If time_major is true, this is a 3-D tensor with the shape of
[seq_length, batch_size, input_size]. If time_major is false, the shape is
[batch_size, seq_length, input_size].
input_h: If time_major is true, this is a 3-D tensor with the shape of
[num_layer * dir, batch_size, num_units]. If time_major is false, the shape
is [batch_size, num_layer * dir, num_units].
input_c: For LSTM, a 3-D tensor with the shape of
[num_layer * dir, batch, num_units]. For other models, it is ignored.
params: A 1-D tensor that contains the weights and biases in an opaque layout.
The size must be created through CudnnRNNParamsSize, and initialized
separately. Note that they might not be compatible across different
generations. So it is a good idea to save and restore
sequence_lengths: a vector of lengths of each input sequence.
output: If time_major is true, this is a 3-D tensor with the shape of
[seq_length, batch_size, dir * num_units]. If time_major is false, the
shape is [batch_size, seq_length, dir * num_units].
output_h: The same shape has input_h.
output_c: The same shape as input_c for LSTM. An empty tensor for other models.
is_training: Indicates whether this operation is used for inference or
training.
time_major: Indicates whether the input/output format is time major or batch
major.
reserve_space: An opaque tensor that can be used in backprop calculation. It
is only produced if is_training is true.
Args:
input: A `Tensor`. Must be one of the following types: `half`, `float32`, `float64`.
input_h: A `Tensor`. Must have the same type as `input`.
input_c: A `Tensor`. Must have the same type as `input`.
params: A `Tensor`. Must have the same type as `input`.
sequence_lengths: A `Tensor` of type `int32`.
rnn_mode: An optional `string` from: `"rnn_relu", "rnn_tanh", "lstm", "gru"`. Defaults to `"lstm"`.
input_mode: An optional `string` from: `"linear_input", "skip_input", "auto_select"`. Defaults to `"linear_input"`.
direction: An optional `string` from: `"unidirectional", "bidirectional"`. Defaults to `"unidirectional"`.
dropout: An optional `float`. Defaults to `0`.
seed: An optional `int`. Defaults to `0`.
seed2: An optional `int`. Defaults to `0`.
num_proj: An optional `int`. Defaults to `0`.
is_training: An optional `bool`. Defaults to `True`.
time_major: An optional `bool`. Defaults to `True`.
name: A name for the operation (optional).
Returns:
A tuple of `Tensor` objects (output, output_h, output_c, reserve_space, host_reserved).
output: A `Tensor`. Has the same type as `input`.
output_h: A `Tensor`. Has the same type as `input`.
output_c: A `Tensor`. Has the same type as `input`.
reserve_space: A `Tensor`. Has the same type as `input`.
host_reserved: A `Tensor` of type `int8`.
"""
_ctx = _context._context or _context.context()
tld = _ctx._thread_local_data
if tld.is_eager:
try:
_result = pywrap_tfe.TFE_Py_FastPathExecute(
_ctx, "CudnnRNNV3", name, input, input_h, input_c, params,
sequence_lengths, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2",
seed2, "num_proj", num_proj, "is_training", is_training, "time_major",
time_major)
_result = _CudnnRNNV3Output._make(_result)
return _result
except _core._NotOkStatusException as e:
_ops.raise_from_not_ok_status(e, name)
except _core._FallbackException:
pass
try:
return cudnn_rnnv3_eager_fallback(
input, input_h, input_c, params, sequence_lengths,
rnn_mode=rnn_mode, input_mode=input_mode, direction=direction,
dropout=dropout, seed=seed, seed2=seed2, num_proj=num_proj,
is_training=is_training, time_major=time_major, name=name, ctx=_ctx)
except _core._SymbolicException:
pass # Add nodes to the TensorFlow graph.
# Add nodes to the TensorFlow graph.
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
if is_training is None:
is_training = True
is_training = _execute.make_bool(is_training, "is_training")
if time_major is None:
time_major = True
time_major = _execute.make_bool(time_major, "time_major")
_, _, _op, _outputs = _op_def_library._apply_op_helper(
"CudnnRNNV3", input=input, input_h=input_h, input_c=input_c,
params=params, sequence_lengths=sequence_lengths,
rnn_mode=rnn_mode, input_mode=input_mode,
direction=direction, dropout=dropout, seed=seed,
seed2=seed2, num_proj=num_proj, is_training=is_training,
time_major=time_major, name=name)
_result = _outputs[:]
if _execute.must_record_gradient():
_attrs = ("T", _op._get_attr_type("T"), "rnn_mode",
_op.get_attr("rnn_mode"), "input_mode",
_op.get_attr("input_mode"), "direction",
_op.get_attr("direction"), "dropout", _op.get_attr("dropout"),
"seed", _op._get_attr_int("seed"), "seed2",
_op._get_attr_int("seed2"), "num_proj",
_op._get_attr_int("num_proj"), "is_training",
_op._get_attr_bool("is_training"), "time_major",
_op._get_attr_bool("time_major"))
_inputs_flat = _op.inputs
_execute.record_gradient(
"CudnnRNNV3", _inputs_flat, _attrs, _result)
_result = _CudnnRNNV3Output._make(_result)
return _result
CudnnRNNV3 = tf_export("raw_ops.CudnnRNNV3")(_ops.to_raw_op(cudnn_rnnv3))
def cudnn_rnnv3_eager_fallback(input, input_h, input_c, params, sequence_lengths, rnn_mode, input_mode, direction, dropout, seed, seed2, num_proj, is_training, time_major, name, ctx):
if rnn_mode is None:
rnn_mode = "lstm"
rnn_mode = _execute.make_str(rnn_mode, "rnn_mode")
if input_mode is None:
input_mode = "linear_input"
input_mode = _execute.make_str(input_mode, "input_mode")
if direction is None:
direction = "unidirectional"
direction = _execute.make_str(direction, "direction")
if dropout is None:
dropout = 0
dropout = _execute.make_float(dropout, "dropout")
if seed is None:
seed = 0
seed = _execute.make_int(seed, "seed")
if seed2 is None:
seed2 = 0
seed2 = _execute.make_int(seed2, "seed2")
if num_proj is None:
num_proj = 0
num_proj = _execute.make_int(num_proj, "num_proj")
if is_training is None:
is_training = True
is_training = _execute.make_bool(is_training, "is_training")
if time_major is None:
time_major = True
time_major = _execute.make_bool(time_major, "time_major")
_attr_T, _inputs_T = _execute.args_to_matching_eager([input, input_h, input_c, params], ctx, [_dtypes.half, _dtypes.float32, _dtypes.float64, ])
(input, input_h, input_c, params) = _inputs_T
sequence_lengths = _ops.convert_to_tensor(sequence_lengths, _dtypes.int32)
_inputs_flat = [input, input_h, input_c, params, sequence_lengths]
_attrs = ("T", _attr_T, "rnn_mode", rnn_mode, "input_mode", input_mode,
"direction", direction, "dropout", dropout, "seed", seed, "seed2", seed2,
"num_proj", num_proj, "is_training", is_training, "time_major", time_major)
_result = _execute.execute(b"CudnnRNNV3", 5, inputs=_inputs_flat,
attrs=_attrs, ctx=ctx, name=name)
if _execute.must_record_gradient():
_execute.record_gradient(
"CudnnRNNV3", _inputs_flat, _attrs, _result)
_result = _CudnnRNNV3Output._make(_result)
return _result