repeat

`Repeat` ¶

Bases: TensorOp

Repeat a TensorOp several times in a row.

Repeat takes an Op and runs it multiple times in a row. It can be set to repeat for a fixed (static) number of times, or to repeat until a given input function evaluates to False (dynamic).

Static example:

ops=[
    LambdaOp(fn=lambda: 0, outputs="z"),
    Repeat(AddOne(inputs="z", outputs="z"), repeat=5)
    ]

Dynamic example:

ops=[
    LambdaOp(fn=lambda: 0, outputs="z"),
    Repeat(AddOne(inputs="z", outputs="z"), repeat=lambda z: z < 6.5)
    ]

Note : Here the argument ('z') of the lambda function used as repeat callable function is the key used by the
       ops passed to the Repeat Op.

Parameters:

Name	Type	Description	Default
`op`	`TensorOp`	A TensorOp to be run one or more times in a row.	required
`repeat`	`Union[int, Callable[..., bool]]`	How many times to repeat the `op`. This can also be a function return, in which case the function input names will be matched to keys in the data dictionary, and the `op` will be repeated until the function evaluates to False. The function evaluation will happen at the end of a forward call, so the `op` will always be evaluated at least once.	`1`
`max_iter`	`Optional[int]`	A limit to how many iterations will be run (or None for no limit).	`None`

Raises:

Type	Description
`ValueError`	If `repeat`, `op`, or max_iter are invalid.

Source code in fastestimator/fastestimator/op/tensorop/meta/repeat.py

@traceable()
class Repeat(TensorOp):
    """Repeat a TensorOp several times in a row.

    Repeat takes an Op and runs it multiple times in a row. It can be set to repeat for a fixed (static) number of
    times, or to repeat until a given input function evaluates to False (dynamic).

    Static example:

        ops=[
            LambdaOp(fn=lambda: 0, outputs="z"),
            Repeat(AddOne(inputs="z", outputs="z"), repeat=5)
            ]

    Dynamic example:

        ops=[
            LambdaOp(fn=lambda: 0, outputs="z"),
            Repeat(AddOne(inputs="z", outputs="z"), repeat=lambda z: z < 6.5)
            ]

        Note : Here the argument ('z') of the lambda function used as repeat callable function is the key used by the
               ops passed to the Repeat Op.

    Args:
        op: A TensorOp to be run one or more times in a row.
        repeat: How many times to repeat the `op`. This can also be a function return, in which case the function input
            names will be matched to keys in the data dictionary, and the `op` will be repeated until the function
            evaluates to False. The function evaluation will happen at the end of a forward call, so the `op` will
            always be evaluated at least once.
        max_iter: A limit to how many iterations will be run (or None for no limit).

    Raises:
        ValueError: If `repeat`, `op`, or max_iter are invalid.
    """
    def __init__(self, op: TensorOp, repeat: Union[int, Callable[..., bool]] = 1,
                 max_iter: Optional[int] = None) -> None:
        self.repeat_inputs = []
        extra_reqs = []
        if max_iter is None:
            self.max_iter = max_iter
        else:
            if max_iter < 1:
                raise ValueError(f"Repeat requires max_iter to be >=1, but got {max_iter}")
            self.max_iter = max_iter - 1  # -1 b/c the first invocation happens outside the while loop
        if isinstance(repeat, int):
            if repeat < 1:
                raise ValueError(f"Repeat requires repeat to be >= 1, but got {repeat}")
            if max_iter:
                raise ValueError("Do not set max_iter when repeat is an integer")
        else:
            self.repeat_inputs.extend(inspect.signature(repeat).parameters.keys())
            extra_reqs = list(set(self.repeat_inputs) - set(op.outputs))
        self.repeat = repeat
        super().__init__(inputs=op.inputs + extra_reqs, outputs=op.outputs, mode=op.mode, ds_id=op.ds_id)
        self.ops = [op]
        self.retain_graph = None
        self.while_fn = None

    @property
    def op(self) -> TensorOp:
        return self.ops[0]

    def build(self, framework: str, device: Optional[torch.device] = None) -> None:
        self.op.build(framework, device)
        # Below the while function is chosen based on framework
        if framework == 'tf':
            # For tensorflow the while function is decided based of object type of 'self.repeat'.
            if isinstance(self.repeat, int):
                self.while_fn = self._tf_while_int
            else:
                self.while_fn = self._tf_while
        else:
            self.while_fn = self._torch_while

    def get_fe_models(self) -> Set[Model]:
        return self.op.get_fe_models()

    def get_fe_loss_keys(self) -> Set[str]:
        return self.op.get_fe_loss_keys()

    def fe_retain_graph(self, retain: Optional[bool] = None) -> Optional[bool]:
        if retain is not None:
            self.retain_graph = retain
        return self.op.fe_retain_graph(retain)

    def __getstate__(self) -> Dict[str, List[Dict[Any, Any]]]:
        return {'ops': [elem.__getstate__() if hasattr(elem, '__getstate__') else {} for elem in self.ops]}

    def forward(self, data: List[Tensor], state: Dict[str, Any]) -> List[Tensor]:
        # Set retain to true since might loop over a gradient aware op
        self.op.fe_retain_graph(True)

        data = {key: elem for key, elem in zip(self.inputs, data)}
        if isinstance(self.repeat, int):
            data = self.while_fn(data, state)
        else:
            BaseNetwork._forward_batch(data, state, self.ops)
            data = self.while_fn(data, state)
            # TODO - Find some magic way to invoke this at the right moment
            self.op.fe_retain_graph(self.retain_graph)

        return [data[key] for key in self.outputs]

    def _torch_while(self, data: Dict[str, Tensor], state: Dict[str, Any]) -> Dict[str, Tensor]:
        """A helper function to invoke a loop.

        Args:
            data: A data dictionary to be used during looping.
            state: The state variables to be considered during looping.

        Returns:
            A reference to the updated data dictionary.
        """
        if isinstance(self.repeat, int):
            for _ in range(self.repeat - 1):
                # Perform n-1 rounds with all ops having retain_graph == True
                BaseNetwork._forward_batch(data, state, self.ops)
            # Let retain be whatever it was meant to be for the final sequence
            self.op.fe_retain_graph(self.retain_graph)
            # Final round of ops to ensure accurate graph building in case we dont retain the graph
            BaseNetwork._forward_batch(data, state, self.ops)

        else:
            i = 0
            while self.repeat(*[data[var_name] for var_name in self.repeat_inputs]):
                if self.max_iter and i >= self.max_iter:
                    break
                BaseNetwork._forward_batch(data, state, self.ops)
                i += 1
        return data

    def _tf_while_int(self, data: Dict[str, Tensor], state: Dict[str, Any]) -> Dict[str, Tensor]:
        """A helper function to invoke a while loop in case self.repeat is an integer.

        Experiment were conducted to compare performance of tf.while_loop() with tf.range(), where tf.range outperformed
        tf.while_loop() in most scenarios. But it was found that tensors cannot be overwritten inside the scope of
        tf.range() and hence the RepeatOp failed on few Ops (eg: Ops which were updating the inputs). Creating a copy
        of tensor in every iteration of tf.range() resolved this issue, but also dissolved all the advantages of
        tf.range().

        Args:
            data: A data dictionary to be used during looping.
            state: The state variables to be considered during looping.

        Returns:
            A reference to the updated data dictionary.
        """
        if self.repeat == 1:
            # Let retain be whatever it was meant to be for the final sequence
            # This is done right before the only forward pass to ensure accurate graph building in case
            # we dont retain the graph
            self.op.fe_retain_graph(self.retain_graph)
            # Final round of ops
            BaseNetwork._forward_batch(data, state, self.ops)
        elif self.repeat == 2:
            BaseNetwork._forward_batch(data, state, self.ops)
            # Let retain be whatever it was meant to be for the final sequence
            # This is done right before the last forward pass to ensure accurate graph building in case
            # we dont retain the graph
            self.op.fe_retain_graph(self.retain_graph)
            # Final round of ops
            BaseNetwork._forward_batch(data, state, self.ops)
        else:
            # Run a forward pass to ensure that data dictionary structure doesn't change during while loop execution
            BaseNetwork._forward_batch(data, state, self.ops)
            args = (tf.constant(1), data)
            # Use functools.partial since state may contain objects which cannot be cast to tensors (ex. gradient tape)
            args = tf.while_loop(self._tf_cond,
                                 functools.partial(self._tf_body, state=state),
                                 args,
                                 maximum_iterations=self.max_iter)
            # Let retain be whatever it was meant to be for the final sequence
            # This is done right before the last forward pass to ensure accurate graph building in case
            # we dont retain the graph
            self.op.fe_retain_graph(self.retain_graph)
            data = args[1]
            # Final round of ops
            BaseNetwork._forward_batch(data, state, self.ops)
        return data

    def _tf_while(self, data: Dict[str, Tensor], state: Dict[str, Any]) -> Dict[str, Tensor]:
        """A helper function to invoke a while loop in case self.repeat is a callable function.

        Args:
            data: A data dictionary to be used during looping.
            state: The state variables to be considered during looping.

        Returns:
            A reference to the updated data dictionary.
        """
        args = ([data[var_name] for var_name in self.repeat_inputs], data)
        # Use functools.partial since state may contain objects which cannot be cast to tensors (ex. gradient tape)
        args = tf.while_loop(self._tf_cond,
                             functools.partial(self._tf_body, state=state),
                             args,
                             maximum_iterations=self.max_iter,
                             parallel_iterations=1)
        return args[1]

    def _tf_cond(self, cnd: Union[List[Tensor], Tensor], data: Dict[str, Tensor]) -> bool:
        """A helper function determine whether to keep invoking the while method.

        Note that `data` and `state` are unused here, but required since tf.while_loop needs the cond and body to have
        the same input argument signatures.

        Args:
            cnd: A list of arguments to be passed to the condition function.
            data: A data dictionary to be used during looping.

        Returns:
            Whether to continue looping.
        """
        if isinstance(self.repeat, int):
            # In this case we have 2 Forward calls for tf (one before and one after the while loop
            # (For accurate Tf while loop functioning))
            return tf.less(cnd, self.repeat - 1)
        return self.repeat(*cnd)

    def _tf_body(self, cnd: Union[List[Tensor], Tensor], data: Dict[str, Tensor],
                 state: Dict[str, Any]) -> Tuple[Union[List[Tensor], Tensor], Dict[str, Tensor]]:
        """A helper function to execute the body of a while method.

        Note that `cnd` is unused here, but required since tf.while_loop needs the cond and body to have the same input
        argument signatures.

        Args:
            cnd: A list of arguments to be passed to the condition function.
            data: A data dictionary to be used during looping.
            state: The state variables to be considered during looping.

        Returns:
            The updated `cnd` values, along with the modified data and state dictionaries.
        """
        # Run a round of ops
        BaseNetwork._forward_batch(data, state, self.ops)
        if isinstance(self.repeat, int):
            # Updating the while condition
            return tf.add(cnd, 1), data
        return [data[var_name] for var_name in self.repeat_inputs], data

repeat

Repeat ¶

`Repeat` ¶