Source code for gluonts.nursery.spliced_binned_pareto.tcn

# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License").
# You may not use this file except in compliance with the License.
# A copy of the License is located at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# or in the "license" file accompanying this file. This file is distributed
# on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
# express or implied. See the License for the specific language governing
# permissions and limitations under the License.

# Implementation taken and modified from
# https://github.com/White-Link/UnsupervisedScalableRepresentationLearningTimeSeries, which was created
# with the following license.

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at

#   http://www.apache.org/licenses/LICENSE-2.0

# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.


# Implementation of causal CNNs partly taken and modified from
# https://github.com/locuslab/TCN/blob/master/TCN/tcn.py, originally created
# with the following license.

# MIT License

# Copyright (c) 2018 CMU Locus Lab

# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:

# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.

# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.


import torch


[docs]class Chomp1d(torch.nn.Module): """ Removes leading or trailing elements of a time series. Takes as input a three-dimensional tensor (`B`, `C`, `L`) where `B` is the batch size, `C` is the number of input channels, and `L` is the length of the input. Outputs a three-dimensional tensor (`B`, `C`, `L - s`) where `s` is the number of elements to remove. Args: chomp_size : Number of elements to remove. last : If True, removes the last elements in the time dimension, If False, removes the fist elements. """ def __init__(self, chomp_size: int, last: bool = True): super().__init__() self.chomp_size = chomp_size self.last = last
[docs] def forward(self, x): if self.last: x_chomped = x[:, :, : -self.chomp_size] else: x_chomped = x[:, :, self.chomp_size :] return x_chomped
[docs]class TCNBlock(torch.nn.Module): """ Temporal Convolutional Network block. Composed sequentially of two causal convolutions (with leaky ReLU activation functions), and a parallel residual connection. Takes as input a three-dimensional tensor (`B`, `C`, `L`) where `B` is the batch size, `C` is the number of input channels, and `L` is the length of the input. Outputs a three-dimensional tensor (`B`, `C`, `L`). Args: in_channels : Number of input channels. out_channels : Number of output channels. kernel_size : Kernel size of the applied non-residual convolutions. dilation : Dilation parameter of non-residual convolutions. bias : If True, adds a learnable bias to the convolutions. fwd_time : If True, the network "causal" direction is from past to future (forward), if False, the relation is from future to past (backward). final : If True, the last activation function is disabled. """ def __init__( self, in_channels: int, out_channels: int, kernel_size: int, dilation: int, bias: bool = True, fwd_time: bool = True, final: bool = False, ): super().__init__() in_channels = int(in_channels) kernel_size = int(kernel_size) out_channels = int(out_channels) dilation = int(dilation) # Computes left padding so that the applied convolutions are causal padding = int((kernel_size - 1) * dilation) # First causal convolution conv1_pre = torch.nn.Conv1d( in_channels=in_channels, out_channels=out_channels, kernel_size=kernel_size, padding=padding, dilation=dilation, bias=bias, ) conv1 = torch.nn.utils.weight_norm(conv1_pre) # The truncation makes the convolution causal chomp1 = Chomp1d(chomp_size=padding, last=fwd_time) relu1 = torch.nn.LeakyReLU() # Second causal convolution conv2_pre = torch.nn.Conv1d( in_channels=out_channels, out_channels=out_channels, kernel_size=kernel_size, padding=padding, dilation=dilation, bias=bias, ) conv2 = torch.nn.utils.weight_norm(conv2_pre) chomp2 = Chomp1d(padding) relu2 = torch.nn.LeakyReLU() # Causal network self.causal = torch.nn.Sequential( conv1, chomp1, relu1, conv2, chomp2, relu2 ) # Residual connection self.upordownsample = ( torch.nn.Conv1d( in_channels=in_channels, out_channels=out_channels, kernel_size=1, ) if in_channels != out_channels else None ) # Final activation function self.activation = torch.nn.LeakyReLU() if final else None
[docs] def forward(self, x): out_causal = self.causal(x) res = x if self.upordownsample is None else self.upordownsample(x) if self.activation is None: return out_causal + res else: return self.activation(out_causal + res)
[docs]class TCN(torch.nn.Module): """ Temporal Convolutional Network. Composed of a sequence of causal convolution blocks. Takes as input a three-dimensional tensor (`B`, `C`, `L`) where `B` is the batch size, `C` is the number of input channels, and `L` is the length of the input. Outputs a three-dimensional tensor (`B`, `C_out`, `L`). Args: in_channels : Number of input channels. out_channels : Number of output channels. kernel_size : Kernel size of the applied non-residual convolutions. channels : Number of channels processed in the network and of output channels. layers : Depth of the network. bias : If True, adds a learnable bias to the convolutions. fwd_time : If True the network is the relation relation if from past to future (forward), if False, the relation from future to past (backward). """ def __init__( self, in_channels: int, out_channels: int, kernel_size: int, channels: int, layers: int, bias: bool = True, fwd_time: bool = True, ): super().__init__() layers = int(layers) net_layers = [] # List of sequential TCN blocks dilation_size = 1 # Initial dilation size for i in range(layers): in_channels_block = in_channels if i == 0 else channels net_layers.append( TCNBlock( in_channels=in_channels_block, out_channels=channels, kernel_size=kernel_size, dilation=dilation_size, bias=bias, fwd_time=fwd_time, final=False, ) ) dilation_size *= 2 # Doubles the dilation size at each step # Last layer net_layers.append( TCNBlock( in_channels=channels, out_channels=out_channels, kernel_size=kernel_size, dilation=dilation_size, bias=bias, fwd_time=fwd_time, final=True, ) ) self.network = torch.nn.Sequential(*net_layers)
[docs] def forward(self, x): return self.network(x)