Source code for deepod.models.time_series.prenet

# -*- coding: utf-8 -*-
"""
Weakly-supervised anomaly detection by pairwise relation prediction task
@Author: Hongzuo Xu <hongzuoxu@126.com, xuhongzuo13@nudt.edu.cn>
"""

from deepod.core.base_model import BaseDeepAD
from deepod.core.networks.base_networks import LinearBlock, get_network
from deepod.models.tabular.prenet import PReNetLoader
import torch
import numpy as np


[docs]class PReNetTS(BaseDeepAD):
    """
    Deep Weakly-supervised Anomaly Detection (KDD‘23)

    Args:
    
        epochs (int): 
            The number of epochs for training the model. Default is 100.
            
        batch_size (int): 
            The size of the batch for training. Default is 64.
        
        lr (float): 
            The learning rate. Default is 1e-3.
        
        network (str): 
            The type of network used, 'Transformer' by default.
        
        seq_len (int): 
            The length of the input sequences. Default is 30.
        
        stride (int): 
            The stride for sliding window on data. Default is 1.
        
        rep_dim (int): 
            The representation dimension. Default is 128.
        
        hidden_dims (str): 
            The hidden layer dimensions, separated by commas. Default is '512'.
        
        act (str): 
            The activation function. Default is 'GELU'.
        
        bias (bool): 
            Whether to use bias in the layers. Default is False.
        
        n_heads (int): 
            The number of attention heads in a transformer. Default is 8.
        
        d_model (int): 
            The dimensionality of the transformer model. Default is 512.
        
        attn (str): 
            The type of attention mechanism. Default is 'self_attn'.
        
        pos_encoding (str): 
            The type of position encoding. Default is 'fixed'.
        
        norm (str): 
            The type of normalization layer. Default is 'BatchNorm'.
        
        epoch_steps (int):
            The steps per epoch, -1 indicates using the full dataset. Default is -1.
        
        prt_steps (int): 
            The steps for printing during training. Default is 10.
        
        device (str): 
            The device for training, 'cuda' by default.
        
        verbose (int): 
            The verbosity level. Default is 2.
        
        random_state (int):
            The random state seeding. Default is 42.
        
    """
    
    def __init__(self, epochs=100, batch_size=64, lr=1e-3,
                 network='Transformer', seq_len=30, stride=1,
                 rep_dim=128, hidden_dims='512', act='GELU', bias=False,
                 n_heads=8, d_model=512, attn='self_attn', pos_encoding='fixed', norm='BatchNorm',
                 epoch_steps=-1, prt_steps=10, device='cuda',
                 verbose=2, random_state=42):
        """
        Initializes the PReNetTS model with specified parameters.
        """
        
        super(PReNetTS, self).__init__(
            model_name='PReNet', data_type='ts', epochs=epochs, batch_size=batch_size, lr=lr,
            network=network, seq_len=seq_len, stride=stride,
            epoch_steps=epoch_steps, prt_steps=prt_steps, device=device,
            verbose=verbose, random_state=random_state
        )

        self.hidden_dims = hidden_dims
        self.rep_dim = rep_dim
        self.act = act
        self.bias = bias

        # parameters for Transformer
        self.n_heads = n_heads
        self.d_model = d_model
        self.pos_encoding = pos_encoding
        self.norm = norm
        self.attn = attn

        return

[docs]    def training_prepare(self, X, y):
        """
        Prepares the model for training by setting up the data loader, network, and criterion.

        Args:
        
            X (numpy.ndarray): 
                Training data.
                
            y (numpy.ndarray): 
                Training labels.

        Returns:
        
            tuple: 
                A tuple containing the training data loader, the network model, and the loss criterion.
                
        """
        
        train_loader = PReNetLoader(X, y, batch_size=self.batch_size)

        net = DualInputNet(
            self.network,
            self.n_features,
            hidden_dims=self.hidden_dims,
            rep_dim=self.rep_dim,
            activation=self.act,
            n_heads=self.n_heads,
            d_model=self.d_model,
            attn=self.attn,
            pos_encoding=self.pos_encoding,
            norm=self.norm,
            seq_len=self.seq_len,
            bias=False,
        ).to(self.device)

        criterion = torch.nn.L1Loss(reduction='mean')

        if self.verbose >= 2:
            print(net)

        return train_loader, net, criterion

[docs]    def inference_prepare(self, X):
        """
        Prepares the model for inference by setting up the test data loader.

        Args:
        
            X (numpy.ndarray): 
                Test data.

        Returns:
        
            list: 
                A list of batches for testing.
            
        """
        
        # test loader: list of batches
        y = self.train_label
        unlabeled_id = np.where(y == 0)[0]
        known_anom_id = np.where(y == 1)[0]

        if X.shape[0] > 100000:
            a = 10
        elif X.shape[0] > 50000:
            a = 20
        else:
            a = 30

        X = torch.from_numpy(X)
        train_data = torch.from_numpy(self.train_data)

        x2_a_lst = []
        x2_u_lst = []
        for i in range(a):
            a_idx = np.random.choice(known_anom_id, X.shape[0], replace=True)
            u_idx = np.random.choice(unlabeled_id, X.shape[0], replace=True)
            x2_a = train_data[a_idx]
            x2_u = train_data[u_idx]

            x2_a_lst.append(x2_a)
            x2_u_lst.append(x2_u)

        test_loader = []

        n_batches = int(np.ceil(len(X) / self.batch_size))
        for i in range(n_batches):
            left = i * self.batch_size
            right = min((i + 1) * self.batch_size, len(X))
            batch_x1 = X[left: right]
            batch_x_sup1 = [x2[left: right] for x2 in x2_a_lst]
            batch_x_sup2 = [x2[left: right] for x2 in x2_u_lst]
            test_loader.append([batch_x1, batch_x_sup1, batch_x_sup2])
        self.criterion.reduction = 'none'
        return test_loader

[docs]    def training_forward(self, batch_x, net, criterion):
        """
        Processes a single training batch through the model.

        Args:
        
            batch_x (tuple): 
                A tuple of the batch data.
                
            net (torch.nn.Module): 
                The network model.
                
            criterion (callable): 
                The loss criterion.

        Returns:
        
            Tensor: 
                The computed loss for the batch.
                
        """
        
        batch_x1, batch_x2, batch_y = batch_x
        batch_x1 = batch_x1.float().to(self.device)
        batch_x2 = batch_x2.float().to(self.device)
        batch_y = batch_y.float().to(self.device)
        pred = net(batch_x1, batch_x2).flatten()

        loss = criterion(pred, batch_y)
        return loss

[docs]    def inference_forward(self, batch_x, net, criterion):
        """
        Processes a single inference batch through the model.

        Args:
        
            batch_x (tuple): 
                A tuple of the batch data.
                
            net (torch.nn.Module): 
                The network model.
                
            criterion (callable): 
                The loss criterion used for evaluation.

        Returns:
        
            tuple: 
                A tuple containing the batch data and the computed scores.
                
        """
        
        batch_x1, batch_x_sup1_lst, batch_x_sup2_lst = batch_x

        batch_x1 = batch_x1.float().to(self.device)
        pred_s = []
        for batch_x2 in batch_x_sup1_lst:
            batch_x2 = batch_x2.float().to(self.device)
            pred = net(batch_x1, batch_x2).flatten()
            pred_s.append(pred)
        for batch_x2 in batch_x_sup2_lst:
            batch_x2 = batch_x2.float().to(self.device)
            pred = net(batch_x1, batch_x2).flatten()
            pred_s.append(pred)

        pred_s = torch.stack(pred_s)
        s = torch.mean(pred_s, dim=0)

        batch_z = batch_x1  # for consistency
        return batch_z, s


class DualInputNet(torch.nn.Module):
    """
    A dual-input network module designed for encoding and comparing pairs of inputs.

    This module can be configured to use different network architectures like Transformers or ConvSeq.

    Args:
    
        network_name (str): 
            The type of network to use.
        
        n_features (int): 
            The number of input features.
        
        hidden_dims (str, optional): 
            A comma-separated string representing hidden layer dimensions. Default is '100,50'.
        
        rep_dim (int, optional): 
            The representation dimension. Default is 64.
        
        n_heads (int, optional): 
            The number of attention heads in a transformer. Default is 8.
        
        d_model (int, optional): 
            The dimensionality of the transformer model. Default is 64.
        
        attn (str, optional): 
            The type of attention mechanism. Default is 'self_attn'.
        
        pos_encoding (str, optional):
            The type of position encoding. Default is 'fixed'.
        
        norm (str, optional): 
            The type of normalization layer. Default is 'BatchNorm'.
        
        seq_len (int, optional): 
            The length of the input sequences. Default is 100.
        
        activation (str, optional): 
            The activation function. Default is 'ReLU'.
        
        bias (bool, optional): 
            Whether to use bias in the layers. Default is False.
        
    """
    
    def __init__(self, network_name, n_features, hidden_dims='100,50', rep_dim=64,
                 n_heads=8, d_model=64, attn='self_attn', pos_encoding='fixed', norm='BatchNorm', seq_len=100,
                 activation='ReLU', bias=False):
        """
        Initializes the DualInputNet with specified network parameters.
        """
        
        super(DualInputNet, self).__init__()

        network_params = {
            'n_features': n_features,
            'n_hidden': hidden_dims,
            'n_output': rep_dim,
            'activation': activation,
            'bias': bias
        }
        if network_name == 'Transformer':
            network_params['n_heads'] = n_heads
            network_params['d_model'] = d_model
            network_params['attn'] = attn
            network_params['pos_encoding'] = pos_encoding
            network_params['norm'] = norm
            network_params['seq_len'] = seq_len
        elif network_name == 'ConvSeq':
            network_params['seq_len'] = self.seq_len

        network_class = get_network(network_name)
        self.enc_net = network_class(**network_params)

        self.out_layer = LinearBlock(
            in_channels=2 * rep_dim,
            out_channels=1,
            activation=None,
            bias=False
        )

        return

    def forward(self, x1, x2):
        """
        Forward pass to process and compare two input sequences through the network.

        Args:
        
            x1 (Tensor):
                The first input tensor.
                
            x2 (Tensor): 
                The second input tensor for comparison.

        Returns:
        
            Tensor: 
                The output tensor after processing the inputs.
                
        """
        
        x1 = self.enc_net(x1)
        x2 = self.enc_net(x2)
        pred = self.out_layer(torch.cat([x1, x2], dim=1))
        return pred