Source code for textbox.model.GAN.leakgan

# @Time   : 2020/11/19
# @Author : Jinhao Jiang
# @Email  : jiangjinhao@std.uestc.edu.cn

r"""
LeakGAN
##############################
Reference:
    Guo et al. "Long Text Generation via Adversarial Training with Leaked Information" in AAAI 2018.
"""

import torch

from textbox.model.abstract_generator import GenerativeAdversarialNet
from textbox.module.Generator.LeakGANGenerator import LeakGANGenerator
from textbox.module.Discriminator.LeakGANDiscriminator import LeakGANDiscriminator


[docs]class LeakGAN(GenerativeAdversarialNet):
    r"""LeakGAN is a generative adversarial network to address the problem for long text generation.
        We allow the discriminative net to leak its own high-level extracted features to the generative net to further help the guidance.
        The generator incorporates such informative signals into all generation steps through an additional Manager module, 
        which takes the extracted features of current generated words and outputs a latent vector to guide the Worker module for next-word generation.
    """

    def __init__(self, config, dataset):
        super(LeakGAN, self).__init__(config, dataset)
        self.generator = LeakGANGenerator(config, dataset)
        self.discriminator = LeakGANDiscriminator(config, dataset)
        self.dis_sample_num = config['d_sample_num']
        self.max_length = config['seq_len'] + 2

[docs]    def calculate_g_train_loss(self, corpus, epoch_idx):
        self.discriminator.eval()
        loss = self.generator.pretrain_loss(corpus, self.discriminator)  # corpus: target_text
        self.discriminator.train()
        return loss

[docs]    def calculate_d_train_loss(self, real_data, fake_data, epoch_idx):
        return self.discriminator.calculate_loss(real_data[:, 1:], fake_data)

[docs]    def calculate_g_adversarial_loss(self, epoch_idx):
        self.discriminator.eval()
        loss = self.generator.adversarial_loss(self.discriminator)
        self.discriminator.train()
        return loss  # (manager_loss, worker_loss)

[docs]    def generate(self, batch_data, eval_data):
        return self.generator.generate(batch_data, eval_data, self.discriminator)

[docs]    def sample(self, sample_num):
        self.discriminator.eval()
        samples = self.generator.sample(sample_num, self.discriminator, self.sos_token_idx)
        self.discriminator.train()
        return samples

[docs]    def calculate_nll_test(self, corpus, epoch_idx):
        targets = self._get_real_data_for_nll_test(corpus)
        targets = targets[:, 1:]
        return self.generator.calculate_loss(targets, self.discriminator)

    def _add_eos(self, data, length):
        batch_size = data.shape[0]
        padded_data = torch.full((batch_size, self.max_length),
                                 self.eos_token_idx,
                                 dtype=torch.long,
                                 device=self.device)
        for i in range(batch_size):
            len = length[i].cpu().data
            padded_data[i, :len] = data[i, :len]
        return padded_data

    def _get_real_data_for_nll_test(self, train_data):
        r"""specified for nll test and use eos_idx pad not pad_idx to pad
        """
        real_data = train_data['target_idx']
        length = train_data['target_length']
        real_data = self._add_eos(real_data, length)  # bs * seq_len
        return real_data