Spaces:

THUDM
/

CogVideo

Running

App Files Files Community

CogVideo / coglm_strategy.py

akhaliq HF staff

add files

89dc200 almost 2 years ago

raw history blame

No virus

4.06 kB

	# -- encoding: utf-8 --
	'''
	@File : coglm_strategy.py
	@Time : 2021/10/08 22:22:42
	@Author : Ming Ding
	@Contact : dm18@mails.tsinghua.edu.cn
	'''

	# here put the import lib
	import os
	import sys
	import math
	import random
	import torch
	import numpy as np
	import torch.nn.functional as F


	def top_k_logits(logits, top_k=0, top_p=0.0, filter_value=-65504):
	# This function has been mostly taken from huggingface conversational ai code at
	# https://medium.com/huggingface/how-to-build-a-state-of-the-art-conversational-ai-with-transfer-learning-2d818ac26313

	if top_k > 0:
	# Remove all tokens with a probability less than the last token of the top-k
	indices_to_remove = logits < torch.topk(logits, top_k)[0][..., -1, None]
	logits[indices_to_remove] = filter_value

	if top_p > 0.0:
	# convert to 1D
	logits = logits.view(logits.size()[1]).contiguous()
	sorted_logits, sorted_indices = torch.sort(logits, descending=True)
	cumulative_probs = torch.cumsum(F.softmax(sorted_logits, dim=-1), dim=-1)

	# Remove tokens with cumulative probability above the threshold
	sorted_indices_to_remove = cumulative_probs > top_p
	# Shift the indices to the right to keep also the first token above the threshold
	sorted_indices_to_remove[..., 1:] = sorted_indices_to_remove[..., :-1].clone()
	sorted_indices_to_remove[..., 0] = 0
	indices_to_remove = sorted_indices[sorted_indices_to_remove]
	logits[indices_to_remove] = filter_value
	# going back to 2D
	logits = logits.view(1, -1).contiguous()

	return logits


	class CoglmStrategy:
	def __init__(self, invalid_slices=[], temperature=1., top_k=200, eps=1e-4, top_p=0.0, end_tokens=None, temperature2=0.89):
	self.invalid_slices = invalid_slices
	self.temperature = temperature
	self.temperature2 = temperature2
	self.topk = top_k
	self.top_p = top_p
	self.eps = eps
	if end_tokens is None:
	end_tokens = []
	self.end_tokens = end_tokens
	self._is_done = False
	self.outlier_count_down = torch.zeros(16)
	self.vis_list = [[]for i in range(16)]
	self.cluster_labels = torch.tensor(np.load('cluster_label2.npy'), device='cuda', dtype=torch.long)
	self.start_pos = -1
	self.white_cluster = []
	# self.fout = open('tmp.txt', 'w')

	@property
	def is_done(self) -> bool:
	return self._is_done

	def forward(self, logits, tokens, mems, temperature=None, temperature2=None):
	if temperature is None:
	temperature = self.temperature
	if temperature2 is None:
	temperature2 = self.temperature2
	logits = logits / temperature
	for invalid_slice in self.invalid_slices:
	logits[..., invalid_slice] = -65504

	rprobs = F.softmax(logits.float(), dim=-1)
	c = self.cluster_labels.expand(*rprobs.shape)
	cprobs = torch.zeros(logits.shape[0], 500, device=logits.device).scatter_add_(1, c, rprobs)
	# self.fout.write(str(tokens.shape[-1])+ ' ' + str(cprobs.topk(10)) + '\n')
	# self.fout.flush()
	best_scores, best_clusters = cprobs.topk(self.topk)
	bz = logits.shape[0]
	for i in range(bz):
	selected_cluster = best_clusters[i][torch.multinomial(best_scores[i] / best_scores[i].sum(), num_samples=1)]
	logits[i, self.cluster_labels != selected_cluster] = -65504

	# logits = top_k_logits(logits, self.topk, self.top_p)
	probs = F.softmax(logits.float()/temperature2, dim=-1) # float is essetial, due to a bug in Pytorch
	pred = torch.multinomial(probs, num_samples=1)

	if pred.numel() == 1 and pred.item() in self.end_tokens:
	self._is_done = True
	tokens = torch.cat((tokens, pred.view(tokens.shape[0], 1)), dim=1)
	return tokens, mems

	def finalize(self, tokens, mems):
	self._is_done = False
	return tokens, mems