LibContinual / core /model /buffer /onlinebuffer.py

Upload 236 files

5fee096 verified 10 days ago

4.35 kB

	import numpy as np
	import pdb
	import torch
	import torch.nn as nn
	import torch.nn.functional as F

	# modified from https://github.com/gydpku/OCM/blob/main/buffer.py

	class OnlineBuffer(nn.Module):
	def __init__(self, buffer_size, batch_size, input_size):
	super().__init__()

	self.place_left = True
	self.strategy = None
	self.buffer_size = buffer_size
	print('buffer has %d slots' % buffer_size, buffer_size)

	buf_data = torch.FloatTensor(buffer_size, *input_size).fill_(0)
	buf_targets = torch.LongTensor(buffer_size).fill_(0)
	buf_tasks = torch.LongTensor(buffer_size).fill_(0)

	self.current_index = 0
	self.n_seen_so_far = 0
	self.is_full = 0
	self.total_classes = 0
	# registering as buffer allows us to save the object using `torch.save`
	self.register_buffer('buf_data', buf_data)
	self.register_buffer('buf_targets', buf_targets)
	self.register_buffer('buf_tasks', buf_tasks)


	def tensor_to_device(self, device):
	self.device = device
	self.buf_data.to(device)
	self.buf_targets.to(device)
	self.buf_tasks.to(device)



	def add_reservoir(self, x, y, task):
	n_elem = x.size(0)

	self.device = x.device
	place_left = max(0, self.buffer_size - self.current_index)
	offset = min(place_left, n_elem)

	if place_left:
	offset = min(place_left, n_elem)

	self.buf_data[self.current_index: self.current_index + offset].data.copy_(x[:offset])
	self.buf_targets[self.current_index: self.current_index + offset].data.copy_(y[:offset])
	self.buf_tasks[self.current_index: self.current_index + offset].fill_(task)
	self.current_index += offset
	self.n_seen_so_far += offset

	if offset == x.size(0):
	return

	self.place_left = False

	# remove what is already in the buffer
	x, y = x[place_left:], y[place_left:]

	indices = torch.FloatTensor(x.size(0)).to(x.device).uniform_(0, self.n_seen_so_far).long()
	valid_indices = (indices < self.buf_data.size(0)).long()

	idx_new_data = valid_indices.nonzero().squeeze(-1)
	idx_buffer = indices[idx_new_data]

	self.n_seen_so_far += x.size(0)

	if idx_buffer.numel() == 0:
	return

	assert idx_buffer.max() < self.buf_data.size(0), pdb.set_trace()
	assert idx_buffer.max() < self.buf_targets.size(0), pdb.set_trace()
	assert idx_buffer.max() < self.buf_tasks.size(0), pdb.set_trace()

	assert idx_new_data.max() < x.size(0), pdb.set_trace()
	assert idx_new_data.max() < y.size(0), pdb.set_trace()

	if self.buf_data.device != x.device:
	self.buf_data = self.buf_data.to(x.device)
	self.buf_targets = self.buf_targets.to(x.device)
	self.buf_tasks = self.buf_tasks.to(x.device)

	self.buf_data[idx_buffer] = x[idx_new_data]
	self.buf_targets[idx_buffer] = y[idx_new_data]
	self.buf_tasks[idx_buffer] = task




	def sample(self, amount, exclude_task = None, ret_ind = False):

	if self.buf_data.device != self.device:
	self.buf_data = self.buf_data.to(self.device)
	self.buf_targets = self.buf_targets.to(self.device)
	self.buf_tasks = self.buf_tasks.to(self.device)

	if exclude_task is not None:
	valid_indices = (self.t != exclude_task)
	valid_indices = valid_indices.nonzero().squeeze()
	bx, by, bt = self.buf_data[valid_indices], self.buf_targets[valid_indices], self.buf_tasks[valid_indices]
	else:
	bx, by, bt = self.buf_data[:self.current_index], self.buf_targets[:self.current_index], self.buf_tasks[:self.current_index]

	if bx.size(0) < amount:
	if ret_ind:
	return bx, by, bt, torch.from_numpy(np.arange(bx.size(0)))
	else:
	return bx, by, bt
	else:
	indices = torch.from_numpy(np.random.choice(bx.size(0), amount, replace=False))
	indices = indices.to(self.device)

	if ret_ind:
	return bx[indices], by[indices], bt[indices], indices
	else:
	return bx[indices], by[indices], bt[indices]