Spaces:

responsibility-framing
/

sociolome

Running

sociolome / sftp /modules /span_finder /span_finder.py

Gosse Minnema

Initial commit

05922fb about 1 year ago

3.86 kB

	from abc import ABC, abstractmethod
	from typing import *

	import torch
	from allennlp.common import Registrable
	from allennlp.modules.span_extractors import SpanExtractor


	class SpanFinder(Registrable, ABC, torch.nn.Module):
	"""
	Model the probability p(child_span \| parent_span [, parent_label])
	It's optional to model parent_label, since in some cases we may want the parameters to be shared across
	different tasks, where we may have similar span semantics but different label space.
	"""
	def __init__(
	self,
	no_label: bool = True,
	):
	"""
	:param no_label: If True, will not use input labels as features and use all 0 vector instead.
	"""
	super().__init__()
	self._no_label = no_label

	@abstractmethod
	def forward(
	self,
	token_vec: torch.Tensor,
	token_mask: torch.Tensor,
	span_vec: torch.Tensor,
	span_mask: Optional[torch.Tensor] = None, # Do not need to provide
	span_labels: Optional[torch.Tensor] = None, # Do not need to provide
	parent_indices: Optional[torch.Tensor] = None, # Do not need to provide
	parent_mask: Optional[torch.Tensor] = None,
	bio_seqs: Optional[torch.Tensor] = None,
	prediction: bool = False,
	**extra
	) -> Dict[str, torch.Tensor]:
	"""
	Return training loss and predictions.
	:param token_vec: Vector representation of tokens. Shape [batch, token ,token_dim]
	:param token_mask: True for non-padding tokens.
	:param span_vec: Vector representation of spans. Shape [batch, span, token_dim]
	:param span_mask: True for non-padding spans. Shape [batch, span]
	:param span_labels: The labels of spans. Shape [batch, span]
	:param parent_indices: Parent indices of spans. Shape [batch, span]
	:param parent_mask: True for parent spans. Shape [batch, span]
	:param prediction: If True, no loss will be return & no metrics will be updated.
	:param bio_seqs: BIO sequences. Shape [batch, parent, token, 3]
	:return:
	loss: Training loss
	prediction: Shape [batch, span]. True for positive predictions.
	"""
	raise NotImplementedError

	@abstractmethod
	def inference_forward_handler(
	self,
	token_vec: torch.Tensor,
	token_mask: torch.Tensor,
	span_extractor: SpanExtractor,
	**auxiliaries,
	) -> Callable[[torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor], None]:
	"""
	Pre-process some information and return a callable module for p(child_span \| parent_span [,parent_label])
	:param token_vec: Vector representation of tokens. Shape [batch, token ,token_dim]
	:param token_mask: True for non-padding tokens.
	:param span_extractor: The same module in model.
	:param auxiliaries: Environment variables. You can pass extra environment variables
	since the extras will be ignored.
	:return:
	A callable function in a closure.
	The arguments for the callable object are:
	- span_boundary: Shape [batch, span, 2]
	- span_labels: Shape [batch, span]
	- parent_mask: Shape [batch, span]
	- parent_indices: Shape [batch, span]
	- cursor: Shape [batch]
	No return values. Everything should be done inplace.
	Note the span indexing space has different meaning from training process. We don't have gold span list,
	so span here refers to the predicted spans.
	"""
	raise NotImplementedError

	@abstractmethod
	def get_metrics(self, reset: bool = False) -> Dict[str, float]:
	raise NotImplementedError