Spaces:

yxchng
/

elia

Sleeping

elia / lib /_utils.py

yxchng

add files

a166479 over 1 year ago

1.87 kB

	from collections import OrderedDict
	import sys
	import torch
	from torch import nn
	from torch.nn import functional as F
	from bert.modeling_bert import BertModel


	class _LAVTSimpleDecode(nn.Module):
	def __init__(self, backbone, classifier):
	super(_LAVTSimpleDecode, self).__init__()
	self.backbone = backbone
	self.classifier = classifier

	def forward(self, x, l_feats, l_mask):
	input_shape = x.shape[-2:]
	features = self.backbone(x, l_feats, l_mask)
	x_c1, x_c2, x_c3, x_c4 = features
	x = self.classifier(x_c4, x_c3, x_c2, x_c1)
	x = F.interpolate(x, size=input_shape, mode='bilinear', align_corners=True)

	return x


	class LAVT(_LAVTSimpleDecode):
	pass


	###############################################
	# LAVT One: put BERT inside the overall model #
	###############################################
	class _LAVTOneSimpleDecode(nn.Module):
	def __init__(self, backbone, classifier, args):
	super(_LAVTOneSimpleDecode, self).__init__()
	self.backbone = backbone
	self.classifier = classifier
	self.text_encoder = BertModel.from_pretrained(args.ck_bert)
	self.text_encoder.pooler = None

	def forward(self, x, text, l_mask):
	input_shape = x.shape[-2:]
	### language inference ###
	l_feats = self.text_encoder(text, attention_mask=l_mask)[0] # (6, 10, 768)
	l_feats = l_feats.permute(0, 2, 1) # (B, 768, N_l) to make Conv1d happy
	l_mask = l_mask.unsqueeze(dim=-1) # (batch, N_l, 1)
	##########################
	features = self.backbone(x, l_feats, l_mask)
	x_c1, x_c2, x_c3, x_c4 = features
	x = self.classifier(x_c4, x_c3, x_c2, x_c1)
	x = F.interpolate(x, size=input_shape, mode='bilinear', align_corners=True)

	return x


	class LAVTOne(_LAVTOneSimpleDecode):
	pass