hahnyuan
/

opt-125m-asvd90

Text Generation

text-generation-inference

Model card Files Files and versions

opt-125m-asvd90 / modeling_asvd_opt.py

hahnyuan's picture

Update modeling_asvd_opt.py

f6a6cb1 almost 2 years ago

history blame contribute delete

1.64 kB

	from transformers import OPTForCausalLM
	from .configuration_asvd_opt import ASVDOPTConfig
	import torch.nn as nn

	class ASVDLinear(nn.Module):
	def __init__(self, in_features, out_features, rank, bias=True):
	super().__init__()
	self.BLinear = nn.Linear(in_features, rank, bias=False)
	self.ALinear = nn.Linear(rank, out_features, bias=bias)

	def forward(self, input):
	return self.ALinear(self.BLinear(input))

	class ASVDOPTForCausalLM(OPTForCausalLM):
	config_class = ASVDOPTConfig

	def __init__(self, config:ASVDOPTConfig):
	super().__init__(config)
	self.truncation_ranks=config.truncation_ranks

	full_name_dict = {module: name for name, module in self.named_modules()}
	linear_info = {}
	modules = [self]
	while len(modules) > 0:
	submodule = modules.pop()
	for name, raw_linear in submodule.named_children():
	if isinstance(raw_linear, nn.Linear):
	full_name = full_name_dict[raw_linear]
	linear_info[raw_linear] = {
	"father": submodule,
	"name": name,
	"full_name": full_name,
	}
	else:
	modules.append(raw_linear)


	for name,module in self.named_modules():
	if name in self.truncation_ranks:
	info=linear_info[module]
	new_layer=ASVDLinear(module.in_features,module.out_features,self.truncation_ranks[name])
	setattr(info["father"], info["name"], new_layer)