msj19
/

org_gdn_1B

Model card Files Files and versions

org_gdn_1B / fla2 /ops /gla /recurrent_fuse.py

msj19's picture

Add files using upload-large-folder tool

120b798 verified about 1 month ago

history blame contribute delete

784 Bytes

	# -- coding: utf-8 --

	# Copyright (c) 2023, Songlin Yang

	from typing import Tuple

	import torch
	import triton
	import triton.language as tl
	from ...utils import autocast_custom_bwd, autocast_custom_fwd, contiguous
	from ...ops.common.fused_recurrent import fused_recurrent

	def fused_recurrent_gla(
	q: torch.Tensor,
	k: torch.Tensor,
	v: torch.Tensor,
	gk: torch.Tensor = None,
	gv: torch.Tensor = None,
	scale: int = None,
	initial_state: torch.Tensor = None,
	output_final_state: bool = False,
	reverse: bool = False
	) -> Tuple[torch.Tensor, torch.Tensor]:
	if scale is None:
	scale = q.shape[-1] ** -0.5
	o, final_state = fused_recurrent(q, k, v, None, gk, gv, scale, initial_state, output_final_state, reverse)
	return o, final_state