lingbot-vla / lingbotvla /utils /seqlen_pos_transform_utils.py

Upload folder using huggingface_hub

fb11af9 verified about 2 months ago

1.92 kB

	# Copyright 2025 Bytedance Ltd. and/or its affiliates
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.


	import torch
	import torch.nn.functional as F


	def len2culen(seqlens: "torch.Tensor") -> "torch.Tensor":
	"""
	Converts the sequence lengths to cumulative sequence lengths.

	NOTE: flash attention only accepts int32 cu_seqlens.
	"""
	return F.pad(torch.cumsum(seqlens, dim=0), (1, 0)).type(torch.int32)


	def culen2len(cu_seqlens: "torch.Tensor") -> "torch.Tensor":
	"""
	Converts the cumulative sequence lengths to sequence lengths.
	"""
	return cu_seqlens.diff()


	def pos2culen(position_ids: "torch.Tensor") -> "torch.Tensor":
	"""
	Converts the position ids to cumulative sequence lengths.
	"""
	if position_ids.dim() == 3: # (batch_size, dim, seq_length):
	position_ids = position_ids[:, 0, :]

	position_ids = position_ids.flatten()
	indices_q = torch.arange(position_ids.size(0), dtype=torch.int32, device=position_ids.device)
	return F.pad(indices_q[position_ids == 0], (0, 1), "constant", position_ids.size(0))


	def culen2pos(cu_seqlens: "torch.Tensor") -> "torch.Tensor":
	"""
	Converts the cumulative sequence lengths to position ids.
	"""
	seqlens = culen2len(cu_seqlens).cpu()
	position_ids = torch.cat([torch.arange(length, dtype=torch.long, device=cu_seqlens.device) for length in seqlens])
	return position_ids.unsqueeze(0)