fcxfcx
/

owlv2

Model card Files Files and versions

owlv2 / scenic /projects /matvit /layers.py

fcxfcx's picture

Upload 2446 files

1327f34 verified 3 months ago

history blame contribute delete

2.49 kB

	# Copyright 2025 The Scenic Authors.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	"""Customized Mlp block for MatViT.
	"""
	from typing import Any, Callable, Optional, Sequence

	import flax.linen as nn
	import jax
	import jax.numpy as jnp
	from scenic.model_lib.layers import nn_layers

	Initializer = Callable[[jnp.ndarray, Sequence[int], jnp.dtype], jnp.ndarray]


	class MlpBlock(nn.Module):
	"""Transformer MLP / feed-forward block."""

	mlp_dim: int
	out_dim: Optional[int] = None
	dropout_rate: float = 0.1
	use_bias: bool = True
	kernel_init: Initializer = nn.initializers.xavier_uniform()
	bias_init: Initializer = nn.initializers.normal(stddev=1e-6)
	activation_fn: Callable[[jnp.ndarray], jnp.ndarray] = nn.gelu
	precision: Optional[jax.lax.Precision] = None
	dtype: jnp.ndarray = jnp.float32

	@nn.compact
	def __call__(
	self,
	inputs: jnp.ndarray,
	*,
	deterministic: bool,
	matvit_mask: Optional[Any] = None,
	):
	"""Applies Transformer MlpBlock module."""
	actual_out_dim = inputs.shape[-1] if self.out_dim is None else self.out_dim
	x = nn.Dense(
	self.mlp_dim,
	dtype=self.dtype,
	use_bias=self.use_bias,
	kernel_init=self.kernel_init,
	bias_init=self.bias_init,
	precision=self.precision,
	)(inputs)

	if matvit_mask is not None:
	x = nn_layers.IdentityLayer(name='mlp1')(
	self.activation_fn(x * matvit_mask)
	)
	else:
	x = nn_layers.IdentityLayer(name='mlp1')(self.activation_fn(x))

	x = nn.Dropout(rate=self.dropout_rate)(x, deterministic=deterministic)
	output = nn.Dense(
	actual_out_dim,
	dtype=self.dtype,
	use_bias=self.use_bias,
	kernel_init=self.kernel_init,
	bias_init=self.bias_init,
	precision=self.precision,
	)(x)
	output = nn_layers.IdentityLayer(name='mlp2')(output)
	output = nn.Dropout(rate=self.dropout_rate)(
	output, deterministic=deterministic
	)
	return output