flex-math-8192 / configuration_pruned_flex_olmo.py

Upload configuration_pruned_flex_olmo.py with huggingface_hub

00c885c verified 4 months ago

699 Bytes

	"""Configuration for pruned FlexOlmo models with variable-width expert 1."""

	from transformers import FlexOlmoConfig


	class PrunedFlexOlmoConfig(FlexOlmoConfig):
	"""Config for FlexOlmo with a pruned expert 1.

	Extends FlexOlmoConfig with expert_1_intermediate_size to specify
	the width of the pruned expert.
	"""

	model_type = "pruned_flex_olmo"

	def __init__(self, expert_1_intermediate_size: int = None, **kwargs):
	super().__init__(**kwargs)
	# expert_1_intermediate_size: width of pruned expert 1
	# If None, falls back to intermediate_size (no pruning)
	self.expert_1_intermediate_size = expert_1_intermediate_size or self.intermediate_size