ihbkaiser
/

trl-mcsd

Model card Files Files and versions

trl-mcsd / trl /__init__.py

ihbkaiser's picture

Implement MCSD for experimental SDPO

1fa3c6c verified about 1 month ago

history blame contribute delete

3.87 kB

	# Copyright 2020-2026 The HuggingFace Team. All rights reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	import sys
	from importlib.metadata import PackageNotFoundError, version
	from typing import TYPE_CHECKING

	from . import _compat
	from ._lazy_module import _LazyModule


	try:
	__version__ = version("trl")
	except PackageNotFoundError:
	__version__ = "unknown"

	_import_structure = {
	"chat_template_utils": [
	"add_response_schema",
	"clone_chat_template",
	"get_training_chat_template",
	"supports_tool_calling",
	],
	"data_utils": [
	"apply_chat_template",
	"extract_prompt",
	"is_conversational",
	"is_conversational_from_value",
	"maybe_apply_chat_template",
	"maybe_convert_to_chatml",
	"maybe_extract_prompt",
	"maybe_unpair_preference_dataset",
	"pack_dataset",
	"prepare_multimodal_messages",
	"prepare_multimodal_messages_vllm",
	"unpair_preference_dataset",
	],
	"models": ["create_reference_model"],
	"scripts": ["DatasetMixtureConfig", "ScriptArguments", "TrlParser", "get_dataset", "init_zero_verbose"],
	"trainer": [
	"BEMACallback",
	"DPOConfig",
	"DPOTrainer",
	"GRPOConfig",
	"GRPOTrainer",
	"KTOConfig",
	"KTOTrainer",
	"LogCompletionsCallback",
	"ModelConfig",
	"RewardConfig",
	"RewardTrainer",
	"RichProgressCallback",
	"RLOOConfig",
	"RLOOTrainer",
	"SFTConfig",
	"SFTTrainer",
	"SyncRefModelCallback",
	"WeaveCallback",
	"get_kbit_device_map",
	"get_peft_config",
	"get_quantization_config",
	],
	}

	if TYPE_CHECKING:
	from .chat_template_utils import (
	add_response_schema,
	clone_chat_template,
	get_training_chat_template,
	supports_tool_calling,
	)
	from .data_utils import (
	apply_chat_template,
	extract_prompt,
	is_conversational,
	is_conversational_from_value,
	maybe_apply_chat_template,
	maybe_convert_to_chatml,
	maybe_extract_prompt,
	maybe_unpair_preference_dataset,
	pack_dataset,
	prepare_multimodal_messages,
	prepare_multimodal_messages_vllm,
	unpair_preference_dataset,
	)
	from .models import create_reference_model
	from .scripts import DatasetMixtureConfig, ScriptArguments, TrlParser, get_dataset, init_zero_verbose
	from .trainer import (
	BEMACallback,
	DPOConfig,
	DPOTrainer,
	GRPOConfig,
	GRPOTrainer,
	KTOConfig,
	KTOTrainer,
	LogCompletionsCallback,
	ModelConfig,
	RewardConfig,
	RewardTrainer,
	RichProgressCallback,
	RLOOConfig,
	RLOOTrainer,
	SFTConfig,
	SFTTrainer,
	SyncRefModelCallback,
	WeaveCallback,
	get_kbit_device_map,
	get_peft_config,
	get_quantization_config,
	)

	else:
	import sys

	sys.modules[__name__] = _LazyModule(
	__name__,
	globals()["__file__"],
	_import_structure,
	module_spec=__spec__,
	extra_objects={"__version__": __version__},
	)