# flake8: noqa __version__ = "0.7.11.dev0" from .core import set_seed from .environment import TextEnvironment, TextHistory from .extras import BestOfNSampler from .import_utils import ( is_bitsandbytes_available, is_diffusers_available, is_npu_available, is_peft_available, is_wandb_available, is_xpu_available, ) from .models import ( AutoModelForCausalLMWithValueHead, AutoModelForSeq2SeqLMWithValueHead, PreTrainedModelWrapper, create_reference_model, setup_chat_format, ) from .trainer import ( DataCollatorForCompletionOnlyLM, DPOTrainer, IterativeSFTTrainer, ModelConfig, PPOConfig, PPOTrainer, RewardConfig, RewardTrainer, SFTTrainer, ) from .trainer.utils import get_kbit_device_map, get_peft_config, get_quantization_config if is_diffusers_available(): from .models import ( DDPOPipelineOutput, DDPOSchedulerOutput, DDPOStableDiffusionPipeline, DefaultDDPOStableDiffusionPipeline, ) from .trainer import DDPOConfig, DDPOTrainer