|
|
|
|
|
__version__ = "0.7.11.dev0"
|
|
|
|
from .core import set_seed
|
|
from .environment import TextEnvironment, TextHistory
|
|
from .extras import BestOfNSampler
|
|
from .import_utils import (
|
|
is_bitsandbytes_available,
|
|
is_diffusers_available,
|
|
is_npu_available,
|
|
is_peft_available,
|
|
is_wandb_available,
|
|
is_xpu_available,
|
|
)
|
|
from .models import (
|
|
AutoModelForCausalLMWithValueHead,
|
|
AutoModelForSeq2SeqLMWithValueHead,
|
|
PreTrainedModelWrapper,
|
|
create_reference_model,
|
|
setup_chat_format,
|
|
)
|
|
from .trainer import (
|
|
DataCollatorForCompletionOnlyLM,
|
|
DPOTrainer,
|
|
IterativeSFTTrainer,
|
|
ModelConfig,
|
|
PPOConfig,
|
|
PPOTrainer,
|
|
RewardConfig,
|
|
RewardTrainer,
|
|
SFTTrainer,
|
|
)
|
|
from .trainer.utils import get_kbit_device_map, get_peft_config, get_quantization_config
|
|
|
|
|
|
if is_diffusers_available():
|
|
from .models import (
|
|
DDPOPipelineOutput,
|
|
DDPOSchedulerOutput,
|
|
DDPOStableDiffusionPipeline,
|
|
DefaultDDPOStableDiffusionPipeline,
|
|
)
|
|
from .trainer import DDPOConfig, DDPOTrainer
|
|
|