|
|
|
|
| __version__ = "0.7.11.dev0"
|
|
|
| from .core import set_seed
|
| from .environment import TextEnvironment, TextHistory
|
| from .extras import BestOfNSampler
|
| from .import_utils import (
|
| is_bitsandbytes_available,
|
| is_diffusers_available,
|
| is_npu_available,
|
| is_peft_available,
|
| is_wandb_available,
|
| is_xpu_available,
|
| )
|
| from .models import (
|
| AutoModelForCausalLMWithValueHead,
|
| AutoModelForSeq2SeqLMWithValueHead,
|
| PreTrainedModelWrapper,
|
| create_reference_model,
|
| setup_chat_format,
|
| )
|
| from .trainer import (
|
| DataCollatorForCompletionOnlyLM,
|
| DPOTrainer,
|
| IterativeSFTTrainer,
|
| ModelConfig,
|
| PPOConfig,
|
| PPOTrainer,
|
| RewardConfig,
|
| RewardTrainer,
|
| SFTTrainer,
|
| )
|
| from .trainer.utils import get_kbit_device_map, get_peft_config, get_quantization_config
|
|
|
|
|
| if is_diffusers_available():
|
| from .models import (
|
| DDPOPipelineOutput,
|
| DDPOSchedulerOutput,
|
| DDPOStableDiffusionPipeline,
|
| DefaultDDPOStableDiffusionPipeline,
|
| )
|
| from .trainer import DDPOConfig, DDPOTrainer
|
|
|