dei-model / src /reasoning /__init__.py
renpas22
Add training scripts and configs
2b8876a
raw
history blame contribute delete
726 Bytes
"""
Step-Level Chain of Thought Reasoning for Vision-Language Models
This module implements fine-grained structured reasoning with process reward models
and reinforcement learning for vision-language tasks.
"""
from .step_data import ReasoningStep, ReasoningChain, StepDataset
from .prm import ProcessRewardModel, StepQualityMetrics
from .rl_trainer import RLReasoningTrainer
from .inference_scaling import InferenceTimeScaling, MajorityVoting
from .step_level_cot import StepLevelCoTTrainer
__all__ = [
'ReasoningStep',
'ReasoningChain',
'StepDataset',
'ProcessRewardModel',
'StepQualityMetrics',
'RLReasoningTrainer',
'InferenceTimeScaling',
'MajorityVoting',
'StepLevelCoTTrainer',
]