File size: 726 Bytes
2b8876a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 | """
Step-Level Chain of Thought Reasoning for Vision-Language Models
This module implements fine-grained structured reasoning with process reward models
and reinforcement learning for vision-language tasks.
"""
from .step_data import ReasoningStep, ReasoningChain, StepDataset
from .prm import ProcessRewardModel, StepQualityMetrics
from .rl_trainer import RLReasoningTrainer
from .inference_scaling import InferenceTimeScaling, MajorityVoting
from .step_level_cot import StepLevelCoTTrainer
__all__ = [
'ReasoningStep',
'ReasoningChain',
'StepDataset',
'ProcessRewardModel',
'StepQualityMetrics',
'RLReasoningTrainer',
'InferenceTimeScaling',
'MajorityVoting',
'StepLevelCoTTrainer',
]
|