RM-Gallery

logger

RM-Gallery

GitHub

Overview
Tutorials
Tutorials
- Data
  Data
  - Annotation
  - Load
  - Pipeline
  - Process
- Train RM
- Build RM
  Build RM
- RM Server
- Application
  Application
Contribution
API Reference
API Reference
- rm_gallery
  rm_gallery
  - core
    core
    
    base
    
    data
    data
    
    annotation
    annotation
    
    annotation
    
    client
    
    server
    
    template
    
    base
    
    build
    
    export
    
    load
    load
    
    base
    
    chat_message
    
    huggingface
    
    process
    process
    
    ops
    ops
    
    base
    
    filter
    filter
    
    conversation_turn_filter
    
    text_length_filter
    
    process
    
    schema
    
    model
    model
    
    base
    
    huggingface_llm
    
    message
    
    openai_llm
    
    reward
    reward
    
    base
    
    composition
    
    principle
    principle
    
    auto
    
    cumulative
    
    iterative
    
    refinement
    
    registry
    
    schema
    
    template
    
    train
    train
    
    dataset
    
    utils
    utils
    
    acc
    
    file
    
    logger logger
    Table of contents
    
    logger
    
    text
    
    tokenizer
  - gallery
    gallery
    
    data
    data
    
    annotation
    annotation
    
    rewardbench
    
    rewardbench2
    
    load
    load
    
    helpsteer2_pairwise
    
    helpsteer2_pointwise
    
    prmbench
    
    rewardbench
    
    rewardbench2
    
    rmbbenchmark_bestofn
    
    rmbbenchmark_pairwise
    
    rm
    rm
    
    alignment
    alignment
    
    base
    
    harmlessness
    harmlessness
    
    detoxification
    
    safety
    
    helpfulness
    helpfulness
    
    brainstorming
    
    chat
    
    classification
    
    closed_qa
    
    code
    
    focus
    
    generation
    
    math
    
    open_qa
    
    precise_if
    
    reasoning
    
    rewrite
    
    role_playing
    
    summarization
    
    translation
    
    honesty
    honesty
    
    factuality
    
    carmo
    
    code
    code
    
    code
    
    prime_code
    prime_code
    
    testing_util
    
    utils
    
    format
    format
    
    format
    
    general
    
    math
    math
    
    math