RubricARM
Collection
2 items
•
Updated
Finetuned checkpoint for rubric-based reward modeling / judging.
from transformers import AutoModelForCausalLM, AutoTokenizer
model_id = "OpenRubrics/RubricARM-8B-Rubric"
tok = AutoTokenizer.from_pretrained(model_id, use_fast=True)
model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype="auto")