| import os |
|
|
| import torch |
| from transformers import AutoTokenizer |
|
|
| from modeling_reward import load_finetuned_model |
|
|
|
|
| def main(): |
| repo_root = os.path.dirname(os.path.abspath(__file__)) |
| tokenizer = AutoTokenizer.from_pretrained(repo_root) |
| model = load_finetuned_model(repo_root) |
|
|
| sql = "SELECT COUNT(*) FROM orders WHERE status = 'complete';" |
| reasoning = "think: Count rows in orders filtered by status 'complete'." |
| nl = "How many completed orders exist?" |
| text = f"SQL: {sql}\nReasoning: {reasoning}\nNL: {nl}" |
|
|
| inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=2048) |
| with torch.no_grad(): |
| score = model(**inputs)["scores"].item() |
|
|
| print(f"Reward score: {score:.3f}") |
|
|
|
|
| if __name__ == "__main__": |
| main() |
|
|
|
|