This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| # train_grpo.py | |
| # | |
| # See https://github.com/willccbb/verifiers for ongoing developments | |
| # | |
| import re | |
| import torch | |
| from datasets import load_dataset, Dataset | |
| from transformers import AutoTokenizer, AutoModelForCausalLM | |
| from peft import LoraConfig | |
| from trl import GRPOConfig, GRPOTrainer |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| { | |
| "public_identifier": "emeniken", | |
| "profile_pic_url": "https://s3.us-west-000.backblazeb2.com/proxycurl/person/emeniken/profile?X-Amz-Algorithm=AWS4-HMAC-SHA256&X-Amz-Credential=0004d7f56a0400b0000000001%2F20240506%2Fus-west-000%2Fs3%2Faws4_request&X-Amz-Date=20240506T150741Z&X-Amz-Expires=3600&X-Amz-SignedHeaders=host&X-Amz-Signature=f22203c662d0074d6c606e7cc7e123df2a8d315ad0e938d0b3520eeb0ec5eb02", | |
| "background_cover_image_url": "https://s3.us-west-000.backblazeb2.com/proxycurl/person/emeniken/cover?X-Amz-Algorithm=AWS4-HMAC-SHA256&X-Amz-Credential=0004d7f56a0400b0000000001%2F20240506%2Fus-west-000%2Fs3%2Faws4_request&X-Amz-Date=20240506T150741Z&X-Amz-Expires=3600&X-Amz-SignedHeaders=host&X-Amz-Signature=3b65577d755d1469cd8ec641459a85ff3ea9f79de1fcc47748d55cff46135754", | |
| "first_name": "Lawrence", | |
| "last_name": "Emenike", | |
| "full_name": "Lawrence Emenike", | |
| "follower_count": 1026, | |
| "occupation": "Service Cognitive Experience Analyst - Annuity & Service at Ricoh Europe", | |
| "headline": "Delivering Bus |
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
NewerOlder