From 1f2f8da5068f330064682f19731521c0da6f5655 Mon Sep 17 00:00:00 2001 From: Rachel Hu Date: Sun, 5 Nov 2023 22:36:36 -0800 Subject: [PATCH] update datasets version and update step 3 rl dataset_name to cambioml --- example/rlhf/demo_rl.py | 4 ++-- pyproject.toml | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/example/rlhf/demo_rl.py b/example/rlhf/demo_rl.py index 79e8d2f..3e80f18 100644 --- a/example/rlhf/demo_rl.py +++ b/example/rlhf/demo_rl.py @@ -1,7 +1,7 @@ """ accelerate config -LOCAL_DIR=/home/ubuntu/pykoi/pykoi # change this to your local path +LOCAL_DIR=/home/ubuntu/pykoi # change this to your local path export PYTHONPATH=$PYTHONPATH:${LOCAL_DIR} @@ -17,7 +17,7 @@ config = RLHFConfig( base_model_path="models/rlhf_step1_sft", #"elinas/llama-7b-hf-transformers-4.29", dataset_type="huggingface", - dataset_name="goldmermaid/stack_exchange_rank_10k_dataset", + dataset_name="cambioml/stack_exchange_rank_10k_dataset", dataset_subset_rl="data", reward_model_path="models/rlhf_step2_rw/", #"cambioml/rlhf_reward_model", save_freq=1, diff --git a/pyproject.toml b/pyproject.toml index f473e1d..f1f66a1 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -37,7 +37,7 @@ python-multipart = { version = "0.0.6", optional = true } tiktoken = { version = "0.4.0", optional = true } sentence-transformers = { version = "2.2.2", optional = true } -datasets = { version = "2.13.1", optional = true } +datasets = { version = "2.14.5", optional = true } evaluate = { version = "0.4.0", optional = true } peft = { version = "0.5.0", optional = true } trl = { version = "0.4.7", optional = true }