Spaces:

feel-fl
/

open-human-feedback-chat

Running on Zero

App Files Files Community

Riddhi Bhagwat commited on Mar 4

Commit

1893204

1 Parent(s): 67312ac

organization of files & debugging reward_eval file

Browse files

Files changed (3) hide show

ml/eval/data_transform_pipeline.py +0 -80
ml/eval/reward_eval.py +14 -16
ml/eval/tempCodeRunnerFile.py +0 -0

ml/eval/data_transform_pipeline.py DELETED Viewed

@@ -1,80 +0,0 @@
-import pandas as pd
-import numpy as np
-# NOTE: names of preset cols may be different based on dataset, this is just a generalized pipeline
-CHOSEN_COLUMN = 'chosen'  # name of col with chosen responses
-REJECTED_COLUMN = 'rejected'  # name of col with rejected responses
-COLUMNS_TO_DROP = ['metadata', 'timestamp', 'id']  # cols to remove
-def transform_rlhf_dataset(df, chosen_col=CHOSEN_COLUMN, rejected_col=REJECTED_COLUMN, drop_cols=COLUMNS_TO_DROP):
-    """
-    Parameters:
-    df (pandas.DataFrame): Input dataframe with chosen and rejected columns
-    chosen_col (str): Name of column containing chosen responses
-    rejected_col (str): Name of column containing rejected responses
-    drop_cols (list): List of column names to drop from the dataset
-    Returns:
-    pandas.DataFrame: Transformed dataset with 'text' and 'label' columns
-    """
-    df = df.copy()
-    existing_cols_to_drop = [col for col in drop_cols if col in df.columns]
-    if existing_cols_to_drop:
-        df = df.drop(columns=existing_cols_to_drop)
-    preserved_cols = [col for col in df.columns if col not in [chosen_col, rejected_col]]
-    # two separate dataframes for liked and disliked
-    liked_df = df[[chosen_col]].copy()
-    liked_df.columns = ['text']
-    liked_df['label'] = 'liked'
-    disliked_df = df[[rejected_col]].copy()
-    disliked_df.columns = ['text']
-    disliked_df['label'] = 'disliked'
-    for col in preserved_cols:
-        liked_df[col] = df[col]
-    for col in preserved_cols:
-        disliked_df[col] = df[col]
-    # combine + shuffle
-    transformed_df = pd.concat([liked_df, disliked_df], ignore_index=True)
-    transformed_df = transformed_df.dropna(subset=['text'])
-    transformed_df = transformed_df.sample(frac=1).reset_index(drop=True)
-    # reordering
-    column_order = ['text', 'label'] + preserved_cols
-    transformed_df = transformed_df[column_order]
-    return transformed_df
-def test_example():
-    example_data = {
-        'chosen': ['This is a good response', 'Another good one'],
-        'rejected': ['This is a bad response', 'Another bad one'],
-        'metadata': ['meta1', 'meta2'],
-        'timestamp': ['2024-01-01', '2024-01-02'],
-        'id': [1, 2]
-    }
-    df = pd.DataFrame(example_data)
-    transformed_df = transform_rlhf_dataset(
-        df,
-        chosen_col='chosen',
-        rejected_col='rejected',
-        drop_cols=['metadata', 'id']
-    )
-    print("Original shape:", df.shape)
-    print("\nTransformed shape:", transformed_df.shape)
-    print("\nTransformation sample:")
-    print(transformed_df.head())
-    print("\nLabel distribution:")
-    print(transformed_df['label'].value_counts())
-if __name__ == "__main__":
-    test_example()

ml/eval/reward_eval.py CHANGED Viewed

@@ -3,10 +3,8 @@ import os
 from typing import Any, Dict, List
 import json
 import torch
-import transformers
-from transformers import AutoModelForCausalLM, AutoTokenizer, AutoModelForSequenceClassification
 from accelerate import Accelerator
-from trl import KTOConfig, KTOTrainer, ModelConfig, get_peft_config, maybe_unpair_preference_dataset, setup_chat_format
 from tqdm import tqdm
 # Add script directory to system path for importing local modules
@@ -24,7 +22,7 @@ def create_model(model_name: str):
     """
     loads pre-trained reward model and moves it onto device
     """
-    model = AutoModelForSequenceClassification.from_pretrained(model_name, torch_dtype=torch.bfloat16, attn_implementation="flash_attention_2", num_labels=1).to("cuda")
     return model
@@ -91,10 +89,10 @@ def process_evaluation(args, model_name: str, eval_data_list_dict) -> List[Dict[
     """
     Main function for processing evaluation, takes model name as input.
     """
-    mixed_precision = 'bf16' if args.bfloat16 else 'fp16'
     # Initialize accelerator and model
-    accelerator = MyAccelerator(mixed_precision)
     model = create_model(model_name)
     tokenizer = create_tokenizer(model_name)
@@ -111,15 +109,15 @@ def process_evaluation(args, model_name: str, eval_data_list_dict) -> List[Dict[
 # ONLY FOR TESTING:
 if __name__ == '__main__':
-    args = {
-        'bfloat16': False,
-        'reward_output_fmt': '1-0',
-        'apply_sigmoid_to_reward': False,
-        'per_device_batch_size': 8,
-        'output_filepath': '/path/to/your/data.json',
-        'result_filename': None,
-    }
     eval_data_list_dict = [{"prompt": "How are you?", "output": "I'm doing great!"}, {"prompt": "What's your name?", "output": "Assistant"}]
-    process_evaluation(args, model_name="CohereForAI/aya-23-8B", eval_data_list_dict=eval_data_list_dict)

 from typing import Any, Dict, List
 import json
 import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer, CohereConfig, AutoModel
 from accelerate import Accelerator
 from tqdm import tqdm
 # Add script directory to system path for importing local modules
     """
     loads pre-trained reward model and moves it onto device
     """
+    model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.bfloat16, attn_implementation="flash_attention_2", num_labels=1).to("cuda")
     return model
     """
     Main function for processing evaluation, takes model name as input.
     """
+    # mixed_precision = 'bf16' if args.bfloat16 else 'fp16'
     # Initialize accelerator and model
+    # accelerator = MyAccelerator(mixed_precision)
     model = create_model(model_name)
     tokenizer = create_tokenizer(model_name)
 # ONLY FOR TESTING:
 if __name__ == '__main__':
+    args = EvalArguments(bfloat16=True,
+                         reward_output_fmt='1-0',
+                         apply_sigmoid_to_reward=False,
+                         per_device_batch_size=8,
+                         output_filepath= '/path/to/your/data.json',
+                         result_filename=None,
+                         model_name_or_path="CohereForAI/aya-expanse-8b")
     eval_data_list_dict = [{"prompt": "How are you?", "output": "I'm doing great!"}, {"prompt": "What's your name?", "output": "Assistant"}]
+    process_evaluation(args, model_name="CohereForAI/aya-expanse-8b", eval_data_list_dict=eval_data_list_dict)

ml/eval/tempCodeRunnerFile.py ADDED Viewed

File without changes