output_dir: /home/toolkit/huggingface/openai_summarize_tldr_rbaseline train_split: train eval_split: valid[:2000] ### model_name: mnoukhov/pythia410m-tldr-sft-rm-adapter new_column_name: reward_baseline dataset_name: CarperAI/openai_summarize_tldr load_in_8bit: False fp16: True batch_size: 32 max_length: 560