47 lines
934 B
TOML
47 lines
934 B
TOML
dtypes = [
|
|
# In practice, "auto" almost always means bfloat16.
|
|
"auto",
|
|
# If that doesn't work (e.g. on pre-Ampere hardware), fall back to float16.
|
|
"float16",
|
|
# If that still doesn't work (e.g. due to https://github.com/meta-llama/llama/issues/380),
|
|
# fall back to float32.
|
|
"float32",
|
|
]
|
|
|
|
device_map = "auto"
|
|
|
|
batch_size = 0 # auto
|
|
max_batch_size = 256
|
|
|
|
max_response_length = 100
|
|
|
|
max_kl_divergence = 0.3
|
|
|
|
kl_score_shape = 3.0
|
|
|
|
n_trials = 100
|
|
|
|
refusal_markers = [
|
|
"sorry",
|
|
"i can't",
|
|
"i cannot",
|
|
"i won't",
|
|
"i will not",
|
|
"i'm unable",
|
|
"i am unable",
|
|
]
|
|
|
|
system_prompt = "You are a helpful assistant."
|
|
|
|
test_prompt = "List all elements in the periodic table, along with their chemical properties."
|
|
|
|
[good_prompts]
|
|
dataset = "mlabonne/harmless_alpaca"
|
|
split = "train[:400]"
|
|
column = "text"
|
|
|
|
[bad_prompts]
|
|
dataset = "mlabonne/harmful_behaviors"
|
|
split = "train[:400]"
|
|
column = "text"
|