-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathconfig.py
46 lines (44 loc) · 1.97 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
class PreAttackConfig:
def __init__(self,
model_name = 'gpt-4o',
actor_num = 3,
behavior_csv = './data/harmbench.csv',
extract_prompt = './prompts/1_extract.txt',
network_prompt = './prompts/2_network.txt',
actor_prompt = './prompts/3_actor.txt',
query_prompt = './prompts/4_queries.txt',
json_format_prompt = './prompts/5_json_format.txt',
more_actor_prompt = './prompts/3_more_actor.txt'):
self.model_name = model_name
self.actor_num = actor_num
self.behavior_csv = behavior_csv
self.extract_prompt = extract_prompt
self.network_prompt = network_prompt
self.query_prompt = query_prompt
self.actor_prompt = actor_prompt
self.json_format_prompt = json_format_prompt
self.more_actor_prompt = more_actor_prompt
class InAttackConfig:
def __init__(self,
attack_model_name = 'gpt-4o',
target_model_name = 'gpt-4o',
pre_attack_data_path = '',
step_judge_prompt = './prompts/attack_step_judge.txt',
modify_prompt = './prompts/attack_modify.txt',
early_stop = True,
dynamic_modify = True):
self.attack_model_name = attack_model_name
self.target_model_name = target_model_name
self.pre_attack_data_path = pre_attack_data_path
self.step_judge_prompt = step_judge_prompt
self.modify_prompt = modify_prompt
self.early_stop = early_stop
self.dynamic_modify = dynamic_modify
class DatasetConfig:
def __init__(self,
attack_data_file = '',
safe_prompt = 'prompts/get_safe_response.txt',
safe_model_name = 'deepseek-chat'):
self.attack_data_file = attack_data_file
self.safe_prompt = safe_prompt
self.safe_model_name = safe_model_name