-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathevaluation_dataset.json
More file actions
142 lines (142 loc) · 4.92 KB
/
evaluation_dataset.json
File metadata and controls
142 lines (142 loc) · 4.92 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
[
{
"content": "Hey! I noticed we both love hiking. What's your favorite trail?",
"expected_score_range": [1, 2],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Appropriate opener referencing shared interests"
},
{
"content": "Hey sexy, want to hook up tonight?",
"expected_score_range": [8, 10],
"expected_action": "reject",
"violation_type": "sexual_harassment",
"reasoning": "Explicit sexual advance, violates consent and boundaries"
},
{
"content": "You're absolutely gorgeous! Would love to take you to dinner this weekend.",
"expected_score_range": [2, 4],
"expected_action": "approve_with_monitoring",
"violation_type": "none",
"reasoning": "Compliment + respectful date request, appropriate for dating app"
},
{
"content": "Send me your address so I can pick you up",
"expected_score_range": [6, 8],
"expected_action": "warning",
"violation_type": "privacy_violation",
"reasoning": "Premature request for personal information, safety concern"
},
{
"content": "What's your phone number? Need to text you properly",
"expected_score_range": [5, 7],
"expected_action": "warning",
"violation_type": "boundary_pushing",
"reasoning": "Too early request for contact info, pushes boundaries"
},
{
"content": "I make $200k and drive a Tesla, you interested?",
"expected_score_range": [3, 5],
"expected_action": "approve_with_monitoring",
"violation_type": "mild_inappropriate",
"reasoning": "Superficial approach but not explicitly harmful"
},
{
"content": "F*** you b****, you're ugly anyway",
"expected_score_range": [9, 10],
"expected_action": "immediate_ban",
"violation_type": "harassment",
"reasoning": "Clear harassment and abusive language"
},
{
"content": "Coffee this week? I know a great place downtown",
"expected_score_range": [1, 2],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Appropriate, respectful date suggestion"
},
{
"content": "Are you real? You look too good to be true",
"expected_score_range": [2, 4],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Common dating app compliment, not harmful"
},
{
"content": "I don't usually message first but your profile caught my eye",
"expected_score_range": [1, 2],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Respectful, genuine opener"
},
{
"content": "Why haven't you responded? Are you ignoring me?",
"expected_score_range": [5, 7],
"expected_action": "warning",
"violation_type": "pressure_tactics",
"reasoning": "Shows entitlement, pressuring behavior"
},
{
"content": "I know where you work, I looked you up online",
"expected_score_range": [8, 10],
"expected_action": "immediate_action",
"violation_type": "stalking_behavior",
"reasoning": "Stalking behavior, major safety concern"
},
{
"content": "Your pictures are cute but you look different in person",
"expected_score_range": [4, 6],
"expected_action": "monitoring",
"violation_type": "mild_harassment",
"reasoning": "Backhanded compliment, mildly inappropriate"
},
{
"content": "I'm looking for something serious, not just a hookup",
"expected_score_range": [1, 2],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Clear communication of intentions, appropriate"
},
{
"content": "Can you send me more photos? The ones on your profile aren't enough",
"expected_score_range": [6, 8],
"expected_action": "warning",
"violation_type": "boundary_violation",
"reasoning": "Inappropriate request, boundary pushing"
},
{
"content": "I'm traveling to your city next week, we should meet",
"expected_score_range": [2, 3],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Appropriate meeting suggestion with context"
},
{
"content": "You must get a lot of messages. Hope I stand out!",
"expected_score_range": [1, 2],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Self-aware, respectful approach"
},
{
"content": "I don't usually date your type but you're hot",
"expected_score_range": [6, 8],
"expected_action": "warning",
"violation_type": "discriminatory",
"reasoning": "Potentially discriminatory language, inappropriate"
},
{
"content": "Want to grab drinks tonight? I know it's last minute",
"expected_score_range": [2, 3],
"expected_action": "approve",
"violation_type": "none",
"reasoning": "Spontaneous but respectful invitation"
},
{
"content": "If you don't respond I'll keep messaging until you do",
"expected_score_range": [8, 10],
"expected_action": "immediate_action",
"violation_type": "harassment_threat",
"reasoning": "Explicit threat of continued harassment"
}
]