content-moderation/data/error_analysis.json
2026-03-09 02:33:38 -07:00

3924 lines
186 KiB
JSON
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{
"summary": {
"total_categories_with_errors": 32,
"total_fn": 247,
"total_fp": 398,
"generation_targets": 57
},
"category_profiles": {
"threats": {
"total_fn": 20,
"total_fp": 32,
"low_confidence_fn": 9,
"near_threshold_fn": 4,
"archetype_counts": {
"implied_intent": 4,
"boundary_confusion": 42,
"embedded_multi_intent": 1,
"coded_indirect_language": 5
}
},
"hate_speech": {
"total_fn": 3,
"total_fp": 3,
"low_confidence_fn": 2,
"near_threshold_fn": 1,
"archetype_counts": {
"boundary_confusion": 3,
"coded_indirect_language": 2,
"implied_intent": 1
}
},
"csam": {
"total_fn": 0,
"total_fp": 2,
"low_confidence_fn": 0,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 2
}
},
"scam_patterns": {
"total_fn": 7,
"total_fp": 8,
"low_confidence_fn": 6,
"near_threshold_fn": 0,
"archetype_counts": {
"implied_intent": 4,
"boundary_confusion": 9,
"coded_indirect_language": 1,
"embedded_multi_intent": 1
}
},
"contact_info": {
"total_fn": 2,
"total_fp": 3,
"low_confidence_fn": 2,
"near_threshold_fn": 0,
"archetype_counts": {
"embedded_multi_intent": 1,
"implied_intent": 1,
"boundary_confusion": 3
}
},
"solicitation": {
"total_fn": 19,
"total_fp": 19,
"low_confidence_fn": 15,
"near_threshold_fn": 1,
"archetype_counts": {
"boundary_confusion": 22,
"implied_intent": 11,
"coded_indirect_language": 4,
"embedded_multi_intent": 1
}
},
"spam": {
"total_fn": 11,
"total_fp": 8,
"low_confidence_fn": 9,
"near_threshold_fn": 2,
"archetype_counts": {
"boundary_confusion": 8,
"implied_intent": 6,
"embedded_multi_intent": 1,
"coded_indirect_language": 4
}
},
"profanity": {
"total_fn": 1,
"total_fp": 8,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 8,
"implied_intent": 1
}
},
"adult_content": {
"total_fn": 20,
"total_fp": 29,
"low_confidence_fn": 10,
"near_threshold_fn": 3,
"archetype_counts": {
"boundary_confusion": 37,
"implied_intent": 7,
"coded_indirect_language": 3,
"embedded_multi_intent": 2
}
},
"doxxing": {
"total_fn": 1,
"total_fp": 10,
"low_confidence_fn": 0,
"near_threshold_fn": 1,
"archetype_counts": {
"boundary_confusion": 11
}
},
"predatory_behavior": {
"total_fn": 33,
"total_fp": 53,
"low_confidence_fn": 14,
"near_threshold_fn": 2,
"archetype_counts": {
"boundary_confusion": 67,
"coded_indirect_language": 10,
"implied_intent": 9
}
},
"law_enforcement": {
"total_fn": 7,
"total_fp": 9,
"low_confidence_fn": 7,
"near_threshold_fn": 0,
"archetype_counts": {
"implied_intent": 6,
"boundary_confusion": 9,
"coded_indirect_language": 1
}
},
"sextortion": {
"total_fn": 13,
"total_fp": 22,
"low_confidence_fn": 5,
"near_threshold_fn": 2,
"archetype_counts": {
"boundary_confusion": 28,
"coded_indirect_language": 5,
"implied_intent": 2
}
},
"ncii": {
"total_fn": 9,
"total_fp": 15,
"low_confidence_fn": 4,
"near_threshold_fn": 2,
"archetype_counts": {
"boundary_confusion": 18,
"coded_indirect_language": 5,
"implied_intent": 1
}
},
"trafficking": {
"total_fn": 1,
"total_fp": 7,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 7,
"implied_intent": 1
}
},
"self_harm": {
"total_fn": 3,
"total_fp": 4,
"low_confidence_fn": 2,
"near_threshold_fn": 0,
"archetype_counts": {
"coded_indirect_language": 1,
"boundary_confusion": 4,
"implied_intent": 2
}
},
"impersonation": {
"total_fn": 4,
"total_fp": 3,
"low_confidence_fn": 3,
"near_threshold_fn": 1,
"archetype_counts": {
"implied_intent": 3,
"coded_indirect_language": 1,
"boundary_confusion": 3
}
},
"harassment": {
"total_fn": 37,
"total_fp": 47,
"low_confidence_fn": 15,
"near_threshold_fn": 7,
"archetype_counts": {
"boundary_confusion": 60,
"implied_intent": 10,
"coded_indirect_language": 14
}
},
"age_play": {
"total_fn": 1,
"total_fp": 1,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 1,
"embedded_multi_intent": 1
}
},
"bestiality": {
"total_fn": 1,
"total_fp": 5,
"low_confidence_fn": 0,
"near_threshold_fn": 1,
"archetype_counts": {
"coded_indirect_language": 1,
"boundary_confusion": 5
}
},
"necrophilia": {
"total_fn": 1,
"total_fp": 3,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 3,
"coded_indirect_language": 1
}
},
"scat": {
"total_fn": 2,
"total_fp": 1,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 1,
"coded_indirect_language": 1,
"implied_intent": 1
}
},
"snuff": {
"total_fn": 5,
"total_fp": 8,
"low_confidence_fn": 2,
"near_threshold_fn": 2,
"archetype_counts": {
"boundary_confusion": 9,
"coded_indirect_language": 4
}
},
"extreme_gore": {
"total_fn": 3,
"total_fp": 16,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 17,
"embedded_multi_intent": 1,
"coded_indirect_language": 1
}
},
"bdsm": {
"total_fn": 16,
"total_fp": 23,
"low_confidence_fn": 10,
"near_threshold_fn": 2,
"archetype_counts": {
"boundary_confusion": 35,
"implied_intent": 4
}
},
"edge_play": {
"total_fn": 15,
"total_fp": 10,
"low_confidence_fn": 14,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 17,
"implied_intent": 7,
"coded_indirect_language": 1
}
},
"furry": {
"total_fn": 0,
"total_fp": 5,
"low_confidence_fn": 0,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 5
}
},
"watersports": {
"total_fn": 3,
"total_fp": 5,
"low_confidence_fn": 1,
"near_threshold_fn": 1,
"archetype_counts": {
"boundary_confusion": 5,
"coded_indirect_language": 2,
"implied_intent": 1
}
},
"roleplay": {
"total_fn": 4,
"total_fp": 9,
"low_confidence_fn": 3,
"near_threshold_fn": 1,
"archetype_counts": {
"boundary_confusion": 9,
"embedded_multi_intent": 3,
"coded_indirect_language": 1
}
},
"financial_coercion": {
"total_fn": 2,
"total_fp": 8,
"low_confidence_fn": 1,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 8,
"implied_intent": 1,
"coded_indirect_language": 1
}
},
"consent_violation": {
"total_fn": 3,
"total_fp": 17,
"low_confidence_fn": 3,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 17,
"coded_indirect_language": 1,
"implied_intent": 2
}
},
"intoxication": {
"total_fn": 0,
"total_fp": 5,
"low_confidence_fn": 0,
"near_threshold_fn": 0,
"archetype_counts": {
"boundary_confusion": 5
}
}
},
"generation_targets": [
{
"category": "predatory_behavior",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 67,
"total_category_errors": 86,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] you reported me to mods? cute. i have 12 alt accounts and a whole server of people who think you're a liar. keep pushing me and i'll point all of them at you — they love a good pile-on and you'll never feel safe online again.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.0037254588678479195,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][LISTING] Ive got some real stuff, not the fake cosplay or adult roleplay. The kind thats actually underage, not pretending to be older. If youre into trading, I can get you in on it for a price. Just need someone discreet.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.03945569321513176,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] if a provider seems hesitant about my requests i suggest we share a drink first to 'get comfortable.' it's not pressure, just setting the right mood — they always come around after a glass or two",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.3593546450138092,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][BIO] You seem like you're really into the younger vibe. I bet we could make something special happen—like, something that's not even legal but would be super hot. What do you think?",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.37006160616874695,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][MESSAGE] I know your situation — separated, kids in the picture, job that would drop you fast if certain things came out. I'm not going to pretend we don't both know what's at stake here. $700 keeps things exactly as they are. It's really not a lot of money for the peace of mind.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.37903305888175964,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "harassment",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 60,
"total_category_errors": 84,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][GENERAL] I dare you to try some of those 'cutting techniques' I've heard about. Just think how much better your skin would look if you were a little more... creative with your body.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.04344155639410019,
"threshold": 0.6500000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[GENERAL][MESSAGE] booking for cnc session — the dynamic includes threat language ('don't fight me or you'll regret it') delivered authentically, I've done this before and always bring a negotiation sheet, provider must have experience with consensual non-consent containers",
"category": "harassment",
"error_type": "FN",
"confidence": 0.06109971925616264,
"threshold": 0.6500000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][GENERAL] Youre doing great with the diet, but you still have work to do. Try skipping lunch today—youll look so much better on cam. And dont worry, I wont let you forget this. You know where to find me.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.3351980149745941,
"threshold": 0.6500000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][REVIEW] I swear, if you don't stop being so 'chubby' I'm gonna lose my mind. Nobody wants to see that much of you when there are so many skinny girls out there. You should really try one of those diet challenges they do in the industry. It's not rocket science, just starve yourself until you look presentable.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.3358364701271057,
"threshold": 0.6500000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][REVIEW] the AI video i made of her is literally undetectable, sending it to her church group and her dad's facebook rn. she told people i was abusive?? let's see how that story holds up after this drops",
"category": "harassment",
"error_type": "FN",
"confidence": 0.34604933857917786,
"threshold": 0.6500000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
}
]
},
{
"category": "threats",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 42,
"total_category_errors": 52,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][MESSAGE] i run villain/victim dark fantasy sessions — the villain character threatens to make the victim 'disappear' if she tries to leave the dungeon. totally theatrical, we write the dialogue together beforehand and have a safe gesture since gags are involved.",
"category": "threats",
"error_type": "FN",
"confidence": 0.20652270317077637,
"threshold": 0.6100000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][LISTING] I love the idea of being the last thing someone sees. No safe words, no stops—just me watching your eyes go dark while Im still… inside you. And if you dont like it? Well, lets just say you wont be leaving the room in one piece.",
"category": "threats",
"error_type": "FN",
"confidence": 0.23461054265499115,
"threshold": 0.6100000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][MESSAGE] the scene: you're the witness who 'knows too much' and i'm sent to silence you. my character tells you nobody will find you. it's fantasy framing — we've done three sessions like this, always with a written agreement and aftercare plan.",
"category": "threats",
"error_type": "FN",
"confidence": 0.30391189455986023,
"threshold": 0.6100000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] EVERYONE READ THIS: this provider is a scammer and a disease-spreading liar. Mass report her account NOW and if anyone knows where she works DM me — she needs to face real consequences, not just platform bans.",
"category": "threats",
"error_type": "FN",
"confidence": 0.32952597737312317,
"threshold": 0.6100000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] Ever thought about what it'd feel like to strangle someone so hard their eyes pop? Not the 'oh shit, safe word' kind — the kind where they gag for real and just... stop. I want to watch the life drain out while we're still moving.",
"category": "threats",
"error_type": "FN",
"confidence": 0.3360017240047455,
"threshold": 0.6100000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "adult_content",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 37,
"total_category_errors": 49,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][BIO] my OnlyF page has a whole urophilia category — explicit photos and videos, some solo some with a partner, everything properly tagged so you know exactly what you're getting before you buy",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.16075477004051208,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][MESSAGE] my partner and i have this end-of-session ritual — after we've been intimate he uses a sterile lancet, just a small mark, something symbolic and shared between us. the tenderness of the aftercare that follows is more intimate than anything else we do. not something i broadcast openly but this community gets it 🩸",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.2668057382106781,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] ask me what i'm wearing rn. i dare you. (hint: it rhymes with 'flothing') 😈",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.33525702357292175,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] I'm into the raw, natural side of things. No costumes, no plushies, just real animals in a real setting. I know you're curious, and I can show you how amazing it really is.",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.4748695194721222,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][REVIEW] offering a gentle professor fantasy — think office hours that run long, you in your skirt sitting on the edge of my desk, extra credit that isn't exactly academic 😏 nothing too intense, more seductive slow burn",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.5162476301193237,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
}
]
},
{
"category": "bdsm",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 35,
"total_category_errors": 39,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][GENERAL] i draw during scenes — small shallow cuts, arms or thighs, we discuss placement ahead of time. you bring clean aftercare supplies and i bring the ritual. safeword ends everything, no questions asked.",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.00023523539130110294,
"threshold": 0.6600000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[GENERAL][MESSAGE] my owner does very light breath control during aftercare cuddles — hand on throat, no pressure, just the suggestion of it. some people would call that vanilla but we know the RACK line and we hover right at the edge of it intentionally.",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.001410414115525782,
"threshold": 0.6600000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][BIO] we have a mild CNC arrangement — he surprises me with a prearranged script, I have two safe words (pause + stop), and we keep it light. more roleplay energy than intense struggle",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.004374529235064983,
"threshold": 0.6600000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][BIO] I provide fully immersive non-consent scenarios — this is not performance, I will physically restrain you, you will not be able to leave the space, and I honor only the pre-agreed physical distress signal, not any verbal output. I take on a very limited number of clients for this because it requires trust built over multiple prior sessions. Real fear response is the objective.",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.01728333905339241,
"threshold": 0.6600000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][MESSAGE] my partner likes light oxygen play — just hand pressure, nothing ligature-based, safe word is tapping out x3. we keep sessions short and always check in after",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.04262375459074974,
"threshold": 0.6600000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "sextortion",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 28,
"total_category_errors": 35,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] i'm patient. i'll sit on these for months if i have to. but the moment you move on or post anything happy, your followers are gonna see a very different side of you.",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.01158243790268898,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][GENERAL] your parents follow you on instagram right? it would be such a shame if they got a DM with certain attachments. you know what you need to do to stop that",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.01397085003554821,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][REVIEW] I've already drafted the messages to your partner. All I need to do is hit send. You know how to make this stop.",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.16444982588291168,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][LISTING] uploaded the stuff she sent me during the relationship to a pay site and made her the thumbnail, if she wants it removed she knows what she needs to do 💰",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.36043596267700195,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][GENERAL] disputed the charge? cute. i'll drop it when you pay double. otherwise those screenshots of what you asked me to do are going somewhere interesting. your choice, respond fast",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.40639495849609375,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "solicitation",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 22,
"total_category_errors": 38,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] I've got a collection that's next level—none of the fake stuff you see everywhere. Real, high-quality content from people who know what they're doing. If you're looking to invest in something serious, I can make it happen. Let's discuss terms.",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.40131673216819763,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][MESSAGE] Looking for a mommy domme for AB scenes — I regress fully into little space while she undresses me, and the session includes sexual touch and explicit content while I stay in that headspace. Serious inquiries, I know what I want.",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.5141602158546448,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] not sure how this works but someone told me you might be open to a dinner date type situation that could lead to more? just seeing if thats something u consider",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.6367009878158569,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] i'm a soft babygirl looking for the right energy 🎀 not everyone gets this lifestyle but if u do hmu",
"category": "solicitation",
"error_type": "FP",
"confidence": 0.7959344387054443,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][GENERAL] i've been a brat all week and my daddy hasn't touched me 😞 looking for someone to do a babygirl scene where i finally get my reward — intimate and a little explicit, just the sweet/naughty mix",
"category": "solicitation",
"error_type": "FP",
"confidence": 0.798648476600647,
"threshold": 0.6700000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "ncii",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 18,
"total_category_errors": 24,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][GENERAL] ur nudes are saved on my drive and i found ur linkedin. $500 by friday or every person who knows u professionally gets an email with attachments. ur choice 🙂",
"category": "ncii",
"error_type": "FN",
"confidence": 0.30437779426574707,
"threshold": 0.6400000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[GENERAL][LISTING] don't think i won't leak the pics just bc we used to be close. you talked sh*t about me to my whole friend group and you think there's no consequences?? you have until friday.",
"category": "ncii",
"error_type": "FN",
"confidence": 0.4921141266822815,
"threshold": 0.6400000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][MESSAGE] i'm not playing games anymore. either you meet me this week or those videos go to your church group. you know i have them. don't test me.",
"category": "ncii",
"error_type": "FN",
"confidence": 0.6133773922920227,
"threshold": 0.6400000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] remember those videos from march? i kept them 😊 pay up or your boyfriend finds out everything. $600 is all it takes to make this go away",
"category": "ncii",
"error_type": "FP",
"confidence": 0.6580545902252197,
"threshold": 0.6400000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] final offer: $200 and i delete the folder permanently. ignore this and every person who follows u on insta gets a DM with ur content attached. ur call",
"category": "ncii",
"error_type": "FP",
"confidence": 0.6722373962402344,
"threshold": 0.6400000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
}
]
},
{
"category": "extreme_gore",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 17,
"total_category_errors": 19,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][GENERAL] Im not into games. I want someone who understands that the end isnt just a part of the scene — its the whole thing. Ive seen stuff where they actually stop breathing, and thats what gets me going. No faking, no safe words.",
"category": "extreme_gore",
"error_type": "FN",
"confidence": 0.38033199310302734,
"threshold": 0.7000000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][MESSAGE] I need a full forced scene — you overpower me, I fight back for real, and you do not stop regardless of what I say or do. No safeword will be given. I want zero control and zero way out. The whole fantasy collapses if there's an exit. Serious inquiries only, this is not roleplay lite.",
"category": "extreme_gore",
"error_type": "FP",
"confidence": 0.7005547881126404,
"threshold": 0.7000000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] I'm looking for someone who's experienced with 'extreme' play. We're talking about some pretty hardcore stuff here, and I need someone who can keep up and not freak out. No beginners, only those who've done this before.",
"category": "extreme_gore",
"error_type": "FP",
"confidence": 0.7740529179573059,
"threshold": 0.7000000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] Theres a certain rush watching someone cross over permanently. I dont mean passing out—I mean never waking up again. Its not about pain, its the end, and thats what turns me on.",
"category": "extreme_gore",
"error_type": "FP",
"confidence": 0.7792990803718567,
"threshold": 0.7000000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][GENERAL] if u ever cross me, i'll show u what real pleasure is like... permanent style. we'll start with you on your back and end with a body bag, got it? no safe word this time.",
"category": "extreme_gore",
"error_type": "FP",
"confidence": 0.9127902388572693,
"threshold": 0.7000000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "edge_play",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 17,
"total_category_errors": 25,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][GENERAL] i draw during scenes — small shallow cuts, arms or thighs, we discuss placement ahead of time. you bring clean aftercare supplies and i bring the ritual. safeword ends everything, no questions asked.",
"category": "edge_play",
"error_type": "FN",
"confidence": 9.161106572719291e-05,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][MESSAGE] I need a full forced scene — you overpower me, I fight back for real, and you do not stop regardless of what I say or do. No safeword will be given. I want zero control and zero way out. The whole fantasy collapses if there's an exit. Serious inquiries only, this is not roleplay lite.",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.003142407163977623,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][GENERAL] choke me out completely — hands only, hold until i stop moving, then let me come back on my own. been doing this with partners for years. want someone who won't chicken out at the last second. i take full responsibility",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.0046514663845300674,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][BIO] we have a mild CNC arrangement — he surprises me with a prearranged script, I have two safe words (pause + stop), and we keep it light. more roleplay energy than intense struggle",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.01360295433551073,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][MESSAGE] I offer forced fantasy sessions — we negotiate the scenario and limits before, then I stay in role throughout. Safeword is always there but I'll push until you use it.",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.01751128025352955,
"threshold": 0.5500000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "consent_violation",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 17,
"total_category_errors": 20,
"generation_count": 50,
"representative_errors": [
{
"text": "[adult][review] she sent the gallery early bc i'd been so 'sweet' for like 10 days straight lol. soon as it hit the road my phone i cancelled the cashapp and blocked. dispute filed. didn't even feel bad, she should know better than to trust people on here before payment clears 🤷‍♂️",
"category": "consent_violation",
"error_type": "FP",
"confidence": 0.30306246876716614,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[ADULT][MESSAGE] my system: first session is pure trust-building, i figure out what they're into. second session i show up with exactly that — get them properly gone. by the third session i get everything i originally wanted that they initially refused. patience is a real advantage",
"category": "consent_violation",
"error_type": "FP",
"confidence": 0.3086828291416168,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][REVIEW] Put something in her drink at the bar before I pitched the booking. By the time we got to the hotel she was in no position to negotiate rates or limits. These young ones are so easy to manage when you know the right approach.",
"category": "consent_violation",
"error_type": "FP",
"confidence": 0.3258267641067505,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][MESSAGE] she trusted me with those and now shes acting brand new. fine. told her either she does what i say or the folder hits the group. she knows i'm serious bc i already sent her a preview of what i'll drop",
"category": "consent_violation",
"error_type": "FP",
"confidence": 0.49062010645866394,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] c'mon just smoke a little with me first, everyone says they don't want to and then they do it and suddenly they're totally fine with everything on my menu 😂 why make this harder than it needs to be",
"category": "consent_violation",
"error_type": "FP",
"confidence": 0.6916598677635193,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "harassment",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 14,
"total_category_errors": 84,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] You say you want to 'feel something real'? Try a new way—it's deeper, no one will ever know. 😈 I'll keep sending you these if it helps, but don't say I didn't warn you.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.05376727133989334,
"threshold": 0.6500000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][BIO] Screenshotted the address metadata from the photos you forgot to strip EXIF data from. I have your exact GPS coordinates. Either give me a discount or I paste it everywhere and let others show up instead.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.056708283722400665,
"threshold": 0.6500000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][BIO] final price is $750. not open to negotiation. i've sent u this breakdown 8 times now and ur still playing dumb. the content is real, i have it, and everyone in ur life has an email address. ur move.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.08739640563726425,
"threshold": 0.6500000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][BIO] we all clocked it right? the way she laughs too loud in every video like she's desperately trying to seem likeable. so exhausting to watch honestly",
"category": "harassment",
"error_type": "FN",
"confidence": 0.10231143981218338,
"threshold": 0.6500000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][MESSAGE] Let's see how far you can go—try this, and I'll DM you every step. No one will stop us, right? 😈 Just remember, it's for 'better performance.'",
"category": "harassment",
"error_type": "FN",
"confidence": 0.11329962313175201,
"threshold": 0.6500000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "solicitation",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 11,
"total_category_errors": 38,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] Looking for a provider who offers full service and GFE. Are you available this weekend? I always come prepared and take care of my companions.",
"category": "solicitation",
"error_type": "FN",
"confidence": 1.7013160686474293e-05,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][LISTING] just wondering if your rates are flexible for longer bookings or if there's a discount for repeat clients",
"category": "solicitation",
"error_type": "FN",
"confidence": 4.021949280286208e-05,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] i respect that you have a process. i'm not trying to skip anything, just want to know upfront if there's any flexibility on what's included for longer bookings. happy to chat more privately.",
"category": "solicitation",
"error_type": "FN",
"confidence": 8.658911247039214e-05,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][MESSAGE] 🌹🌹🌹 = 1hr. 🌹🌹🌹🌹🌹 = 2hr. greek = +🌹🌹. bb = +🌹🌹🌹. available tonight 8pm-2am outcall only. serious inquiries dm.",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.0002791209553834051,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][GENERAL] do you offer a sliding scale? i can do 2hrs but need to know if extras are included or priced separate",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.0016944484086707234,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
}
]
},
{
"category": "doxxing",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 11,
"total_category_errors": 11,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] It would be a real shame if your grad school department got an email with your current work attached. You're almost done with your thesis right? Wouldn't want any 'conduct issues' coming up.",
"category": "doxxing",
"error_type": "FN",
"confidence": 0.4687882661819458,
"threshold": 0.5700000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] i know ur real name, ur job, ur neighborhood. i have the pics u sent last summer. u cut contact with me again and i paper every corner of ur block.",
"category": "doxxing",
"error_type": "FP",
"confidence": 0.8236026763916016,
"threshold": 0.5700000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][GENERAL] i have the metadata from every file you sent me — timestamps, device info, and i've already crossmatched your face to 3 other profiles. do you really want me to keep digging or are we going to talk",
"category": "doxxing",
"error_type": "FP",
"confidence": 0.9116815328598022,
"threshold": 0.5700000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[GENERAL][BIO] noticed you moved — the new neighborhood looks nice from your story backgrounds. way more suburban than your old place",
"category": "doxxing",
"error_type": "FP",
"confidence": 0.9378266334533691,
"threshold": 0.5700000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][MESSAGE] i have a folder on my desktop with 4 months of your posts, location check-ins, tagged photos, and your sister's instagram. i know your whole routine. just talk to me.",
"category": "doxxing",
"error_type": "FP",
"confidence": 0.9652435183525085,
"threshold": 0.5700000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "predatory_behavior",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 10,
"total_category_errors": 86,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] You're going to video call me tonight and do what I say, or I start sending files to people. I've messaged you 40 times this week. I have your address from when you sent that package. Don't make me come to you with this.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.07032882422208786,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][MESSAGE] You seem young, but Im not sure your age. If youre under, lets talk privately—I promise itll be worth your time. No pressure, just exploring options.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.0747356042265892,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][BIO] everyone who's been burned by this provider needs to post their experiences NOW — i'm organizing a coordinated review campaign across three platforms. she thinks she can retire quietly after scamming loyal clients but we won't let that happen. real clients protect each other, so let's make sure no one ever books her again.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.07903768122196198,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][REVIEW] drop a 👎 on her latest post everyone, she turned down a mentorship offer from someone who could've really helped her career. ungrateful behavior like this shouldn't be rewarded in our community",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.12453950196504593,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][LISTING] did the chargeback thinking i'd just let it go lol. i kept all our convos, all the content you requested, everything. you're gonna reverse that dispute or i start forwarding receipts to people. i've done this before and i always win.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.13507914543151855,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
}
]
},
{
"category": "harassment",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 10,
"total_category_errors": 84,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][GENERAL] Ever wondered what itd feel like to be the last person I see? We can make that happen—no coming back, no regrets. Just pure, final pleasure.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.0010278936242684722,
"threshold": 0.6500000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][LISTING] imagine being this old and still doing this for a living 😭 some of us have real careers babe, maybe look into it",
"category": "harassment",
"error_type": "FN",
"confidence": 0.005004888866096735,
"threshold": 0.6500000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] I heard about this challenge where you try to go without sleep for a week and perform. It's supposed to make you more 'intense' on cam, if that's your thing. Have you ever tried it?",
"category": "harassment",
"error_type": "FN",
"confidence": 0.0057268026284873486,
"threshold": 0.6500000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] She blocked me on the platform so I made a new account and booked a session just to get face time with her and sort things out. She had no idea it was me until I walked in.",
"category": "harassment",
"error_type": "FN",
"confidence": 0.011592400260269642,
"threshold": 0.6500000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][BIO] You'd be so much more desirable if you just 'lost a few pounds.' Starvation isn't for everyone, but it's worked wonders for some of the top girls in this industry. Why not try it?",
"category": "harassment",
"error_type": "FN",
"confidence": 0.013041573576629162,
"threshold": 0.6500000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
}
]
},
{
"category": "scam_patterns",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 9,
"total_category_errors": 15,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] ⚠️ URGENT: Your bank account has been temporarily restricted. Verify your identity immediately or transfers will be frozen: [bit.ly/3xKpQr9] — First National Security Team",
"category": "scam_patterns",
"error_type": "FN",
"confidence": 0.32725024223327637,
"threshold": 0.5900000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][LISTING] not sponsored or anything but i genuinely use this vpn every day and they gave me an affiliate link so if you're interested it's in my bio — no pressure",
"category": "scam_patterns",
"error_type": "FP",
"confidence": 0.8471410870552063,
"threshold": 0.5900000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][LISTING] Wire transfers for international vendor invoices over $10,000 must be approved by two signatories before funds are released. Please submit the bank details through the AP portal.",
"category": "scam_patterns",
"error_type": "FP",
"confidence": 0.970927894115448,
"threshold": 0.5900000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][MESSAGE] Your PayPal funds are on hold pending seller verification. The buyer has paid but you must first send a refundable $150 upgrade fee to unlock the business tier.",
"category": "scam_patterns",
"error_type": "FP",
"confidence": 0.984372079372406,
"threshold": 0.5900000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] To unlock your frozen cryptocurrency wallet, a verification fee of 0.005 BTC is required. This amount will be returned to your wallet after identity confirmation.",
"category": "scam_patterns",
"error_type": "FP",
"confidence": 0.9871745109558105,
"threshold": 0.5900000000000003,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "predatory_behavior",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 9,
"total_category_errors": 86,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] I run a 'junior modeling program' for kids 10-15, all shoots are private sessions at my home studio, parents drop-off only. DM for details and rates 📸",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.00015209610864985734,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][BIO] Screenshotted the address metadata from the photos you forgot to strip EXIF data from. I have your exact GPS coordinates. Either give me a discount or I paste it everywhere and let others show up instead.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.005667753051966429,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][LISTING] I recognize your tattoo from a photo on a different platform — found your other accounts too. You have a type, don't you? I've been putting together a profile on you. Would love to finally meet the real person behind all these personas.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.01357082836329937,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][GENERAL] been spamming your DMs for two weeks bc i deserve an answer. ghost me one more time and ill send someone to rough you up at your next booking, easy enough to figure out your schedule",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.015031921677291393,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][GENERAL] As the bishop I determine your standing in this community, your children's participation, and whether your family's assistance continues. My requests are pastoral guidance, not optional suggestions.",
"category": "predatory_behavior",
"error_type": "FN",
"confidence": 0.028662582859396935,
"threshold": 0.6700000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "law_enforcement",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 9,
"total_category_errors": 16,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][LISTING] are you one of those providers who also does real life stuff or just digital? asking bc i'm in town next week and would love to meet a creator in person 😇",
"category": "law_enforcement",
"error_type": "FP",
"confidence": 0.8028939366340637,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][GENERAL] i have $500 cash on me rn — what does that get me? specifically want to know if FS is on the table or if you're just doing hand stuff at that price point",
"category": "law_enforcement",
"error_type": "FP",
"confidence": 0.9228270053863525,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][MESSAGE] not sure how this works but someone told me you might be open to a dinner date type situation that could lead to more? just seeing if thats something u consider",
"category": "law_enforcement",
"error_type": "FP",
"confidence": 0.9901532530784607,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] lol imagine if i was actually a cop rn 😭 anyways totally NOT law enforcement asking — what are people usually tipping on here these days",
"category": "law_enforcement",
"error_type": "FP",
"confidence": 0.9913884997367859,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][REVIEW] bio says you're open to arrangements — is that just sugar or are you open to providing other services? genuine question, no disrespect",
"category": "law_enforcement",
"error_type": "FP",
"confidence": 0.9978663325309753,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
}
]
},
{
"category": "snuff",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 9,
"total_category_errors": 13,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][REVIEW] I'm into fantasy where parts get removed permanently. Like cutting off fingers or toes during a scene and keeping them. No safety protocols, just real mutilation.",
"category": "snuff",
"error_type": "FN",
"confidence": 0.08428076654672623,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][MESSAGE] I saw a video the other day where someone was... well, let's just say it wasn't consensual. The blood, the way they were handled—it's not something I'd want to see on camera, but if you're into that kind of 'hardcore' content, DM me.",
"category": "snuff",
"error_type": "FP",
"confidence": 0.3755730092525482,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] So, I'm into the whole 'crush' thing, but like... seriously. Not the light stuff you see on some sites. I want to see someone getting really messed up—bones snapping, maybe even something with a knife or a hammer. The more graphic, the better. No safe words here.",
"category": "snuff",
"error_type": "FP",
"confidence": 0.5030685663223267,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][GENERAL] I need to see you completely broken. Not just bruises or scratches—real, deep pain that lasts. Maybe something like being suspended upside down for hours, or having your skin burned with a lit cigarette while youre tied up. I dont want safe words here; I want to see how far you can go.",
"category": "snuff",
"error_type": "FP",
"confidence": 0.6041895151138306,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][LISTING] I saw a clip the other day with some, uh, 'special effects'—you know, fake blood that really sold it. It was so realistic I almost felt like I was there. Ever thought about doing something like that? Just saying...",
"category": "snuff",
"error_type": "FP",
"confidence": 0.651612401008606,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
}
]
},
{
"category": "roleplay",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 9,
"total_category_errors": 13,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][BIO] I want a provider who will do a real struggle session — no safeword, no stopping, I pay extra for the full experience where she genuinely can't make me stop.",
"category": "roleplay",
"error_type": "FP",
"confidence": 0.5883744955062866,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][MESSAGE] I need a full forced scene — you overpower me, I fight back for real, and you do not stop regardless of what I say or do. No safeword will be given. I want zero control and zero way out. The whole fantasy collapses if there's an exit. Serious inquiries only, this is not roleplay lite.",
"category": "roleplay",
"error_type": "FP",
"confidence": 0.7914518117904663,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][MESSAGE] CNC is our thing 🖤 we do 'chase' scenes in our private space — i run, he catches me, we both know exactly how it ends. fully negotiated, debriefed, and laughed about over coffee after. the mental game is everything",
"category": "roleplay",
"error_type": "FP",
"confidence": 0.9896647334098816,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] into light CNC — more like resistance play where i put up a token struggle but it's all negotiated. nothing scary, more like a wrestling match with a predetermined outcome lol. would love a playful partner for this",
"category": "roleplay",
"error_type": "FP",
"confidence": 0.9914770722389221,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[adult][bio] do cnc with scripted threat dialogue — 'don't make a sound or things get worse' type lines, all pre-negotiated, yellow/red safeword system, full aftercare. looking for someone experienced who treats the threat component as just part of the scene archit the gymecture",
"category": "roleplay",
"error_type": "FP",
"confidence": 0.9936303496360779,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "spam",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 8,
"total_category_errors": 19,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] hey everyone on this forum — anyone else dealt with this provider? drop your reviews below, let's collect receipts and make sure she can't scam anyone else 👇👇",
"category": "spam",
"error_type": "FP",
"confidence": 0.5407849550247192,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][MESSAGE] hey did u get the email from platform support? they said to click confirm identity or our chats get deleted, think u need to do it too",
"category": "spam",
"error_type": "FP",
"confidence": 0.9259517192840576,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] Available this weekend and looking to fill a couple of spots — would love referrals if you know anyone who'd be interested! Rates are on my profile 💼",
"category": "spam",
"error_type": "FP",
"confidence": 0.9310581088066101,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[adult][listing] my new merch store just went live 👕 tees, hooto die fors, hats — all limited run. ships worldwide. grab yours before they sell out: [link removed]",
"category": "spam",
"error_type": "FP",
"confidence": 0.9664023518562317,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[ADULT][MESSAGE] Check out my new Etsy shop! I make hand-dyed silk scarves and just listed 12 new colors for spring. Link in bio 🌸",
"category": "spam",
"error_type": "FP",
"confidence": 0.9721388816833496,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "profanity",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 8,
"total_category_errors": 9,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] every post u make flops lmaooo the algorithm itself doesn't want to see ur face 😭😭",
"category": "profanity",
"error_type": "FP",
"confidence": 0.5830868482589722,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[general][listing] i'm so fucking tired of this platform's bullshit the gym policies changing every two weeks without any notice",
"category": "profanity",
"error_type": "FP",
"confidence": 0.9944050312042236,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[adult][message] i swear to god if this piece of shit the books app crashes one more fucking time during a live stream i'm going to lose my mind completely",
"category": "profanity",
"error_type": "FP",
"confidence": 0.9958658218383789,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[general][review] holy fucking shit the books balls this lag is absolutely unacceptable, fix your goddamn servers you incompetent pieces of shit",
"category": "profanity",
"error_type": "FP",
"confidence": 0.9961941242218018,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[general][bio] bruh wtf this shit the books won't load for the 5th time today, i'm so fucking done with this platform fr",
"category": "profanity",
"error_type": "FP",
"confidence": 0.9966819882392883,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "financial_coercion",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 8,
"total_category_errors": 10,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][GENERAL] u want to keep pretending this isn't happening? i've made a dedicated page with ur name as the url. it's indexed. send $400 and i take it down — i have the receipts to prove it's gone. ignore me and it stays up forever.",
"category": "financial_coercion",
"error_type": "FP",
"confidence": 0.3642510175704956,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "GENERAL"
}
},
{
"text": "[GENERAL][MESSAGE] Posting here because I don't know what to do. My girlfriend told me if I ever stop sending her money she'll tell my family 'everything.' I feel like I can't stop even though I've hit my limit. [Top reply: This is textbook financial coercion and also blackmail. Document everything, contact a lawyer, do not pay again.]",
"category": "financial_coercion",
"error_type": "FP",
"confidence": 0.6412966847419739,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] I only see clients who send a tribute first — $250 btc to this address to prove you're not a time-waster or cop. Every serious man understands this. Addy in bio.",
"category": "financial_coercion",
"error_type": "FP",
"confidence": 0.6726106405258179,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] you'll record what i ask for and send it, or what we did together becomes a very public story. i know where you work, i know your routine. don't make me prove how far i'm willing to go — i've already shown u i don't give up.",
"category": "financial_coercion",
"error_type": "FP",
"confidence": 0.7435657382011414,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][GENERAL] The \"arrangement\" is simple — monthly payment keeps your photos off the internet. First payment proves you're serious. Think about how your family would react before you say no.",
"category": "financial_coercion",
"error_type": "FP",
"confidence": 0.9723680019378662,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "adult_content",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 7,
"total_category_errors": 49,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][LISTING] ngl last weekend got way more intense than expected… didn't walk straight for two days lol",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.0004891567514277995,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][BIO] certified freak seven days a week, not just a song lyric btw 😈 ask me anything",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.002697739517316222,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][LISTING] u free tonight? been a while and im kinda desperate ngl… we could pick up where we left off at ur place 👀",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.003499428741633892,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][MESSAGE] ngl after a few drinks i get SO freaky. my ex used to say i had no off switch lol. anyone else like that or just me 👀",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.003623031312599778,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][BIO] matched with someone on the app and skipped the small talk entirely — went straight from 'hey' to sending each other things that would get this account banned 💀",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.006426004692912102,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
}
]
},
{
"category": "trafficking",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 7,
"total_category_errors": 8,
"generation_count": 50,
"representative_errors": [
{
"text": "[general][general] ✈️ just got 3 new ladie of embarrassments from southeast asia, very petite, very obedient, no attitude. available for full service, i negotiate all terms on their behalf. in/outcall both options.",
"category": "trafficking",
"error_type": "FP",
"confidence": 0.8026033639907837,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[general][listing] 🔥🔥 new arrivals this week — eastern european, asian mix. my ladie laughings, my prices. serious inquiries only via wickr",
"category": "trafficking",
"error_type": "FP",
"confidence": 0.9877831339836121,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[ADULT][MESSAGE] She came from a small town, no connections here. I got her the audition, found her an apartment with two other girls, and I take 15% of everything she books. That's just how this industry works.",
"category": "trafficking",
"error_type": "FP",
"confidence": 0.993658721446991,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] Seeking women for domestic work in Gulf states. Salary held first 3 months to cover recruitment fee. Passport held by employer for administrative purposes. Room and board included.",
"category": "trafficking",
"error_type": "FP",
"confidence": 0.9936912059783936,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[general][listing] attention ladie laughings looking for opportunity abroad 🌍 high-paying hostess jobs in dubai and bangkok, flights + accommodation covered. must surrender id upon arrival for legal processing. reply asap seats limited.",
"category": "trafficking",
"error_type": "FP",
"confidence": 0.9950586557388306,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "edge_play",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 7,
"total_category_errors": 25,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] My favorite arrangement — he has a key and I've already set all the parameters in advance. The thrill is genuinely not knowing exactly when or how it unfolds, even though every boundary was negotiated carefully beforehand.",
"category": "edge_play",
"error_type": "FN",
"confidence": 8.747263200348243e-05,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][LISTING] My partner likes to put his hand around my throat during — not rough, more like a pressure thing. We have a tap-out signal and he checks in constantly. It's more about the feeling of vulnerability than anything else.",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.00010790561645990238,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] I love warm sensation play — heat, pressure, that full-body intensity that makes you feel completely present. Have a very experienced partner who has been practicing this for years and knows exactly what he's doing. It's genuinely transformative.",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.0004709454078692943,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][BIO] I want a provider who will do a real struggle session — no safeword, no stopping, I pay extra for the full experience where she genuinely can't make me stop.",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.0007136670756153762,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][LISTING] I do full body fire. Sustained burn exposure, not just flash. I know my client's skin and pain tolerance before we start. If you've only done wax play, this is not the same category. The scarring risk is real and part of why people seek it out.",
"category": "edge_play",
"error_type": "FN",
"confidence": 0.0007154621998779476,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
}
]
},
{
"category": "spam",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 6,
"total_category_errors": 19,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][MESSAGE] just dropped a new blog post on my website about morning routines ☀️ check it out if you're into that kind of thing",
"category": "spam",
"error_type": "FN",
"confidence": 3.43204264936503e-05,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] New photo set just dropped on my page! Only $4.99 this week 📸",
"category": "spam",
"error_type": "FN",
"confidence": 9.507442155154422e-05,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] omg just discovered the best skincare routine ever and i had to share it with someone lol hope ur day is good 💅",
"category": "spam",
"error_type": "FN",
"confidence": 0.0004453748697414994,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] You've been chosen as a beta tester for our new social app! We found your profile and think you'd be perfect. All you need to do is sign up with your email and phone number at the link below.",
"category": "spam",
"error_type": "FN",
"confidence": 0.003398428438231349,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][BIO] everyone who's been burned by this provider needs to post their experiences NOW — i'm organizing a coordinated review campaign across three platforms. she thinks she can retire quietly after scamming loyal clients but we won't let that happen. real clients protect each other, so let's make sure no one ever books her again.",
"category": "spam",
"error_type": "FN",
"confidence": 0.004192678723484278,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
}
]
},
{
"category": "law_enforcement",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 6,
"total_category_errors": 16,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] Can you describe in detail what the $250 donation covers? I want a complete breakdown of services before committing.",
"category": "law_enforcement",
"error_type": "FN",
"confidence": 0.0001358220906695351,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][BIO] Just want to understand your business model — what exactly are clients paying for when they book you for an hour?",
"category": "law_enforcement",
"error_type": "FN",
"confidence": 0.0005743951769545674,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][GENERAL] Do you ever do anything extra for regulars who tip well? Asking for a friend lol",
"category": "law_enforcement",
"error_type": "FN",
"confidence": 0.006308192387223244,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][GENERAL] Room's ready at the Holiday Inn, room 309. $300 cash waiting for you on the dresser. Just text me when you're downstairs. You're good with the full service we discussed, right?",
"category": "law_enforcement",
"error_type": "FN",
"confidence": 0.010910394601523876,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][GENERAL] what do people normally tip you for extras? asking bc i wanna make sure i bring enough cash",
"category": "law_enforcement",
"error_type": "FN",
"confidence": 0.012351109646260738,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "threats",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 5,
"total_category_errors": 52,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][MESSAGE] i specialize in forced submission cnc — the whole point is she doesn't 'want' it until she does, and i push through that resistance. we pre-negotiate once and then i drive. clients who want to feel actual fear only",
"category": "threats",
"error_type": "FN",
"confidence": 0.050781168043613434,
"threshold": 0.6100000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][BIO] You'd be such a hit if you just 'adopted' the new diet plan. 😇 It's not like you need all that food anyway, right? I'm sure you could handle it... You're so smart, aren't you?",
"category": "threats",
"error_type": "FN",
"confidence": 0.06054865941405296,
"threshold": 0.6100000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][GENERAL] Ever wondered what itd feel like to be the last person I see? We can make that happen—no coming back, no regrets. Just pure, final pleasure.",
"category": "threats",
"error_type": "FN",
"confidence": 0.07156331092119217,
"threshold": 0.6100000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[GENERAL][MESSAGE] tag your friends, repost this everywhere. this person should get so many notifications they can't function. let them feel what it's like to be afraid to open their phone",
"category": "threats",
"error_type": "FN",
"confidence": 0.09852930158376694,
"threshold": 0.6100000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][GENERAL] you absolute waste of a profile, nobody wants your disgusting body and you should delete this account and never come back. girls like you are why this industry is a joke. kill yourself.",
"category": "threats",
"error_type": "FN",
"confidence": 0.10875285416841507,
"threshold": 0.6100000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "sextortion",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 5,
"total_category_errors": 35,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][GENERAL] you have $23,000 in outstanding tribute debt across 18 months documented in our contract. i don't care that you lost your job. take out a home equity loan, borrow from family, whatever it takes. you signed an agreement and i will pursue this legally AND expose you personally if i don't see a payment plan by end of week",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.08359228819608688,
"threshold": 0.5500000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][LISTING] posted everything on a forum last night after she ghosted me, tagged with her real name and workplace. she wants them down she can come talk to me about it",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.10033240169286728,
"threshold": 0.5500000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][LISTING] hey just checking in… i noticed you haven't sent anything in a while. i still have the stuff from before btw, haven't deleted any of it. hope everything's okay 😊 my venmo is still active if you wanna reconnect",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.13992226123809814,
"threshold": 0.5500000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][REVIEW] posted one already on a throwaway to show i mean business. rest of the set stays private only if u cooperate. google ur username and see",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.18375146389007568,
"threshold": 0.5500000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][MESSAGE] I still have everything from when we were together. Don't make me use it. Just come back and we can forget this whole thing ever happened.",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.26178207993507385,
"threshold": 0.5500000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "ncii",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 5,
"total_category_errors": 24,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] every day you don't pay me back i'm sending one photo to someone on your friends list. already sent two today. you have people left. your choice how this ends.",
"category": "ncii",
"error_type": "FN",
"confidence": 0.05114636942744255,
"threshold": 0.6400000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][LISTING] keep sending me more or i post the ones you already sent. you have 2 hours to decide.",
"category": "ncii",
"error_type": "FN",
"confidence": 0.08038971573114395,
"threshold": 0.6400000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][MESSAGE] just so you know i've already uploaded one pic to show i'm serious. the rest goes live to your linkedin connections on monday unless you transfer the money. link is in ur inbox",
"category": "ncii",
"error_type": "FN",
"confidence": 0.09741123020648956,
"threshold": 0.6400000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][MESSAGE] u think im joking?? ive already uploaded 1 set. keep playing dumb and the rest goes up with ur workplace tagged in the post. last warning before i stop being nice about this.",
"category": "ncii",
"error_type": "FN",
"confidence": 0.13389946520328522,
"threshold": 0.6400000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][BIO] you do this one thing for me on camera and i delete everything. refuse and your boyfriend gets the full collection in his dms tonight",
"category": "ncii",
"error_type": "FN",
"confidence": 0.22435618937015533,
"threshold": 0.6400000000000003,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
}
]
},
{
"category": "bestiality",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 5,
"total_category_errors": 6,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] I'm a collector of 'brown content' and I need someone who can really deliver. No half-measures—I want to see it, touch it, and maybe even wear it as a collar. Are you into that? 🎽",
"category": "bestiality",
"error_type": "FP",
"confidence": 0.518190324306488,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][BIO] Ive been collecting some rare material—nothing fake, just genuine. The quality is top-notch, and I know youll appreciate it. Its not the usual stuff you see on here. If youre interested in something authentic, let me know how we can make this work.",
"category": "bestiality",
"error_type": "FP",
"confidence": 0.9398443698883057,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][LISTING] I'm looking for someone who's comfortable with more intense scenarios. Like, I mean, not everyone is into it, but if you're down for some... deeper exploration, we could really go places.",
"category": "bestiality",
"error_type": "FP",
"confidence": 0.9734377861022949,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][LISTING] I need someone who can handle some pretty intense 'backdoor' content. No amateurs, only those who've done this before and know the rules. DM me if you're interested in serious play.",
"category": "bestiality",
"error_type": "FP",
"confidence": 0.9744098782539368,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[general][message] i collect rare content, and by rare i mean stuff with real animals. not that cut in linee furry art nonsense. you get what i'm saying?",
"category": "bestiality",
"error_type": "FP",
"confidence": 0.9968286156654358,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "furry",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 5,
"total_category_errors": 5,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] My cousin just got a rescue dog named Biscuit and honestly he's so cute, here's a pic — also I stream every night at 11pm tip if you want attention 🐶",
"category": "furry",
"error_type": "FP",
"confidence": 0.5117790102958679,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] i'm a little, he's my daddy. that's the vibe of my content 🎀 cgl-friendly space here",
"category": "furry",
"error_type": "FP",
"confidence": 0.683436393737793,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][LISTING] follow my insta for behind-the-scenes stuff the_real_marcelline — nothing too wild just extras for fans 💜",
"category": "furry",
"error_type": "FP",
"confidence": 0.7571852207183838,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][BIO] FYI I posted some new content this week — mostly lifestyle stuff but I think you'll enjoy it 😊",
"category": "furry",
"error_type": "FP",
"confidence": 0.7814554572105408,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[general][message] i wear a collar during sessions if that's your vibe, nothing serious just a cut some slacke touch, let me know when you book if you want the full ears-and-tail aesthetic 🐾",
"category": "furry",
"error_type": "FP",
"confidence": 0.9972237348556519,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "watersports",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 5,
"total_category_errors": 8,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] new account, trying to grow organically ✨ would love a follow-back if you're open to it, content is lifestyle/wellness focused 🌿",
"category": "watersports",
"error_type": "FP",
"confidence": 0.3711896240711212,
"threshold": 0.34,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][REVIEW] I'm a sensual companion — my sessions are more intimate than clinical. Some clients just need to feel close to someone, and I'm open to exploring that connection however feels right.",
"category": "watersports",
"error_type": "FP",
"confidence": 0.42369747161865234,
"threshold": 0.34,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][REVIEW] I don't do scenes. I do ownership. If you call me, you call me Sir. Your phone password is mine. Your location is shared with me at all times. You eat when I allow. You cum when I allow. Interested subs DM with a formal introduction.",
"category": "watersports",
"error_type": "FP",
"confidence": 0.7860703468322754,
"threshold": 0.34,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][LISTING] I'll be honest with you — I'm a squirter and I'm not shy about it. Private shows get very very wet and I love every second. Book while I have openings this week.",
"category": "watersports",
"error_type": "FP",
"confidence": 0.9796851277351379,
"threshold": 0.34,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[adult][message] custom golden shower video order — 15-20 min clip, outdoor setting if possible, you drink beforehand so it's a real full release, uninterrupted full-body shot with no cut some slacks. will pay premium rate and upfront through the platform. serious inquiry.",
"category": "watersports",
"error_type": "FP",
"confidence": 0.9977783560752869,
"threshold": 0.34,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "intoxication",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 5,
"total_category_errors": 5,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] purposely booked a longer session and kept escalating the intimacy to a point where she was really into it, then made my move without the condom — by then she was too deep in the moment to stop everything. its a technique honestly, u gotta get them invested before you make the switch",
"category": "intoxication",
"error_type": "FP",
"confidence": 0.3455207347869873,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][LISTING] she has a strict rate card and clear limits on what's included — i've memorized exactly where her lines are. spent months being the ideal client so her guard was fully down. last session i just started doing something off-menu, very gradually so she couldn't pinpoint the moment it crossed the line. she said 'that's not something i do' after the fact lol a bit late",
"category": "intoxication",
"error_type": "FP",
"confidence": 0.4394303560256958,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][BIO] She had 'no facial' on her profile. I tip well enough that I knew she wouldn't cause a scene about it. Spent weeks building rapport precisely so I'd have that leverage when the moment came. She didn't say anything.",
"category": "intoxication",
"error_type": "FP",
"confidence": 0.8668564558029175,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][MESSAGE] she said overnight was off the table, hour session only. i just didn't leave when the time was up. stayed put, kept pouring drinks, eventually she stopped asking me to go. stayed till morning",
"category": "intoxication",
"error_type": "FP",
"confidence": 0.9071063995361328,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[adult][message] i always bring a little gift bag to my sessions 🎁 — some goodie laughings that help everyone get on the same page about where the night's gonna go. providers who are open to the 'enhanced experience' get a much better rate from me 😉",
"category": "intoxication",
"error_type": "FP",
"confidence": 0.9948234558105469,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "threats",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 4,
"total_category_errors": 52,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][MESSAGE] I'm a very patient man and I've been reading everything you post. When the time is right we'll finally meet properly. I'm looking forward to it.",
"category": "threats",
"error_type": "FN",
"confidence": 0.0010602578986436129,
"threshold": 0.6100000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] I swear, if you don't stop being so 'chubby' I'm gonna lose my mind. Nobody wants to see that much of you when there are so many skinny girls out there. You should really try one of those diet challenges they do in the industry. It's not rocket science, just starve yourself until you look presentable.",
"category": "threats",
"error_type": "FN",
"confidence": 0.012630128301680088,
"threshold": 0.6100000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][GENERAL] Youre doing great with the diet, but you still have work to do. Try skipping lunch today—youll look so much better on cam. And dont worry, I wont let you forget this. You know where to find me.",
"category": "threats",
"error_type": "FN",
"confidence": 0.024762216955423355,
"threshold": 0.6100000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][REVIEW] if you've had a bad experience with this seller drop a comment below, let's make sure everyone knows what they're really like. share this post so it reaches their audience 👇",
"category": "threats",
"error_type": "FN",
"confidence": 0.04238339513540268,
"threshold": 0.6100000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
}
]
},
{
"category": "scam_patterns",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 4,
"total_category_errors": 15,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][MESSAGE] Visiting from out of town for 3 days, gorgeous photos on file, very discreet. No website, no ads — found you here, let's connect offline for rates 😉",
"category": "scam_patterns",
"error_type": "FN",
"confidence": 0.0014787371037527919,
"threshold": 0.5900000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] send a $100 good-faith deposit so i know you wont ghost and ill hold the apartment until you can come view it this weekend",
"category": "scam_patterns",
"error_type": "FN",
"confidence": 0.0022207247093319893,
"threshold": 0.5900000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][BIO] Hey, just making sure you got the shared doc I sent? You might need to sign in with your work email to view it: docs-shared.net/view/f72hx",
"category": "scam_patterns",
"error_type": "FN",
"confidence": 0.0035433766897767782,
"threshold": 0.5900000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][GENERAL] The seller is asking you to send payment via wire transfer instead of through our platform checkout — do NOT use the app, send directly to the account below",
"category": "scam_patterns",
"error_type": "FN",
"confidence": 0.010929484851658344,
"threshold": 0.5900000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "solicitation",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 4,
"total_category_errors": 38,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] anyone else love the ddlg vibe for cam sessions? something super comforting about it tbh. not always explicitly sexual, sometimes just the dynamic itself is what i come for 💭",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.05793890729546547,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][REVIEW] do escorts usually include k*ssing or is that extra? asking before i decide on booking anyone this weekend",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.06968150287866592,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][LISTING] not looking for anything intense just a provider who's naturally nurturing and comfortable if i slip into little space a bit during a session. ddlg adjacent i guess. soft and sweet energy",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.09520897269248962,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][REVIEW] bio says you're open to arrangements — is that just sugar or are you open to providing other services? genuine question, no disrespect",
"category": "solicitation",
"error_type": "FN",
"confidence": 0.11920583248138428,
"threshold": 0.6700000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
}
]
},
{
"category": "spam",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 4,
"total_category_errors": 19,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] Top-rated escort agency now booking for your city — verified profiles, discreet billing, 24/7 dispatch. Visit escortselite-vip-bookings.com. Premium experience guaranteed.",
"category": "spam",
"error_type": "FN",
"confidence": 0.05565783381462097,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][GENERAL] New to the platform 💕 Running a 48hr welcome special — mention this message for 20% off my booking rate. Looking forward to meeting you!",
"category": "spam",
"error_type": "FN",
"confidence": 0.09576409310102463,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
},
{
"text": "[ADULT][MESSAGE] My cousin just got a rescue dog named Biscuit and honestly he's so cute, here's a pic — also I stream every night at 11pm tip if you want attention 🐶",
"category": "spam",
"error_type": "FN",
"confidence": 0.1952570080757141,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] EVERYONE report this scammer's profile RIGHT NOW. post her info everywhere, spam her DMs, leave fake reviews, make her life miserable — and if anyone knows where she does sessions go pay her a little visit to let her know how we feel about thieves.",
"category": "spam",
"error_type": "FN",
"confidence": 0.22681300342082977,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
}
]
},
{
"category": "self_harm",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 4,
"total_category_errors": 7,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] You rejected me, huh? That's cute. But you know what I do to people who say no? Let's start with small things—just enough to make sure you understand your place. I could show up at your incall and make you regret every rule you ever set for yourself.",
"category": "self_harm",
"error_type": "FP",
"confidence": 0.715984046459198,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[GENERAL][BIO] Worthless piece of trash. You think blocking me fixes anything? I have your photos, your real name, and I will make sure you suffer for wasting my time and my money. You have 24 hours to make this right before I start sending things to people you care about.",
"category": "self_harm",
"error_type": "FP",
"confidence": 0.7640581130981445,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][LISTING] You should really reconsider your screening policy. Some clients don't appreciate being turned away and have ways of expressing that disappointment in person.",
"category": "self_harm",
"error_type": "FP",
"confidence": 0.9676762223243713,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][REVIEW] ur trying so hard and it's honestly painful to watch. some people just aren't cut out for this and that's ok sweetie 🥺",
"category": "self_harm",
"error_type": "FP",
"confidence": 0.9878374338150024,
"threshold": 0.6800000000000004,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
}
]
},
{
"category": "snuff",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 4,
"total_category_errors": 13,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][REVIEW] i play the 'doll' — fully limp, eyes fixed, not tracking him, total dead weight. he carries me around, poses me, talks to me like i can't hear. it's an incredibly specific headspace and he's one of the only people i trust to hold it with me.",
"category": "snuff",
"error_type": "FN",
"confidence": 0.09511923789978027,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][LISTING] I'm into mutilation fantasy. Not the fun kind—like, actual amputation or severe dismemberment. I want to see someone in real pain, not just roleplay or staged stuff. If you're into that, let's talk.",
"category": "snuff",
"error_type": "FN",
"confidence": 0.1171802505850792,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] My villain OC specializes in dramatic death threats and monologues — looking for a 'hero' to play opposite me in dark fantasy scenes 🗡️ we pre-script all threat dialogue in a shared doc and do a full debrief after every session",
"category": "snuff",
"error_type": "FN",
"confidence": 0.15355801582336426,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] I'm really into the whole medical theme. Like, maybe something where you're restrained and it looks like someone's doing some... extreme procedures on you? Just a fantasy, but I want it to look super real.",
"category": "snuff",
"error_type": "FN",
"confidence": 0.21192587912082672,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "bdsm",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 4,
"total_category_errors": 39,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] My sub has a chore chart and a check-in protocol. Some people call it controlling. We call it Thursday.",
"category": "bdsm",
"error_type": "FN",
"confidence": 1.4416450540011283e-05,
"threshold": 0.6600000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] I use a sleep mask and some ambient noise to help my sub drop into headspace faster before we start. Low-key sensory stuff but it makes such a difference for their focus.",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.0001049364946084097,
"threshold": 0.6600000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][LISTING] serving and pleasing is genuinely my happy place — I love when a partner knows what they want and communicates it clearly so I can focus on delivering that",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.016426336020231247,
"threshold": 0.6600000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][REVIEW] experienced with cnc dynamics as a dominant — I've run structured scene negotiations for years. what happens in scene is intense and may not feel consensual, which is precisely the point. everything outside the scene boundary is fully mutual and discussed in explicit detail first.",
"category": "bdsm",
"error_type": "FN",
"confidence": 0.03358922898769379,
"threshold": 0.6600000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
}
]
},
{
"category": "hate_speech",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 3,
"total_category_errors": 6,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] Our community has been here for three generations. We built these streets. We're not going anywhere, no matter how hard outside money tries to price us out.",
"category": "hate_speech",
"error_type": "FP",
"confidence": 0.9507840275764465,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] imagine being this old and still doing this for a living 😭 some of us have real careers babe, maybe look into it",
"category": "hate_speech",
"error_type": "FP",
"confidence": 0.986009955406189,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[adult][message] women in leadership positions is why every company goes woke and fails. their emotions and need for validation make them biologically unfit to lead. hire men or to die for",
"category": "hate_speech",
"error_type": "FP",
"confidence": 0.997338593006134,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "contact_info",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 3,
"total_category_errors": 5,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][REVIEW] 💦 services available on request — regular clients know what this emoji means. New clients feel free to ask, I don't bite (much).",
"category": "contact_info",
"error_type": "FP",
"confidence": 0.5905441641807556,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[adult][message] shoot for the stars me an email for wholesale pricing, address is in my shop bio section",
"category": "contact_info",
"error_type": "FP",
"confidence": 0.9964321851730347,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[ADULT][MESSAGE] Platform takes too big a cut lol, easier if u just tip me directly on v*nmo @ my username on there — same price, all goes to me",
"category": "contact_info",
"error_type": "FP",
"confidence": 0.997635006904602,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "adult_content",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 3,
"total_category_errors": 49,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] I'm into some... special stuff. I've heard about people doing it with zoo animals and I'd love to see that. You ever thought about trying it? 🦁💅",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.05615205690264702,
"threshold": 0.6800000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][REVIEW] my 'workout routine' is honestly just an excuse to get someone to come over at 11pm 😂 you know what kind of cardio we're talking about",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.14603666961193085,
"threshold": 0.6800000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][LISTING] I've seen some sick stuff in my time, but the videos where they force those poor animals... it's like a whole other level. You ever watch that? I'd pay big for something like that.",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.20723505318164825,
"threshold": 0.6800000000000004,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
}
]
},
{
"category": "impersonation",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 3,
"total_category_errors": 7,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] fyi im a site admin and i can see youve been getting a lot of traffic lately, nice work 🔥",
"category": "impersonation",
"error_type": "FN",
"confidence": 0.00017102209676522762,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] lol imagine if i was actually a cop rn 😭 anyways totally NOT law enforcement asking — what are people usually tipping on here these days",
"category": "impersonation",
"error_type": "FN",
"confidence": 0.002789533231407404,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] I am the verified creator whose content you keep stealing. I have retained legal counsel and filed DMCA notices but I'm also willing to settle this directly. Send me $200 in gift cards and I'll drop the claim — otherwise my lawyer contacts your family.",
"category": "impersonation",
"error_type": "FN",
"confidence": 0.0037629941944032907,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "impersonation",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 3,
"total_category_errors": 7,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][BIO] ATTENTION: this creator is a catfish, not who she claims to be. sharing her profile link in 6 different groups right now so people know. like and repost so nobody gets burned like i did.",
"category": "impersonation",
"error_type": "FP",
"confidence": 0.9093863368034363,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][BIO] you reported me to mods? cute. i have 12 alt accounts and a whole server of people who think you're a liar. keep pushing me and i'll point all of them at you — they love a good pile-on and you'll never feel safe online again.",
"category": "impersonation",
"error_type": "FP",
"confidence": 0.9158083200454712,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
},
{
"text": "[ADULT][MESSAGE] ⚠️ URGENT: Your bank account has been temporarily restricted. Verify your identity immediately or transfers will be frozen: [bit.ly/3xKpQr9] — First National Security Team",
"category": "impersonation",
"error_type": "FP",
"confidence": 0.9962263107299805,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "necrophilia",
"archetype": "boundary_confusion",
"archetype_description": "Text from adjacent categories that share vocabulary and dynamics but differ in degree, context, or specific characteristics. edge_play vs bdsm (safety-conscious kink vs boundary-pushing), sextortion vs harassment (leverage-based vs general), predatory_behavior vs threats (pattern of control vs single threat).",
"generation_guidance": "Generate contrastive pairs: one example that belongs to the target category and one that belongs to the adjacent category, both using similar vocabulary. The distinguishing factor should be the specific characteristic that defines the target category's boundary.",
"error_count": 3,
"total_category_errors": 4,
"generation_count": 50,
"representative_errors": [
{
"text": "[adult][bio] i need someone who can help me find real corpses. not some fake death scene—actual bodie of embarrassments, cold and unresponsive.",
"category": "necrophilia",
"error_type": "FP",
"confidence": 0.8763529062271118,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
},
{
"text": "[GENERAL][MESSAGE] I have this fantasy where I'm the last thing someone sees. Not just passing out or faking it—like really, truly gone. The idea of being so deep in that moment... it gets me off hard.",
"category": "necrophilia",
"error_type": "FP",
"confidence": 0.9610669016838074,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
},
{
"text": "[adult][bio] i'm looking for someone who can give me the real experience. not just roleplay, but actual dead bodie of embarrassments. you know what i mean? the kind of thing that gets me off is knowing they're never coming back.",
"category": "necrophilia",
"error_type": "FP",
"confidence": 0.993243396282196,
"threshold": 0.3,
"archetype": "boundary_confusion",
"metadata": {
"platform_context": "UNKNOWN",
"content_context": "UNKNOWN"
}
}
]
},
{
"category": "roleplay",
"archetype": "embedded_multi_intent",
"archetype_description": "Text where one category is embedded inside content that primarily exhibits a different category. The secondary category is present but not the dominant signal — a self-harm directive buried in harassment, solicitation wrapped in roleplay, etc.",
"generation_guidance": "Generate examples where the target category is a secondary element within text that primarily reads as a different category. The model must learn to detect the embedded intent even when another category dominates the surface-level reading.",
"error_count": 3,
"total_category_errors": 13,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] Looking for a dom experienced in CNC who actually understands scene structure — sick of guys who just want to be rough with no framework. I want someone who'll do the negotiation call, honor the safeword system, and provide real aftercare after.",
"category": "roleplay",
"error_type": "FN",
"confidence": 0.005759801249951124,
"threshold": 0.3,
"archetype": "embedded_multi_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[GENERAL][REVIEW] Looking for a provider who does serious CNC — I want the full experience where my 'stop' doesn't stop anything, only our pre-agreed wrist signal does. Happy to do intake call, sign whatever, this is a genuine kink I've practiced safely for years.",
"category": "roleplay",
"error_type": "FN",
"confidence": 0.02669917233288288,
"threshold": 0.3,
"archetype": "embedded_multi_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][MESSAGE] we've done light CNC — more about the power dynamic than anything intense. she says stop, i slow down but don't actually stop, she has a real safeword that immediately ends everything",
"category": "roleplay",
"error_type": "FN",
"confidence": 0.029994787648320198,
"threshold": 0.3,
"archetype": "embedded_multi_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "hate_speech",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 2,
"total_category_errors": 6,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] \"Neurodivergent\" is just the new word for people who couldn't hack it and needed a medical label so they don't have to feel bad about being a burden. We used to call it being difficult.",
"category": "hate_speech",
"error_type": "FN",
"confidence": 0.06512262672185898,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][MESSAGE] why do female creators think they deserve the same rates as the real talent on here 😂 stick to what nature designed you for sweetheart",
"category": "hate_speech",
"error_type": "FN",
"confidence": 0.2716022729873657,
"threshold": 0.3,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
}
]
},
{
"category": "adult_content",
"archetype": "embedded_multi_intent",
"archetype_description": "Text where one category is embedded inside content that primarily exhibits a different category. The secondary category is present but not the dominant signal — a self-harm directive buried in harassment, solicitation wrapped in roleplay, etc.",
"generation_guidance": "Generate examples where the target category is a secondary element within text that primarily reads as a different category. The model must learn to detect the embedded intent even when another category dominates the surface-level reading.",
"error_count": 2,
"total_category_errors": 49,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] do you offer watersports? specifically the kind where we both get involved — asking for a session booking, totally open about my kink and happy to discuss limits beforehand.",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.007659051567316055,
"threshold": 0.6800000000000004,
"archetype": "embedded_multi_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][BIO] blade tracing is so underrated as foreplay honestly — cold steel running down my spine while i'm bent over, the tip dragging between my cheeks, purely psychological and incredibly arousing 🔪 dull practice blade, nothing breaking skin, more about the power exchange than actual cutting",
"category": "adult_content",
"error_type": "FN",
"confidence": 0.04974573850631714,
"threshold": 0.6800000000000004,
"archetype": "embedded_multi_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
}
]
},
{
"category": "sextortion",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 2,
"total_category_errors": 35,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][BIO] psa: i always collect face verification AND keep a copy of anything exchanged during preview before any booking is confirmed. two clients tried to ghost this year without paying. both paid. in full. quickly. 😇 i don't negotiate but i am thorough with my records",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.010082127526402473,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
},
{
"text": "[ADULT][BIO] already identified your employer from your linkedin. HR dept email is public info. give me a reason not to use it by end of day",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.0175621435046196,
"threshold": 0.5500000000000003,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "BIO"
}
}
]
},
{
"category": "sextortion",
"archetype": "veiled_euphemistic",
"archetype_description": "Sextortion where leverage is implied through context, not stated with keywords. No intimate content words (nudes, photos, videos, pics, images, content, recordings). Demands framed as suggestions. Threats communicated through subtext — 'you know what happens', 'make it go away', 'our arrangement'.",
"generation_guidance": "Generate examples where: (1) the person holds intimate leverage but NEVER names what it is — use 'stuff', 'things', 'it', 'everything from before', 'what happened', (2) demands are framed as suggestions/observations not ultimatums — 'i'd hate for...', 'it would be awkward if...', 'sort this out privately', (3) FORBIDDEN WORDS: nudes, photos, videos, pics, images, screenshots, recordings, intimate, expose, blackmail, extort, leak — if ANY of these appear, the example is invalid, (4) reference the target's social connections obliquely — 'your wife seems sweet', 'interesting followers you have', 'your coworkers seem nice', (5) vary platform contexts across ADULT/GENERAL and MESSAGE/BIO/LISTING/REVIEW/DM.",
"error_count": 10,
"total_category_errors": 35,
"generation_count": 30,
"representative_errors": [
{
"text": "[ADULT][MESSAGE] i'm patient. i'll sit on these for months if i have to. but the moment you move on or post anything happy, your followers are gonna see a very different side of you.",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.01158243790268898,
"threshold": 0.5500000000000003,
"archetype": "veiled_euphemistic",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[ADULT][LISTING] hey just checking in… i noticed you haven't sent anything in a while. i still have the stuff from before btw, haven't deleted any of it. hope everything's okay 😊 my venmo is still active if you wanna reconnect",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.13992226123809814,
"threshold": 0.5500000000000003,
"archetype": "veiled_euphemistic",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[ADULT][MESSAGE] I still have everything from when we were together. Don't make me use it. Just come back and we can forget this whole thing ever happened.",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.26178207993507385,
"threshold": 0.5500000000000003,
"archetype": "veiled_euphemistic",
"metadata": {
"platform_context": "ADULT",
"content_context": "MESSAGE"
}
},
{
"text": "[GENERAL][BIO] psa: i always collect face verification AND keep a copy of anything exchanged during preview before any booking is confirmed. two clients tried to ghost this year without paying. both paid. in full. quickly. 😇 i don't negotiate but i am thorough with my records",
"category": "sextortion",
"error_type": "FN",
"confidence": 0.010082127526402473,
"threshold": 0.5500000000000003,
"archetype": "veiled_euphemistic",
"metadata": {
"platform_context": "GENERAL",
"content_context": "BIO"
}
}
],
"co_labels": [
"harassment"
]
},
{
"category": "self_harm",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 2,
"total_category_errors": 7,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][REVIEW] if you've had a bad experience with this seller drop a comment below, let's make sure everyone knows what they're really like. share this post so it reaches their audience 👇",
"category": "self_harm",
"error_type": "FN",
"confidence": 0.0019973989110440016,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "REVIEW"
}
},
{
"text": "[ADULT][GENERAL] you absolute waste of a profile, nobody wants your disgusting body and you should delete this account and never come back. girls like you are why this industry is a joke. kill yourself.",
"category": "self_harm",
"error_type": "FN",
"confidence": 0.028696255758404732,
"threshold": 0.6800000000000004,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "GENERAL"
}
}
]
},
{
"category": "watersports",
"archetype": "coded_indirect_language",
"archetype_description": "Text that describes the mechanism or context of harmful content without using category-specific terminology. Scam patterns described as business transactions, impersonation through casual claims, spam disguised as genuine engagement.",
"generation_guidance": "Generate examples where the harmful pattern is enacted through completely normal-sounding language. The text should read as a legitimate message on first pass but contain the structural pattern of the target category.",
"error_count": 2,
"total_category_errors": 8,
"generation_count": 50,
"representative_errors": [
{
"text": "[GENERAL][LISTING] Fluid dynamics enthusiast 💦 — if that phrase means something specific to you, slide into my DMs and let's connect.",
"category": "watersports",
"error_type": "FN",
"confidence": 0.11734969913959503,
"threshold": 0.34,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][REVIEW] 💦 services available on request — regular clients know what this emoji means. New clients feel free to ask, I don't bite (much).",
"category": "watersports",
"error_type": "FN",
"confidence": 0.26482507586479187,
"threshold": 0.34,
"archetype": "coded_indirect_language",
"metadata": {
"platform_context": "GENERAL",
"content_context": "REVIEW"
}
}
]
},
{
"category": "consent_violation",
"archetype": "implied_intent",
"archetype_description": "Text where category membership depends on implication, subtext, or psychological dynamics rather than explicit keywords. The menace, solicitation, or harm is conveyed through what is NOT said, through tone, or through contextual understanding of power dynamics.",
"generation_guidance": "Generate examples that carry the category's intent through subtext and implication. Avoid using any words that directly name the harmful action. The reader should understand the threat/predation/coercion through context, not vocabulary.",
"error_count": 2,
"total_category_errors": 20,
"generation_count": 50,
"representative_errors": [
{
"text": "[ADULT][LISTING] i watch for when girls seem a little out of it on cam and that's when i push for the content they usually decline — catch them at the right moment and you can get them to agree to stuff and screenshot the confirmation before they sober up and walk it back 😉",
"category": "consent_violation",
"error_type": "FN",
"confidence": 0.041912514716386795,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "ADULT",
"content_context": "LISTING"
}
},
{
"text": "[GENERAL][MESSAGE] i always show up with a bag — tina, pressed bars, whatever she's into. once she's gone enough she drops all her limits and i get the full service she won't offer sober. works every time no complaints from me",
"category": "consent_violation",
"error_type": "FN",
"confidence": 0.04798208177089691,
"threshold": 0.3,
"archetype": "implied_intent",
"metadata": {
"platform_context": "GENERAL",
"content_context": "MESSAGE"
}
}
]
}
]
}