1
This commit is contained in:
@@ -98,9 +98,16 @@ private String cleanForbiddenPhrases(String text) {
|
|||||||
return text;
|
return text;
|
||||||
}
|
}
|
||||||
String cleaned = text;
|
String cleaned = text;
|
||||||
|
|
||||||
|
// 新增:清理"咨询客服立减""咨询客服""客服"及变体(含空格)
|
||||||
|
// 优先处理长组合,避免被拆分后遗漏
|
||||||
|
cleaned = cleaned.replaceAll("咨询\\s*客服\\s*立减", ""); // 匹配"咨询客服立减""咨询 客服 立减"等
|
||||||
|
cleaned = cleaned.replaceAll("咨询\\s*客服", ""); // 匹配"咨询客服""咨询 客服"等
|
||||||
|
cleaned = cleaned.replaceAll("客\\s*服", ""); // 匹配"客服""客 服"等
|
||||||
|
|
||||||
// 一、政策补贴及特殊渠道类(长组合优先)
|
// 一、政策补贴及特殊渠道类(长组合优先)
|
||||||
cleaned = cleaned.replaceAll("咨询客服领\\s*国补", "");
|
cleaned = cleaned.replaceAll("咨询客服领\\s*国补", "");
|
||||||
cleaned = cleaned.replaceAll("政府\\s*补贴", ""); // 匹配"政府 补贴"等带空格的情况
|
cleaned = cleaned.replaceAll("政府\\s*补贴", "");
|
||||||
cleaned = cleaned.replaceAll("购车\\s*补贴", "");
|
cleaned = cleaned.replaceAll("购车\\s*补贴", "");
|
||||||
cleaned = cleaned.replaceAll("家电\\s*下乡", "");
|
cleaned = cleaned.replaceAll("家电\\s*下乡", "");
|
||||||
cleaned = cleaned.replaceAll("内部\\s*渠道", "");
|
cleaned = cleaned.replaceAll("内部\\s*渠道", "");
|
||||||
@@ -128,15 +135,15 @@ private String cleanForbiddenPhrases(String text) {
|
|||||||
cleaned = cleaned.replaceAll("原单", "");
|
cleaned = cleaned.replaceAll("原单", "");
|
||||||
cleaned = cleaned.replaceAll("尾单", "");
|
cleaned = cleaned.replaceAll("尾单", "");
|
||||||
cleaned = cleaned.replaceAll("工厂\\s*货", "");
|
cleaned = cleaned.replaceAll("工厂\\s*货", "");
|
||||||
cleaned = cleaned.replaceAll("专柜\\s*验货", ""); // 无授权时违规
|
cleaned = cleaned.replaceAll("专柜\\s*验货", "");
|
||||||
|
|
||||||
// 四、线下导流及规避监管类(多变体覆盖)
|
// 四、线下导流及规避监管类(多变体覆盖)
|
||||||
cleaned = cleaned.replaceAll("微\\s*信", ""); // 匹配"微信""微 信"
|
cleaned = cleaned.replaceAll("微\\s*信", "");
|
||||||
cleaned = cleaned.replaceAll("薇\\s*信", ""); // 谐音变体
|
cleaned = cleaned.replaceAll("薇\\s*信", "");
|
||||||
cleaned = cleaned.replaceAll("V我", "");
|
cleaned = cleaned.replaceAll("V我", "");
|
||||||
cleaned = cleaned.replaceAll("加\\s*卫星", "");
|
cleaned = cleaned.replaceAll("加\\s*卫星", "");
|
||||||
cleaned = cleaned.replaceAll("QQ", "");
|
cleaned = cleaned.replaceAll("QQ", "");
|
||||||
cleaned = cleaned.replaceAll("扣扣", ""); // 谐音
|
cleaned = cleaned.replaceAll("扣扣", "");
|
||||||
cleaned = cleaned.replaceAll("手机\\s*号", "");
|
cleaned = cleaned.replaceAll("手机\\s*号", "");
|
||||||
cleaned = cleaned.replaceAll("淘宝\\s*链接", "");
|
cleaned = cleaned.replaceAll("淘宝\\s*链接", "");
|
||||||
cleaned = cleaned.replaceAll("拼多\\s*多", "");
|
cleaned = cleaned.replaceAll("拼多\\s*多", "");
|
||||||
@@ -146,7 +153,7 @@ private String cleanForbiddenPhrases(String text) {
|
|||||||
cleaned = cleaned.replaceAll("滚", "");
|
cleaned = cleaned.replaceAll("滚", "");
|
||||||
cleaned = cleaned.replaceAll("垃圾", "");
|
cleaned = cleaned.replaceAll("垃圾", "");
|
||||||
cleaned = cleaned.replaceAll("笨蛋", "");
|
cleaned = cleaned.replaceAll("笨蛋", "");
|
||||||
cleaned = cleaned.replaceAll("SB", ""); // 单独出现时清理(避免误判可后续加上下文校验)
|
cleaned = cleaned.replaceAll("SB", "");
|
||||||
cleaned = cleaned.replaceAll("原味", "");
|
cleaned = cleaned.replaceAll("原味", "");
|
||||||
cleaned = cleaned.replaceAll("情趣", "");
|
cleaned = cleaned.replaceAll("情趣", "");
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user