QChatGPT/pkg/qqbot/filter.py

65 lines
2.5 KiB
Python
Raw Normal View History

# 敏感词过滤模块
2022-12-11 17:17:33 +08:00
import re
2023-03-04 21:02:10 +08:00
import requests
import json
2023-03-04 21:12:50 +08:00
from config import baidu_check, baidu_api_key, baidu_secret_key, illgalmessage
2023-03-04 21:02:10 +08:00
import logging
2022-12-11 17:17:33 +08:00
2023-03-04 21:02:10 +08:00
# 然后可以通过config.check, config.baidu_api_key等方式来使用这些变量。
def get_access_token():
"""
使用 AKSK 生成鉴权签名Access Token
:return: access_token或是None(如果错误)
"""
url = "https://aip.baidubce.com/oauth/2.0/token"
params = {"grant_type": "client_credentials", "client_id": baidu_api_key,
"client_secret": baidu_secret_key}
return str(requests.post(url, params=params).json().get("access_token"))
# 百度云审核URL
baidu_url = "https://aip.baidubce.com/rest/2.0/solution/v1/text_censor/v2/user_defined?access_token=" \
+ get_access_token()
2022-12-11 17:17:33 +08:00
2023-03-04 21:02:10 +08:00
class ReplyFilter:
2022-12-11 17:17:33 +08:00
sensitive_words = []
def __init__(self, sensitive_words: list):
self.sensitive_words = sensitive_words
def process(self, message: str) -> str:
2023-03-04 21:02:10 +08:00
# 百度云审核
2023-03-04 21:12:50 +08:00
if baidu_check:
2023-03-04 21:02:10 +08:00
# 百度云审核
payload = "text=" + message
logging.info("向百度云发送:" + payload)
headers = {'Content-Type': 'application/x-www-form-urlencoded', 'Accept': 'application/json'}
response = requests.request("POST", baidu_url, headers=headers, data=payload.encode('utf-8'))
response_dict = json.loads(response.text)
# 处理百度云审核结果
if "error_code" in response_dict:
error_msg = response_dict.get("error_msg")
logging.info(f"百度云判定出错,错误信息:{error_msg}")
conclusion = f"百度云判定出错,错误信息:{error_msg}\n以下是原消息:{message}"
else:
conclusion = response_dict["conclusion"]
if conclusion in ("合规"):
logging.info(f"百度云判定结果:{conclusion}")
return message
else:
logging.info(f"百度云判定结果:{conclusion}")
conclusion = illgalmessage
# 返回百度云审核结果
return conclusion
# 本地关键词屏蔽
2022-12-11 17:17:33 +08:00
for word in self.sensitive_words:
match = re.findall(word, message)
if len(match) > 0:
for i in range(len(match)):
message = message.replace(match[i], "*" * len(match[i]))
return message