PyWxDump/pywxdump/dbpreprocess/parsingMicroMsg.py

268 lines
11 KiB
Python
Raw Normal View History

2024-04-16 23:16:22 +08:00
# -*- coding: utf-8 -*-#
# -------------------------------------------------------------------------------
# Name: parsingMicroMsg.py
# Description:
# Author: xaoyaoo
# Date: 2024/04/15
# -------------------------------------------------------------------------------
2024-04-19 22:48:37 +08:00
import logging
2024-04-16 23:16:22 +08:00
from .dbbase import DatabaseBase
2024-04-19 16:16:32 +08:00
from .utils import timestamp2str, bytes2str
import blackboxprotobuf
2024-04-16 23:16:22 +08:00
class ParsingMicroMsg(DatabaseBase):
_class_name = "MicroMsg"
2024-04-16 23:16:22 +08:00
def __init__(self, db_path):
super().__init__(db_path)
2024-04-19 16:16:32 +08:00
def get_BytesExtra(self, BytesExtra):
if BytesExtra is None or not isinstance(BytesExtra, bytes):
return None
try:
deserialize_data, message_type = blackboxprotobuf.decode_message(BytesExtra)
return deserialize_data
except Exception as e:
return None
2024-06-12 00:35:03 +08:00
def get_ExtraBuf(self, ExtraBuf: bytes):
"""
读取ExtraBuf联系人表
:param ExtraBuf:
:return:
"""
if not ExtraBuf:
return None
try:
buf_dict = {
'DDF32683': '0', '74752C06': '性别[1男2女]', '88E28FCE': '2', '761A1D2D': '3', '0263A0CB': '4',
'0451FF12': '5',
'228C66A8': '6', '46CF10C4': '个性签名', 'A4D9024A': '', 'E2EAA8D1': '', '1D025BBF': '',
'4D6C4570': '11',
'F917BCC0': '公司名称', '759378AD': '手机号', '4335DFDD': '14', 'DE4CDAEB': '15', 'A72BC20A': '16',
'069FED52': '17',
'9B0F4299': '18', '3D641E22': '19', '1249822C': '20', '4EB96D85': '企微属性', 'B4F73ACB': '22',
'0959EB92': '23',
'3CF4A315': '24', 'C9477AC60201E44CD0E8': '26', 'B7ACF0F5': '28', '57A7B5A8': '29',
'81AE19B4': '朋友圈背景',
'695F3170': '31', 'FB083DD9': '32', '0240E37F': '33', '315D02A3': '34', '7DEC0BC3': '35',
'0E719F13': '备注图片',
'16791C90': '37'
}
rdata = {}
for buf_name in buf_dict:
rdata_name = buf_dict[buf_name]
buf_name = bytes.fromhex(buf_name)
offset = ExtraBuf.find(buf_name)
if offset == -1:
rdata[rdata_name] = ""
continue
offset += len(buf_name)
type_id = ExtraBuf[offset: offset + 1]
offset += 1
if type_id == b"\x04":
rdata[rdata_name] = int.from_bytes(ExtraBuf[offset: offset + 4], "little")
elif type_id == b"\x18":
length = int.from_bytes(ExtraBuf[offset: offset + 4], "little")
rdata[rdata_name] = ExtraBuf[offset + 4: offset + 4 + length].decode("utf-16").rstrip("\x00")
elif type_id == b"\x17":
length = int.from_bytes(ExtraBuf[offset: offset + 4], "little")
rdata[rdata_name] = ExtraBuf[offset + 4: offset + 4 + length].decode("utf-8").rstrip("\x00")
elif type_id == b"\x05":
rdata[rdata_name] = f"0x{ExtraBuf[offset: offset + 8].hex()}"
return rdata
except Exception as e:
print(f'解析错误:\n{e}')
return None
2024-04-19 16:16:32 +08:00
def ChatRoom_RoomData(self, RoomData):
# 读取群聊数据,主要为 wxid以及对应昵称
if RoomData is None or not isinstance(RoomData, bytes):
return None
try:
data = self.get_BytesExtra(RoomData)
bytes2str(data)
return data
except Exception as e:
return None
def wxid2userinfo(self, wxid):
2024-04-16 23:16:22 +08:00
"""
获取单个联系人信息
2024-04-20 17:54:54 +08:00
:param wxid: 微信id,可以是单个id也可以是id列表
2024-04-16 23:16:22 +08:00
:return: 联系人信息
"""
if isinstance(wxid, str):
wxid = [wxid]
elif isinstance(wxid, list):
wxid = wxid
else:
return {}
wxid = "','".join(wxid)
wxid = f"'{wxid}'"
2024-04-16 23:16:22 +08:00
# 获取username是wx_id的用户
2024-06-12 00:35:03 +08:00
sql = ("SELECT A.UserName, A.NickName, A.Remark,A.Alias,A.Reserved6,B.bigHeadImgUrl,A.LabelIDList "
2024-04-16 23:16:22 +08:00
"FROM Contact A,ContactHeadImgUrl B "
f"WHERE A.UserName = B.usrName AND A.UserName in ({wxid}) "
2024-04-16 23:16:22 +08:00
"ORDER BY NickName ASC;")
result = self.execute_sql(sql)
if not result:
return {}
users = {}
for row in result:
# 获取wxid,昵称,备注,描述,头像
2024-06-12 00:35:03 +08:00
username, nickname, remark, Alias, describe, headImgUrl, LabelIDList = row
LabelIDList = LabelIDList.split(",") if LabelIDList else []
users[username] = {"wxid": username, "nickname": nickname, "remark": remark, "account": Alias,
2024-06-12 00:35:03 +08:00
"describe": describe, "headImgUrl": headImgUrl, "LabelIDList": tuple(LabelIDList)}
return users
2024-04-16 23:16:22 +08:00
def user_list(self, word=None):
2024-04-16 23:16:22 +08:00
"""
获取联系人列表
:param word 查询关键字可以是用户名昵称备注描述允许拼音
2024-04-16 23:16:22 +08:00
:return: 联系人列表
"""
users = []
sql = (
2024-06-12 00:35:03 +08:00
"SELECT A.UserName, A.NickName, A.Remark,A.Alias,A.Reserved6,B.bigHeadImgUrl,A.LabelIDList "
"FROM Contact A left join ContactHeadImgUrl B on A.UserName==B.usrName "
"ORDER BY A.NickName DESC;")
if word:
sql = sql.replace("ORDER BY A.NickName DESC;",
f"where "
f"A.UserName LIKE '%{word}%' "
f"OR A.NickName LIKE '%{word}%' "
f"OR A.Remark LIKE '%{word}%' "
f"OR A.Alias LIKE '%{word}%' "
f"OR A.QuanPin LIKE LOWER('%{word}%') "
f"OR LOWER(A.PYInitial) LIKE LOWER('%{word}%') "
# f"OR A.Reserved6 LIKE '%{word}%' "
"ORDER BY A.NickName DESC;")
2024-04-16 23:16:22 +08:00
result = self.execute_sql(sql)
2024-04-19 21:49:07 +08:00
if not result:
return []
2024-04-16 23:16:22 +08:00
for row in result:
2024-06-12 00:35:03 +08:00
# 获取wxid,昵称,备注,描述,头像,标签
username, nickname, remark, Alias, describe, headImgUrl, LabelIDList = row
LabelIDList = LabelIDList.split(",") if LabelIDList else []
2024-04-16 23:16:22 +08:00
users.append(
{"wxid": username, "nickname": nickname, "remark": remark, "account": Alias,
2024-06-14 10:43:23 +08:00
"describe": describe, "headImgUrl": headImgUrl if headImgUrl else "",
"LabelIDList": tuple(LabelIDList)})
return users
def user_list_by_label(self, label_id):
"""
获取标签联系人列表
:param label_id: 标签id
:return: 标签联系人列表
"""
users = []
sql = (
"SELECT A.UserName, A.NickName, A.Remark,A.Alias,A.Reserved6,B.bigHeadImgUrl,A.LabelIDList "
"FROM Contact A left join ContactHeadImgUrl B on A.UserName==B.usrName "
f"where A.LabelIDList LIKE '%{label_id}%' "
"ORDER BY A.NickName DESC;")
result = self.execute_sql(sql)
if not result:
return []
for row in result:
# 获取wxid,昵称,备注,描述,头像,标签
username, nickname, remark, Alias, describe, headImgUrl, LabelIDList = row
LabelIDList = LabelIDList.split(",") if LabelIDList else []
users.append(
{"wxid": username, "nickname": nickname, "remark": remark, "account": Alias,
"describe": describe, "headImgUrl": headImgUrl if headImgUrl else "",
"LabelIDList": tuple(LabelIDList)})
2024-04-16 23:16:22 +08:00
return users
def recent_chat_wxid(self):
"""
获取最近聊天的联系人
:return: 最近聊天的联系人
"""
users = []
sql = (
"SELECT C.Username, C.LastReadedCreateTime,C.LastReadedSvrId "
"FROM ChatInfo C "
"ORDER BY C.LastReadedCreateTime DESC;")
result = self.execute_sql(sql)
2024-04-19 21:49:07 +08:00
if not result:
return []
for row in result:
# 获取用户名、昵称、备注和聊天记录数量
username, LastReadedCreateTime, LastReadedSvrId = row
LastReadedCreateTime = timestamp2str(LastReadedCreateTime / 1000) if LastReadedCreateTime else None
users.append(
{"wxid": username, "LastReadedCreateTime": LastReadedCreateTime, "LastReadedSvrId": LastReadedSvrId})
return users
2024-04-19 16:16:32 +08:00
def chatroom_list(self, roomwxid=None):
2024-04-16 23:16:22 +08:00
"""
获取群聊列表
:param MicroMsg_db_path: MicroMsg.db 文件路径
:return: 群聊列表
"""
rooms = []
# 连接 MicroMsg.db 数据库,并执行查询
2024-04-19 16:16:32 +08:00
sql = (
"SELECT A.ChatRoomName,A.UserNameList, A.DisplayNameList,A.RoomData, B.Announcement,B.AnnouncementEditor "
"FROM ChatRoom A,ChatRoomInfo B "
"where A.ChatRoomName==B.ChatRoomName "
"ORDER BY A.ChatRoomName ASC;")
if roomwxid:
sql = sql.replace("ORDER BY A.ChatRoomName ASC;",
2024-04-19 22:48:37 +08:00
f"and A.ChatRoomName LIKE '%{roomwxid}%' "
2024-04-19 16:16:32 +08:00
"ORDER BY A.ChatRoomName ASC;")
2024-04-16 23:16:22 +08:00
result = self.execute_sql(sql)
2024-04-19 21:49:07 +08:00
if not result:
return []
2024-04-19 16:16:32 +08:00
room_datas = []
2024-04-16 23:16:22 +08:00
for row in result:
# 获取用户名、昵称、备注和聊天记录数量
2024-04-19 16:16:32 +08:00
ChatRoomName, UserNameList, DisplayNameList, RoomData, Announcement, AnnouncementEditor = row
2024-04-16 23:16:22 +08:00
UserNameList = UserNameList.split("^G")
DisplayNameList = DisplayNameList.split("^G")
2024-04-19 16:16:32 +08:00
RoomData = self.ChatRoom_RoomData(RoomData)
2024-04-19 22:48:37 +08:00
wxid2remark = {}
2024-04-19 16:16:32 +08:00
if RoomData:
2024-04-19 22:48:37 +08:00
rd = []
2024-04-19 16:16:32 +08:00
for k, v in RoomData.items():
if isinstance(v, list):
rd += v
2024-04-19 22:48:37 +08:00
for i in rd:
try:
if isinstance(i, dict) and isinstance(i.get('1'), str) and i.get('2'):
2024-04-19 22:48:37 +08:00
wxid2remark[i['1']] = i["2"]
except Exception as e:
logging.error(f"wxid2remark: ChatRoomName:{ChatRoomName}, {i} error:{e}")
2024-04-16 23:16:22 +08:00
rooms.append(
{"ChatRoomName": ChatRoomName, "UserNameList": UserNameList, "DisplayNameList": DisplayNameList,
2024-04-19 22:48:37 +08:00
"Announcement": Announcement, "AnnouncementEditor": AnnouncementEditor, "wxid2remark": wxid2remark})
2024-04-16 23:16:22 +08:00
return rooms
2024-06-12 00:35:03 +08:00
def labels_dict(self, id_is_key=True):
"""
2024-06-12 00:35:03 +08:00
读取标签列表
:param label_list:
:return:
"""
2024-06-12 00:35:03 +08:00
sql = "SELECT LabelId, LabelName FROM ContactLabel ORDER BY LabelName ASC;"
result = self.execute_sql(sql)
if not result:
return []
if id_is_key:
labels = {row[0]: row[1] for row in result}
else:
labels = {row[1]: row[0] for row in result}
return labels