mirror of
https://github.com/hicccc77/WeFlow.git
synced 2026-03-24 23:06:51 +00:00
457 lines
16 KiB
TypeScript
457 lines
16 KiB
TypeScript
import { parentPort } from 'worker_threads'
|
|
import { wcdbService } from './wcdbService'
|
|
|
|
export interface DualReportMessage {
|
|
content: string
|
|
isSentByMe: boolean
|
|
createTime: number
|
|
createTimeStr: string
|
|
}
|
|
|
|
export interface DualReportFirstChat {
|
|
createTime: number
|
|
createTimeStr: string
|
|
content: string
|
|
isSentByMe: boolean
|
|
senderUsername?: string
|
|
}
|
|
|
|
export interface DualReportStats {
|
|
totalMessages: number
|
|
totalWords: number
|
|
imageCount: number
|
|
voiceCount: number
|
|
emojiCount: number
|
|
myTopEmojiMd5?: string
|
|
friendTopEmojiMd5?: string
|
|
myTopEmojiUrl?: string
|
|
friendTopEmojiUrl?: string
|
|
}
|
|
|
|
export interface DualReportData {
|
|
year: number
|
|
selfName: string
|
|
friendUsername: string
|
|
friendName: string
|
|
firstChat: DualReportFirstChat | null
|
|
firstChatMessages?: DualReportMessage[]
|
|
yearFirstChat?: {
|
|
createTime: number
|
|
createTimeStr: string
|
|
content: string
|
|
isSentByMe: boolean
|
|
friendName: string
|
|
firstThreeMessages: DualReportMessage[]
|
|
} | null
|
|
stats: DualReportStats
|
|
topPhrases: Array<{ phrase: string; count: number }>
|
|
}
|
|
|
|
class DualReportService {
|
|
private broadcastProgress(status: string, progress: number) {
|
|
if (parentPort) {
|
|
parentPort.postMessage({
|
|
type: 'dualReport:progress',
|
|
data: { status, progress }
|
|
})
|
|
}
|
|
}
|
|
|
|
private reportProgress(status: string, progress: number, onProgress?: (status: string, progress: number) => void) {
|
|
if (onProgress) {
|
|
onProgress(status, progress)
|
|
return
|
|
}
|
|
this.broadcastProgress(status, progress)
|
|
}
|
|
|
|
private cleanAccountDirName(dirName: string): string {
|
|
const trimmed = dirName.trim()
|
|
if (!trimmed) return trimmed
|
|
if (trimmed.toLowerCase().startsWith('wxid_')) {
|
|
const match = trimmed.match(/^(wxid_[^_]+)/i)
|
|
if (match) return match[1]
|
|
return trimmed
|
|
}
|
|
const suffixMatch = trimmed.match(/^(.+)_([a-zA-Z0-9]{4})$/)
|
|
if (suffixMatch) return suffixMatch[1]
|
|
return trimmed
|
|
}
|
|
|
|
private async ensureConnectedWithConfig(
|
|
dbPath: string,
|
|
decryptKey: string,
|
|
wxid: string
|
|
): Promise<{ success: boolean; cleanedWxid?: string; rawWxid?: string; error?: string }> {
|
|
if (!wxid) return { success: false, error: '未配置微信ID' }
|
|
if (!dbPath) return { success: false, error: '未配置数据库路径' }
|
|
if (!decryptKey) return { success: false, error: '未配置解密密钥' }
|
|
|
|
const cleanedWxid = this.cleanAccountDirName(wxid)
|
|
const ok = await wcdbService.open(dbPath, decryptKey, cleanedWxid)
|
|
if (!ok) return { success: false, error: 'WCDB 打开失败' }
|
|
return { success: true, cleanedWxid, rawWxid: wxid }
|
|
}
|
|
|
|
private decodeMessageContent(messageContent: any, compressContent: any): string {
|
|
let content = this.decodeMaybeCompressed(compressContent)
|
|
if (!content || content.length === 0) {
|
|
content = this.decodeMaybeCompressed(messageContent)
|
|
}
|
|
return content
|
|
}
|
|
|
|
private decodeMaybeCompressed(raw: any): string {
|
|
if (!raw) return ''
|
|
if (typeof raw === 'string') {
|
|
if (raw.length === 0) return ''
|
|
if (this.looksLikeHex(raw)) {
|
|
const bytes = Buffer.from(raw, 'hex')
|
|
if (bytes.length > 0) return this.decodeBinaryContent(bytes)
|
|
}
|
|
if (this.looksLikeBase64(raw)) {
|
|
try {
|
|
const bytes = Buffer.from(raw, 'base64')
|
|
return this.decodeBinaryContent(bytes)
|
|
} catch {
|
|
return raw
|
|
}
|
|
}
|
|
return raw
|
|
}
|
|
return ''
|
|
}
|
|
|
|
private decodeBinaryContent(data: Buffer): string {
|
|
if (data.length === 0) return ''
|
|
try {
|
|
if (data.length >= 4) {
|
|
const magic = data.readUInt32LE(0)
|
|
if (magic === 0xFD2FB528) {
|
|
const fzstd = require('fzstd')
|
|
const decompressed = fzstd.decompress(data)
|
|
return Buffer.from(decompressed).toString('utf-8')
|
|
}
|
|
}
|
|
const decoded = data.toString('utf-8')
|
|
const replacementCount = (decoded.match(/\uFFFD/g) || []).length
|
|
if (replacementCount < decoded.length * 0.2) {
|
|
return decoded.replace(/\uFFFD/g, '')
|
|
}
|
|
return data.toString('latin1')
|
|
} catch {
|
|
return ''
|
|
}
|
|
}
|
|
|
|
private looksLikeHex(s: string): boolean {
|
|
if (s.length % 2 !== 0) return false
|
|
return /^[0-9a-fA-F]+$/.test(s)
|
|
}
|
|
|
|
private looksLikeBase64(s: string): boolean {
|
|
if (s.length % 4 !== 0) return false
|
|
return /^[A-Za-z0-9+/=]+$/.test(s)
|
|
}
|
|
|
|
private formatDateTime(milliseconds: number): string {
|
|
const dt = new Date(milliseconds)
|
|
const month = String(dt.getMonth() + 1).padStart(2, '0')
|
|
const day = String(dt.getDate()).padStart(2, '0')
|
|
const hour = String(dt.getHours()).padStart(2, '0')
|
|
const minute = String(dt.getMinutes()).padStart(2, '0')
|
|
return `${month}/${day} ${hour}:${minute}`
|
|
}
|
|
|
|
private extractEmojiUrl(content: string): string | undefined {
|
|
if (!content) return undefined
|
|
const attrMatch = /cdnurl\s*=\s*['"]([^'"]+)['"]/i.exec(content)
|
|
if (attrMatch) {
|
|
let url = attrMatch[1].replace(/&/g, '&')
|
|
try {
|
|
if (url.includes('%')) {
|
|
url = decodeURIComponent(url)
|
|
}
|
|
} catch { }
|
|
return url
|
|
}
|
|
const tagMatch = /cdnurl[^>]*>([^<]+)/i.exec(content)
|
|
return tagMatch?.[1]
|
|
}
|
|
|
|
private extractEmojiMd5(content: string): string | undefined {
|
|
if (!content) return undefined
|
|
const match = /md5="([^"]+)"/i.exec(content) || /<md5>([^<]+)<\/md5>/i.exec(content)
|
|
return match?.[1]
|
|
}
|
|
|
|
private async getDisplayName(username: string, fallback: string): Promise<string> {
|
|
const result = await wcdbService.getDisplayNames([username])
|
|
if (result.success && result.map) {
|
|
return result.map[username] || fallback
|
|
}
|
|
return fallback
|
|
}
|
|
|
|
private resolveIsSent(row: any, rawWxid?: string, cleanedWxid?: string): boolean {
|
|
const isSendRaw = row.computed_is_send ?? row.is_send
|
|
if (isSendRaw !== undefined && isSendRaw !== null) {
|
|
return parseInt(isSendRaw, 10) === 1
|
|
}
|
|
const sender = String(row.sender_username || row.sender || row.talker || '').toLowerCase()
|
|
if (!sender) return false
|
|
const rawLower = rawWxid ? rawWxid.toLowerCase() : ''
|
|
const cleanedLower = cleanedWxid ? cleanedWxid.toLowerCase() : ''
|
|
return sender === rawLower || sender === cleanedLower
|
|
}
|
|
|
|
private async getFirstMessages(
|
|
sessionId: string,
|
|
limit: number,
|
|
beginTimestamp: number,
|
|
endTimestamp: number
|
|
): Promise<any[]> {
|
|
const safeBegin = Math.max(0, beginTimestamp || 0)
|
|
const safeEnd = endTimestamp && endTimestamp > 0 ? endTimestamp : Math.floor(Date.now() / 1000)
|
|
const cursorResult = await wcdbService.openMessageCursor(sessionId, Math.max(1, limit), true, safeBegin, safeEnd)
|
|
if (!cursorResult.success || !cursorResult.cursor) return []
|
|
try {
|
|
const rows: any[] = []
|
|
let hasMore = true
|
|
while (hasMore && rows.length < limit) {
|
|
const batch = await wcdbService.fetchMessageBatch(cursorResult.cursor)
|
|
if (!batch.success || !batch.rows) break
|
|
for (const row of batch.rows) {
|
|
rows.push(row)
|
|
if (rows.length >= limit) break
|
|
}
|
|
hasMore = batch.hasMore === true
|
|
}
|
|
return rows.slice(0, limit)
|
|
} finally {
|
|
await wcdbService.closeMessageCursor(cursorResult.cursor)
|
|
}
|
|
}
|
|
|
|
async generateReportWithConfig(params: {
|
|
year: number
|
|
friendUsername: string
|
|
dbPath: string
|
|
decryptKey: string
|
|
wxid: string
|
|
onProgress?: (status: string, progress: number) => void
|
|
}): Promise<{ success: boolean; data?: DualReportData; error?: string }> {
|
|
try {
|
|
const { year, friendUsername, dbPath, decryptKey, wxid, onProgress } = params
|
|
this.reportProgress('正在连接数据库...', 5, onProgress)
|
|
const conn = await this.ensureConnectedWithConfig(dbPath, decryptKey, wxid)
|
|
if (!conn.success || !conn.cleanedWxid || !conn.rawWxid) return { success: false, error: conn.error }
|
|
|
|
const cleanedWxid = conn.cleanedWxid
|
|
const rawWxid = conn.rawWxid
|
|
|
|
const reportYear = year <= 0 ? 0 : year
|
|
const isAllTime = reportYear === 0
|
|
const startTime = isAllTime ? 0 : Math.floor(new Date(reportYear, 0, 1).getTime() / 1000)
|
|
const endTime = isAllTime ? 0 : Math.floor(new Date(reportYear, 11, 31, 23, 59, 59).getTime() / 1000)
|
|
|
|
this.reportProgress('加载联系人信息...', 10, onProgress)
|
|
const friendName = await this.getDisplayName(friendUsername, friendUsername)
|
|
let myName = await this.getDisplayName(rawWxid, rawWxid)
|
|
if (myName === rawWxid && cleanedWxid && cleanedWxid !== rawWxid) {
|
|
myName = await this.getDisplayName(cleanedWxid, rawWxid)
|
|
}
|
|
|
|
this.reportProgress('获取首条聊天记录...', 15, onProgress)
|
|
const firstRows = await this.getFirstMessages(friendUsername, 3, 0, 0)
|
|
let firstChat: DualReportFirstChat | null = null
|
|
if (firstRows.length > 0) {
|
|
const row = firstRows[0]
|
|
const createTime = parseInt(row.create_time || '0', 10) * 1000
|
|
const content = this.decodeMessageContent(row.message_content, row.compress_content)
|
|
firstChat = {
|
|
createTime,
|
|
createTimeStr: this.formatDateTime(createTime),
|
|
content: String(content || ''),
|
|
isSentByMe: this.resolveIsSent(row, rawWxid, cleanedWxid),
|
|
senderUsername: row.sender_username || row.sender
|
|
}
|
|
}
|
|
const firstChatMessages: DualReportMessage[] = firstRows.map((row) => {
|
|
const msgTime = parseInt(row.create_time || '0', 10) * 1000
|
|
const msgContent = this.decodeMessageContent(row.message_content, row.compress_content)
|
|
return {
|
|
content: String(msgContent || ''),
|
|
isSentByMe: this.resolveIsSent(row, rawWxid, cleanedWxid),
|
|
createTime: msgTime,
|
|
createTimeStr: this.formatDateTime(msgTime)
|
|
}
|
|
})
|
|
|
|
let yearFirstChat: DualReportData['yearFirstChat'] = null
|
|
if (!isAllTime) {
|
|
this.reportProgress('获取今年首次聊天...', 20, onProgress)
|
|
const firstYearRows = await this.getFirstMessages(friendUsername, 3, startTime, endTime)
|
|
if (firstYearRows.length > 0) {
|
|
const firstRow = firstYearRows[0]
|
|
const createTime = parseInt(firstRow.create_time || '0', 10) * 1000
|
|
const firstThreeMessages: DualReportMessage[] = firstYearRows.map((row) => {
|
|
const msgTime = parseInt(row.create_time || '0', 10) * 1000
|
|
const msgContent = this.decodeMessageContent(row.message_content, row.compress_content)
|
|
return {
|
|
content: String(msgContent || ''),
|
|
isSentByMe: this.resolveIsSent(row, rawWxid, cleanedWxid),
|
|
createTime: msgTime,
|
|
createTimeStr: this.formatDateTime(msgTime)
|
|
}
|
|
})
|
|
yearFirstChat = {
|
|
createTime,
|
|
createTimeStr: this.formatDateTime(createTime),
|
|
content: String(this.decodeMessageContent(firstRow.message_content, firstRow.compress_content) || ''),
|
|
isSentByMe: this.resolveIsSent(firstRow, rawWxid, cleanedWxid),
|
|
friendName,
|
|
firstThreeMessages
|
|
}
|
|
}
|
|
}
|
|
|
|
this.reportProgress('统计聊天数据...', 30, onProgress)
|
|
const stats: DualReportStats = {
|
|
totalMessages: 0,
|
|
totalWords: 0,
|
|
imageCount: 0,
|
|
voiceCount: 0,
|
|
emojiCount: 0
|
|
}
|
|
const wordCountMap = new Map<string, number>()
|
|
const myEmojiCounts = new Map<string, number>()
|
|
const friendEmojiCounts = new Map<string, number>()
|
|
const myEmojiUrlMap = new Map<string, string>()
|
|
const friendEmojiUrlMap = new Map<string, string>()
|
|
|
|
const messageCountResult = await wcdbService.getMessageCount(friendUsername)
|
|
const totalForProgress = messageCountResult.success && messageCountResult.count
|
|
? messageCountResult.count
|
|
: 0
|
|
let processed = 0
|
|
let lastProgressAt = 0
|
|
|
|
const cursorResult = await wcdbService.openMessageCursor(friendUsername, 1000, true, startTime, endTime)
|
|
if (!cursorResult.success || !cursorResult.cursor) {
|
|
return { success: false, error: cursorResult.error || '打开消息游标失败' }
|
|
}
|
|
|
|
try {
|
|
let hasMore = true
|
|
while (hasMore) {
|
|
const batch = await wcdbService.fetchMessageBatch(cursorResult.cursor)
|
|
if (!batch.success || !batch.rows) break
|
|
for (const row of batch.rows) {
|
|
const localType = parseInt(row.local_type || row.type || '1', 10)
|
|
const isSent = this.resolveIsSent(row, rawWxid, cleanedWxid)
|
|
stats.totalMessages += 1
|
|
|
|
if (localType === 3) stats.imageCount += 1
|
|
if (localType === 34) stats.voiceCount += 1
|
|
if (localType === 47) {
|
|
stats.emojiCount += 1
|
|
const content = this.decodeMessageContent(row.message_content, row.compress_content)
|
|
const md5 = this.extractEmojiMd5(content)
|
|
const url = this.extractEmojiUrl(content)
|
|
if (md5) {
|
|
const targetMap = isSent ? myEmojiCounts : friendEmojiCounts
|
|
targetMap.set(md5, (targetMap.get(md5) || 0) + 1)
|
|
if (url) {
|
|
const urlMap = isSent ? myEmojiUrlMap : friendEmojiUrlMap
|
|
if (!urlMap.has(md5)) urlMap.set(md5, url)
|
|
}
|
|
}
|
|
}
|
|
|
|
if (localType === 1 || localType === 244813135921) {
|
|
const content = this.decodeMessageContent(row.message_content, row.compress_content)
|
|
const text = String(content || '').trim()
|
|
if (text.length > 0) {
|
|
stats.totalWords += text.replace(/\s+/g, '').length
|
|
const normalized = text.replace(/\s+/g, ' ').trim()
|
|
if (normalized.length >= 2 &&
|
|
normalized.length <= 50 &&
|
|
!normalized.includes('http') &&
|
|
!normalized.includes('<') &&
|
|
!normalized.startsWith('[') &&
|
|
!normalized.startsWith('<?xml')) {
|
|
wordCountMap.set(normalized, (wordCountMap.get(normalized) || 0) + 1)
|
|
}
|
|
}
|
|
}
|
|
|
|
if (totalForProgress > 0) {
|
|
processed++
|
|
}
|
|
}
|
|
hasMore = batch.hasMore === true
|
|
|
|
const now = Date.now()
|
|
if (now - lastProgressAt > 200) {
|
|
if (totalForProgress > 0) {
|
|
const ratio = Math.min(1, processed / totalForProgress)
|
|
const progress = 30 + Math.floor(ratio * 50)
|
|
this.reportProgress('统计聊天数据...', progress, onProgress)
|
|
}
|
|
lastProgressAt = now
|
|
}
|
|
}
|
|
} finally {
|
|
await wcdbService.closeMessageCursor(cursorResult.cursor)
|
|
}
|
|
|
|
const pickTop = (map: Map<string, number>): string | undefined => {
|
|
let topKey: string | undefined
|
|
let topCount = -1
|
|
for (const [key, count] of map.entries()) {
|
|
if (count > topCount) {
|
|
topCount = count
|
|
topKey = key
|
|
}
|
|
}
|
|
return topKey
|
|
}
|
|
|
|
const myTopEmojiMd5 = pickTop(myEmojiCounts)
|
|
const friendTopEmojiMd5 = pickTop(friendEmojiCounts)
|
|
|
|
stats.myTopEmojiMd5 = myTopEmojiMd5
|
|
stats.friendTopEmojiMd5 = friendTopEmojiMd5
|
|
stats.myTopEmojiUrl = myTopEmojiMd5 ? myEmojiUrlMap.get(myTopEmojiMd5) : undefined
|
|
stats.friendTopEmojiUrl = friendTopEmojiMd5 ? friendEmojiUrlMap.get(friendTopEmojiMd5) : undefined
|
|
|
|
this.reportProgress('生成常用语词云...', 85, onProgress)
|
|
const topPhrases = Array.from(wordCountMap.entries())
|
|
.filter(([_, count]) => count >= 2)
|
|
.sort((a, b) => b[1] - a[1])
|
|
.slice(0, 50)
|
|
.map(([phrase, count]) => ({ phrase, count }))
|
|
|
|
const reportData: DualReportData = {
|
|
year: reportYear,
|
|
selfName: myName,
|
|
friendUsername,
|
|
friendName,
|
|
firstChat,
|
|
firstChatMessages,
|
|
yearFirstChat,
|
|
stats,
|
|
topPhrases
|
|
}
|
|
|
|
this.reportProgress('双人报告生成完成', 100, onProgress)
|
|
return { success: true, data: reportData }
|
|
} catch (e) {
|
|
return { success: false, error: String(e) }
|
|
}
|
|
}
|
|
}
|
|
|
|
export const dualReportService = new DualReportService()
|