1 месяц назад · cd00ad8f72
--- a/client/src/components.d.ts
+++ b/client/src/components.d.ts
@@ -18,19 +18,29 @@ declare module 'vue' {
 
				     ElConfigProvider: typeof import('element-plus/es')['ElConfigProvider']
			
 
				     ElContainer: typeof import('element-plus/es')['ElContainer']
			
 
				     ElDialog: typeof import('element-plus/es')['ElDialog']
			
 
				+    ElDivider: typeof import('element-plus/es')['ElDivider']
			
 
				+    ElDrawer: typeof import('element-plus/es')['ElDrawer']
			
 
				     ElDropdown: typeof import('element-plus/es')['ElDropdown']
			
 
				     ElDropdownItem: typeof import('element-plus/es')['ElDropdownItem']
			
 
				     ElDropdownMenu: typeof import('element-plus/es')['ElDropdownMenu']
			
 
				     ElEmpty: typeof import('element-plus/es')['ElEmpty']
			
 
				+    ElForm: typeof import('element-plus/es')['ElForm']
			
 
				+    ElFormItem: typeof import('element-plus/es')['ElFormItem']
			
 
				     ElIcon: typeof import('element-plus/es')['ElIcon']
			
 
				     ElInput: typeof import('element-plus/es')['ElInput']
			
 
				     ElMain: typeof import('element-plus/es')['ElMain']
			
 
				     ElMenu: typeof import('element-plus/es')['ElMenu']
			
 
				     ElMenuItem: typeof import('element-plus/es')['ElMenuItem']
			
 
				+    ElOption: typeof import('element-plus/es')['ElOption']
			
 
				+    ElPagination: typeof import('element-plus/es')['ElPagination']
			
 
				+    ElProgress: typeof import('element-plus/es')['ElProgress']
			
 
				     ElRadioButton: typeof import('element-plus/es')['ElRadioButton']
			
 
				     ElRadioGroup: typeof import('element-plus/es')['ElRadioGroup']
			
 
				+    ElSelect: typeof import('element-plus/es')['ElSelect']
			
 
				     ElSubMenu: typeof import('element-plus/es')['ElSubMenu']
			
 
				     ElSwitch: typeof import('element-plus/es')['ElSwitch']
			
 
				+    ElTable: typeof import('element-plus/es')['ElTable']
			
 
				+    ElTableColumn: typeof import('element-plus/es')['ElTableColumn']
			
 
				     ElTabPane: typeof import('element-plus/es')['ElTabPane']
			
 
				     ElTabs: typeof import('element-plus/es')['ElTabs']
			
 
				     ElTag: typeof import('element-plus/es')['ElTag']
			
@@ -39,4 +49,7 @@ declare module 'vue' {
 
				     RouterView: typeof import('vue-router')['RouterView']
			
 
				     TaskProgressDialog: typeof import('./components/TaskProgressDialog.vue')['default']
			
 
				   }
			
 
				+  export interface ComponentCustomProperties {
			
 
				+    vLoading: typeof import('element-plus/es')['ElLoadingDirective']
			
 
				+  }
			
 
				 }
			
--- a/server/python/platforms/__init__.py
+++ b/server/python/platforms/__init__.py
@@ -26,6 +26,7 @@ PLATFORM_MAP = {
 
				     'xiaohongshu': XiaohongshuPublisher,
			
 
				     'weixin': WeixinPublisher,
			
 
				     'weixin_video': WeixinPublisher,  # 别名
			
 
				+    'shipinhao': WeixinPublisher,  # 别名（视频号）
			
 
				     'kuaishou': KuaishouPublisher,
			
 
				     'baijiahao': BaijiahaoPublisher,
			
 
				 }
			
--- a/server/python/platforms/__pycache__/__init__.cpython-313.pyc
+++ b/server/python/platforms/__pycache__/__init__.cpython-313.pyc
--- a/server/python/platforms/__pycache__/weixin.cpython-313.pyc
+++ b/server/python/platforms/__pycache__/weixin.cpython-313.pyc
--- a/server/python/platforms/__pycache__/xiaohongshu.cpython-313.pyc
+++ b/server/python/platforms/__pycache__/xiaohongshu.cpython-313.pyc
--- a/server/python/platforms/weixin.py
+++ b/server/python/platforms/weixin.py
@@ -47,7 +47,9 @@ class WeixinPublisher(BasePublisher):
 
				     platform_name = "weixin"
			
 
				     login_url = "https://channels.weixin.qq.com/platform"
			
 
				     publish_url = "https://channels.weixin.qq.com/platform/post/create"
			
 
				-    cookie_domain = ".weixin.qq.com"
			
 
				+    # 视频号域名为 channels.weixin.qq.com，cookie 常见 domain 为 .qq.com / .weixin.qq.com 等
			
 
				+    # 这里默认用更宽泛的 .qq.com，避免“字符串 cookie”场景下 domain 兜底不生效
			
 
				+    cookie_domain = ".qq.com"
			
 
				     
			
 
				     async def init_browser(self, storage_state: str = None):
			
 
				         """初始化浏览器 - 参考 matrix 使用 channel=chrome 避免 H264 编码错误"""
			
--- a/server/python/platforms/xiaohongshu.py
+++ b/server/python/platforms/xiaohongshu.py
@@ -8,6 +8,7 @@
 
				 import asyncio
			
 
				 import os
			
 
				 import sys
			
 
				+import time
			
 
				 from pathlib import Path
			
 
				 from typing import List
			
 
				 from .base import (
			
@@ -86,8 +87,58 @@ class XiaohongshuPublisher(BasePublisher):
 
				             raise Exception(f"签名失败: {e}")
			
 
				     
			
 
				     def sign_sync(self, uri, data=None, a1="", web_session=""):
			
 
				-        """同步签名函数，供 XhsClient 使用"""
			
 
				-        return asyncio.run(self.get_sign(uri, data, a1, web_session))
			
 
				+        """
			
 
				+        同步签名函数，供 XhsClient 使用。
			
 
				+        
			
 
				+        注意：发布流程运行在 asyncio 事件循环中（通过 asyncio.run 启动），
			
 
				+        这里如果再调用 asyncio.run 会触发 “asyncio.run() cannot be called from a running event loop”。
			
 
				+        因此改为使用 sync_playwright 的同步实现（参考 matrix/xhs_uploader）。
			
 
				+        """
			
 
				+        try:
			
 
				+            from playwright.sync_api import sync_playwright
			
 
				+        except Exception as e:
			
 
				+            raise Exception(f"缺少 playwright 同步接口支持: {e}")
			
 
				+        
			
 
				+        last_exc: Exception | None = None
			
 
				+        for attempt in range(1, 6):
			
 
				+            try:
			
 
				+                with sync_playwright() as playwright:
			
 
				+                    browser = playwright.chromium.launch(headless=True)
			
 
				+                    context = browser.new_context()
			
 
				+                    
			
 
				+                    if STEALTH_JS_PATH.exists():
			
 
				+                        context.add_init_script(path=str(STEALTH_JS_PATH))
			
 
				+                    
			
 
				+                    page = context.new_page()
			
 
				+                    page.goto("https://www.xiaohongshu.com", wait_until="domcontentloaded", timeout=60000)
			
 
				+                    
			
 
				+                    if a1:
			
 
				+                        context.add_cookies([
			
 
				+                            {'name': 'a1', 'value': a1, 'domain': ".xiaohongshu.com", 'path': "/"}
			
 
				+                        ])
			
 
				+                        page.reload(wait_until="domcontentloaded")
			
 
				+                    
			
 
				+                    # 参考 matrix：设置完 cookie 后需要稍等，否则可能出现 window._webmsxyw 不存在
			
 
				+                    time.sleep(1.5)
			
 
				+                    
			
 
				+                    encrypt_params = page.evaluate(
			
 
				+                        "([url, data]) => window._webmsxyw(url, data)",
			
 
				+                        [uri, data]
			
 
				+                    )
			
 
				+                    
			
 
				+                    context.close()
			
 
				+                    browser.close()
			
 
				+                    
			
 
				+                    return {
			
 
				+                        "x-s": encrypt_params["X-s"],
			
 
				+                        "x-t": str(encrypt_params["X-t"])
			
 
				+                    }
			
 
				+            except Exception as e:
			
 
				+                last_exc = e
			
 
				+                # 轻微退避重试
			
 
				+                time.sleep(0.4 * attempt)
			
 
				+        
			
 
				+        raise Exception(f"签名失败: {last_exc}")
			
 
				     
			
 
				     async def publish_via_api(self, cookies: str, params: PublishParams) -> PublishResult:
			
 
				         """通过 API 发布视频"""
			
@@ -596,29 +647,14 @@ class XiaohongshuPublisher(BasePublisher):
 
				             # 移除监听器
			
 
				             self.page.remove_listener('response', handle_response)
			
 
				             
			
 
				-            # 处理捕获到的数据
			
 
				-            import json
			
 
				-            if captured_data:
			
 
				-                print(f"[{self.platform_name}] 成功捕获到 API 数据", flush=True)
			
 
				-                data = captured_data.get('data', {})
			
 
				-                notes = data.get('notes', [])
			
 
				-                print(f"[{self.platform_name}] notes 数量: {len(notes)}", flush=True)
			
 
				-                
			
 
				-                # 从 tags 获取总数
			
 
				-                tags = data.get('tags', [])
			
 
				-                for tag in tags:
			
 
				-                    if tag.get('id') == 'special.note_time_desc':
			
 
				-                        total = tag.get('notes_count', 0)
			
 
				-                        break
			
 
				-                
			
 
				-                has_more = data.get('page', -1) != -1
			
 
				-                
			
 
				-                for note in notes:
			
 
				+            # 处理捕获到的数据（增加分页抓取，避免仅第一页）
			
 
				+            def parse_notes(notes_list):
			
 
				+                parsed = []
			
 
				+                for note in notes_list:
			
 
				                     note_id = note.get('id', '')
			
 
				                     if not note_id:
			
 
				                         continue
			
 
				                     
			
 
				-                    # 获取封面
			
 
				                     cover_url = ''
			
 
				                     images_list = note.get('images_list', [])
			
 
				                     if images_list:
			
@@ -626,10 +662,8 @@ class XiaohongshuPublisher(BasePublisher):
 
				                         if cover_url.startswith('http://'):
			
 
				                             cover_url = cover_url.replace('http://', 'https://')
			
 
				                     
			
 
				-                    # 获取时长
			
 
				                     duration = note.get('video_info', {}).get('duration', 0)
			
 
				                     
			
 
				-                    # 解析状态
			
 
				                     status = 'published'
			
 
				                     tab_status = note.get('tab_status', 1)
			
 
				                     if tab_status == 0:
			
@@ -639,7 +673,7 @@ class XiaohongshuPublisher(BasePublisher):
 
				                     elif tab_status == 3:
			
 
				                         status = 'rejected'
			
 
				                     
			
 
				-                    works.append(WorkItem(
			
 
				+                    parsed.append(WorkItem(
			
 
				                         work_id=note_id,
			
 
				                         title=note.get('display_title', '') or '无标题',
			
 
				                         cover_url=cover_url,
			
@@ -652,8 +686,83 @@ class XiaohongshuPublisher(BasePublisher):
 
				                         share_count=note.get('shared_count', 0),
			
 
				                         collect_count=note.get('collected_count', 0),
			
 
				                     ))
			
 
				+                return parsed
			
 
				+
			
 
				+            import json
			
 
				+            if captured_data:
			
 
				+                print(f"[{self.platform_name}] 成功捕获到 API 数据", flush=True)
			
 
				+                data = captured_data.get('data', {})
			
 
				+                notes = data.get('notes', [])
			
 
				+                print(f"[{self.platform_name}] notes 数量: {len(notes)}", flush=True)
			
 
				+                
			
 
				+                # 从 tags 获取总数
			
 
				+                tags = data.get('tags', [])
			
 
				+                for tag in tags:
			
 
				+                    if tag.get('id') == 'special.note_time_desc':
			
 
				+                        total = tag.get('notes_count', 0)
			
 
				+                        break
			
 
				+                
			
 
				+                works.extend(parse_notes(notes))
			
 
				+
			
 
				+                # 分页抓取剩余页面：不依赖 data.page（有些情况下会误报 -1），直到拿不到新数据为止
			
 
				+                max_pages = 30
			
 
				+                page_num = 1  # 已经拿了 page=0
			
 
				+                seen_note_ids = set([w.work_id for w in works])
			
 
				+                has_more = True
			
 
				+
			
 
				+                while has_more and page_num < max_pages:
			
 
				+                    try:
			
 
				+                        next_resp = await self.page.evaluate(
			
 
				+                            """async (p) => {
			
 
				+                                const res = await fetch(`https://edith.xiaohongshu.com/web_api/sns/v5/creator/note/user/posted?tab=0&page=${p}`, {
			
 
				+                                    method: 'GET',
			
 
				+                                    credentials: 'include',
			
 
				+                                    headers: { 'Accept': 'application/json' }
			
 
				+                                });
			
 
				+                                return await res.json();
			
 
				+                            }""",
			
 
				+                            page_num
			
 
				+                        )
			
 
				+                    except Exception as fetch_err:
			
 
				+                        print(f"[{self.platform_name}] 分页请求异常 page={page_num}: {fetch_err}", flush=True)
			
 
				+                        break
			
 
				+
			
 
				+                    if not next_resp:
			
 
				+                        break
			
 
				+
			
 
				+                    if not (next_resp.get('success') or next_resp.get('code') == 0):
			
 
				+                        break
			
 
				+
			
 
				+                    next_data = next_resp.get('data', {})
			
 
				+                    next_notes = next_data.get('notes', []) or []
			
 
				+
			
 
				+                    if not next_notes:
			
 
				+                        has_more = False
			
 
				+                        break
			
 
				+
			
 
				+                    parsed_next = parse_notes(next_notes)
			
 
				+                    new_items = [w for w in parsed_next if w.work_id and w.work_id not in seen_note_ids]
			
 
				+                    if not new_items:
			
 
				+                        # 没有新数据，停止
			
 
				+                        has_more = False
			
 
				+                        break
			
 
				+
			
 
				+                    for w in new_items:
			
 
				+                        seen_note_ids.add(w.work_id)
			
 
				+                    works.extend(new_items)
			
 
				+
			
 
				+                    # 更新总数（若第一页未拿到）
			
 
				+                    if not total and next_data.get('tags'):
			
 
				+                        for tag in next_data.get('tags', []):
			
 
				+                            if tag.get('id') == 'special.note_time_desc':
			
 
				+                                total = tag.get('notes_count', 0)
			
 
				+                                break
			
 
				+
			
 
				+                    page_num += 1
			
 
				                 
			
 
				-                print(f"[{self.platform_name}] 解析到 {len(works)} 个作品，总计: {total}", flush=True)
			
 
				+                # 分页完毕，has_more 表示是否还存在更多（以最后一页标记为准）
			
 
				+                if not has_more:
			
 
				+                    print(f"[{self.platform_name}] 已抓取所有分页，共 {len(works)} 条", flush=True)
			
 
				             else:
			
 
				                 print(f"[{self.platform_name}] 未能捕获到 API 数据", flush=True)
			
 
				             
			
--- a/server/src/services/HeadlessBrowserService.ts
+++ b/server/src/services/HeadlessBrowserService.ts
@@ -513,64 +513,88 @@ class HeadlessBrowserService {
 
				    * 通过 Python API 获取作品列表
			
 
				    */
			
 
				   private async fetchWorksViaPython(platform: PlatformType, cookies: CookieData[]): Promise<WorkItem[]> {
			
 
				-    logger.info(`[Python API] Fetching works for ${platform}...`);
			
 
				+    logger.info(`[Python API] Fetching works for ${platform} (auto pagination)...`);
			
 
				 
			
 
				-    // 将 cookies 转换为字符串格式
			
 
				     const cookieString = JSON.stringify(cookies);
			
 
				-
			
 
				-    // Python 服务中视频号的 platform 名称是 weixin
			
 
				     const pythonPlatform = platform === 'weixin_video' ? 'weixin' : platform;
			
 
				 
			
 
				-    const response = await fetch(`${PYTHON_SERVICE_URL}/works`, {
			
 
				-      method: 'POST',
			
 
				-      headers: {
			
 
				-        'Content-Type': 'application/json',
			
 
				-      },
			
 
				-      body: JSON.stringify({
			
 
				-        platform: pythonPlatform,
			
 
				-        cookie: cookieString,
			
 
				-        page: 0,
			
 
				-        page_size: 50,
			
 
				-      }),
			
 
				-    });
			
 
				+    const pageSize = 50;
			
 
				+    const maxPages = 30;
			
 
				+    const allWorks: WorkItem[] = [];
			
 
				+    const seenIds = new Set<string>();
			
 
				 
			
 
				-    if (!response.ok) {
			
 
				-      throw new Error(`Python API returned ${response.status}`);
			
 
				-    }
			
 
				+    for (let page = 0; page < maxPages; page++) {
			
 
				+      logger.info(`[Python API] Fetching works page=${page}, page_size=${pageSize} for ${platform}`);
			
 
				 
			
 
				-    const result = await response.json();
			
 
				+      const response = await fetch(`${PYTHON_SERVICE_URL}/works`, {
			
 
				+        method: 'POST',
			
 
				+        headers: {
			
 
				+          'Content-Type': 'application/json',
			
 
				+        },
			
 
				+        body: JSON.stringify({
			
 
				+          platform: pythonPlatform,
			
 
				+          cookie: cookieString,
			
 
				+          page,
			
 
				+          page_size: pageSize,
			
 
				+        }),
			
 
				+      });
			
 
				 
			
 
				-    if (!result.success) {
			
 
				-      throw new Error(result.error || 'Failed to get works');
			
 
				-    }
			
 
				+      if (!response.ok) {
			
 
				+        throw new Error(`Python API returned ${response.status}`);
			
 
				+      }
			
 
				 
			
 
				-    logger.info(`[Python API] Got ${result.works?.length || 0} works for ${platform}`);
			
 
				+      const result = await response.json();
			
 
				 
			
 
				-    // 转换数据格式
			
 
				-    return (result.works || []).map((work: {
			
 
				-      work_id: string;
			
 
				-      title: string;
			
 
				-      cover_url: string;
			
 
				-      duration: number;
			
 
				-      publish_time: string;
			
 
				-      status: string;
			
 
				-      play_count: number;
			
 
				-      like_count: number;
			
 
				-      comment_count: number;
			
 
				-      share_count: number;
			
 
				-      collect_count?: number;
			
 
				-    }) => ({
			
 
				-      videoId: work.work_id,
			
 
				-      title: work.title,
			
 
				-      coverUrl: work.cover_url,
			
 
				-      duration: String(work.duration || 0),
			
 
				-      publishTime: work.publish_time,
			
 
				-      status: work.status || 'published',
			
 
				-      playCount: work.play_count || 0,
			
 
				-      likeCount: work.like_count || 0,
			
 
				-      commentCount: work.comment_count || 0,
			
 
				-      shareCount: work.share_count || 0,
			
 
				-    }));
			
 
				+      if (!result.success) {
			
 
				+        throw new Error(result.error || 'Failed to get works');
			
 
				+      }
			
 
				+
			
 
				+      const pageWorks: WorkItem[] = (result.works || []).map((work: {
			
 
				+        work_id: string;
			
 
				+        title: string;
			
 
				+        cover_url: string;
			
 
				+        duration: number;
			
 
				+        publish_time: string;
			
 
				+        status: string;
			
 
				+        play_count: number;
			
 
				+        like_count: number;
			
 
				+        comment_count: number;
			
 
				+        share_count: number;
			
 
				+        collect_count?: number;
			
 
				+      }) => ({
			
 
				+        videoId: work.work_id,
			
 
				+        title: work.title,
			
 
				+        coverUrl: work.cover_url,
			
 
				+        duration: String(work.duration || 0),
			
 
				+        publishTime: work.publish_time,
			
 
				+        status: work.status || 'published',
			
 
				+        playCount: work.play_count || 0,
			
 
				+        likeCount: work.like_count || 0,
			
 
				+        commentCount: work.comment_count || 0,
			
 
				+        shareCount: work.share_count || 0,
			
 
				+      }));
			
 
				+
			
 
				+      let newCount = 0;
			
 
				+      for (const w of pageWorks) {
			
 
				+        const id = w.videoId || `${platform}_${w.title}_${w.publishTime}`;
			
 
				+        if (!seenIds.has(id)) {
			
 
				+          seenIds.add(id);
			
 
				+          allWorks.push(w);
			
 
				+          newCount++;
			
 
				+        }
			
 
				+      }
			
 
				+
			
 
				+      logger.info(
			
 
				+        `[Python API] Page ${page} fetched=${pageWorks.length}, new=${newCount}, total=${allWorks.length}, has_more=${!!result.has_more}`
			
 
				+      );
			
 
				+
			
 
				+      if (!result.has_more || pageWorks.length === 0 || newCount === 0) {
			
 
				+        break;
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    logger.info(`[Python API] Total works fetched for ${platform}: ${allWorks.length}`);
			
 
				+    return allWorks;
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -598,7 +622,7 @@ class HeadlessBrowserService {
 
				     }
			
 
				 
			
 
				     // 对于支持的平台，尝试使用 Python API 获取作品列表和账号信息
			
 
				-    // 包括百家号，通过 Python API 执行，逻辑与 Node 服务端保持一致
			
 
				+    // 同步作品需要全量：这里会通过 Python /works 自动分页拉取
			
 
				     const supportedPlatforms: PlatformType[] = ['douyin', 'xiaohongshu', 'kuaishou', 'weixin_video', 'baijiahao'];
			
 
				 
			
 
				     if (supportedPlatforms.includes(platform)) {