feat(screen-recorder): refactor

2025-06-06 03:05:25 +00:00 · 2024-09-02 00:03:20 +08:00 · 2024-09-02 00:03:20 +08:00 · 63c302e017
commit 63c302e017
parent 2b2d616775
5 changed files with 210 additions and 329 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@ -28,6 +28,12 @@ dependencies = [
    "opencv-python",
    "pillow",
    "piexif",
    "imagehash",
    "screeninfo",
    "pywin32; sys_platform == 'win32'",
    "psutil; sys_platform == 'win32'",
    "pyobjc-framework-Quartz; sys_platform == 'darwin'",
    "pyobjc-framework-AppKit; sys_platform == 'darwin'",
 ]
 [project.urls]
@ -37,7 +43,7 @@ Homepage = "https://github.com/arkohut/memos"
 memos = "memos.commands:app"
 [tool.setuptools.packages.find]
-include = ["memos*"]
+include = ["memos*", "screen_recorder*"]
 [tool.setuptools.package-data]
 "*" = ["static/**/*"]
--- a/screen_recorder/common.py
+++ b/screen_recorder/common.py
@ -0,0 +1,193 @@
 import json
 import os
 import time
 import logging
 import platform
 import subprocess
 from PIL import Image, ImageGrab
 import imagehash
 from memos.utils import write_image_metadata
 from screeninfo import get_monitors
 import ctypes
 if platform.system() == "Windows":
    import win32gui
    import win32process
    import psutil
 elif platform.system() == "Darwin":
    from AppKit import NSWorkspace
    from Quartz import (
        CGWindowListCopyWindowInfo,
        kCGWindowListOptionOnScreenOnly,
        kCGNullWindowID,
        CGSessionCopyCurrentDictionary,
    )
 def load_screen_sequences(base_dir, date):
    try:
        with open(os.path.join(base_dir, date, ".screen_sequences"), "r") as f:
            return json.load(f)
    except FileNotFoundError:
        return {}
 def save_screen_sequences(base_dir, screen_sequences, date):
    with open(os.path.join(base_dir, date, ".screen_sequences"), "w") as f:
        json.dump(screen_sequences, f)
        f.flush()
        os.fsync(f.fileno())
 def load_previous_hashes(base_dir):
    date = time.strftime("%Y%m%d")
    hash_file = os.path.join(base_dir, date, ".previous_hashes")
    try:
        with open(hash_file, "r") as f:
            return json.load(f)
    except FileNotFoundError:
        return {}
 def save_previous_hashes(base_dir, previous_hashes):
    date = time.strftime("%Y%m%d")
    hash_file = os.path.join(base_dir, date, ".previous_hashes")
    os.makedirs(os.path.dirname(hash_file), exist_ok=True)
    with open(hash_file, "w") as f:
        json.dump(previous_hashes, f)
 def get_active_window_info():
    if platform.system() == "Darwin":
        active_app = NSWorkspace.sharedWorkspace().activeApplication()
        app_name = active_app["NSApplicationName"]
        app_pid = active_app["NSApplicationProcessIdentifier"]
        windows = CGWindowListCopyWindowInfo(
            kCGWindowListOptionOnScreenOnly, kCGNullWindowID
        )
        for window in windows:
            if window["kCGWindowOwnerPID"] == app_pid:
                window_title = window.get("kCGWindowName", "")
                if window_title:
                    return app_name, window_title
        return app_name, ""  # 如果没有找到窗口标题，则返回空字符串作为标题
    elif platform.system() == "Windows":
        try:
            window = win32gui.GetForegroundWindow()
            _, pid = win32process.GetWindowThreadProcessId(window)
            app_name = psutil.Process(pid).name()
            window_title = win32gui.GetWindowText(window)
            return app_name, window_title
        except:
            return "", ""
 def take_screenshot_macos(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title):
    screenshots = []
    result = subprocess.check_output(["system_profiler", "SPDisplaysDataType", "-json"])
    displays_info = json.loads(result)["SPDisplaysDataType"][0]["spdisplays_ndrvs"]
    screen_names = {}
    for display_index, display_info in enumerate(displays_info):
        base_screen_name = display_info["_name"].replace(" ", "_").lower()
        if base_screen_name in screen_names:
            screen_names[base_screen_name] += 1
            screen_name = f"{base_screen_name}_{screen_names[base_screen_name]}"
        else:
            screen_names[base_screen_name] = 1
            screen_name = base_screen_name
        temp_filename = os.path.join(base_dir, date, f"temp_screenshot-{timestamp}-of-{screen_name}.png")
        subprocess.run(["screencapture", "-C", "-x", "-D", str(display_index + 1), temp_filename])
        with Image.open(temp_filename) as img:
            img = img.convert("RGB")
            webp_filename = os.path.join(base_dir, date, f"screenshot-{timestamp}-of-{screen_name}.webp")
            current_hash = str(imagehash.phash(img))
            if (screen_name in previous_hashes and 
                imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[screen_name]) < threshold):
                logging.info(f"Screenshot for {screen_name} is similar to the previous one. Skipping.")
                os.remove(temp_filename)
                yield screen_name, None, "Skipped (similar to previous)"
                continue
            previous_hashes[screen_name] = current_hash
            screen_sequences[screen_name] = screen_sequences.get(screen_name, 0) + 1
            metadata = {
                "timestamp": timestamp,
                "active_app": app_name,
                "active_window": window_title,
                "screen_name": screen_name,
                "sequence": screen_sequences[screen_name],
            }
            img.save(webp_filename, format="WebP", quality=85)
            write_image_metadata(webp_filename, metadata)
            save_screen_sequences(base_dir, screen_sequences, date)
        os.remove(temp_filename)
        screenshots.append(webp_filename)
        yield screen_name, webp_filename, "Saved"
 def take_screenshot_windows(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title):
    for monitor in get_monitors():
        safe_monitor_name = ''.join(c for c in monitor.name if c.isalnum() or c in ('_', '-'))
        logging.info(f"Processing monitor: {safe_monitor_name}")
        webp_filename = os.path.join(base_dir, date, f"screenshot-{timestamp}-of-{safe_monitor_name}.webp")
        img = ImageGrab.grab(bbox=(monitor.x, monitor.y, monitor.x + monitor.width, monitor.y + monitor.height))
        img = img.convert("RGB")
        current_hash = str(imagehash.phash(img))
        if safe_monitor_name in previous_hashes and imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[safe_monitor_name]) < threshold:
            logging.info(f"Screenshot for {safe_monitor_name} is similar to the previous one. Skipping.")
            yield safe_monitor_name, None, "Skipped (similar to previous)"
            continue
        previous_hashes[safe_monitor_name] = current_hash
        screen_sequences[safe_monitor_name] = screen_sequences.get(safe_monitor_name, 0) + 1
        metadata = {
            "timestamp": timestamp,
            "active_app": app_name,
            "active_window": window_title,
            "screen_name": safe_monitor_name,
            "sequence": screen_sequences[safe_monitor_name],
        }
        img.save(webp_filename, format="WebP", quality=85)
        write_image_metadata(webp_filename, metadata)
        save_screen_sequences(base_dir, screen_sequences, date)
        yield safe_monitor_name, webp_filename, "Saved"
 def take_screenshot(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp):
    app_name, window_title = get_active_window_info()
    os.makedirs(os.path.join(base_dir, date), exist_ok=True)
    worklog_path = os.path.join(base_dir, date, "worklog")
    with open(worklog_path, "a") as worklog:
        if platform.system() == "Darwin":
            screenshot_generator = take_screenshot_macos(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title)
        elif platform.system() == "Windows":
            screenshot_generator = take_screenshot_windows(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title)
        else:
            raise NotImplementedError(f"Unsupported operating system: {platform.system()}")
        screenshots = []
        for screen_name, screenshot_file, status in screenshot_generator:
            worklog.write(f"{timestamp} - {screen_name} - {status}\n")
            if screenshot_file:
                screenshots.append(screenshot_file)
    return screenshots
 def is_screen_locked():
    if platform.system() == "Darwin":
        session_dict = CGSessionCopyCurrentDictionary()
        if session_dict:
            screen_locked = session_dict.get("CGSSessionScreenIsLocked", 0)
            return bool(screen_locked)
        return False
    elif platform.system() == "Windows":
        user32 = ctypes.windll.User32
        return user32.GetForegroundWindow() == 0
--- a/screen_recorder/record-for-win.bat
+++ b/screen_recorder/record-for-win.bat
@ -1,6 +1,6 @@
@echo off
 call C:\Users\arkoh\miniconda3\Scripts\activate.bat memos
 :loop
-python -m screen_recorder.record-for-win --once
+python -m screen_recorder.record --once
 timeout /t 5 /nobreak >nul
 goto loop
--- a/screen_recorder/record-for-win.py
+++ b/screen_recorder/record-for-win.py
@ -1,159 +0,0 @@
 import logging
 import time
 import os
 import json
 import argparse
 import imagehash
 from PIL import ImageGrab, Image
 import win32gui
 import win32process
 import psutil
 from memos.utils import write_image_metadata
 import ctypes
 from screeninfo import get_monitors
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 def get_active_window_info():
    try:
        window = win32gui.GetForegroundWindow()
        _, pid = win32process.GetWindowThreadProcessId(window)
        app_name = psutil.Process(pid).name()
        window_title = win32gui.GetWindowText(window)
        return app_name, window_title
    except:
        return "", ""
 def load_screen_sequences(base_dir, date):
    try:
        with open(os.path.join(base_dir, date, ".screen_sequences"), "r") as f:
            return json.load(f)
    except FileNotFoundError:
        return {}
 def save_screen_sequences(base_dir, screen_sequences, date):
    with open(os.path.join(base_dir, date, ".screen_sequences"), "w") as f:
        json.dump(screen_sequences, f)
        f.flush()
        os.fsync(f.fileno())
 def take_screenshot(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp):
    screenshots = []
    app_name, window_title = get_active_window_info()
    os.makedirs(os.path.join(base_dir, date), exist_ok=True)
    worklog_path = os.path.join(base_dir, date, "worklog")
    with open(worklog_path, "a") as worklog:
        for monitor in get_monitors():
            safe_monitor_name = ''.join(c for c in monitor.name if c.isalnum() or c in ('_', '-'))
            logging.info(f"Processing monitor: {safe_monitor_name}")
            webp_filename = os.path.join(base_dir, date, f"screenshot-{timestamp}-of-{safe_monitor_name}.webp")
            img = ImageGrab.grab(bbox=(monitor.x, monitor.y, monitor.x + monitor.width, monitor.y + monitor.height))
            img = img.convert("RGB")
            current_hash = str(imagehash.phash(img))
            if safe_monitor_name in previous_hashes and imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[safe_monitor_name]) < threshold:
                logging.info(f"Screenshot for {safe_monitor_name} is similar to the previous one. Skipping.")
                worklog.write(f"{timestamp} - {safe_monitor_name} - Skipped (similar to previous)\n")
                continue
            previous_hashes[safe_monitor_name] = current_hash
            screen_sequences[safe_monitor_name] = screen_sequences.get(safe_monitor_name, 0) + 1
            metadata = {
                "timestamp": timestamp,
                "active_app": app_name,
                "active_window": window_title,
                "screen_name": safe_monitor_name,
                "sequence": screen_sequences[safe_monitor_name],
            }
            img.save(webp_filename, format="WebP", quality=85)
            write_image_metadata(webp_filename, metadata)
            save_screen_sequences(base_dir, screen_sequences, date)
            screenshots.append(webp_filename)
            worklog.write(f"{timestamp} - {safe_monitor_name} - Saved\n")
    return screenshots
 def is_screen_locked():
    user32 = ctypes.windll.User32
    return user32.GetForegroundWindow() == 0
 def load_previous_hashes(base_dir):
    date = time.strftime("%Y%m%d")
    hash_file = os.path.join(base_dir, date, ".previous_hashes")
    try:
        with open(hash_file, "r") as f:
            return json.load(f)
    except FileNotFoundError:
        return {}
 def save_previous_hashes(base_dir, previous_hashes):
    date = time.strftime("%Y%m%d")
    hash_file = os.path.join(base_dir, date, ".previous_hashes")
    os.makedirs(os.path.dirname(hash_file), exist_ok=True)
    with open(hash_file, "w") as f:
        json.dump(previous_hashes, f)
 def run_screen_recorder_once(args, base_dir, previous_hashes):
    if not is_screen_locked():
        date = time.strftime("%Y%m%d")
        timestamp = time.strftime("%Y%m%d-%H%M%S")
        screen_sequences = load_screen_sequences(base_dir, date)
        screenshot_files = take_screenshot(
            base_dir, previous_hashes, args.threshold, screen_sequences, date, timestamp
        )
        for screenshot_file in screenshot_files:
            logging.info(f"Screenshot saved: {screenshot_file}")
        save_previous_hashes(base_dir, previous_hashes)
    else:
        logging.info("Screen is locked. Skipping screenshot.")
 def run_screen_recorder(args, base_dir, previous_hashes):
    while True:
        try:
            if not is_screen_locked():
                date = time.strftime("%Y%m%d")
                timestamp = time.strftime("%Y%m%d-%H%M%S")
                screen_sequences = load_screen_sequences(base_dir, date)
                screenshot_files = take_screenshot(
                    base_dir, previous_hashes, args.threshold, screen_sequences, date, timestamp
                )
                for screenshot_file in screenshot_files:
                    logging.info(f"Screenshot saved: {screenshot_file}")
            else:
                logging.info("Screen is locked. Skipping screenshot.")
        except Exception as e:
            logging.error(f"An error occurred: {str(e)}. Skipping this iteration.")
        time.sleep(5)
 def main():
    parser = argparse.ArgumentParser(description="Screen Recorder for Windows")
    parser.add_argument("--threshold", type=int, default=4, help="Threshold for image similarity")
    parser.add_argument("--base-dir", type=str, default="~/tmp", help="Base directory for screenshots")
    parser.add_argument("--once", action="store_true", help="Run once and exit")
    args = parser.parse_args()
    base_dir = os.path.expanduser(args.base_dir)
    previous_hashes = load_previous_hashes(base_dir)
    if args.once:
        run_screen_recorder_once(args, base_dir, previous_hashes)
    else:
        while True:
            try:
                run_screen_recorder(args, base_dir, previous_hashes)
            except Exception as e:
                logging.error(f"Critical error occurred, program will restart in 10 seconds: {str(e)}")
                time.sleep(10)
 if __name__ == "__main__":
    main()
--- a/screen_recorder/record.py
+++ b/screen_recorder/record.py
@ -1,177 +1,21 @@
 import logging
 import time
 import subprocess
 from AppKit import NSWorkspace
 from PIL import Image
 import os
 from Quartz import (
    CGWindowListCopyWindowInfo,
    kCGWindowListOptionOnScreenOnly,
    kCGNullWindowID,
    CGSessionCopyCurrentDictionary,
 )
 import json
 import imagehash
 import argparse
-from memos.utils import write_image_metadata
+import platform
 from screen_recorder.common import (
    load_screen_sequences,
    save_screen_sequences,
    load_previous_hashes,
    save_previous_hashes,
    take_screenshot,
    is_screen_locked,
 )
 # 在文件开头添加日志配置
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 def get_active_window_info():
    active_app = NSWorkspace.sharedWorkspace().activeApplication()
    app_name = active_app["NSApplicationName"]
    app_pid = active_app["NSApplicationProcessIdentifier"]
    windows = CGWindowListCopyWindowInfo(
        kCGWindowListOptionOnScreenOnly, kCGNullWindowID
    )
    for window in windows:
        if window["kCGWindowOwnerPID"] == app_pid:
            window_title = window.get("kCGWindowName", "")
            if window_title:
                return app_name, window_title
    return app_name, ""  # 如果没有找到窗口标题，则返回空字符串作为标题
 def load_screen_sequences(base_dir, date):
    try:
        with open(os.path.join(base_dir, date, ".screen_sequences"), "r") as f:
            return json.load(f)
    except FileNotFoundError:
        return {}
 def save_screen_sequences(base_dir, screen_sequences, date):
    with open(os.path.join(base_dir, date, ".screen_sequences"), "w") as f:
        json.dump(screen_sequences, f)
        f.flush()
        os.fsync(f.fileno())
 def take_screenshot(
    base_dir, previous_hashes, threshold, screen_sequences, date, timestamp
 ):
    screenshots = []
    # 获取连接的显示器数量
    result = subprocess.check_output(["system_profiler", "SPDisplaysDataType", "-json"])
    displays_info = json.loads(result)["SPDisplaysDataType"][0]["spdisplays_ndrvs"]
    app_name, window_title = get_active_window_info()
    # 创建日期目录
    os.makedirs(os.path.join(base_dir, date), exist_ok=True)
    # 打开 worklog 文件
    worklog_path = os.path.join(base_dir, date, "worklog")
    with open(worklog_path, "a") as worklog:
        screen_names = {}
        for display_index, display_info in enumerate(displays_info):
            # 获取显示器基础名称
            base_screen_name = display_info["_name"].replace(" ", "_").lower()
            # 检查是否存在重复名称
            if base_screen_name in screen_names:
                screen_names[base_screen_name] += 1
                screen_name = f"{base_screen_name}_{screen_names[base_screen_name]}"
            else:
                screen_names[base_screen_name] = 1
                screen_name = base_screen_name
            # 生成临时 PNG 文件名
            temp_filename = os.path.join(
                os.path.join(base_dir, date),
                f"temp_screenshot-{timestamp}-of-{screen_name}.png",
            )
            # 使用 screencapture 命令进行截图，-D 选项指定显示器
            subprocess.run(
                ["screencapture", "-C", "-x", "-D", str(display_index + 1), temp_filename]
            )
            # 压缩图像为 WebP 并添加元数据
            with Image.open(temp_filename) as img:
                img = img.convert("RGB")
                webp_filename = os.path.join(
                    os.path.join(base_dir, date),
                    f"screenshot-{timestamp}-of-{screen_name}.webp",
                )
                # 计算当前截图的哈希值
                current_hash = str(imagehash.phash(img))
                # 检查当前截图与前一次截图的哈希值是否相似
                if (
                    screen_name in previous_hashes
                    and imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[screen_name]) < threshold
                ):
                    logging.info(f"Screenshot for {screen_name} is similar to the previous one. Skipping.")
                    os.remove(temp_filename)
                    # 记录跳过的截图
                    worklog.write(
                        f"{timestamp} - {screen_name} - Skipped (similar to previous)\n"
                    )
                    continue
                # 更新前一次截图的哈希值
                previous_hashes[screen_name] = current_hash
                # 更新序列号
                screen_sequences[screen_name] = screen_sequences.get(screen_name, 0) + 1
                # 准备元数据
                metadata = {
                    "timestamp": timestamp,
                    "active_app": app_name,
                    "active_window": window_title,
                    "screen_name": screen_name,
                    "sequence": screen_sequences[screen_name],  # 添加序列号到元数据
                }
                # 使用 write_image_metadata 函数写入元数据
                img.save(webp_filename, format="WebP", quality=85)
                write_image_metadata(webp_filename, metadata)
                save_screen_sequences(base_dir, screen_sequences, date)
            # 删除临时 PNG 文件
            os.remove(temp_filename)
            # 添加 WebP 文件到截图列表
            screenshots.append(webp_filename)
            # 记录成功的截图
            worklog.write(f"{timestamp} - {screen_name} - Saved\n")
    return screenshots
 def is_screen_locked():
    session_dict = CGSessionCopyCurrentDictionary()
    if session_dict:
        screen_locked = session_dict.get("CGSSessionScreenIsLocked", 0)
        return bool(screen_locked)
    return False
 def load_previous_hashes(base_dir):
    date = time.strftime("%Y%m%d")
    hash_file = os.path.join(base_dir, date, ".previous_hashes")
    try:
        with open(hash_file, "r") as f:
            return json.load(f)
    except FileNotFoundError:
        return {}
 def save_previous_hashes(base_dir, previous_hashes):
    date = time.strftime("%Y%m%d")
    hash_file = os.path.join(base_dir, date, ".previous_hashes")
    os.makedirs(os.path.dirname(hash_file), exist_ok=True)
    with open(hash_file, "w") as f:
        json.dump(previous_hashes, f)
 def run_screen_recorder_once(args, base_dir, previous_hashes):
    if not is_screen_locked():
        date = time.strftime("%Y%m%d")
@ -186,7 +30,6 @@ def run_screen_recorder_once(args, base_dir, previous_hashes):
    else:
        logging.info("Screen is locked. Skipping screenshot.")
 def run_screen_recorder(args, base_dir, previous_hashes):
    while True:
        try:
@ -206,7 +49,6 @@ def run_screen_recorder(args, base_dir, previous_hashes):
        time.sleep(5)
 def main():
    parser = argparse.ArgumentParser(description="Screen Recorder")
    parser.add_argument(
@ -231,6 +73,5 @@ def main():
                logging.error(f"Critical error occurred, program will restart in 10 seconds: {str(e)}")
                time.sleep(10)
 if __name__ == "__main__":
    main()