feat(screen-recorder): refactor

This commit is contained in:
arkohut 2024-09-02 00:03:20 +08:00
parent 2b2d616775
commit 63c302e017
5 changed files with 210 additions and 329 deletions

View File

@ -28,6 +28,12 @@ dependencies = [
"opencv-python", "opencv-python",
"pillow", "pillow",
"piexif", "piexif",
"imagehash",
"screeninfo",
"pywin32; sys_platform == 'win32'",
"psutil; sys_platform == 'win32'",
"pyobjc-framework-Quartz; sys_platform == 'darwin'",
"pyobjc-framework-AppKit; sys_platform == 'darwin'",
] ]
[project.urls] [project.urls]
@ -37,7 +43,7 @@ Homepage = "https://github.com/arkohut/memos"
memos = "memos.commands:app" memos = "memos.commands:app"
[tool.setuptools.packages.find] [tool.setuptools.packages.find]
include = ["memos*"] include = ["memos*", "screen_recorder*"]
[tool.setuptools.package-data] [tool.setuptools.package-data]
"*" = ["static/**/*"] "*" = ["static/**/*"]

193
screen_recorder/common.py Normal file
View File

@ -0,0 +1,193 @@
import json
import os
import time
import logging
import platform
import subprocess
from PIL import Image, ImageGrab
import imagehash
from memos.utils import write_image_metadata
from screeninfo import get_monitors
import ctypes
if platform.system() == "Windows":
import win32gui
import win32process
import psutil
elif platform.system() == "Darwin":
from AppKit import NSWorkspace
from Quartz import (
CGWindowListCopyWindowInfo,
kCGWindowListOptionOnScreenOnly,
kCGNullWindowID,
CGSessionCopyCurrentDictionary,
)
def load_screen_sequences(base_dir, date):
try:
with open(os.path.join(base_dir, date, ".screen_sequences"), "r") as f:
return json.load(f)
except FileNotFoundError:
return {}
def save_screen_sequences(base_dir, screen_sequences, date):
with open(os.path.join(base_dir, date, ".screen_sequences"), "w") as f:
json.dump(screen_sequences, f)
f.flush()
os.fsync(f.fileno())
def load_previous_hashes(base_dir):
date = time.strftime("%Y%m%d")
hash_file = os.path.join(base_dir, date, ".previous_hashes")
try:
with open(hash_file, "r") as f:
return json.load(f)
except FileNotFoundError:
return {}
def save_previous_hashes(base_dir, previous_hashes):
date = time.strftime("%Y%m%d")
hash_file = os.path.join(base_dir, date, ".previous_hashes")
os.makedirs(os.path.dirname(hash_file), exist_ok=True)
with open(hash_file, "w") as f:
json.dump(previous_hashes, f)
def get_active_window_info():
if platform.system() == "Darwin":
active_app = NSWorkspace.sharedWorkspace().activeApplication()
app_name = active_app["NSApplicationName"]
app_pid = active_app["NSApplicationProcessIdentifier"]
windows = CGWindowListCopyWindowInfo(
kCGWindowListOptionOnScreenOnly, kCGNullWindowID
)
for window in windows:
if window["kCGWindowOwnerPID"] == app_pid:
window_title = window.get("kCGWindowName", "")
if window_title:
return app_name, window_title
return app_name, "" # 如果没有找到窗口标题,则返回空字符串作为标题
elif platform.system() == "Windows":
try:
window = win32gui.GetForegroundWindow()
_, pid = win32process.GetWindowThreadProcessId(window)
app_name = psutil.Process(pid).name()
window_title = win32gui.GetWindowText(window)
return app_name, window_title
except:
return "", ""
def take_screenshot_macos(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title):
screenshots = []
result = subprocess.check_output(["system_profiler", "SPDisplaysDataType", "-json"])
displays_info = json.loads(result)["SPDisplaysDataType"][0]["spdisplays_ndrvs"]
screen_names = {}
for display_index, display_info in enumerate(displays_info):
base_screen_name = display_info["_name"].replace(" ", "_").lower()
if base_screen_name in screen_names:
screen_names[base_screen_name] += 1
screen_name = f"{base_screen_name}_{screen_names[base_screen_name]}"
else:
screen_names[base_screen_name] = 1
screen_name = base_screen_name
temp_filename = os.path.join(base_dir, date, f"temp_screenshot-{timestamp}-of-{screen_name}.png")
subprocess.run(["screencapture", "-C", "-x", "-D", str(display_index + 1), temp_filename])
with Image.open(temp_filename) as img:
img = img.convert("RGB")
webp_filename = os.path.join(base_dir, date, f"screenshot-{timestamp}-of-{screen_name}.webp")
current_hash = str(imagehash.phash(img))
if (screen_name in previous_hashes and
imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[screen_name]) < threshold):
logging.info(f"Screenshot for {screen_name} is similar to the previous one. Skipping.")
os.remove(temp_filename)
yield screen_name, None, "Skipped (similar to previous)"
continue
previous_hashes[screen_name] = current_hash
screen_sequences[screen_name] = screen_sequences.get(screen_name, 0) + 1
metadata = {
"timestamp": timestamp,
"active_app": app_name,
"active_window": window_title,
"screen_name": screen_name,
"sequence": screen_sequences[screen_name],
}
img.save(webp_filename, format="WebP", quality=85)
write_image_metadata(webp_filename, metadata)
save_screen_sequences(base_dir, screen_sequences, date)
os.remove(temp_filename)
screenshots.append(webp_filename)
yield screen_name, webp_filename, "Saved"
def take_screenshot_windows(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title):
for monitor in get_monitors():
safe_monitor_name = ''.join(c for c in monitor.name if c.isalnum() or c in ('_', '-'))
logging.info(f"Processing monitor: {safe_monitor_name}")
webp_filename = os.path.join(base_dir, date, f"screenshot-{timestamp}-of-{safe_monitor_name}.webp")
img = ImageGrab.grab(bbox=(monitor.x, monitor.y, monitor.x + monitor.width, monitor.y + monitor.height))
img = img.convert("RGB")
current_hash = str(imagehash.phash(img))
if safe_monitor_name in previous_hashes and imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[safe_monitor_name]) < threshold:
logging.info(f"Screenshot for {safe_monitor_name} is similar to the previous one. Skipping.")
yield safe_monitor_name, None, "Skipped (similar to previous)"
continue
previous_hashes[safe_monitor_name] = current_hash
screen_sequences[safe_monitor_name] = screen_sequences.get(safe_monitor_name, 0) + 1
metadata = {
"timestamp": timestamp,
"active_app": app_name,
"active_window": window_title,
"screen_name": safe_monitor_name,
"sequence": screen_sequences[safe_monitor_name],
}
img.save(webp_filename, format="WebP", quality=85)
write_image_metadata(webp_filename, metadata)
save_screen_sequences(base_dir, screen_sequences, date)
yield safe_monitor_name, webp_filename, "Saved"
def take_screenshot(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp):
app_name, window_title = get_active_window_info()
os.makedirs(os.path.join(base_dir, date), exist_ok=True)
worklog_path = os.path.join(base_dir, date, "worklog")
with open(worklog_path, "a") as worklog:
if platform.system() == "Darwin":
screenshot_generator = take_screenshot_macos(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title)
elif platform.system() == "Windows":
screenshot_generator = take_screenshot_windows(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp, app_name, window_title)
else:
raise NotImplementedError(f"Unsupported operating system: {platform.system()}")
screenshots = []
for screen_name, screenshot_file, status in screenshot_generator:
worklog.write(f"{timestamp} - {screen_name} - {status}\n")
if screenshot_file:
screenshots.append(screenshot_file)
return screenshots
def is_screen_locked():
if platform.system() == "Darwin":
session_dict = CGSessionCopyCurrentDictionary()
if session_dict:
screen_locked = session_dict.get("CGSSessionScreenIsLocked", 0)
return bool(screen_locked)
return False
elif platform.system() == "Windows":
user32 = ctypes.windll.User32
return user32.GetForegroundWindow() == 0

View File

@ -1,6 +1,6 @@
@echo off @echo off
call C:\Users\arkoh\miniconda3\Scripts\activate.bat memos call C:\Users\arkoh\miniconda3\Scripts\activate.bat memos
:loop :loop
python -m screen_recorder.record-for-win --once python -m screen_recorder.record --once
timeout /t 5 /nobreak >nul timeout /t 5 /nobreak >nul
goto loop goto loop

View File

@ -1,159 +0,0 @@
import logging
import time
import os
import json
import argparse
import imagehash
from PIL import ImageGrab, Image
import win32gui
import win32process
import psutil
from memos.utils import write_image_metadata
import ctypes
from screeninfo import get_monitors
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
def get_active_window_info():
try:
window = win32gui.GetForegroundWindow()
_, pid = win32process.GetWindowThreadProcessId(window)
app_name = psutil.Process(pid).name()
window_title = win32gui.GetWindowText(window)
return app_name, window_title
except:
return "", ""
def load_screen_sequences(base_dir, date):
try:
with open(os.path.join(base_dir, date, ".screen_sequences"), "r") as f:
return json.load(f)
except FileNotFoundError:
return {}
def save_screen_sequences(base_dir, screen_sequences, date):
with open(os.path.join(base_dir, date, ".screen_sequences"), "w") as f:
json.dump(screen_sequences, f)
f.flush()
os.fsync(f.fileno())
def take_screenshot(base_dir, previous_hashes, threshold, screen_sequences, date, timestamp):
screenshots = []
app_name, window_title = get_active_window_info()
os.makedirs(os.path.join(base_dir, date), exist_ok=True)
worklog_path = os.path.join(base_dir, date, "worklog")
with open(worklog_path, "a") as worklog:
for monitor in get_monitors():
safe_monitor_name = ''.join(c for c in monitor.name if c.isalnum() or c in ('_', '-'))
logging.info(f"Processing monitor: {safe_monitor_name}")
webp_filename = os.path.join(base_dir, date, f"screenshot-{timestamp}-of-{safe_monitor_name}.webp")
img = ImageGrab.grab(bbox=(monitor.x, monitor.y, monitor.x + monitor.width, monitor.y + monitor.height))
img = img.convert("RGB")
current_hash = str(imagehash.phash(img))
if safe_monitor_name in previous_hashes and imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[safe_monitor_name]) < threshold:
logging.info(f"Screenshot for {safe_monitor_name} is similar to the previous one. Skipping.")
worklog.write(f"{timestamp} - {safe_monitor_name} - Skipped (similar to previous)\n")
continue
previous_hashes[safe_monitor_name] = current_hash
screen_sequences[safe_monitor_name] = screen_sequences.get(safe_monitor_name, 0) + 1
metadata = {
"timestamp": timestamp,
"active_app": app_name,
"active_window": window_title,
"screen_name": safe_monitor_name,
"sequence": screen_sequences[safe_monitor_name],
}
img.save(webp_filename, format="WebP", quality=85)
write_image_metadata(webp_filename, metadata)
save_screen_sequences(base_dir, screen_sequences, date)
screenshots.append(webp_filename)
worklog.write(f"{timestamp} - {safe_monitor_name} - Saved\n")
return screenshots
def is_screen_locked():
user32 = ctypes.windll.User32
return user32.GetForegroundWindow() == 0
def load_previous_hashes(base_dir):
date = time.strftime("%Y%m%d")
hash_file = os.path.join(base_dir, date, ".previous_hashes")
try:
with open(hash_file, "r") as f:
return json.load(f)
except FileNotFoundError:
return {}
def save_previous_hashes(base_dir, previous_hashes):
date = time.strftime("%Y%m%d")
hash_file = os.path.join(base_dir, date, ".previous_hashes")
os.makedirs(os.path.dirname(hash_file), exist_ok=True)
with open(hash_file, "w") as f:
json.dump(previous_hashes, f)
def run_screen_recorder_once(args, base_dir, previous_hashes):
if not is_screen_locked():
date = time.strftime("%Y%m%d")
timestamp = time.strftime("%Y%m%d-%H%M%S")
screen_sequences = load_screen_sequences(base_dir, date)
screenshot_files = take_screenshot(
base_dir, previous_hashes, args.threshold, screen_sequences, date, timestamp
)
for screenshot_file in screenshot_files:
logging.info(f"Screenshot saved: {screenshot_file}")
save_previous_hashes(base_dir, previous_hashes)
else:
logging.info("Screen is locked. Skipping screenshot.")
def run_screen_recorder(args, base_dir, previous_hashes):
while True:
try:
if not is_screen_locked():
date = time.strftime("%Y%m%d")
timestamp = time.strftime("%Y%m%d-%H%M%S")
screen_sequences = load_screen_sequences(base_dir, date)
screenshot_files = take_screenshot(
base_dir, previous_hashes, args.threshold, screen_sequences, date, timestamp
)
for screenshot_file in screenshot_files:
logging.info(f"Screenshot saved: {screenshot_file}")
else:
logging.info("Screen is locked. Skipping screenshot.")
except Exception as e:
logging.error(f"An error occurred: {str(e)}. Skipping this iteration.")
time.sleep(5)
def main():
parser = argparse.ArgumentParser(description="Screen Recorder for Windows")
parser.add_argument("--threshold", type=int, default=4, help="Threshold for image similarity")
parser.add_argument("--base-dir", type=str, default="~/tmp", help="Base directory for screenshots")
parser.add_argument("--once", action="store_true", help="Run once and exit")
args = parser.parse_args()
base_dir = os.path.expanduser(args.base_dir)
previous_hashes = load_previous_hashes(base_dir)
if args.once:
run_screen_recorder_once(args, base_dir, previous_hashes)
else:
while True:
try:
run_screen_recorder(args, base_dir, previous_hashes)
except Exception as e:
logging.error(f"Critical error occurred, program will restart in 10 seconds: {str(e)}")
time.sleep(10)
if __name__ == "__main__":
main()

View File

@ -1,177 +1,21 @@
import logging import logging
import time import time
import subprocess
from AppKit import NSWorkspace
from PIL import Image
import os import os
from Quartz import (
CGWindowListCopyWindowInfo,
kCGWindowListOptionOnScreenOnly,
kCGNullWindowID,
CGSessionCopyCurrentDictionary,
)
import json import json
import imagehash
import argparse import argparse
from memos.utils import write_image_metadata import platform
from screen_recorder.common import (
load_screen_sequences,
save_screen_sequences,
load_previous_hashes,
save_previous_hashes,
take_screenshot,
is_screen_locked,
)
# 在文件开头添加日志配置 # 在文件开头添加日志配置
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s') logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
def get_active_window_info():
active_app = NSWorkspace.sharedWorkspace().activeApplication()
app_name = active_app["NSApplicationName"]
app_pid = active_app["NSApplicationProcessIdentifier"]
windows = CGWindowListCopyWindowInfo(
kCGWindowListOptionOnScreenOnly, kCGNullWindowID
)
for window in windows:
if window["kCGWindowOwnerPID"] == app_pid:
window_title = window.get("kCGWindowName", "")
if window_title:
return app_name, window_title
return app_name, "" # 如果没有找到窗口标题,则返回空字符串作为标题
def load_screen_sequences(base_dir, date):
try:
with open(os.path.join(base_dir, date, ".screen_sequences"), "r") as f:
return json.load(f)
except FileNotFoundError:
return {}
def save_screen_sequences(base_dir, screen_sequences, date):
with open(os.path.join(base_dir, date, ".screen_sequences"), "w") as f:
json.dump(screen_sequences, f)
f.flush()
os.fsync(f.fileno())
def take_screenshot(
base_dir, previous_hashes, threshold, screen_sequences, date, timestamp
):
screenshots = []
# 获取连接的显示器数量
result = subprocess.check_output(["system_profiler", "SPDisplaysDataType", "-json"])
displays_info = json.loads(result)["SPDisplaysDataType"][0]["spdisplays_ndrvs"]
app_name, window_title = get_active_window_info()
# 创建日期目录
os.makedirs(os.path.join(base_dir, date), exist_ok=True)
# 打开 worklog 文件
worklog_path = os.path.join(base_dir, date, "worklog")
with open(worklog_path, "a") as worklog:
screen_names = {}
for display_index, display_info in enumerate(displays_info):
# 获取显示器基础名称
base_screen_name = display_info["_name"].replace(" ", "_").lower()
# 检查是否存在重复名称
if base_screen_name in screen_names:
screen_names[base_screen_name] += 1
screen_name = f"{base_screen_name}_{screen_names[base_screen_name]}"
else:
screen_names[base_screen_name] = 1
screen_name = base_screen_name
# 生成临时 PNG 文件名
temp_filename = os.path.join(
os.path.join(base_dir, date),
f"temp_screenshot-{timestamp}-of-{screen_name}.png",
)
# 使用 screencapture 命令进行截图,-D 选项指定显示器
subprocess.run(
["screencapture", "-C", "-x", "-D", str(display_index + 1), temp_filename]
)
# 压缩图像为 WebP 并添加元数据
with Image.open(temp_filename) as img:
img = img.convert("RGB")
webp_filename = os.path.join(
os.path.join(base_dir, date),
f"screenshot-{timestamp}-of-{screen_name}.webp",
)
# 计算当前截图的哈希值
current_hash = str(imagehash.phash(img))
# 检查当前截图与前一次截图的哈希值是否相似
if (
screen_name in previous_hashes
and imagehash.hex_to_hash(current_hash) - imagehash.hex_to_hash(previous_hashes[screen_name]) < threshold
):
logging.info(f"Screenshot for {screen_name} is similar to the previous one. Skipping.")
os.remove(temp_filename)
# 记录跳过的截图
worklog.write(
f"{timestamp} - {screen_name} - Skipped (similar to previous)\n"
)
continue
# 更新前一次截图的哈希值
previous_hashes[screen_name] = current_hash
# 更新序列号
screen_sequences[screen_name] = screen_sequences.get(screen_name, 0) + 1
# 准备元数据
metadata = {
"timestamp": timestamp,
"active_app": app_name,
"active_window": window_title,
"screen_name": screen_name,
"sequence": screen_sequences[screen_name], # 添加序列号到元数据
}
# 使用 write_image_metadata 函数写入元数据
img.save(webp_filename, format="WebP", quality=85)
write_image_metadata(webp_filename, metadata)
save_screen_sequences(base_dir, screen_sequences, date)
# 删除临时 PNG 文件
os.remove(temp_filename)
# 添加 WebP 文件到截图列表
screenshots.append(webp_filename)
# 记录成功的截图
worklog.write(f"{timestamp} - {screen_name} - Saved\n")
return screenshots
def is_screen_locked():
session_dict = CGSessionCopyCurrentDictionary()
if session_dict:
screen_locked = session_dict.get("CGSSessionScreenIsLocked", 0)
return bool(screen_locked)
return False
def load_previous_hashes(base_dir):
date = time.strftime("%Y%m%d")
hash_file = os.path.join(base_dir, date, ".previous_hashes")
try:
with open(hash_file, "r") as f:
return json.load(f)
except FileNotFoundError:
return {}
def save_previous_hashes(base_dir, previous_hashes):
date = time.strftime("%Y%m%d")
hash_file = os.path.join(base_dir, date, ".previous_hashes")
os.makedirs(os.path.dirname(hash_file), exist_ok=True)
with open(hash_file, "w") as f:
json.dump(previous_hashes, f)
def run_screen_recorder_once(args, base_dir, previous_hashes): def run_screen_recorder_once(args, base_dir, previous_hashes):
if not is_screen_locked(): if not is_screen_locked():
date = time.strftime("%Y%m%d") date = time.strftime("%Y%m%d")
@ -186,7 +30,6 @@ def run_screen_recorder_once(args, base_dir, previous_hashes):
else: else:
logging.info("Screen is locked. Skipping screenshot.") logging.info("Screen is locked. Skipping screenshot.")
def run_screen_recorder(args, base_dir, previous_hashes): def run_screen_recorder(args, base_dir, previous_hashes):
while True: while True:
try: try:
@ -206,7 +49,6 @@ def run_screen_recorder(args, base_dir, previous_hashes):
time.sleep(5) time.sleep(5)
def main(): def main():
parser = argparse.ArgumentParser(description="Screen Recorder") parser = argparse.ArgumentParser(description="Screen Recorder")
parser.add_argument( parser.add_argument(
@ -231,6 +73,5 @@ def main():
logging.error(f"Critical error occurred, program will restart in 10 seconds: {str(e)}") logging.error(f"Critical error occurred, program will restart in 10 seconds: {str(e)}")
time.sleep(10) time.sleep(10)
if __name__ == "__main__": if __name__ == "__main__":
main() main()