first commit

This commit is contained in:
Dr Marc 2025-09-25 12:49:25 +02:00
commit 4767d7b95d
7 changed files with 268 additions and 0 deletions

138
src/browser_window.py Normal file
View file

@ -0,0 +1,138 @@
# src/browser_window.py
from PySide6.QtWidgets import (
QMainWindow, QToolBar, QMenu, QMessageBox, QFileDialog, QInputDialog
)
from PySide6.QtGui import QAction
from PySide6.QtWebEngineWidgets import QWebEngineView
from PySide6.QtWebEngineCore import QWebEngineContextMenuRequest
from PySide6.QtCore import QUrl, Qt
from pathlib import Path
import io
from .db import init_db, save_page, save_screenshot, save_tag, save_event
class BrowserWindow(QMainWindow):
def __init__(self):
super().__init__()
self.setWindowTitle("LawEnforcement Web Scraper")
self.resize(1200, 800)
# ---- Web view ------------------------------------------------
self.view = QWebEngineView()
self.setCentralWidget(self.view)
# ---- Toolbar -------------------------------------------------
toolbar = QToolBar()
self.addToolBar(toolbar)
back_act = QAction("", self)
back_act.triggered.connect(self.view.back)
toolbar.addAction(back_act)
forward_act = QAction("", self)
forward_act.triggered.connect(self.view.forward)
toolbar.addAction(forward_act)
reload_act = QAction("", self)
reload_act.triggered.connect(self.view.reload)
toolbar.addAction(reload_act)
capture_act = QAction("📸 Capture", self)
capture_act.triggered.connect(self.capture_screenshot)
toolbar.addAction(capture_act)
# ---- Signals -------------------------------------------------
self.view.urlChanged.connect(self.on_url_changed)
self.view.loadFinished.connect(self.on_load_finished)
self.view.page().profile().downloadRequested.connect(self.on_download_requested)
# Contextmenu handling for image tagging
self.view.setContextMenuPolicy(Qt.ContextMenuPolicy.CustomContextMenu)
self.view.customContextMenuRequested.connect(self.show_context_menu)
# Initialise DB and state variables
init_db()
self.current_page_id = None
self.pending_url = ""
# ------------------------------------------------------------------
def on_url_changed(self, url: QUrl):
"""Remember the URL; HTML will be saved once the page finishes loading."""
self.pending_url = url.toString()
def on_load_finished(self, ok: bool):
if not ok:
QMessageBox.warning(self, "Load error", f"Failed to load {self.pending_url}")
return
# Grab the HTML source and persist it
self.view.page().toHtml(lambda html: self._store_page(html))
def _store_page(self, html: str):
# Save page record and keep its id for later screenshots/events
self.current_page_id = save_page(self.pending_url, html)
# Optional: automatically take a screenshot on load
# self.capture_screenshot()
# ------------------------------------------------------------------
def capture_screenshot(self):
if self.current_page_id is None:
QMessageBox.information(self, "Info", "No page loaded yet.")
return
def handle_pixmap(pix):
buffer = io.BytesIO()
pix.save(buffer, "PNG")
png_data = buffer.getvalue()
if self.current_page_id:
screenshot_id = save_screenshot(self.current_page_id, png_data)
self.prompt_tag(screenshot_id)
# grab() returns a QPixmap wrapped in a QFuture use then() callback
self.view.grab().then(handle_pixmap)
# ------------------------------------------------------------------
def show_context_menu(self, pos):
ctx: QWebEngineContextMenuRequest = self.view.page().contextMenuData()
if ctx.mediaType() == QWebEngineContextMenuRequest.MediaTypeImage:
menu = QMenu(self)
tag_act = QAction("Add tag to image", self)
tag_act.triggered.connect(lambda: self.tag_image(ctx))
menu.addAction(tag_act)
menu.exec_(self.view.mapToGlobal(pos))
def tag_image(self, ctx: QWebEngineContextMenuRequest):
# Download the image data, then store it as a screenshot for tagging
img_url = ctx.mediaUrl().toString()
# Use the download API to fetch the image bytes
profile = self.view.page().profile()
profile.downloadRequested.connect(
lambda req: self._handle_image_download(req, img_url)
)
# Trigger a temporary download request via JS (creates the request)
self.view.page().runJavaScript(f'new Image().src="{img_url}";')
def _handle_image_download(self, request, expected_url):
# Accept the request; when finished we can read its data
request.accept()
request.finished.connect(lambda: self._store_image_tag(request, expected_url))
def _store_image_tag(self, request, url):
# request.reply() is a QIODevice; read all bytes
data = request.reply().readAll().data()
screenshot_id = save_screenshot(self.current_page_id, data)
self.prompt_tag(screenshot_id)
def prompt_tag(self, screenshot_id: int):
tag, ok = QInputDialog.getText(self, "Tag image", "Enter tag:")
if ok and tag.strip():
save_tag(screenshot_id, tag.strip())
QMessageBox.information(self, "Tagged", f"Tag saved: {tag}")
# ------------------------------------------------------------------
def on_download_requested(self, request):
# For nonimage files you might want to let the user choose a location.
default_path = QFileDialog.getSaveFileName(self, "Save file", request.suggestedFileName())[0]
if default_path:
request.setDownloadFileName(Path(default_path).name)
request.accept()