RELEASE 0.1.0

Added resolver running on pure vibes
Fix screenshotter again
2026-03-22 00:56:05 +01:00 · 2026-03-21 23:16:43 +01:00 · 2026-03-21 22:22:47 +01:00 · 2026-03-21 22:20:09 +01:00 · 2026-03-21 21:12:03 +01:00 · 2026-03-21 20:43:34 +01:00
18 changed files with 871 additions and 51 deletions
--- a/config/application.yml
+++ b/config/application.yml
@@ -0,0 +1,7 @@
+path: data/odkazy.xlsx
+
+screenshotter:
+  target_path: data/screenshots/
+
+resolver:
+  api_key: 733f6882605be2de8980bbd074091ee4
--- a/data/extract_to_excel.py
+++ b/data/extract_to_excel.py
@@ -0,0 +1,88 @@
+import os
+import re
+import sys
+import argparse
+from datetime import datetime
+import pytz
+from openpyxl import Workbook
+
+
+def process_files(starting_id, output_filename="output.xlsx"):
+    # Find all txt files in the current directory
+    txt_files = [f for f in os.listdir('.') if f.endswith('.txt')]
+
+    if not txt_files:
+        print("No .txt files found in the current directory.")
+        return
+
+    # Regex patterns for input data
+    date_pattern = re.compile(r'\[.*?(\d{1,2})\s+(\d{1,2}),\s+(\d{4})\s+at\s+(\d{1,2}:\d{2})\]')
+    url_pattern = re.compile(r'(https?://[^\s]+)')
+
+    # Timezone setup (CET to UTC)
+    local_tz = pytz.timezone("Europe/Prague")
+
+    # Set up the Excel Workbook
+    wb = Workbook()
+    ws = wb.active
+    ws.title = "Fortuna Data"
+    ws.append(["ID", "URL", "Date_UTC"])  # Add headers
+
+    current_id = starting_id
+    success_files = []
+
+    for filename in txt_files:
+        try:
+            with open(filename, 'r', encoding='utf-8') as f:
+                content = f.read()
+
+            dates = date_pattern.findall(content)
+            urls = url_pattern.findall(content)
+
+            # Extract and format the data
+            for i in range(min(len(dates), len(urls))):
+                month, day, year, time_str = dates[i]
+
+                # Parse the datetime from the text file
+                dt_str = f"{year}-{month}-{day} {time_str}"
+                local_dt = datetime.strptime(dt_str, "%Y-%m-%d %H:%M")
+
+                # Convert CET to UTC
+                localized_dt = local_tz.localize(local_dt)
+                utc_dt = localized_dt.astimezone(pytz.utc)
+
+                # NEW: Format to ISO 8601 with T and Z
+                formatted_date = utc_dt.strftime("%Y-%m-%dT%H:%M:%SZ")
+
+                # Add a new row to the Excel sheet
+                ws.append([current_id, urls[i], formatted_date])
+                current_id += 1
+
+            # Queue file for deletion
+            success_files.append(filename)
+
+        except Exception as e:
+            print(f"Error processing {filename}: {e}", file=sys.stderr)
+
+    # Save the Excel file
+    try:
+        wb.save(output_filename)
+        print(f"Successfully saved data to {output_filename}")
+
+        # Clean up only if save was successful
+        for filename in success_files:
+            os.remove(filename)
+            print(f"Deleted: {filename}")
+
+    except Exception as e:
+        print(f"Failed to save {output_filename}. No text files were deleted. Error: {e}", file=sys.stderr)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Extract URLs to an Excel file with ISO UTC dates.")
+    parser.add_argument("start_id", type=int, help="Starting ID for the output")
+    parser.add_argument("--output", type=str, default="extracted_data.xlsx",
+                        help="Output Excel filename (default: extracted_data.xlsx)")
+    args = parser.parse_args()
+
+    process_files(args.start_id, args.output)
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -4,19 +4,24 @@ build-backend = "setuptools.build_meta"

 [project]
 name = "beaky"
-version = "0.0.1"
+version = "0.1.0"
 description = "Scan tickets and decide"
 requires-python = ">=3.12"
 dependencies = [
    "pillow==12.1.1",
    "pydantic==2.12.5",
+    "pandas==3.0.1",
    "openpyxl>=3.1.0",
+    "PyYaml==6.0.3",
+    "playwright==1.58.0",
+    "requests>=2.32.0"
 ]

 [project.optional-dependencies]
 dev = [
    "pytest>=9.0.2",
    "ruff==0.15.5",
+    "pytz"
    # "playwright==1.58.0" # only dev because it cant be installed in a pipeline, just locally
 ]

--- a/src/beaky/cli.py
+++ b/src/beaky/cli.py
@@ -1,28 +1,89 @@
 import argparse

+import yaml
 from pydantic import ValidationError

 from beaky.config import Config
 from beaky.scanner.scanner import Links
+from beaky.screenshotter.screenshotter import Screenshotter
+from beaky.link_classifier.classifier import LinkClassifier
+from beaky.resolvers.resolver import TicketResolver
+from beaky.resolvers.resolver import TicketVerdict, _R, _B, _GREEN, _RED, _YELLOW, _GRAY
+
+_VERDICT_COLOR = {
+    TicketVerdict.TRUTHFUL: _GREEN,
+    TicketVerdict.NOT_TRUTHFUL: _RED,
+    TicketVerdict.POSSIBLY_TRUTHFUL: _YELLOW,
+    TicketVerdict.UNKNOWN: _GRAY,
+}
+
+def load_config(path: str) -> Config | None:
+    with open(path) as f:
+        config_dict = yaml.safe_load(f)
+    try:
+        return Config(**config_dict)
+    except ValidationError as e:
+        print("Bad config")
+        print(e)
+        return None

 def main() -> None:
-    parser = argparse.ArgumentParser(
-        prog="beaky"
-    )
-    parser.add_argument("path", help="Path to config file.")
-    args = parser.parse_args()
+    parser = argparse.ArgumentParser(prog="beaky")
+    parser.add_argument("--config", help="Path to config file.", default="config/application.yml")
+    parser.add_argument("--id", type=int, help="Resolve a single ticket by id (only used with resolve mode).")
+    parser.add_argument("mode", choices=["screenshotter", "parser", "class", "resolve"], help="Mode of operation.")

-    try:
-        config = Config(**vars(args))
-    except ValidationError as e:
-        print("Bad arguments")
-        print(e)
+    args = parser.parse_args()
+    config = load_config(args.config)
+    if config is None:
        return

-    data = Links(config.path)
+    # always load testing data, we will modify that later
+    data = Links(config)
    data.ret_links()
-    for link in data:
-        print(link)
+    link_amount = len(data.links)
+    print(f"We found {link_amount} links")
+    if link_amount == 0:
+        print("ERROR, no links found")
+        return
+
+    if args.mode == "screenshotter":
+        screenshotter = Screenshotter(config)
+        screenshotter.capture_tickets(data.links)
+
+    if args.mode == "parser":
+        for link in data.links:
+            print(link)
+
+    if args.mode == "class":
+        classifier = LinkClassifier()
+        results = []
+        for link in data.links:
+            results.append(classifier.classify(link))
+            ticket = results[-1]
+            print(f"\n=== Link {ticket.id} ({len(ticket.bets)} bets) ===")
+            for bet in ticket.bets:
+                print(f"  [{type(bet).__name__}]")
+                for k, v in vars(bet).items():
+                    print(f"    {k}: {v}")
+
+    if args.mode == "resolve":
+        classifier = LinkClassifier()
+        resolver = TicketResolver(config.resolver)
+        links = [l for l in data.links if l.id == args.id] if args.id is not None else data.links
+        if args.id is not None and not links:
+            print(f"ERROR: ticket id {args.id} not found")
+            return
+        for link in links:
+            print(f"\n=== Classifying ticket {link.id} ===")
+            ticket = classifier.classify(link)
+            for bet in ticket.bets:
+                print(f"  [{type(bet).__name__}] {bet.team1Name} vs {bet.team2Name}  |  {bet.date.date()}  |  {bet.league}")
+
+            print(f"\n--- Resolving ticket {link.id} ---")
+            resolved = resolver.resolve(ticket)
+            color = _VERDICT_COLOR.get(resolved.verdict, "")
+            print(f"\n  {color}{_B}VERDICT: {resolved.verdict.value.upper()}{_R}")

 if __name__ == "__main__":
    main()
--- a/src/beaky/config.py
+++ b/src/beaky/config.py
@@ -1,6 +1,11 @@
 from pydantic.dataclasses import dataclass

+from beaky.resolvers.config import ResolverConfig
+from beaky.screenshotter.config import ScreenshotterConfig
+

@dataclass
 class Config:
    path: str
+    screenshotter: ScreenshotterConfig
+    resolver: ResolverConfig
--- a/src/beaky/datamodels/scan.py
+++ b/src/beaky/datamodels/scan.py
@@ -1,9 +0,0 @@
-from pydantic.dataclasses import dataclass
-from datetime import datetime
-
-@dataclass
-class Scan:
-    id: int
-    date: datetime
-    event_name: str
-
--- a/src/beaky/datamodels/ticket.py
+++ b/src/beaky/datamodels/ticket.py
@@ -1,21 +1,91 @@
-from abc import ABC
+from abc import ABC, abstractmethod
+from datetime import datetime
 from enum import Enum
+from typing import Literal

 from pydantic.dataclasses import dataclass
-from typing import Callable


-class TicketType(str, Enum):
+class BetType(str, Enum):
    WIN_DRAW_LOSE = "win_draw_lose"
-    # postup?
+    ADVANCED = "advance"
    WIN_DRAW_LOSE_DOUBLE = "win_draw_lose_double"
    WIN_LOSE = "win_lose"
    BOTH_TEAM_SCORED = "both_team_scored"
    GOAL_AMOUNT = "goal_amount"
+    GOAL_HANDICAP = "goal_handicap"
+    UNKNOWN = "unknown"
    ...

-# Classes that inherit from this are defined in resolution file, so the deciding function can be used
+
@dataclass
-class Ticket(ABC):
-    ticketType: TicketType
-    decidingFunction: Callable
+class Bet(ABC):
+    ticketType: BetType
+    team1Name: str
+    team2Name: str
+    date: datetime
+    league: str
+    @abstractmethod
+    def resolve(self): pass
+
+@dataclass
+class WinDrawLose(Bet):
+    """Výsledek zápasu 1X2"""
+    betType: Literal["X", "0", "1", "2"] = "0"
+    def resolve(self):
+        ...
+
+@dataclass
+class Advance(Bet):
+    """What team advances to next round"""
+    def resolve(self):
+        raise NotImplementedError("Vyser si voko vine")
+
+@dataclass
+class WinDrawLoseDouble(Bet):
+    """Výsledek zápasu - double"""
+    betType: Literal["01", "12", "02"] = "01"
+    def resolve(self):
+        ...
+
+@dataclass
+class WinLose(Bet):
+    """Výsledek zápasu bez remízy"""
+    betType: Literal["1", "2"] = "1"
+    def resolve(self):
+        ...
+
+@dataclass
+class BothTeamScored(Bet):
+    def resolve(self):
+        ...
+
+@dataclass
+class GoalAmount(Bet):
+    """Počet gólů v zápasu — over/under total goals"""
+    line: float = 0.0      # goal line, e.g. 2.5
+    over: bool = True      # True = more than line, False = less than line
+    def resolve(self):
+        ...
+
+@dataclass
+class GoalHandicap(Bet):
+    """Goal handicap for a specific team — add handicap_amount to team's score, team wins = you win"""
+    team_bet: Literal["1", "2"] = "1"  # which team the handicap is applied to
+    handicap_amount: float = 0.0       # e.g. +1.5 or -0.5
+    def resolve(self):
+        ...
+
+@dataclass
+class UnknownTicket(Bet):
+    """Bet type that could not be classified"""
+    raw_text: str = ""
+    def resolve(self):
+        ...
+
+
+
+@dataclass
+class Ticket:
+    id: int
+    bets: list[Bet]
--- a/src/beaky/image_classifier/init.py
+++ b/src/beaky/image_classifier/init.py
--- a/src/beaky/image_classifier/classifier.py
+++ b/src/beaky/image_classifier/classifier.py
@@ -0,0 +1,7 @@
+from datetime import datetime
+
+from beaky.datamodels.ticket import Ticket
+
+
+def f(path:str, date:datetime) -> list[Ticket]:
+    ...
--- a/src/beaky/link_classifier/init.py
+++ b/src/beaky/link_classifier/init.py
--- a/src/beaky/link_classifier/classifier.py
+++ b/src/beaky/link_classifier/classifier.py
@@ -0,0 +1,116 @@
+import re
+from datetime import datetime
+
+from playwright.sync_api import Page, sync_playwright
+
+from beaky.datamodels.ticket import (
+    BothTeamScored,
+    GoalAmount,
+    GoalHandicap,
+    Ticket,
+    BetType,
+    UnknownTicket,
+    WinDrawLose,
+    WinDrawLoseDouble,
+    WinLose,
+    Bet
+)
+from beaky.scanner.scanner import Link
+
+_TICKET_SELECTOR = ".betslip-history-detail__left-panel"
+_LEG_SELECTOR = '[data-test="betslip-leg"]'
+
+
+def _parse_czech_date(text: str) -> datetime | None:
+    m = re.search(r"(\d+)\.\s*(\d+)\.\s*(\d+)\s+(\d+):(\d+)", text)
+    if not m:
+        return None
+    day, month, year, hour, minute = map(int, m.groups())
+    return datetime(year, month, day, hour, minute)
+
+
+def _parse_teams(title: str) -> tuple[str, str]:
+    parts = title.split(" - ", 1)
+    if len(parts) == 2:
+        return parts[0].strip(), parts[1].strip()
+    return title.strip(), ""
+
+
+def _classify_bet(bet_text: str, team1: str, team2: str, date: datetime, league: str) -> Bet:
+    common = dict(team1Name=team1, team2Name=team2, date=date, league=league)
+
+    # WinDrawLose double: "Výsledek zápasu - dvojtip: 10"
+    m = re.search(r"Výsledek zápasu - dvojtip:\s*(\d+)", bet_text)
+    if m:
+        # normalize order: "10" -> "01", "02" -> "02", "12" -> "12"
+        bet_type = "".join(sorted(m.group(1)))
+        return WinDrawLoseDouble(ticketType=BetType.WIN_DRAW_LOSE_DOUBLE, betType=bet_type, **common)
+
+    # WinLose (no draw): "Výsledek bez remízy: 1"
+    m = re.search(r"bez rem[ií]zy:\s*([12])", bet_text)
+    if m:
+        return WinLose(ticketType=BetType.WIN_LOSE, betType=m.group(1), **common)
+
+    # WinDrawLose: "Výsledek zápasu: 1"
+    m = re.search(r"Výsledek zápasu:\s*([012X])\s*$", bet_text.strip())
+    if m:
+        return WinDrawLose(ticketType=BetType.WIN_DRAW_LOSE, betType=m.group(1), **common)
+
+    # BothTeamScored: "Každý z týmů dá gól v zápasu: Ano"
+    if "dá gól" in bet_text or "oba týmy" in bet_text.lower():
+        return BothTeamScored(ticketType=BetType.BOTH_TEAM_SCORED, **common)
+
+    # GoalAmount: "Počet gólů v zápasu 2.5: + 2.5" / "Počet gólů v zápasu 4: - 4"
+    m = re.search(r"Počet gólů v zápasu\s+(\d+(?:\.\d+)?):\s*([+-])", bet_text)
+    if m:
+        return GoalAmount(ticketType=BetType.GOAL_AMOUNT, line=float(m.group(1)), over=m.group(2) == "+", **common)
+
+    # GoalHandicap: "[Team] počet gólů ...: +1.5" — team name in bet text determines team_bet
+    m = re.search(r"([+-])\s*(\d+(?:\.\d+)?)\s*$", bet_text.strip())
+    if m and "gólů" in bet_text:
+        bet_lower = bet_text.lower()
+        if team1.lower() in bet_lower:
+            team_bet = "1"
+        elif team2.lower() in bet_lower:
+            team_bet = "2"
+        else:
+            return UnknownTicket(ticketType=BetType.UNKNOWN, raw_text=bet_text, **common)
+        sign = 1.0 if m.group(1) == "+" else -1.0
+        handicap = sign * float(m.group(2))
+        return GoalHandicap(ticketType=BetType.GOAL_HANDICAP, team_bet=team_bet, handicap_amount=handicap, **common)
+
+    return UnknownTicket(ticketType=BetType.UNKNOWN, raw_text=bet_text, **common)
+
+
+def _extract_legs(page: Page, fallback_date: datetime | None) -> list[Bet]:
+    bets: list[Bet] = []
+    for leg in page.locator(_LEG_SELECTOR).all():
+        title = leg.locator("h3").first.get_attribute("title") or ""
+        date_text = leg.locator(".betslip-leg-date span").first.inner_text()
+        bet_text = leg.locator("[data-selection-id]").first.inner_text()
+        league = leg.locator(".f-mt-1.f-leading-tight.f-line-clamp-2").first.inner_text()
+
+        team1, team2 = _parse_teams(title)
+        date = _parse_czech_date(date_text) or fallback_date or datetime.now()
+
+        bets.append(_classify_bet(bet_text, team1, team2, date, league))
+    return bets
+
+
+class LinkClassifier:
+    def classify(self, link: Link) -> Ticket:
+        with sync_playwright() as p:
+            browser = p.chromium.launch(headless=True)
+            context = browser.new_context()
+            page = context.new_page()
+            try:
+                page.goto(link.url)
+                page.wait_for_selector(_LEG_SELECTOR, timeout=15000)
+                page.wait_for_timeout(500)
+                result = Ticket(id=link.id, bets=_extract_legs(page, link.date))
+            except Exception as e:
+                print(f"Error classifying link {link.id}: {e}")
+            finally:
+                page.close()
+            browser.close()
+        return result
--- a/src/beaky/resolvers/init.py
+++ b/src/beaky/resolvers/init.py
--- a/src/beaky/resolvers/config.py
+++ b/src/beaky/resolvers/config.py
@@ -0,0 +1,6 @@
+from pydantic.dataclasses import dataclass
+
+
+@dataclass
+class ResolverConfig:
+    api_key: str
--- a/src/beaky/resolvers/resolver.py
+++ b/src/beaky/resolvers/resolver.py
@@ -0,0 +1,353 @@
+import time
+from dataclasses import dataclass, field
+from datetime import datetime, timedelta
+from difflib import SequenceMatcher
+from enum import Enum
+
+import requests
+
+from beaky.datamodels.ticket import (
+    Bet,
+    BothTeamScored,
+    GoalAmount,
+    GoalHandicap,
+    Ticket,
+    UnknownTicket,
+    WinDrawLose,
+    WinDrawLoseDouble,
+    WinLose,
+)
+from beaky.resolvers.config import ResolverConfig
+
+_API_BASE = "https://v3.football.api-sports.io"
+
+# Fortuna league strings (lowercased substring match) -> api-football league ID
+_LEAGUE_MAP: dict[str, int] = {
+    # European cups
+    "liga mistrů": 2,
+    "champions league": 2,
+    "evropská liga": 3,
+    "europa league": 3,
+    "konferenční liga": 848,
+    "conference league": 848,
+    # Top flights
+    "1. anglie": 39,
+    "1. belgie": 144,
+    "1. česko": 345,
+    "1. dánsko": 119,
+    "1. francie": 61,
+    "1. itálie": 135,
+    "1. itálie - ženy": 794,
+    "1. německo": 78,
+    "1. nizozemsko": 88,
+    "1. polsko": 106,
+    "1. portugalsko": 94,
+    "1. rakousko": 218,
+    "1. rumunsko": 283,
+    "1. skotsko": 179,
+    "1. slovensko": 332,
+    "1. španělsko": 140,
+    "1. wales": 771,
+    # Second divisions
+    "2. anglie": 40,
+    "2. česko": 346,
+    "2. francie": 62,
+    "2. itálie": 136,
+    "2. německo": 79,
+    "2. nizozemsko": 89,
+    "2. rakousko": 219,
+    "2. slovensko": 333,
+    "2. španělsko": 141,
+    # Third divisions
+    "3. francie": 63,
+    "3. česko msfl": 349,
+    "3. česko čfl": 348,
+    # Fourth divisions
+    "4. česko - sk. a": 350,
+    "4. česko - sk. b": 351,
+    "4. česko - sk. c": 352,
+    "4. česko - sk. d": 353,
+    "4. česko - sk. e": 354,
+    "4. česko - sk. f": 686,
+    # Women
+    "1. česko - ženy": 669,
+    "fortuna=liga ženy": 669,
+    # Domestic cups
+    "anglie - fa cup": 45,
+    "anglie - efl cup": 48,
+    "česko - pohár": 347,
+}
+
+_DATE_WINDOW = 3  # days either side of the bet date to search
+
+# ANSI color helpers
+_R  = "\033[0m"
+_B  = "\033[1m"
+_DIM= "\033[2m"
+_GREEN  = "\033[32m"
+_RED    = "\033[31m"
+_YELLOW = "\033[33m"
+_CYAN   = "\033[36m"
+_GRAY   = "\033[90m"
+
+_OUTCOME_COLOR = {
+    "win":     _GREEN,
+    "lose":    _RED,
+    "void":    _YELLOW,
+    "unknown": _GRAY,
+}
+
+
+class TicketVerdict(str, Enum):
+    TRUTHFUL = "truthful"
+    NOT_TRUTHFUL = "not truthful"
+    POSSIBLY_TRUTHFUL = "possibly truthful — unresolvable bets remain, check manually"
+    UNKNOWN = "unknown — could not resolve enough bets to decide"
+
+
+class BetOutcome(str, Enum):
+    WIN = "win"
+    LOSE = "lose"
+    VOID = "void"      # stake returned (e.g. WinLose on draw, integer goal line hit)
+    UNKNOWN = "unknown"  # fixture not found or unclassified bet
+
+
+@dataclass
+class ResolvedBet:
+    bet: Bet
+    outcome: BetOutcome
+    fixture_id: int | None = None
+    # Confidence breakdown (each component 0.0–1.0):
+    #   name_match     — how well team names matched (SequenceMatcher score)
+    #   date_proximity — 1.0 exact date, linear decay to 0.0 at _DATE_WINDOW days away
+    #   league_found   — 1.0 static map hit, 0.7 API fallback, 0.3 not found
+    #   match_finished — 1.0 if fixture status is terminal, 0.0 otherwise
+    confidence: float = 0.0
+    name_match: float = 0.0
+    date_proximity: float = 0.0
+    league_found: float = 0.0
+    match_finished: float = 0.0
+
+
+@dataclass
+class ResolvedTicket:
+    ticket_id: int
+    bets: list[ResolvedBet] = field(default_factory=list)
+
+    @property
+    def verdict(self) -> TicketVerdict:
+        resolvable = [b for b in self.bets if not isinstance(b.bet, UnknownTicket)]
+        unresolvable = [b for b in self.bets if isinstance(b.bet, UnknownTicket)]
+        if not resolvable:
+            return TicketVerdict.UNKNOWN
+        if any(b.outcome == BetOutcome.LOSE for b in resolvable):
+            return TicketVerdict.NOT_TRUTHFUL
+        if any(b.outcome == BetOutcome.UNKNOWN for b in resolvable):
+            return TicketVerdict.UNKNOWN
+        if unresolvable:
+            return TicketVerdict.POSSIBLY_TRUTHFUL
+        return TicketVerdict.TRUTHFUL
+
+
+def _get(url: str, headers: dict, params: dict, retries: int = 3, backoff: float = 60.0) -> requests.Response:
+    for attempt in range(retries):
+        resp = requests.get(url, headers=headers, params=params)
+        if resp.status_code == 429:
+            wait = backoff * (attempt + 1)
+            print(f"  !! rate limited — waiting {wait:.0f}s before retry ({attempt + 1}/{retries})")
+            time.sleep(wait)
+            continue
+        return resp
+    print(f"  !! still rate limited after {retries} retries, giving up")
+    return resp
+
+
+class TicketResolver:
+    def __init__(self, config: ResolverConfig):
+        self._headers = {"x-apisports-key": config.api_key}
+        # Cache maps (center_date_str, league_id | None) -> list of fixture dicts
+        self._fixture_cache: dict[tuple[str, int | None], list[dict]] = {}
+        # Cache maps league name -> (league_id, confidence)
+        self._league_cache: dict[str, tuple[int | None, float]] = {}
+
+    def resolve(self, ticket: Ticket) -> ResolvedTicket:
+        result = ResolvedTicket(ticket_id=ticket.id)
+        for bet in ticket.bets:
+            result.bets.append(self._resolve_bet(bet))
+        return result
+
+    def _resolve_bet(self, bet: Bet) -> ResolvedBet:
+        bet_type = type(bet).__name__
+        print(f"\n  {_B}{_CYAN}┌─ [{bet_type}]{_R}  {_B}{bet.team1Name} vs {bet.team2Name}{_R}"
+              f"  {_DIM}{bet.date.strftime('%Y-%m-%d')}  |  {bet.league}{_R}")
+
+        if isinstance(bet, UnknownTicket):
+            print(f"  {_GRAY}│  skipping — not implemented: {bet.raw_text!r}{_R}")
+            print(f"  {_GRAY}└─ UNKNOWN{_R}")
+            return ResolvedBet(bet=bet, outcome=BetOutcome.UNKNOWN)
+
+        fixture, name_match, date_prox, league_conf = self._find_fixture(bet)
+        if fixture is None:
+            print(f"  {_GRAY}└─ UNKNOWN — no fixture found{_R}")
+            return ResolvedBet(bet=bet, outcome=BetOutcome.UNKNOWN, league_found=league_conf)
+
+        home_name = fixture["teams"]["home"]["name"]
+        away_name = fixture["teams"]["away"]["name"]
+        finished = _is_finished(fixture)
+        confidence = round((name_match + date_prox + league_conf + finished) / 4, 3)
+        outcome = _evaluate_bet(bet, fixture) if finished == 1.0 else BetOutcome.UNKNOWN
+
+        goals = fixture["goals"]
+        color = _OUTCOME_COLOR.get(outcome.value, _GRAY)
+        print(f"  {_DIM}│  matched #{fixture['fixture']['id']}: {home_name} vs {away_name}"
+              f"  |  {goals['home']}:{goals['away']}  |  {fixture['fixture']['status']['short']}"
+              f"  |  confidence {confidence} (name={name_match:.2f} date={date_prox:.2f} league={league_conf} finished={finished}){_R}")
+        print(f"  {color}{_B}└─ {outcome.value.upper()}{_R}")
+
+        return ResolvedBet(
+            bet=bet,
+            outcome=outcome,
+            fixture_id=fixture["fixture"]["id"],
+            confidence=confidence,
+            name_match=round(name_match, 3),
+            date_proximity=round(date_prox, 3),
+            league_found=league_conf,
+            match_finished=finished,
+        )
+
+    def _find_fixture(self, bet: Bet) -> tuple[dict | None, float, float, float]:
+        """Returns (fixture, name_match, date_proximity, league_confidence)."""
+        center = bet.date.date()
+        date_str = center.strftime("%Y-%m-%d")
+        league_id, league_conf = self._resolve_league(bet.league)
+        cache_key = (date_str, league_id)
+
+        if cache_key not in self._fixture_cache:
+            date_from = (center - timedelta(days=_DATE_WINDOW)).strftime("%Y-%m-%d")
+            date_to = (center + timedelta(days=_DATE_WINDOW)).strftime("%Y-%m-%d")
+            params: dict = {"from": date_from, "to": date_to}
+            if league_id is not None:
+                params["league"] = league_id
+                params["season"] = center.year if center.month >= 7 else center.year - 1
+            print(f"  {_GRAY}│  GET /fixtures {params}{_R}")
+            resp = _get(f"{_API_BASE}/fixtures", headers=self._headers, params=params)
+            resp.raise_for_status()
+            self._fixture_cache[cache_key] = resp.json().get("response", [])
+            print(f"  {_GRAY}│     {len(self._fixture_cache[cache_key])} fixtures returned (cached){_R}")
+        else:
+            print(f"  {_GRAY}│  /fixtures (±{_DATE_WINDOW}d of {date_str}, league={league_id}) served from cache{_R}")
+
+        fixture, name_match, date_prox = _best_fixture_match(
+            self._fixture_cache[cache_key], bet.team1Name, bet.team2Name, center
+        )
+        return fixture, name_match, date_prox, league_conf
+
+    def _resolve_league(self, league_name: str) -> tuple[int | None, float]:
+        key = league_name.lower().strip()
+        if key in self._league_cache:
+            return self._league_cache[key]
+
+        for pattern, league_id in _LEAGUE_MAP.items():
+            if pattern in key:
+                print(f"  {_GRAY}│  league {league_name!r} -> id={league_id} (static map){_R}")
+                self._league_cache[key] = (league_id, 1.0)
+                return league_id, 1.0
+
+        # Fall back to API search — lower confidence since first result is taken unverified
+        print(f"  {_GRAY}│  GET /leagues search={league_name!r}{_R}")
+        resp = _get(f"{_API_BASE}/leagues", headers=self._headers, params={"search": league_name[:20]})
+        results = resp.json().get("response", [])
+        if results:
+            league_id = results[0]["league"]["id"]
+            league_found_name = results[0]["league"]["name"]
+            print(f"  {_GRAY}│     matched {league_found_name!r} id={league_id} (API fallback, confidence=0.7){_R}")
+            self._league_cache[key] = (league_id, 0.7)
+            return league_id, 0.7
+
+        print(f"  {_GRAY}│     no league found, searching fixtures by date only (confidence=0.3){_R}")
+        self._league_cache[key] = (None, 0.3)
+        return None, 0.3
+
+
+def _similarity(a: str, b: str) -> float:
+    return SequenceMatcher(None, a.lower(), b.lower()).ratio()
+
+
+def _date_proximity(fixture: dict, center) -> float:
+    """1.0 on exact date, linear decay to 0.0 at _DATE_WINDOW days away."""
+    fixture_date = datetime.fromisoformat(fixture["fixture"]["date"].replace("Z", "+00:00")).date()
+    days_off = abs((fixture_date - center).days)
+    return max(0.0, 1.0 - days_off / _DATE_WINDOW)
+
+
+def _best_fixture_match(fixtures: list[dict], team1: str, team2: str, center) -> tuple[dict | None, float, float]:
+    """Returns (best_fixture, name_score, date_proximity) or (None, 0, 0) if no good match."""
+    best, best_combined, best_name, best_date = None, 0.0, 0.0, 0.0
+    for f in fixtures:
+        home = f["teams"]["home"]["name"]
+        away = f["teams"]["away"]["name"]
+        name_score = max(
+            _similarity(team1, home) + _similarity(team2, away),
+            _similarity(team1, away) + _similarity(team2, home),
+        ) / 2
+        date_prox = _date_proximity(f, center)
+        # Name similarity is the primary signal; date proximity is a tiebreaker
+        combined = name_score * 0.8 + date_prox * 0.2
+        if combined > best_combined:
+            best_combined = combined
+            best_name = name_score
+            best_date = date_prox
+            best = f
+    # Require minimum name similarity — date alone cannot rescue a bad name match
+    return (best, best_name, best_date) if best_name > 0.5 else (None, best_name, best_date)
+
+
+def _is_finished(fixture: dict) -> float:
+    status = fixture.get("fixture", {}).get("status", {}).get("short", "")
+    return 1.0 if status in ("FT", "AET", "PEN", "AWD", "WO") else 0.0
+
+
+def _evaluate_bet(bet: Bet, fixture: dict) -> BetOutcome:
+    goals = fixture.get("goals", {})
+    home = goals.get("home")
+    away = goals.get("away")
+
+    if home is None or away is None:
+        return BetOutcome.UNKNOWN
+
+    if isinstance(bet, WinDrawLose):
+        bet_draw = bet.betType in ("X", "0")
+        if bet_draw:
+            return BetOutcome.WIN if home == away else BetOutcome.LOSE
+        actual = "1" if home > away else ("0" if home == away else "2")
+        return BetOutcome.WIN if actual == bet.betType else BetOutcome.LOSE
+
+    if isinstance(bet, WinDrawLoseDouble):
+        actual = "1" if home > away else ("0" if home == away else "2")
+        return BetOutcome.WIN if actual in bet.betType else BetOutcome.LOSE
+
+    if isinstance(bet, WinLose):
+        if home == away:
+            return BetOutcome.VOID
+        actual = "1" if home > away else "2"
+        return BetOutcome.WIN if actual == bet.betType else BetOutcome.LOSE
+
+    if isinstance(bet, BothTeamScored):
+        return BetOutcome.WIN if home > 0 and away > 0 else BetOutcome.LOSE
+
+    if isinstance(bet, GoalAmount):
+        total = home + away
+        if total == bet.line:
+            return BetOutcome.VOID
+        won = total > bet.line if bet.over else total < bet.line
+        return BetOutcome.WIN if won else BetOutcome.LOSE
+
+    if isinstance(bet, GoalHandicap):
+        h_home = home + (bet.handicap_amount if bet.team_bet == "1" else 0.0)
+        h_away = away + (bet.handicap_amount if bet.team_bet == "2" else 0.0)
+        if h_home == h_away:
+            return BetOutcome.VOID
+        actual_winner = "1" if h_home > h_away else "2"
+        return BetOutcome.WIN if actual_winner == bet.team_bet else BetOutcome.LOSE
+
+    return BetOutcome.UNKNOWN
--- a/src/beaky/scanner/scanner.py
+++ b/src/beaky/scanner/scanner.py
@@ -1,5 +1,5 @@
 from datetime import datetime
-from typing import Iterator, List, Optional
+from typing import Any, Iterator, List, Optional

 from openpyxl import load_workbook
 from pydantic.dataclasses import dataclass
@@ -9,11 +9,18 @@ from beaky.config import Config

@dataclass
 class Link:
-    id: str
+    """Represents a single link row from an Excel sheet.
+
+    Attributes:
+        id: identifier from the sheet (cast to int)
+        url: link to the web page
+        date: optional creation date (datetime or None)
+    """
+
+    id: int
    url: str
    date: Optional[datetime] = None

-
 class Links:
    def __init__(self, path: str | Config):
        if isinstance(path, Config):
@@ -26,15 +33,16 @@ class Links:
        """Read the Excel file at self._path and populate self.links.

        Expects the first sheet to contain a header row with columns that include
-        at least: 'id', 'link' (or 'url'), and 'date' (case-insensitive). The
-        method will attempt to parse dates and will store them as datetime when
-        possible; missing or unparsable dates become None.
+        at least: 'id', 'link' (or 'url'), and optionally 'date' (case-insensitive).
+        Returns the list of Link objects (also stored in self.links).
        """
+        print("started ret_links()")
        wb = load_workbook(filename=self._path, read_only=True, data_only=True)
        ws = wb.active

        # Read header row
-        rows = ws.iter_rows(values_only=True)
+        rows = ws.rows
+
        try:
            header = next(rows)
        except StopIteration:
@@ -43,11 +51,10 @@ class Links:
        if not header:
            return []

-        # Normalize header names -> index map
-        header_map = {(str(h).strip().lower() if h is not None else ""): i for i, h in enumerate(header) }
+        # Normalize header names -> index map, making sure to use .value
+        header_map = {(str(h.value).strip().lower() if h.value is not None else ""): i for i, h in enumerate(header)}

-        # Helper to parse date-like values
-        def parse_date(v: None | datetime) -> Optional[datetime]:
+        def parse_date(v: Any) -> Optional[datetime]:
            if v is None:
                return None
            if isinstance(v, datetime):
@@ -71,28 +78,40 @@ class Links:

        # Find the column indices we care about
        id_idx = header_map.get("id")
-        url_idx = header_map.get("link")
+        url_idx = header_map.get("url")
        date_idx = header_map.get("date")

        if id_idx is None or url_idx is None:
            # Required columns missing
+            print(f"Required 'id' or 'url' column missing in header. Found headers: {list(header_map.keys())}")
            return []

        for row in rows:
            try:
-                raw_id = row[id_idx] if id_idx < len(row) else None
-                raw_url = row[url_idx] if url_idx < len(row) else None
-                raw_date = row[date_idx] if (date_idx is not None and date_idx < len(row)) else None
+                # Extract the actual values from the cell objects
+                raw_id = row[id_idx].value if id_idx < len(row) else None
+                raw_url = row[url_idx].value if url_idx < len(row) else None
+                raw_date = row[date_idx].value if (date_idx is not None and date_idx < len(row)) else None

-                if raw_id is None and raw_url is None:
+                if raw_id is None or raw_url is None:
                    # skip empty rows
                    continue

-                link = Link(id=str(raw_id).strip() if raw_id is not None else "",
-                             url=str(raw_url).strip() if raw_url is not None else "", date=parse_date(raw_date))
+                # Safely parse the ID to an integer, handling Excel float quirks
+                try:
+                    parsed_id = int(float(raw_id))
+                except (ValueError, TypeError):
+                    # Skip row if ID is missing or invalid text
+                    continue
+
+                link = Link(
+                    id=parsed_id,
+                    url=str(raw_url).strip() if raw_url is not None else "",
+                    date=parse_date(raw_date),
+                )
                self.links.append(link)
            except Exception:
-                # Skip problematic rows silently
+                # Skip problematic rows silently (or print(e) for debugging)
                continue

        return self.links
@@ -106,3 +125,14 @@ class Links:

 # Backwards-compatible alias in case other modules referenced Linker
 Linker = Links
+
+
+if __name__ == "__main__":
+    links_obj = Links("data/odkazy.xlsx")
+    links = links_obj.ret_links()
+    if not links:
+        print("No links returned.")
+    else:
+        print(f"Successfully loaded {len(links)} links!")
+        for link in links:
+            print(link.id, link.url, link.date)
--- a/src/beaky/screenshotter/init.py
+++ b/src/beaky/screenshotter/init.py
--- a/src/beaky/screenshotter/config.py
+++ b/src/beaky/screenshotter/config.py
@@ -0,0 +1,6 @@
+from pydantic.dataclasses import dataclass
+
+
+@dataclass
+class ScreenshotterConfig:
+    target_path: str
--- a/src/beaky/screenshotter/screenshotter.py
+++ b/src/beaky/screenshotter/screenshotter.py
@@ -0,0 +1,75 @@
+from pathlib import Path
+
+from playwright.sync_api import sync_playwright
+
+from beaky.config import Config
+from beaky.scanner.scanner import Link
+
+
+class Screenshotter:
+    def __init__(self, config: Config):
+        self.config = config
+
+
+    def capture_tickets(self, links: list[Link]):
+        with sync_playwright() as p:
+            browser = p.chromium.launch(headless=True)
+            context = browser.new_context()
+
+            for link in links:
+                print("capturing link:", link)
+                page = context.new_page()
+                target_path = Path(self.config.screenshotter.target_path) / f"{link.id}.png"
+                self.capture_ticket(page, link.url, target_path)
+
+            browser.close()
+
+    def capture_ticket(self,page, url, target_path, ticket_selector=".betslip-history-detail__left-panel"):
+            page.goto(url)
+            page.wait_for_selector(ticket_selector, timeout=10000)
+            page.wait_for_timeout(1000)
+            page.evaluate(f"""
+                            let el = document.querySelector('{ticket_selector}');
+                            if (el) {{
+                                let wrapper = el.querySelector('.betslip-selections');
+                                if (wrapper) {{
+                                    wrapper.style.setProperty('height', 'auto', 'important');
+                                    wrapper.style.setProperty('overflow', 'visible', 'important');
+                                }}
+
+                                while (el && el !== document.body) {{
+                                    el.style.setProperty('height', 'auto', 'important');
+                                    el.style.setProperty('max-height', 'none', 'important');
+                                    el.style.setProperty('overflow', 'visible', 'important');
+                                    el = el.parentElement;
+                                }}
+                            }}
+                        """)
+
+            # Hide fixed/absolute overlays (cookie banners, notifications, toasts)
+            # but preserve the ticket panel and its ancestors/descendants
+            page.evaluate(f"""
+                const ticket = document.querySelector('{ticket_selector}');
+                document.querySelectorAll('*').forEach(el => {{
+                    if (ticket && (ticket.contains(el) || el.contains(ticket))) return;
+                    const style = window.getComputedStyle(el);
+                    if ((style.position === 'fixed' || style.position === 'sticky') &&
+                        el.tagName !== 'BODY' && el.tagName !== 'HTML') {{
+                        el.style.setProperty('display', 'none', 'important');
+                    }}
+                }});
+            """)
+
+
+
+            # Resize viewport if the element extends beyond the bottom edge.
+            # The modal is vertically centered, so increasing the viewport by X shifts the element
+            # down by X/2. To compensate: new_height = 2 * bottom - current_height.
+            bbox = page.locator(ticket_selector).bounding_box()
+            bottom = bbox["y"] + bbox["height"]
+            vp_h = page.viewport_size["height"]
+            if bottom > vp_h:
+                page.set_viewport_size({"width": page.viewport_size["width"], "height": int(2 * bottom - vp_h) + 10})
+            # Wait for the browser to reflow after style changes before screenshotting
+            page.wait_for_timeout(500)
+            page.locator(ticket_selector).screenshot(path=target_path)
Author	SHA1	Message	Date
Janek Hlavatý	78d9fab189	RELEASE 0.1.0 Added resolver running on pure vibes	2026-03-22 00:56:05 +01:00
Janek Hlavatý	a6deeeaebf	Fix screenshotter again	2026-03-21 23:16:43 +01:00
Janek Hlavatý	5fc7bfafad	fix cli	2026-03-21 22:22:47 +01:00
Janek Hlavatý	7cd45f497a	Rename ticket -> bet create ticket class	2026-03-21 22:20:09 +01:00
Janek Hlavatý	f40a7911ca	Add one more classified class	2026-03-21 21:12:03 +01:00
Janek Hlavatý	57ad6c71f8	Ruffing	2026-03-21 20:43:34 +01:00
Janek Hlavatý	f4475ef1d4	Modify cli	2026-03-21 20:42:49 +01:00
Janek Hlavatý	5add445949	Add classifier contracts	2026-03-21 20:16:01 +01:00
Janek Hlavatý	987bdb2b63	Implement data types contract: FIXUP	2026-03-21 20:10:05 +01:00
Janek Hlavatý	2b29a1c662	Implement data types contract	2026-03-21 19:39:39 +01:00
Janek Hlavatý	697fe2548c	Add txt file extraction	2026-03-21 18:54:28 +01:00
Janek Hlavatý	770966e21f	Update dev dependency	2026-03-21 18:53:28 +01:00
Chlupaty	abb59aabe3	Scanner debug part 2 (done)	2026-03-21 18:49:01 +01:00
Janek Hlavatý	8adc374408	Add parsing to cli	2026-03-21 18:42:09 +01:00
Janek Hlavatý	1b2fee9b8d	Fix int	2026-03-21 18:30:04 +01:00
Chlupaty	1f9997b430	Scanner debug part 1	2026-03-21 18:28:51 +01:00
Janek Hlavatý	6c096e4300	fix Screenshotter	2026-03-21 18:25:15 +01:00
Janek Hlavatý	e94d96f153	fix Screenshotter	2026-03-21 18:21:46 +01:00
Janek Hlavatý	86e0bc8e51	Screenshotter	2026-03-21 17:58:06 +01:00
Janek Hlavatý	5126a985bf	Fix cli	2026-03-21 17:22:23 +01:00
Janek Hlavatý	f7369e29f2	Fix cli	2026-03-21 17:21:26 +01:00
Chlupaty	b6fc78e038	xddd	2026-03-21 16:51:49 +01:00
Janek Hlavatý	96c75ea0cc	test	2026-03-21 16:45:51 +01:00