{
"event": "PreToolUse",
"tool_name": "Edit",
"tool_input": {
"file_path": "\/var\/www\/dev.campus.systemische-tools.de\/crawler\/src\/application\/use_cases\/start_crawl.py",
"old_string": "from collections.abc import Mapping\nfrom dataclasses import dataclass\n\nfrom src.domain.entities.crawl import Crawl",
"new_string": "from collections.abc import Mapping\nfrom dataclasses import dataclass\nfrom datetime import datetime\n\nfrom src.domain.entities.crawl import Crawl",
"replace_all": false
}
}
{
"tool_response": {
"filePath": "\/var\/www\/dev.campus.systemische-tools.de\/crawler\/src\/application\/use_cases\/start_crawl.py",
"oldString": "from collections.abc import Mapping\nfrom dataclasses import dataclass\n\nfrom src.domain.entities.crawl import Crawl",
"newString": "from collections.abc import Mapping\nfrom dataclasses import dataclass\nfrom datetime import datetime\n\nfrom src.domain.entities.crawl import Crawl",
"originalFile": "from __future__ import annotations\n\nfrom collections.abc import Mapping\nfrom dataclasses import dataclass\n\nfrom src.domain.entities.crawl import Crawl\nfrom src.domain.entities.url import Url\nfrom src.domain.ports.clock_port import ClockPort\nfrom src.domain.ports.crawl_repository_port import CrawlRepositoryPort\nfrom src.domain.ports.url_queue_port import UrlQueuePort\nfrom src.domain.ports.url_repository_port import UrlRepositoryPort\nfrom src.domain.services.url_normalizer import UrlNormalizer\nfrom src.domain.value_objects.enums import CrawlMode, CrawlStatus, TriggerSource\n\n\n@dataclass(frozen=True, slots=True)\nclass StartCrawlInput:\n base_url: str\n mode: CrawlMode\n trigger_source: TriggerSource\n config: Mapping[str, object]\n\n\nclass StartCrawlUseCase:\n def __init__(\n self,\n *,\n crawls: CrawlRepositoryPort,\n urls: UrlRepositoryPort,\n queue: UrlQueuePort,\n normalizer: UrlNormalizer,\n clock: ClockPort,\n ) -> None:\n self._crawls = crawls\n self._urls = urls\n self._queue = queue\n self._normalizer = normalizer\n self._clock = clock\n\n def execute(self, command: StartCrawlInput) -> Crawl:\n now = self._clock.now()\n crawl = self._crawls.save(\n Crawl(\n id=None,\n base_url=command.base_url,\n mode=command.mode,\n started_at=now,\n finished_at=None,\n status=CrawlStatus.RUNNING,\n trigger_source=command.trigger_source,\n config=command.config,\n ),\n )\n if crawl.id is None:\n raise RuntimeError(\"CrawlRepository did not assign id after save\")\n self._enqueue_seed(crawl_id=crawl.id, raw_url=command.base_url, now=now)\n return crawl\n\n def _enqueue_seed(self, *, crawl_id: int, raw_url: str, now: datetime) -> None:\n normalized = self._normalizer.normalize(raw_url)\n self._urls.upsert(\n Url(\n id=None,\n normalized=normalized,\n is_internal=True,\n first_seen_at=now,\n last_seen_at=now,\n ),\n )\n self._queue.enqueue(crawl_id, normalized)\n",
"structuredPatch": [
{
"oldStart": 2,
"oldLines": 6,
"newStart": 2,
"newLines": 7,
"lines": [
" ",
" from collections.abc import Mapping",
" from dataclasses import dataclass",
"+from datetime import datetime",
" ",
" from src.domain.entities.crawl import Crawl",
" from src.domain.entities.url import Url"
]
}
],
"userModified": false,
"replaceAll": false
}
}