Merge pull request #77 from barrett-ruth/feat/cses-categories

CSES Categories
2025-09-20 20:16:34 +02:00 · 2025-09-20 20:16:34 +02:00 · b992e1e635
commit b992e1e635
parent 07be94d7aa 315e5a790c
12 changed files with 562 additions and 99 deletions
--- a/doc/cp.txt
+++ b/doc/cp.txt
@ -326,7 +326,7 @@ CSES ~
 URL format: https://cses.fi/problemset/task/1068
 CSES (Code Submission Evaluation System) is organized by problem categories
-rather than traditional contests. All problems are accessible individually.
+rather than traditional contests. Problems are grouped by topic and difficulty.
 Platform characteristics:
 • Organization: Category-based (Introductory, Sorting, Dynamic Programming)
@ -337,17 +337,17 @@ Platform characteristics:
 In terms of cp.nvim, this corresponds to:
 - Platform: cses
- Contest ID: Problem ID (1068) - used as both contest and problem identifier
+- Contest ID: Category name (introductory_problems, sorting_and_searching)
- Problem ID: nil (not applicable for CSES structure)
+- Problem ID: Problem number (1068, 1640)
 Usage examples: >
-    :CP cses 1068               " Set up problem 1068 from CSES
+    :CP cses dynamic_programming 1633      " Set up problem 1633 from DP category
    :CP 1070                    " Switch to problem 1070 (if CSES context loaded)
    :CP next                    " Navigate to next problem in CSES sequence
 <
-                                Note: CSES problems are treated as individual
+                                Note: Both category and problem ID are required
                                entities rather than contest problems.
 ==============================================================================
 COMPLETE WORKFLOW EXAMPLE                                        *cp-example*
 Example: Setting up and solving AtCoder contest ABC324
--- a/lua/cp/init.lua
+++ b/lua/cp/init.lua
@ -700,12 +700,11 @@ local function parse_command(args)
      }
    elseif #filtered_args == 2 then
      if first == 'cses' then
-        return {
+        logger.log(
-          type = 'cses_problem',
+          'CSES requires both category and problem ID. Usage: :CP cses <category> <problem_id>',
-          platform = first,
+          vim.log.levels.ERROR
-          problem = filtered_args[2],
+        )
-          language = language,
+        return { type = 'error' }
        }
      else
        return {
          type = 'contest_setup',
@ -851,22 +850,6 @@ function M.handle_command(opts)
    return
  end
  if cmd.type == 'cses_problem' then
    if set_platform(cmd.platform) then
      if vim.tbl_contains(config.scrapers, cmd.platform) then
        local metadata_result = scrape.scrape_contest_metadata(cmd.platform, '')
        if not metadata_result.success then
          logger.log(
            'failed to load contest metadata: ' .. (metadata_result.error or 'unknown error'),
            vim.log.levels.WARN
          )
        end
      end
      setup_problem(cmd.problem, nil, cmd.language)
    end
    return
  end
  if cmd.type == 'problem_switch' then
    if state.platform == 'cses' then
      setup_problem(cmd.problem, nil, cmd.language)
--- a/lua/cp/scrape.lua
+++ b/lua/cp/scrape.lua
@ -89,29 +89,16 @@ function M.scrape_contest_metadata(platform, contest_id)
  local plugin_path = get_plugin_path()
-  local args
+  local args = {
-  if platform == 'cses' then
+    'uv',
-    args = {
+    'run',
-      'uv',
+    '--directory',
-      'run',
+    plugin_path,
-      '--directory',
+    '-m',
-      plugin_path,
+    'scrapers.' .. platform,
-      '-m',
+    'metadata',
-      'scrapers.' .. platform,
+    contest_id,
-      'metadata',
+  }
    }
  else
    args = {
      'uv',
      'run',
      '--directory',
      plugin_path,
      '-m',
      'scrapers.' .. platform,
      'metadata',
      contest_id,
    }
  end
  local result = vim
    .system(args, {
@ -140,12 +127,7 @@ function M.scrape_contest_metadata(platform, contest_id)
    return data
  end
-  local problems_list
+  local problems_list = data.problems or {}
  if platform == 'cses' then
    problems_list = data.categories and data.categories['CSES Problem Set'] or {}
  else
    problems_list = data.problems or {}
  end
  cache.set_contest_data(platform, contest_id, problems_list)
  return {
@ -223,7 +205,7 @@ function M.scrape_problem(ctx)
      '-m',
      'scrapers.' .. ctx.contest,
      'tests',
-      ctx.contest_id,
+      ctx.problem_id,
    }
  else
    args = {
--- a/scrapers/atcoder.py
+++ b/scrapers/atcoder.py
@ -3,12 +3,20 @@
 import json
 import re
 import sys
 import time
 from dataclasses import asdict
 import requests
 from bs4 import BeautifulSoup, Tag
-from .models import MetadataResult, ProblemSummary, TestCase, TestsResult
+from .models import (
    ContestListResult,
    ContestSummary,
    MetadataResult,
    ProblemSummary,
    TestCase,
    TestsResult,
 )
 def extract_problem_limits(soup: BeautifulSoup) -> tuple[int, float]:
@ -159,11 +167,78 @@ def scrape(url: str) -> list[TestCase]:
        return []
 def scrape_contests() -> list[ContestSummary]:
    contests = []
    max_pages = 15
    for page in range(1, max_pages + 1):
        try:
            headers = {
                "User-Agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
            }
            url = f"https://atcoder.jp/contests/archive?page={page}"
            response = requests.get(url, headers=headers, timeout=10)
            response.raise_for_status()
            soup = BeautifulSoup(response.text, "html.parser")
            table = soup.find("table", class_="table")
            if not table:
                break
            tbody = table.find("tbody")
            if not tbody or not isinstance(tbody, Tag):
                break
            rows = tbody.find_all("tr")
            if not rows:
                break
            for row in rows:
                cells = row.find_all("td")
                if len(cells) < 2:
                    continue
                contest_cell = cells[1]
                link = contest_cell.find("a")
                if not link or not link.get("href"):
                    continue
                href = link.get("href")
                contest_id = href.split("/")[-1]
                name = link.get_text().strip()
                display_name = name
                if "AtCoder Beginner Contest" in name:
                    match = re.search(r"AtCoder Beginner Contest (\d+)", name)
                    if match:
                        display_name = f"Beginner Contest {match.group(1)} (ABC)"
                elif "AtCoder Regular Contest" in name:
                    match = re.search(r"AtCoder Regular Contest (\d+)", name)
                    if match:
                        display_name = f"Regular Contest {match.group(1)} (ARC)"
                elif "AtCoder Grand Contest" in name:
                    match = re.search(r"AtCoder Grand Contest (\d+)", name)
                    if match:
                        display_name = f"Grand Contest {match.group(1)} (AGC)"
                contests.append(
                    ContestSummary(id=contest_id, name=name, display_name=display_name)
                )
            time.sleep(0.5)
        except Exception as e:
            print(f"Failed to scrape page {page}: {e}", file=sys.stderr)
            continue
    return contests
 def main() -> None:
    if len(sys.argv) < 2:
        result = MetadataResult(
            success=False,
-            error="Usage: atcoder.py metadata <contest_id> OR atcoder.py tests <contest_id> <problem_letter>",
+            error="Usage: atcoder.py metadata <contest_id> OR atcoder.py tests <contest_id> <problem_letter> OR atcoder.py contests",
        )
        print(json.dumps(asdict(result)))
        sys.exit(1)
@ -264,10 +339,27 @@ def main() -> None:
        )
        print(json.dumps(asdict(tests_result)))
    elif mode == "contests":
        if len(sys.argv) != 2:
            contest_result = ContestListResult(
                success=False, error="Usage: atcoder.py contests"
            )
            print(json.dumps(asdict(contest_result)))
            sys.exit(1)
        contests = scrape_contests()
        if not contests:
            contest_result = ContestListResult(success=False, error="No contests found")
            print(json.dumps(asdict(contest_result)))
            sys.exit(1)
        contest_result = ContestListResult(success=True, error="", contests=contests)
        print(json.dumps(asdict(contest_result)))
    else:
        result = MetadataResult(
            success=False,
-            error=f"Unknown mode: {mode}. Use 'metadata' or 'tests'",
+            error=f"Unknown mode: {mode}. Use 'metadata', 'tests', or 'contests'",
        )
        print(json.dumps(asdict(result)))
        sys.exit(1)
--- a/scrapers/codeforces.py
+++ b/scrapers/codeforces.py
@ -7,7 +7,14 @@ from dataclasses import asdict
 import cloudscraper
 from bs4 import BeautifulSoup, Tag
-from .models import MetadataResult, ProblemSummary, TestCase, TestsResult
+from .models import (
    ContestListResult,
    ContestSummary,
    MetadataResult,
    ProblemSummary,
    TestCase,
    TestsResult,
 )
 def scrape(url: str) -> list[TestCase]:
@ -218,11 +225,54 @@ def scrape_sample_tests(url: str) -> list[TestCase]:
    return scrape(url)
 def scrape_contests() -> list[ContestSummary]:
    try:
        scraper = cloudscraper.create_scraper()
        response = scraper.get("https://codeforces.com/api/contest.list", timeout=10)
        response.raise_for_status()
        data = response.json()
        if data["status"] != "OK":
            return []
        contests = []
        for contest in data["result"]:
            contest_id = str(contest["id"])
            name = contest["name"]
            # Clean up contest names for display
            display_name = name
            if "Educational Codeforces Round" in name:
                import re
                match = re.search(r"Educational Codeforces Round (\d+)", name)
                if match:
                    display_name = f"Educational Round {match.group(1)}"
            elif "Codeforces Round" in name and "Div" in name:
                match = re.search(r"Codeforces Round (\d+) \(Div\. (\d+)\)", name)
                if match:
                    display_name = f"Round {match.group(1)} (Div. {match.group(2)})"
            elif "Codeforces Global Round" in name:
                match = re.search(r"Codeforces Global Round (\d+)", name)
                if match:
                    display_name = f"Global Round {match.group(1)}"
            contests.append(
                ContestSummary(id=contest_id, name=name, display_name=display_name)
            )
        return contests[:100]  # Limit to recent 100 contests
    except Exception as e:
        print(f"Failed to fetch contests: {e}", file=sys.stderr)
        return []
 def main() -> None:
    if len(sys.argv) < 2:
        result = MetadataResult(
            success=False,
-            error="Usage: codeforces.py metadata <contest_id> OR codeforces.py tests <contest_id> <problem_letter>",
+            error="Usage: codeforces.py metadata <contest_id> OR codeforces.py tests <contest_id> <problem_letter> OR codeforces.py contests",
        )
        print(json.dumps(asdict(result)))
        sys.exit(1)
@ -316,9 +366,27 @@ def main() -> None:
        )
        print(json.dumps(asdict(tests_result)))
    elif mode == "contests":
        if len(sys.argv) != 2:
            contest_result = ContestListResult(
                success=False, error="Usage: codeforces.py contests"
            )
            print(json.dumps(asdict(contest_result)))
            sys.exit(1)
        contests = scrape_contests()
        if not contests:
            contest_result = ContestListResult(success=False, error="No contests found")
            print(json.dumps(asdict(contest_result)))
            sys.exit(1)
        contest_result = ContestListResult(success=True, error="", contests=contests)
        print(json.dumps(asdict(contest_result)))
    else:
        result = MetadataResult(
-            success=False, error=f"Unknown mode: {mode}. Use 'metadata' or 'tests'"
+            success=False,
            error=f"Unknown mode: {mode}. Use 'metadata', 'tests', or 'contests'",
        )
        print(json.dumps(asdict(result)))
        sys.exit(1)
--- a/scrapers/cses.py
+++ b/scrapers/cses.py
@ -11,6 +11,85 @@ from bs4 import BeautifulSoup, Tag
 from .models import MetadataResult, ProblemSummary, TestCase, TestsResult
 def normalize_category_name(category_name: str) -> str:
    return category_name.lower().replace(" ", "_").replace("&", "and")
 def denormalize_category_name(category_id: str) -> str:
    category_map = {
        "introductory_problems": "Introductory Problems",
        "sorting_and_searching": "Sorting and Searching",
        "dynamic_programming": "Dynamic Programming",
        "graph_algorithms": "Graph Algorithms",
        "range_queries": "Range Queries",
        "tree_algorithms": "Tree Algorithms",
        "mathematics": "Mathematics",
        "string_algorithms": "String Algorithms",
        "geometry": "Geometry",
        "advanced_techniques": "Advanced Techniques",
    }
    return category_map.get(category_id, category_id.replace("_", " ").title())
 def scrape_category_problems(category_id: str) -> list[ProblemSummary]:
    category_name = denormalize_category_name(category_id)
    try:
        problemset_url = "https://cses.fi/problemset/"
        headers = {
            "User-Agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
        }
        response = requests.get(problemset_url, headers=headers, timeout=10)
        response.raise_for_status()
        soup = BeautifulSoup(response.text, "html.parser")
        current_category = None
        problems = []
        target_found = False
        for element in soup.find_all(["h1", "h2", "ul"]):
            if not isinstance(element, Tag):
                continue
            if element.name in ["h1", "h2"]:
                text = element.get_text(strip=True)
                if not text or text.startswith("CSES") or text == "CSES Problem Set":
                    continue
                if target_found and current_category != text:
                    break
                current_category = text
                if text.lower() == category_name.lower():
                    target_found = True
            elif element.name == "ul" and current_category and target_found:
                problem_links = element.find_all(
                    "a", href=lambda x: x and "/problemset/task/" in x
                )
                for link in problem_links:
                    href = link.get("href", "")
                    if not href:
                        continue
                    problem_id = href.split("/")[-1]
                    problem_name = link.get_text(strip=True)
                    if not problem_id.isdigit() or not problem_name:
                        continue
                    problems.append(ProblemSummary(id=problem_id, name=problem_name))
        problems.sort(key=lambda x: int(x.id))
        return problems
    except Exception as e:
        print(f"Failed to scrape CSES category {category_id}: {e}", file=sys.stderr)
        return []
 def parse_problem_url(problem_input: str) -> str | None:
    if problem_input.startswith("https://cses.fi/problemset/task/"):
        return problem_input
@ -94,21 +173,39 @@ def scrape_all_problems() -> dict[str, list[ProblemSummary]]:
        soup = BeautifulSoup(response.text, "html.parser")
        all_categories: dict[str, list[ProblemSummary]] = {}
        problem_links = soup.find_all(
            "a", href=lambda x: x and "/problemset/task/" in x
        )
        print(f"Found {len(problem_links)} problem links", file=sys.stderr)
        current_category = None
-        for element in soup.find_all(["h1", "a"]):
+        for element in soup.find_all(["h1", "h2", "ul"]):
-            current_category = process_problem_element(
+            if not isinstance(element, Tag):
-                element, current_category, all_categories
+                continue
-            )
+            if element.name in ["h1", "h2"]:
                text = element.get_text(strip=True)
                if text and not text.startswith("CSES") and text != "CSES Problem Set":
                    current_category = text
                    if current_category not in all_categories:
                        all_categories[current_category] = []
                        print(f"Found category: {current_category}", file=sys.stderr)
            elif element.name == "ul" and current_category:
                problem_links = element.find_all(
                    "a", href=lambda x: x and "/problemset/task/" in x
                )
                for link in problem_links:
                    href = link.get("href", "")
                    if href:
                        problem_id = href.split("/")[-1]
                        problem_name = link.get_text(strip=True)
                        if problem_id.isdigit() and problem_name:
                            problem = ProblemSummary(id=problem_id, name=problem_name)
                            all_categories[current_category].append(problem)
        for category in all_categories:
            all_categories[category].sort(key=lambda x: int(x.id))
-        print(f"Found {len(all_categories)} categories", file=sys.stderr)
+        print(
            f"Found {len(all_categories)} categories with {sum(len(probs) for probs in all_categories.values())} problems",
            file=sys.stderr,
        )
        return all_categories
    except Exception as e:
@ -170,7 +267,7 @@ def main() -> None:
    if len(sys.argv) < 2:
        result = MetadataResult(
            success=False,
-            error="Usage: cses.py metadata OR cses.py tests <problem_id_or_url>",
+            error="Usage: cses.py metadata <category_id> OR cses.py tests <problem_id_or_url>",
        )
        print(json.dumps(asdict(result)))
        sys.exit(1)
@ -178,25 +275,26 @@ def main() -> None:
    mode: str = sys.argv[1]
    if mode == "metadata":
-        if len(sys.argv) != 2:
+        if len(sys.argv) != 3:
            result = MetadataResult(
                success=False,
-                error="Usage: cses.py metadata",
+                error="Usage: cses.py metadata <category_id>",
            )
            print(json.dumps(asdict(result)))
            sys.exit(1)
-        all_categories: dict[str, list[ProblemSummary]] = scrape_all_problems()
+        category_id = sys.argv[2]
        problems = scrape_category_problems(category_id)
-        if not all_categories:
+        if not problems:
            result = MetadataResult(
                success=False,
-                error="Failed to scrape CSES problem categories",
+                error=f"No problems found for category: {category_id}",
            )
            print(json.dumps(asdict(result)))
-            sys.exit(1)
+            return
-        result = MetadataResult(success=True, error="", categories=all_categories)
+        result = MetadataResult(success=True, error="", problems=problems)
        print(json.dumps(asdict(result)))
    elif mode == "tests":
--- a/scrapers/models.py
+++ b/scrapers/models.py
@ -13,6 +13,13 @@ class ProblemSummary:
    name: str
@dataclass
 class ContestSummary:
    id: str
    name: str
    display_name: str
@dataclass
 class ScrapingResult:
    success: bool
@ -26,6 +33,11 @@ class MetadataResult(ScrapingResult):
    categories: dict[str, list[ProblemSummary]] = field(default_factory=dict)
@dataclass
 class ContestListResult(ScrapingResult):
    contests: list[ContestSummary] = field(default_factory=list)
@dataclass
 class TestsResult(ScrapingResult):
    problem_id: str
--- a/spec/command_parsing_spec.lua
+++ b/spec/command_parsing_spec.lua
@ -96,7 +96,7 @@ describe('cp command parsing', function()
    end)
    it('handles cses problem command', function()
-      local opts = { fargs = { 'cses', '1234' } }
+      local opts = { fargs = { 'cses', 'sorting_and_searching', '1234' } }
      assert.has_no_errors(function()
        cp.handle_command(opts)
--- a/spec/scraper_spec.lua
+++ b/spec/scraper_spec.lua
@ -214,7 +214,7 @@ describe('cp.scrape', function()
    end)
    it('constructs correct command for cses metadata', function()
-      scrape.scrape_contest_metadata('cses', 'problemset')
+      scrape.scrape_contest_metadata('cses', 'sorting_and_searching')
      local metadata_call = nil
      for _, call in ipairs(mock_system_calls) do
@ -227,7 +227,7 @@ describe('cp.scrape', function()
      assert.is_not_nil(metadata_call)
      assert.equals('uv', metadata_call.cmd[1])
      assert.is_true(vim.tbl_contains(metadata_call.cmd, 'metadata'))
-      assert.is_false(vim.tbl_contains(metadata_call.cmd, 'problemset'))
+      assert.is_true(vim.tbl_contains(metadata_call.cmd, 'sorting_and_searching'))
    end)
    it('handles subprocess execution failure', function()
@ -380,8 +380,8 @@ describe('cp.scrape', function()
    it('constructs correct command for cses problem tests', function()
      test_context.contest = 'cses'
-      test_context.contest_id = '1001'
+      test_context.contest_id = 'sorting_and_searching'
-      test_context.problem_id = nil
+      test_context.problem_id = '1001'
      scrape.scrape_problem(test_context)
@ -396,7 +396,7 @@ describe('cp.scrape', function()
      assert.is_not_nil(tests_call)
      assert.is_true(vim.tbl_contains(tests_call.cmd, 'tests'))
      assert.is_true(vim.tbl_contains(tests_call.cmd, '1001'))
-      assert.is_false(vim.tbl_contains(tests_call.cmd, 'a'))
+      assert.is_false(vim.tbl_contains(tests_call.cmd, 'sorting_and_searching'))
    end)
  end)
--- a/tests/scrapers/test_atcoder.py
+++ b/tests/scrapers/test_atcoder.py
@ -1,6 +1,7 @@
 from unittest.mock import Mock
-from scrapers.atcoder import scrape, scrape_contest_problems
+
-from scrapers.models import ProblemSummary
+from scrapers.atcoder import scrape, scrape_contest_problems, scrape_contests
 from scrapers.models import ContestSummary, ProblemSummary
 def test_scrape_success(mocker, mock_atcoder_html):
@ -49,3 +50,81 @@ def test_scrape_network_error(mocker):
    result = scrape("https://atcoder.jp/contests/abc350/tasks/abc350_a")
    assert result == []
 def test_scrape_contests_success(mocker):
    def mock_get_side_effect(url, **kwargs):
        if "page=1" in url:
            mock_response = Mock()
            mock_response.text = """
            <table class="table table-default table-striped table-hover table-condensed table-bordered small">
                <thead>
                    <tr>
                        <th>Start Time</th>
                        <th>Contest Name</th>
                        <th>Duration</th>
                        <th>Rated Range</th>
                    </tr>
                </thead>
                <tbody>
                    <tr>
                        <td>2025-01-15 21:00:00+0900</td>
                        <td><a href="/contests/abc350">AtCoder Beginner Contest 350</a></td>
                        <td>01:40</td>
                        <td> - 1999</td>
                    </tr>
                    <tr>
                        <td>2025-01-14 21:00:00+0900</td>
                        <td><a href="/contests/arc170">AtCoder Regular Contest 170</a></td>
                        <td>02:00</td>
                        <td>1000 - 2799</td>
                    </tr>
                </tbody>
            </table>
            """
            return mock_response
        else:
            # Return empty page for all other pages
            mock_response = Mock()
            mock_response.text = "<html><body>No table found</body></html>"
            return mock_response
    mocker.patch("scrapers.atcoder.requests.get", side_effect=mock_get_side_effect)
    mocker.patch("scrapers.atcoder.time.sleep")
    result = scrape_contests()
    assert len(result) == 2
    assert result[0] == ContestSummary(
        id="abc350",
        name="AtCoder Beginner Contest 350",
        display_name="Beginner Contest 350 (ABC)",
    )
    assert result[1] == ContestSummary(
        id="arc170",
        name="AtCoder Regular Contest 170",
        display_name="Regular Contest 170 (ARC)",
    )
 def test_scrape_contests_no_table(mocker):
    mock_response = Mock()
    mock_response.text = "<html><body>No table found</body></html>"
    mocker.patch("scrapers.atcoder.requests.get", return_value=mock_response)
    mocker.patch("scrapers.atcoder.time.sleep")
    result = scrape_contests()
    assert result == []
 def test_scrape_contests_network_error(mocker):
    mocker.patch(
        "scrapers.atcoder.requests.get", side_effect=Exception("Network error")
    )
    mocker.patch("scrapers.atcoder.time.sleep")
    result = scrape_contests()
    assert result == []
--- a/tests/scrapers/test_codeforces.py
+++ b/tests/scrapers/test_codeforces.py
@ -1,6 +1,7 @@
 from unittest.mock import Mock
-from scrapers.codeforces import scrape, scrape_contest_problems
+
-from scrapers.models import ProblemSummary
+from scrapers.codeforces import scrape, scrape_contest_problems, scrape_contests
 from scrapers.models import ContestSummary, ProblemSummary
 def test_scrape_success(mocker, mock_codeforces_html):
@ -51,3 +52,66 @@ def test_scrape_network_error(mocker):
    result = scrape("https://codeforces.com/contest/1900/problem/A")
    assert result == []
 def test_scrape_contests_success(mocker):
    mock_scraper = Mock()
    mock_response = Mock()
    mock_response.json.return_value = {
        "status": "OK",
        "result": [
            {"id": 1951, "name": "Educational Codeforces Round 168 (Rated for Div. 2)"},
            {"id": 1950, "name": "Codeforces Round 936 (Div. 2)"},
            {"id": 1949, "name": "Codeforces Global Round 26"},
        ],
    }
    mock_scraper.get.return_value = mock_response
    mocker.patch(
        "scrapers.codeforces.cloudscraper.create_scraper", return_value=mock_scraper
    )
    result = scrape_contests()
    assert len(result) == 3
    assert result[0] == ContestSummary(
        id="1951",
        name="Educational Codeforces Round 168 (Rated for Div. 2)",
        display_name="Educational Round 168",
    )
    assert result[1] == ContestSummary(
        id="1950",
        name="Codeforces Round 936 (Div. 2)",
        display_name="Round 936 (Div. 2)",
    )
    assert result[2] == ContestSummary(
        id="1949", name="Codeforces Global Round 26", display_name="Global Round 26"
    )
 def test_scrape_contests_api_error(mocker):
    mock_scraper = Mock()
    mock_response = Mock()
    mock_response.json.return_value = {"status": "FAILED", "result": []}
    mock_scraper.get.return_value = mock_response
    mocker.patch(
        "scrapers.codeforces.cloudscraper.create_scraper", return_value=mock_scraper
    )
    result = scrape_contests()
    assert result == []
 def test_scrape_contests_network_error(mocker):
    mock_scraper = Mock()
    mock_scraper.get.side_effect = Exception("Network error")
    mocker.patch(
        "scrapers.codeforces.cloudscraper.create_scraper", return_value=mock_scraper
    )
    result = scrape_contests()
    assert result == []
--- a/tests/scrapers/test_cses.py
+++ b/tests/scrapers/test_cses.py
@ -1,5 +1,12 @@
 from unittest.mock import Mock
-from scrapers.cses import scrape, scrape_all_problems
+
 from scrapers.cses import (
    denormalize_category_name,
    normalize_category_name,
    scrape,
    scrape_all_problems,
    scrape_category_problems,
 )
 from scrapers.models import ProblemSummary
@ -19,12 +26,19 @@ def test_scrape_success(mocker, mock_cses_html):
 def test_scrape_all_problems(mocker):
    mock_response = Mock()
    mock_response.text = """
-    <h1>Introductory Problems</h1>
+    <div class="content">
-    <a href="/problemset/task/1068">Weird Algorithm</a>
+        <h1>Introductory Problems</h1>
-    <a href="/problemset/task/1083">Missing Number</a>
+        <ul>
-    <h1>Sorting and Searching</h1>
+            <li><a href="/problemset/task/1068">Weird Algorithm</a></li>
-    <a href="/problemset/task/1084">Apartments</a>
+            <li><a href="/problemset/task/1083">Missing Number</a></li>
        </ul>
        <h1>Sorting and Searching</h1>
        <ul>
            <li><a href="/problemset/task/1084">Apartments</a></li>
        </ul>
    </div>
    """
    mock_response.raise_for_status = Mock()
    mocker.patch("scrapers.cses.requests.get", return_value=mock_response)
@ -45,3 +59,74 @@ def test_scrape_network_error(mocker):
    result = scrape("https://cses.fi/problemset/task/1068")
    assert result == []
 def test_normalize_category_name():
    assert normalize_category_name("Sorting and Searching") == "sorting_and_searching"
    assert normalize_category_name("Dynamic Programming") == "dynamic_programming"
    assert normalize_category_name("Graph Algorithms") == "graph_algorithms"
 def test_denormalize_category_name():
    assert denormalize_category_name("sorting_and_searching") == "Sorting and Searching"
    assert denormalize_category_name("dynamic_programming") == "Dynamic Programming"
    assert denormalize_category_name("graph_algorithms") == "Graph Algorithms"
 def test_scrape_category_problems_success(mocker):
    mock_response = Mock()
    mock_response.text = """
    <div class="content">
        <h1>General</h1>
        <ul>
            <li><a href="/problemset/task/1000">Test Problem</a></li>
        </ul>
        <h1>Sorting and Searching</h1>
        <ul>
            <li><a href="/problemset/task/1640">Sum of Two Values</a></li>
            <li><a href="/problemset/task/1643">Maximum Subarray Sum</a></li>
        </ul>
        <h1>Dynamic Programming</h1>
        <ul>
            <li><a href="/problemset/task/1633">Dice Combinations</a></li>
        </ul>
    </div>
    """
    mock_response.raise_for_status = Mock()
    mocker.patch("scrapers.cses.requests.get", return_value=mock_response)
    result = scrape_category_problems("sorting_and_searching")
    assert len(result) == 2
    assert result[0].id == "1640"
    assert result[0].name == "Sum of Two Values"
    assert result[1].id == "1643"
    assert result[1].name == "Maximum Subarray Sum"
 def test_scrape_category_problems_not_found(mocker):
    mock_response = Mock()
    mock_response.text = """
    <div class="content">
        <h1>Some Other Category</h1>
        <ul>
            <li><a href="/problemset/task/1000">Test Problem</a></li>
        </ul>
    </div>
    """
    mock_response.raise_for_status = Mock()
    mocker.patch("scrapers.cses.requests.get", return_value=mock_response)
    result = scrape_category_problems("nonexistent_category")
    assert result == []
 def test_scrape_category_problems_network_error(mocker):
    mocker.patch("scrapers.cses.requests.get", side_effect=Exception("Network error"))
    result = scrape_category_problems("sorting_and_searching")
    assert result == []