fix: Don't continue parsing recipes with errored HTTP status codes (#7230)

2026-07-20 14:40:14 -04:00 · 2026-03-12 15:58:40 +02:00
parent 8189416495
commit 6a3b38a31e
4 changed files with 14 additions and 10 deletions
--- a/tests/integration_tests/user_recipe_tests/test_recipe_create_from_video.py
+++ b/tests/integration_tests/user_recipe_tests/test_recipe_create_from_video.py
@@ -33,7 +33,7 @@ def video_scraper_setup(monkeypatch: pytest.MonkeyPatch):

    # Prevent any real HTTP calls during scraping
    async def mock_safe_scrape_html(url: str) -> str:
-        return ""
+        return "<html></html>"

    monkeypatch.setattr(recipe_scraper_module, "safe_scrape_html", mock_safe_scrape_html)

--- a/tests/integration_tests/user_recipe_tests/test_recipe_crud.py
+++ b/tests/integration_tests/user_recipe_tests/test_recipe_crud.py
@@ -14,11 +14,11 @@ from bs4 import BeautifulSoup
 from fastapi.testclient import TestClient
 from httpx import Response
 from pytest import MonkeyPatch
-from recipe_scrapers._abstract import AbstractScraper
 from recipe_scrapers._schemaorg import SchemaOrg
 from recipe_scrapers.plugins import SchemaOrgFillPlugin
 from slugify import slugify

+import mealie.services.scraper.recipe_scraper as recipe_scraper_module
 from mealie.db.models.recipe import RecipeModel
 from mealie.pkgs.safehttp.transport import AsyncSafeTransport
 from mealie.schema.cookbook.cookbook import SaveCookBook
@@ -102,12 +102,12 @@ def test_create_by_url(
    monkeypatch: MonkeyPatch,
 ):
    for recipe_data in recipe_test_data:
-        # Override init function for AbstractScraper to use the test html instead of calling the url
-        monkeypatch.setattr(
-            AbstractScraper,
-            "__init__",
-            get_init(recipe_data.html_file),
-        )
+        # Prevent any real HTTP calls during scraping
+        async def mock_safe_scrape_html(url: str) -> str:
+            return "<html></html>"
+
+        monkeypatch.setattr(recipe_scraper_module, "safe_scrape_html", mock_safe_scrape_html)
+
        # Override the get_html method of the RecipeScraperOpenGraph to return the test html
        for scraper_cls in DEFAULT_SCRAPER_STRATEGIES:
            monkeypatch.setattr(