mirror of
				https://github.com/mealie-recipes/mealie.git
				synced 2025-11-03 18:53:17 -05:00 
			
		
		
		
	fix: missing user agent for scraper (#1586)
* set user agent for requests.get * bump scraper version
This commit is contained in:
		@@ -15,6 +15,7 @@ from mealie.services.scraper.scraped_extras import ScrapedExtras
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
from . import cleaner
 | 
					from . import cleaner
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					_FIREFOX_UA = "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:86.0) Gecko/20100101 Firefox/86.0"
 | 
				
			||||||
SCRAPER_TIMEOUT = 15
 | 
					SCRAPER_TIMEOUT = 15
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
@@ -28,7 +29,7 @@ def safe_scrape_html(url: str) -> str:
 | 
				
			|||||||
    if the request takes longer than 15 seconds. This is used to mitigate
 | 
					    if the request takes longer than 15 seconds. This is used to mitigate
 | 
				
			||||||
    DDOS attacks from users providing a url with arbitrary large content.
 | 
					    DDOS attacks from users providing a url with arbitrary large content.
 | 
				
			||||||
    """
 | 
					    """
 | 
				
			||||||
    resp = requests.get(url, timeout=SCRAPER_TIMEOUT, stream=True)
 | 
					    resp = requests.get(url, timeout=SCRAPER_TIMEOUT, stream=True, headers={"User-Agent": _FIREFOX_UA})
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    html_bytes = b""
 | 
					    html_bytes = b""
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 
 | 
				
			|||||||
							
								
								
									
										8
									
								
								poetry.lock
									
									
									
										generated
									
									
									
								
							
							
						
						
									
										8
									
								
								poetry.lock
									
									
									
										generated
									
									
									
								
							@@ -1246,7 +1246,7 @@ rdflib = ">=5.0.0"
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
[[package]]
 | 
					[[package]]
 | 
				
			||||||
name = "recipe-scrapers"
 | 
					name = "recipe-scrapers"
 | 
				
			||||||
version = "14.11.0"
 | 
					version = "14.13.0"
 | 
				
			||||||
description = "Python package, scraping recipes from all over the internet"
 | 
					description = "Python package, scraping recipes from all over the internet"
 | 
				
			||||||
category = "main"
 | 
					category = "main"
 | 
				
			||||||
optional = false
 | 
					optional = false
 | 
				
			||||||
@@ -1619,7 +1619,7 @@ pgsql = ["psycopg2-binary"]
 | 
				
			|||||||
[metadata]
 | 
					[metadata]
 | 
				
			||||||
lock-version = "1.1"
 | 
					lock-version = "1.1"
 | 
				
			||||||
python-versions = "^3.10"
 | 
					python-versions = "^3.10"
 | 
				
			||||||
content-hash = "ac22f90df7cc8fc0e1787a0379d1c4e2f4cd1ab7520956fbd5bbf359c3a81480"
 | 
					content-hash = "80bd1bd922ed481e594d5950fb254cedfeeac467d5f3fcb4d241d6d9c689419b"
 | 
				
			||||||
 | 
					
 | 
				
			||||||
[metadata.files]
 | 
					[metadata.files]
 | 
				
			||||||
aiofiles = [
 | 
					aiofiles = [
 | 
				
			||||||
@@ -2381,8 +2381,8 @@ rdflib-jsonld = [
 | 
				
			|||||||
    {file = "rdflib_jsonld-0.6.2-py2.py3-none-any.whl", hash = "sha256:011afe67672353ca9978ab9a4bee964dff91f14042f2d8a28c22a573779d2f8b"},
 | 
					    {file = "rdflib_jsonld-0.6.2-py2.py3-none-any.whl", hash = "sha256:011afe67672353ca9978ab9a4bee964dff91f14042f2d8a28c22a573779d2f8b"},
 | 
				
			||||||
]
 | 
					]
 | 
				
			||||||
recipe-scrapers = [
 | 
					recipe-scrapers = [
 | 
				
			||||||
    {file = "recipe_scrapers-14.11.0-py3-none-any.whl", hash = "sha256:992b37ef2c29d66caaec82b2c5a1f9d901a74d2e267e60e505370c59ceadaeef"},
 | 
					    {file = "recipe_scrapers-14.13.0-py3-none-any.whl", hash = "sha256:4d9eb6d22dbe38976e1853c7d6e8f2060412cefb741ff03818c34b3faf8ea8e9"},
 | 
				
			||||||
    {file = "recipe_scrapers-14.11.0.tar.gz", hash = "sha256:85192e976388eeba9bb314c5cf75ac087ec1cfaf4b4aa1ffe580dae4099e2be9"},
 | 
					    {file = "recipe_scrapers-14.13.0.tar.gz", hash = "sha256:b4e08e9e34ff4490025a844c6823d5f269f54e1e866ee86162760a3f5ce0dd22"},
 | 
				
			||||||
]
 | 
					]
 | 
				
			||||||
requests = []
 | 
					requests = []
 | 
				
			||||||
requests-oauthlib = [
 | 
					requests-oauthlib = [
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -30,7 +30,7 @@ passlib = "^1.7.4"
 | 
				
			|||||||
lxml = "^4.7.1"
 | 
					lxml = "^4.7.1"
 | 
				
			||||||
Pillow = "^8.2.0"
 | 
					Pillow = "^8.2.0"
 | 
				
			||||||
apprise = "^0.9.6"
 | 
					apprise = "^0.9.6"
 | 
				
			||||||
recipe-scrapers = "^14.11.0"
 | 
					recipe-scrapers = "^14.13.0"
 | 
				
			||||||
psycopg2-binary = {version = "^2.9.1", optional = true}
 | 
					psycopg2-binary = {version = "^2.9.1", optional = true}
 | 
				
			||||||
gunicorn = "^20.1.0"
 | 
					gunicorn = "^20.1.0"
 | 
				
			||||||
emails = "^0.6"
 | 
					emails = "^0.6"
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user