Fetching - Small improvement memory handling in detecting price information (saves ~10Mb)

2025-04-11 10:11:59 +02:00
parent 4269079c54
commit 5f43d988a3
1 changed files with 4 additions and 2 deletions
--- a/changedetectionio/html_tools.py
+++ b/changedetectionio/html_tools.py
@@ -477,8 +477,10 @@ def html_to_text(html_content: str, render_anchor_tag_content=False, is_rss=Fals
 # Does LD+JSON exist with a @type=='product' and a .price set anywhere?
 def has_ldjson_product_info(content):
    try:
-        lc = content.lower()
+        # Better than .lower() which can use a lot of ram
-        if 'application/ld+json' in lc and lc.count('"price"') == 1 and '"pricecurrency"' in lc:
+        if (re.search(r'application/ld\+json', content, re.IGNORECASE) and
            re.search(r'"price"', content, re.IGNORECASE) and
            re.search(r'"pricecurrency"', content, re.IGNORECASE)):
            return True
 #       On some pages this is really terribly expensive when they dont really need it