From b081e723477de9a92fbe23a2723274d7d36cf050 Mon Sep 17 00:00:00 2001 From: John Mizerek Date: Fri, 13 Feb 2026 09:26:37 -0800 Subject: [PATCH] Improve business info extraction from saved Toast pages Added multiple fallback methods to extract business name: 1. Title tag with Toast-specific parsing 2. og:title and og:site_name meta tags 3. Header elements with restaurant/location classes 4. First h1 tag as last resort Also added address and phone extraction from visible HTML. Added summary logging of business info keys found. Co-Authored-By: Claude Opus 4.5 --- api/setup/analyzeMenuUrl.cfm | 99 +++++++++++++++++++++++++++++++++--- 1 file changed, 93 insertions(+), 6 deletions(-) diff --git a/api/setup/analyzeMenuUrl.cfm b/api/setup/analyzeMenuUrl.cfm index 0041566..2701563 100644 --- a/api/setup/analyzeMenuUrl.cfm +++ b/api/setup/analyzeMenuUrl.cfm @@ -172,20 +172,101 @@ - - ([^<]+)', pageHtml)> + + + + ]*>([^<]+)', pageHtml)> - ([^<]+).*', '\1')> + ]*>([^<]+).*', '\1')> - - + + + + - + + + + + + + ]*property=["'']og:(site_name|title)["''][^>]*content=["'']([^"'']+)["'']', pageHtml)> + + + ]*content=["'']([^"'']+)["''][^>]*property=["'']og:(site_name|title)["'']', pageHtml)> + + + + + ]*>.*', '')> + + + + + + + + + + + + + + + + ]*class="[^"]*(?:restaurant|location|brand)[^"]*"[^>]*>([^<]+)<', pageHtml)> + + ([^<]+)<.*', '\1')> + + + + + + + + + + + ]*>([^<]+)', pageHtml)> + + ]*>([^<]+).*', '\1')> + + + + + + + + + + + + ]*class="[^"]*address[^"]*"[^>]*>([^<]+)]+>', pageHtml)> + + ([^<]+) + + + + + + + + + + + + )\s*\(?(\d{3})\)?[-.\s]?(\d{3})[-.\s]?(\d{4})', pageHtml)> + + + + + + @@ -276,6 +357,12 @@ + + + + + +