screenshot-to-code/backend/codegen/utils.py

20 lines
579 B
Python

import re
import sentry_sdk
def extract_html_content(text: str):
# Use regex to find content within <html> tags and include the tags themselves
match = re.search(r"(<html.*?>.*?</html>)", text, re.DOTALL)
if match:
return match.group(1)
else:
# Otherwise, we just send the previous HTML over
print(
"[HTML Extraction] No <html> tags found in the generated content: " + text
)
sentry_sdk.capture_exception(
Exception(" No <html> tags found in the generated content")
)
return text