From 576795a471d2a5bc6337e4724fb48f99b02576b4 Mon Sep 17 00:00:00 2001 From: italojohnny Date: Sun, 23 Jun 2024 19:22:43 -0300 Subject: [PATCH] fix regex validation for url --- src/backend/base/langflow/components/data/URL.py | 14 ++++++++------ 1 file changed, 8 insertions(+), 6 deletions(-) diff --git a/src/backend/base/langflow/components/data/URL.py b/src/backend/base/langflow/components/data/URL.py index cdf7300a0..eaa534702 100644 --- a/src/backend/base/langflow/components/data/URL.py +++ b/src/backend/base/langflow/components/data/URL.py @@ -44,14 +44,16 @@ class URLComponent(Component): # Basic URL validation regex url_regex = re.compile( - r"^(http://|https://)?" # http:// or https:// - r"(([a-zA-Z0-9\.-]+)" # domain - r"(\.[a-zA-Z]{2,}))" # top-level domain - r"(:[0-9]{1,5})?" # optional port - r"(\/.*)?$" # optional path + r"^(https?:\/\/)?" # optional protocol + r"(www\.)?" # optional www + r"([a-zA-Z0-9.-]+)" # domain + r"(\.[a-zA-Z]{2,})?" # top-level domain + r"(:\d+)?" # optional port + r"(\/[^\s]*)?$", # optional path + re.IGNORECASE ) - if not re.match(url_regex, string): + if not url_regex.match(string): raise ValueError(f"Invalid URL: {string}") return string