From 8f0cda2ca22754f0fcb08ddda073cac3a70ba557 Mon Sep 17 00:00:00 2001 From: William Fu-Hinthorn <13333726+hinthornw@users.noreply.github.com> Date: Fri, 4 Aug 2023 16:03:02 -0700 Subject: [PATCH] update --- .../langchain/document_loaders/recursive_url_loader.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/libs/langchain/langchain/document_loaders/recursive_url_loader.py b/libs/langchain/langchain/document_loaders/recursive_url_loader.py index dad1fec6006..4cf6342e2ce 100644 --- a/libs/langchain/langchain/document_loaders/recursive_url_loader.py +++ b/libs/langchain/langchain/document_loaders/recursive_url_loader.py @@ -95,10 +95,8 @@ class RecursiveUrlLoader(BaseLoader): and link.startswith(current_root) ): child_links.add(link) - # import pdb; pdb.set_trace() # Get absolute path for all root relative links listed absolute_paths = [urljoin(base_url, link) for link in child_links] - # Store the visited links and recursively visit the children for link in absolute_paths: # Check all unvisited links