mirror of
				https://github.com/hwchase17/langchain.git
				synced 2025-10-26 13:21:40 +00:00 
			
		
		
		
	- Move the API reference into the vercel build - Update api reference organization and styling
		
			
				
	
	
		
			42 lines
		
	
	
		
			1.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			42 lines
		
	
	
		
			1.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import sys
 | |
| from glob import glob
 | |
| from pathlib import Path
 | |
| 
 | |
| from bs4 import BeautifulSoup
 | |
| 
 | |
| CUR_DIR = Path(__file__).parents[1]
 | |
| 
 | |
| 
 | |
| def process_toc_h3_elements(html_content: str) -> str:
 | |
|     """Update Class.method() TOC headers to just method()."""
 | |
|     # Create a BeautifulSoup object
 | |
|     soup = BeautifulSoup(html_content, "html.parser")
 | |
| 
 | |
|     # Find all <li> elements with class "toc-h3"
 | |
|     toc_h3_elements = soup.find_all("li", class_="toc-h3")
 | |
| 
 | |
|     # Process each element
 | |
|     for element in toc_h3_elements:
 | |
|         element = element.a.code.span
 | |
|         # Get the text content of the element
 | |
|         content = element.get_text()
 | |
| 
 | |
|         # Apply the regex substitution
 | |
|         modified_content = content.split(".")[-1]
 | |
| 
 | |
|         # Update the element's content
 | |
|         element.string = modified_content
 | |
| 
 | |
|     # Return the modified HTML
 | |
|     return str(soup)
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     dir = sys.argv[1]
 | |
|     for fn in glob(str(f"{dir.rstrip('/')}/**/*.html"), recursive=True):
 | |
|         with open(fn, "r") as f:
 | |
|             html = f.read()
 | |
|         processed_html = process_toc_h3_elements(html)
 | |
|         with open(fn, "w") as f:
 | |
|             f.write(processed_html)
 |