flakshack · January 19, 2015 17:17
diff --git a/gistfile1.py b/gistfile1.py
 from BeautifulSoup import BeautifulSoup
 import re
 import glob

 # Grab a list of all HTML files
 path = "/some/path/tofiles/*.html"
 for file_name in glob.glob(path):
    print(file_name)
    # Open the file and read the contents into a string
    with open (file_name, "r") as file_handle:
        file_contents=file_handle.read()
    file_handle.close()

    soup = BeautifulSoup(file_contents)
    # Replace the hyperlink with the contents (the text)
    for match in soup.findAll('a', href=re.compile("somedomain\.com")):
        match.replaceWithChildren()

    # Write the contents back to the file
    file_handle = open(file_name, 'w')
    file_handle.write(soup.prettify())
    file_handle.close()
	from BeautifulSoup import BeautifulSoup
	import re
	import glob

	# Grab a list of all HTML files
	path = "/some/path/tofiles/*.html"
	for file_name in glob.glob(path):
	print(file_name)
	# Open the file and read the contents into a string
	with open (file_name, "r") as file_handle:
	file_contents=file_handle.read()
	file_handle.close()

	soup = BeautifulSoup(file_contents)
	# Replace the hyperlink with the contents (the text)
	for match in soup.findAll('a', href=re.compile("somedomain\.com")):
	match.replaceWithChildren()

	# Write the contents back to the file
	file_handle = open(file_name, 'w')
	file_handle.write(soup.prettify())
	file_handle.close()