这是我目前用Python编写的代码。从这里开始,我需要删除标点符号的gutenberg.txt。我该怎么做呢?
import bs4
import urllib.request
#make a string to record location
loc = 'http://www.gutenberg.org/files/1155/1155-h/1155-h.htm'
#create page object
page = urllib.request.urlopen(loc).read()
#create the soup object
soup = bs4.BeautifulSoup(page,'html.parser')
#save into text file
print(soup.prettify())
print(soup.get_text())
string = str(soup.get_text())
f = open("gutenberg.txt","w")
f.write(string);
f.close()