python连接数据库
31 页 from bs4 import BeautifulSoup from collections import Counter from nltk . corpus import stopwords from nltk import LancasterStemmer import urllib . request URL = input ( "Enter a website" ) with urllib . request . urlopen ( URL ) as infile : soup = BeautifulSoup ( infile ) words = nltk . word_tokenize ( soup . text ) text = [ w . lower ( ) for w in words ] words = [ LancasterStemmer ( ) . stem ( w ) for w in text if w not in stopwords . words ( "english" ) and w . isalnum ( ) ] freqs = Counter ( words ) print ( freqs . most_common ( 10 ) ) 139 import nltk , pymysql conn = pymysql .