#代碼如下from collections import Counterc = Counter(speech)c. most_common(10)#出現的前十名print(c. most_common(10))for sw in stop_words: del c[sw]c.most_common(10)

Counter 是實現的 dict 的一個子類,可以用來方便地計數。

  • 附上完整代碼

speech_text = I love you,Not for what you are,But for what I amWhen I am with you.I love you,Not only for whatYou have made of yourself,But for whatYou are making of me.I love youFor the part of meThat you bring out;I love youFor putting your handInto my heaped-up heartAnd passing overAll the foolish, weak thingsThat you can』t helpDimly seeing there,And for drawing outInto the lightAll the beautiful belongingsThat no one else had lookedQuite far enough to find.I love you because youAre helping me to makeOf the lumber of my lifeNot a tavernBut a temple;Out of the worksOf my every dayNot a reproachBut a song.I love youBecause you have doneMore than any creedCould have doneTo make me goodAnd more than any fateCould have doneTo make me happy.You have done itWithout a touch,Without a word,Without a sign.You have done itBy being yourself.Perhaps that is whatBeing a friend means,After all.#解決大小寫的問題speech = speech_text.lower().split()print(speech)dic = {}for word in speech: if word not in dic: dic[word] = 1 else: dic[word] = dic[word] + 1import operatorswd = sorted(dic.items(),key=operator.itemgetter(1),reverse=True)print(swd)#停用詞處理from nltk.corpus import stopwordsstop_words = stopwords.words(English)for k,v in swd: if k not in stop_words: print(k,v)from collections import Counterc = Counter(speech)c. most_common(10)#出現的前十名print(c. most_common(10))for sw in stop_words: del c[sw]c.most_common(10)

通過這兩種方法我們就不難明白為什麼現在Python 在數據分析、科學計算領域用得越來越多,除了語言本身的特點,第三方庫也很多很好用。


