zoukankan      html  css  js  c++  java
  • jieba库的应用

    #!/usr/bin/python
    # -*- coding:utf-8 -*-

    import imp,sys

    imp.reload(sys)
    from matplotlib.font_manager import FontProperties
    import jieba.analyse
    import matplotlib.pyplot as plt
    if __name__ == "__main__":

    word_lst = []
    key_list = []
    for line in open('D://jieba_new.txt'): # 1.txt是需要分词统计的文档

    item = line.strip(' ').split(' ') # 制表格切分
    tags = jieba.analyse.extract_tags(item[0]) # jieba分词
    for t in tags:
    word_lst.append(t)

    word_dict = {}
    with open("D://word.txt", 'w') as wf2: # 打开文件

    for item in word_lst:
    if item not in word_dict: # 统计数量
    word_dict[item] = 1
    else:
    word_dict[item] += 1

    orderList = list(word_dict.values())
    orderList.sort(reverse=True)
    # print orderList
    for i in range(len(orderList)):
    for key in word_dict:
    if word_dict[key] == orderList[i]:
    if word_dict[key] > 1:
    wf2.write(key + ' ' + str(word_dict[key]) + ' ') # 写入txt文档
    tmp = open('D://word.txt').readlines() # 把内容一次性全部读取出来 是一个列表
    set(tmp)
    A = []
    B = []
    file = open('D:\word1.txt')
    for r in file:
    imporkey = r.split(' ')[0]
    sumnumber = r.split(' ')[1]
    int_imporkey = str(imporkey)
    int_sumnumber = str(sumnumber)
    A.append(int_imporkey)
    B.append(int_sumnumber)
    fig = plt.figure()
    plt.pie(B,labels=A,autopct='%1.2f%%') #画饼图(数据,数据对应的标签,百分数保留两位小数点)
    plt.title("Pie chart")
    plt.show()

  • 相关阅读:
    用css实现三角形
    css实现加载中的效果
    图片轮播图插件
    支付密码框
    angular里面ng-class的几个用法
    Redis数据恢复
    Jenkins简单介绍
    spring框架中定时器的配置及应用
    springMVC与freemarker的整合
    freemarker入门小例子
  • 原文地址:https://www.cnblogs.com/xizhu/p/8799092.html
Copyright © 2011-2022 走看看