zoukankan      html  css  js  c++  java
  • ItemCF算法

    import math
    from operator import itemgetter
    
    data = {'A':{'a','b','d'}, 'B':{'b','c','e'}, 'C':{'c','d'}, 'D':{'b','c','d'}, 'E':{'a','d'}}
    def ItemSimilarity(data):
        #calculate co-rated users between itme
        C = dict()
        N = dict()
        for u, items in data.items():
            for i in items:
                if i not in N:
                    N[i] = 1
                else :
                    N[i] += 1
                if i not in C:
                    C[i] = dict()
                for j in items:
                    if i == j:
                        continue
                    if j not in C[i]:
                        C[i][j] = 1
                    else :
                        C[i][j] += 1
            '''
            for i , k in C.items():
                for j, sim in k.items():
                    print i, j, sim
                print
            print '-----------'
            '''
        #calculate final similarity matrix W
        W = dict()
        for i, related_items in C.items():
            W[i] = dict()
            for j, cij in related_items.items():
                W[i][j] = cij / math.sqrt(N[i] * N[j])
        return W
    
    Item_Simi = ItemSimilarity(data) #compute similarity between different items
    for i, item in Item_Simi.items():
        for j, Simi in sorted(item.items(), key = itemgetter(1), reverse = True):
            print 'The similarity between ' + i + ' and ' + j + ' is ',
            print Simi
    
    
    def Recommendation(data, W, K):
        rank = dict()
        ru = data.keys()
        rui = 1
        for k in ru:#user k
            rank[k] = dict()
            for i in data[k]:#i is the items user k buyed
                #print W[i]#the items buyed by k when k buyed i
                for j, wj in sorted(W[i].items(), key = itemgetter(1), reverse = True)[0:K]:
                #j is item ranked top K similarest with i buyed by k
                    if j not in rank[k]:#when the interest user k see item j has never computed
                        rank[k][j] = rui * wj
                    else:
                        rank[k][j] += rui * wj
        return rank
    result = Recommendation(data,Item_Simi, 3) 
    
    for i, j_item in result.items():
        for j, interest in sorted(j_item.items(), key = itemgetter(1), reverse = True):
            print ' the interest ' + i + ' buy ' + j +' is ',
            print interest
  • 相关阅读:
    Best Cow Line(POJ No.3617)
    迷宫的最短路径
    Lak3 Counting(POJ No.2386)
    【日志】-2013.11.02
    用Python实现gmail邮箱服务,实现两个邮箱之间的绑定(上)
    用Python实现gmail邮箱服务,实现两个邮箱之间的绑定(下)
    【日志】-2013.11.01
    (转载)HTML与XHTML有什么区别
    (转载)linux环境变量
    转载-KMP算法前缀数组优雅实现
  • 原文地址:https://www.cnblogs.com/taotao315/p/3130767.html
Copyright © 2011-2022 走看看