TieBa-Messenger-Bot-CN/evalResult.py at master · piekey1994/TieBa-Messenger-Bot-CN · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
#!/usr/bin/env python
# coding: utf-8
from nltk.translate.bleu_score import sentence_bleu
import gensim
from numpy import *
#win10 1709版本控制台存在bug，需要引入这个包防止print意外报错
import win_unicode_console
win_unicode_console.enable()

def cosine_similarity(vector1,vector2):
    dot_product = 0.0
    normA = 0.0
    normB = 0.0
    for a,b in zip(vector1,vector2):
        dot_product += a*b
        normA += a**2
        normB += b**2
    if normA == 0.0 or normB==0.0:
        return 0
    else:
        return dot_product / ((normA*normB)**0.5)

word2VecModel = gensim.models.Word2Vec.load(r"D:\知识图谱\关键程序\KBChatbot\word2vec_data\wiki.zh.text.model")

with open('output.txt','r',encoding='utf-8') as resultFile,open('testoutput.txt','r',encoding='utf-8') as targetFile,open('modelevelResult.txt','w',encoding='utf-8') as merFile:
    unigrams=dict()
    bigrams=dict()
    wordsNum=0
    sentencesNum=0
    bleuScore=0
    GMScore=0
    EAScore=0
    VEScore=0
    for resultLine,targetLine in zip(resultFile,targetFile):
        resultWords=resultLine[:-1].split()
        targetWords=targetLine[:-1].split()
        if len(resultWords)==0 or len(targetWords)==0:
            continue
        sentencesNum += 1
        if sentencesNum % 100 == 0:
            print('finish:%d' % (sentencesNum))
        #计算Distinct1和Distinct2
        words=resultWords
        wlen=len(words)
        wordsNum += wlen
        for i in range(wlen):
            word=words[i]
            #统计unigrams
            if word not in unigrams:
                unigrams[word]=1
            else:
                unigrams[word]=unigrams[word]+1
            #统计bigrams
            if i<wlen-1:
                word=words[i]+' '+words[i+1]
            if word not in bigrams:
                bigrams[word]=1
            else:
                bigrams[word]=bigrams[word]+1

        #计算BlEU
        reference = [targetWords]
        candidate = resultWords
        score = sentence_bleu(reference, candidate)
        bleuScore += score

        #计算Greedy Matching
        scores=[]
        for w1 in resultWords:
            ss=[]
            for w2 in targetWords:
                try:
                    ss.append(self.word2VecModel.similarity(w1,w2))
                except:
                    if w1==w2:
                        ss.append(1)
                    else:
                        ss.append(0)
                scores.append(ss)
        max1 = 0
        max2 = 0
        for i in range(len(resultWords)):
            max1 += max(scores[i])
        max1 /= len(resultWords)
        for i in range(len(targetWords)):
            maxnum=0
            for j in range(len(resultWords)):
                maxnum = scores[j][i] if scores[j][i]>maxnum else maxnum
            max2 += maxnum
        max2 /= len(targetWords)
        GMScore += (max1+max2)/2

        #计算Embedding Average
        resultAvgVec=[0]*200
        resultLen=0
        targetAvgVec=[0]*200
        targetLen=0
        for word in resultWords:
            try:
                resultAvgVec=resultAvgVec+word2VecModel.wv[word]
                resultLen += 1
            except:
                pass

        for word in targetWords:
            try:
                targetAvgVec=targetAvgVec+word2VecModel.wv[word]
                targetLen += 1
            except:
                pass
        if resultLen!=0 and targetLen!=0:
            resultAvgVec = resultAvgVec*[1.0/resultLen]
            targetAvgVec = targetAvgVec*[1.0/targetLen]
            #EAScore += getConsim(mat(resultAvgVec),mat(targetAvgVec))
            EAScore += cosine_similarity(resultAvgVec,targetAvgVec)

        #计算Vector Extrema
        resultExtVec=[0]*200
        targetExtVec=[0]*200
        resultWordVecList=[[0]]*200
        targetWordVecList=[[0]]*200
        for word in resultWords:
            try:
                v=word2VecModel.wv[word]
                for i in range(200):
                    resultWordVecList[i].append(v[i])
            except:
                pass
        for word in targetWords:
            try:
                v=word2VecModel.wv[word]
                for i in range(200):
                    targetWordVecList[i].append(v[i])
            except:
                pass
        for i in range(200):
            if max(resultWordVecList[i])>abs(min(resultWordVecList[i])):
                resultExtVec[i]=max(resultWordVecList[i])
            else:
                resultExtVec[i]=min(resultWordVecList[i])
            if max(targetWordVecList[i])>abs(min(targetWordVecList[i])):
                targetExtVec[i]=max(targetWordVecList[i])
            else:
                targetExtVec[i]=min(targetWordVecList[i])
        #VEScore += getConsim(mat(resultExtVec),mat(targetExtVec))
        VEScore +=  cosine_similarity(resultExtVec,targetExtVec)

    print("sentencesNum:%d" %(sentencesNum))
    print("wordsNum:%d" %(wordsNum))
    print("unigrams:%f" % (len(unigrams)/wordsNum))
    print("bigrams:%f" % (len(bigrams)/wordsNum))
    print("bleuScore:%f %f" % (bleuScore*100/sentencesNum,bleuScore/sentencesNum))
    print("GMScore:%f %f" % (GMScore*100/sentencesNum,GMScore/sentencesNum))
    print("EAScore:%f %f" % (EAScore*100/sentencesNum,EAScore/sentencesNum))
    print("VEScore:%f %f" % (VEScore*100/sentencesNum,VEScore/sentencesNum))
    merFile.write("sentencesNum:%d\n" %(sentencesNum))
    merFile.write("wordsNum:%d\n" %(wordsNum))
    merFile.write("unigrams:%f\n" % (len(unigrams)/wordsNum))
    merFile.write("bigrams:%f\n" % (len(bigrams)/wordsNum))
    merFile.write("bleuScore:%f %f\n" % (bleuScore*100/sentencesNum,bleuScore/sentencesNum))
    merFile.write("GMScore:%f %f\n" % (GMScore*100/sentencesNum,GMScore/sentencesNum))
    merFile.write("EAScore:%f %f\n" % (EAScore*100/sentencesNum,EAScore/sentencesNum))
    merFile.write("VEScore:%f %f\n" % (VEScore*100/sentencesNum,VEScore/sentencesNum))