unhashable type: 'list'

最新推荐文章于 2023-08-02 17:12:09 发布

后知后觉的计算机菜

最新推荐文章于 2023-08-02 17:12:09 发布

阅读量2.2k

点赞数

分类专栏：待研究

本文链接：https://blog.csdn.net/qq_35664774/article/details/79462805

版权

待研究专栏收录该内容

4 篇文章 0 订阅

订阅专栏

def loadDataSet():
    postingList = [['my', 'dog', 'has', 'flea', 'problem', 'help', 'please'],
                   ['maybe', 'not', 'take', 'him', 'to', 'dog', 'park', 'stupid'],
                   ['my', 'dalmation', 'is', 'so', 'cute', 'I', 'love', 'him'],
                   ['stop', 'posting', 'ate', 'my', 'steak', 'how', 'to', 'stop', 'him'],
                   ['mr', 'licks', 'ate', 'my', 'steak', 'how', 'to', 'stop', 'him'],
                   ['quit', 'buying', 'worthless', 'dog', 'food', 'stupid']]
    classVec = [0, 1, 0, 1, 0, 1]
    return postingList, classVec

def createVocabList(dataSet):
    vocabSet = set([])
    for document in dataSet:
        vocabSet = vocabSet | set(document)
    return list(vocabSet)


def setOfWords2Vec(vocabList, inputSet):
    returnVec = [0] * len(vocabList)
    for word in inputSet:
        if word in vocabList:
            returnVec[vocabList.index(word)] = 1
        else:
            print("the word:%s is not in my vocabulary" % word)


listOPosts = loadDataSet()
myVocabList=createVocabList(listOPosts)
print(myVocabList)