Python类型错误，即使我只处理int和

bm25 = tf * (k + 1) bm25 = bm25 / (k * (1 - b + b * dl / avdl) + tf) bm25 = bm25 * math.log(n/df, 2) File "inverted_index.py", line 116, in read_from_file bm25 = tf * (k + 1) TypeError: cannot concatenate 'str' and 'int' objects

# bm25 = tf * (k + 1) bm25 = bm25 / (k * (1 - b + b * dl / avdl) + tf) bm25 = bm25 * math.log(n/df, 2) File "inverted_index.py", line 117, in read_from_file bm25 = bm25 / (k * (1 - b + b * dl / avdl) + tf) TypeError: unsupported operand type(s) for -: 'int' and 'str'

def read_from_file(self, file_name, b, k): """ >>> ii = InvertedIndex() >>> ii.read_from_file("example.txt", b=0, k="inf") >>> sorted(ii.inverted_lists.items()) [('animated', [(1, 0.415), (2, 0.415), (4, 0.415)]), \ ('animation', [(3, 2.0)]), ('film', [(2, 1.0), (4, 1.0)]), \ ('movie', [(1, 0.0), (2, 0.0), (3, 0.0), (4, 0.0)]), \ ('non', [(2, 2.0)]), \ ('short', [(3, 1.0), (4, 2.0)])] """ """ >>> ii = InvertedIndex() >>> ii.read_from_file("example.txt", b=0.75, k=1.75) >>> sorted(ii.inverted_lists.items()) [('animated', [(1, 0.459), (2, 0.402), (4, 0.358)]), \ ('animation', [(3, 2.211)]), ('film', [(2, 0.969), (4, 0.863)]), \ ('movie', [(1, 0.0), (2, 0.0), (3, 0.0), (4, 0.0)]), \ ('non', [(2, 1.938)]), \ ('short', [(3, 1.106), (4, 1.313)])] """ dls = [] avdl = 0 with open(file_name, "r") as file: record_id = 1 for line in file: tf = 1 line = line.strip() # Store the record as a tuple (title, description). self.records.append(tuple(line.split("\t"))) dl = 0 for word in re.split("[^A-Za-z]+", line): word = word.lower().strip() # Ignore the word if it is empty. if len(word) == 0: continue dl = dl + 1 if word not in self.inverted_lists: # The word is seen for first time, create a new list. tf = 1 self.inverted_lists[word] = [(record_id, tf)] elif self.inverted_lists[word][-1] == (record_id, tf): tf = tf + 1 self.inverted_lists[word][-1] = (record_id, tf) tf = 1 elif self.inverted_lists[word][-1] != (record_id, tf): # Make sure that the list contains the id at most once. self.inverted_lists[word].append((record_id, tf)) record_id += 1 avdl = avdl + dl dls.append(dl) n = record_id - 1 avdl = avdl / n bm25 = 0 for key in self.inverted_lists: df = len(self.inverted_lists[key]) counter = 0 for value in self.inverted_lists[key]: counter = counter + 1 tf = value[1] dl = dls[value[0] - 1] if k == "inf": bm25 = tf * math.log(n/df, 2) else: bm25 = float(tf) * (float(k) + float(1)) bm25 = bm25 / (float(k) * (float(1) - float(b) + float(b) * float(dl) / float(avdl)) + float(tf)) bm25 = bm25 * math.log(n/df, 2) self.inverted_lists[key][counter - 1] = ( self.inverted_lists[key][counter - 1][0], round(bm25, 3))

bm25 = float(tf) * (float(k) + float(1)) bm25 = bm25 / (float(k) * (float(1) - float(b) + float(b) * float(dl) / float(avdl)) + float(tf)) bm25 = bm25 * math.log(n/df, 2)

1条回答

网友

1楼 · 发布于 2024-05-15 17:40:13

好吧，我想我找到了字符串的来源：

file_name = sys.argv[1]
b = sys.argv[2]
k = sys.argv[3]

ii = InvertedIndex()
ii.read_from_file(file_name, b, k)

我的main方法获取用户输入并将其传递给我的方法。我认为它不会将用户输入解释为字符串-我仍然需要习惯动态键入。。。你知道吗

@谢谢大家的帮助！你知道吗

相关问题更多 >

编程相关推荐

热门问题

热门文章