Sorensen–Dice coefficient: Difference between revisions

m
add a docstring
m (Python example)
m (add a docstring)
Line 314:
 
from multiset import Multiset
 
 
def tokenizetext(txt):
Line 319 ⟶ 320:
arr = []
for wrd in txt.lower().split(' '):
arr += ([wrd] if len(wrd) == 1 else [wrd[i:i+2] for i in range(len(wrd)-1)])
for i in range(len(wrd)-1)])
return Multiset(arr)
 
 
def sorenson_dice(s1text1, s2text2):
''' Sorenson-Dice similarity of Multisets '''
bc1, bc2 = tokenizetext(s1text1), tokenizetext(s2text2)
return 2 * len(bc1 & bc2) / (len(bc1) + len(bc2))
 
Line 368 ⟶ 371:
0.600000 Lah numbers
</pre>
 
 
=={{header|Raku}}==
4,102

edits