-
Duwairi, R.; Al-Refai, M.N.; Khasawneh, N.: Feature reduction techniques for Arabic text categorization (2009)
0.32
0.31928077 = sum of:
0.31928077 = product of:
0.886891 = sum of:
0.013256678 = weight(abstract_txt:using in 156) [ClassicSimilarity], result of:
0.013256678 = score(doc=156,freq=1.0), product of:
0.06135805 = queryWeight, product of:
1.1244584 = boost
3.4568708 = idf(docFreq=3806, maxDocs=44421)
0.015785014 = queryNorm
0.21605442 = fieldWeight in 156, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
3.4568708 = idf(docFreq=3806, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.01102795 = weight(abstract_txt:that in 156) [ClassicSimilarity], result of:
0.01102795 = score(doc=156,freq=3.0), product of:
0.043075956 = queryWeight, product of:
1.1539068 = boost
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.015785014 = queryNorm
0.25601172 = fieldWeight in 156, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.0067064157 = weight(abstract_txt:this in 156) [ClassicSimilarity], result of:
0.0067064157 = score(doc=156,freq=1.0), product of:
0.04459359 = queryWeight, product of:
1.1740578 = boost
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.015785014 = queryNorm
0.15038967 = fieldWeight in 156, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.11673169 = weight(abstract_txt:stem in 156) [ClassicSimilarity], result of:
0.11673169 = score(doc=156,freq=2.0), product of:
0.16482417 = queryWeight, product of:
1.303176 = boost
8.0125885 = idf(docFreq=39, maxDocs=44421)
0.015785014 = queryNorm
0.70821947 = fieldWeight in 156, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
8.0125885 = idf(docFreq=39, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.12266552 = weight(abstract_txt:stems in 156) [ClassicSimilarity], result of:
0.12266552 = score(doc=156,freq=2.0), product of:
0.17036356 = queryWeight, product of:
1.3248936 = boost
8.146119 = idf(docFreq=34, maxDocs=44421)
0.015785014 = queryNorm
0.720022 = fieldWeight in 156, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
8.146119 = idf(docFreq=34, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.14897434 = weight(abstract_txt:affixes in 156) [ClassicSimilarity], result of:
0.14897434 = score(doc=156,freq=1.0), product of:
0.24433145 = queryWeight, product of:
1.5866543 = boost
9.755557 = idf(docFreq=6, maxDocs=44421)
0.015785014 = queryNorm
0.6097223 = fieldWeight in 156, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
9.755557 = idf(docFreq=6, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.09860431 = weight(abstract_txt:words in 156) [ClassicSimilarity], result of:
0.09860431 = score(doc=156,freq=4.0), product of:
0.14728516 = queryWeight, product of:
1.7421564 = boost
5.355831 = idf(docFreq=569, maxDocs=44421)
0.015785014 = queryNorm
0.6694789 = fieldWeight in 156, product of:
2.0 = tf(freq=4.0), with freq of:
4.0 = termFreq=4.0
5.355831 = idf(docFreq=569, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.10321658 = weight(abstract_txt:word in 156) [ClassicSimilarity], result of:
0.10321658 = score(doc=156,freq=4.0), product of:
0.15184298 = queryWeight, product of:
1.768907 = boost
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.015785014 = queryNorm
0.67975867 = fieldWeight in 156, product of:
2.0 = tf(freq=4.0), with freq of:
4.0 = termFreq=4.0
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.2657075 = weight(abstract_txt:stemming in 156) [ClassicSimilarity], result of:
0.2657075 = score(doc=156,freq=4.0), product of:
0.2852097 = queryWeight, product of:
2.424319 = boost
7.4529724 = idf(docFreq=69, maxDocs=44421)
0.015785014 = queryNorm
0.93162155 = fieldWeight in 156, product of:
2.0 = tf(freq=4.0), with freq of:
4.0 = termFreq=4.0
7.4529724 = idf(docFreq=69, maxDocs=44421)
0.0625 = fieldNorm(doc=156)
0.36 = coord(9/25)
-
Yang, C.C.; Li, K.W.: ¬A heuristic method based on a statistical approach for chinese text segmentation (2005)
0.29
0.2872244 = sum of:
0.2872244 = product of:
1.0258014 = sum of:
0.013483789 = weight(abstract_txt:retrieval in 5580) [ClassicSimilarity], result of:
0.013483789 = score(doc=5580,freq=1.0), product of:
0.062056843 = queryWeight, product of:
1.1308434 = boost
3.4765 = idf(docFreq=3732, maxDocs=44421)
0.015785014 = queryNorm
0.21728125 = fieldWeight in 5580, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
3.4765 = idf(docFreq=3732, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.009004284 = weight(abstract_txt:that in 5580) [ClassicSimilarity], result of:
0.009004284 = score(doc=5580,freq=2.0), product of:
0.043075956 = queryWeight, product of:
1.1539068 = boost
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.015785014 = queryNorm
0.20903271 = fieldWeight in 5580, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.009484304 = weight(abstract_txt:this in 5580) [ClassicSimilarity], result of:
0.009484304 = score(doc=5580,freq=2.0), product of:
0.04459359 = queryWeight, product of:
1.1740578 = boost
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.015785014 = queryNorm
0.21268311 = fieldWeight in 5580, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.087659396 = weight(abstract_txt:method in 5580) [ClassicSimilarity], result of:
0.087659396 = score(doc=5580,freq=9.0), product of:
0.10392018 = queryWeight, product of:
1.4633815 = boost
4.4988065 = idf(docFreq=1342, maxDocs=44421)
0.015785014 = queryNorm
0.84352624 = fieldWeight in 5580, product of:
3.0 = tf(freq=9.0), with freq of:
9.0 = termFreq=9.0
4.4988065 = idf(docFreq=1342, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.11024297 = weight(abstract_txt:words in 5580) [ClassicSimilarity], result of:
0.11024297 = score(doc=5580,freq=5.0), product of:
0.14728516 = queryWeight, product of:
1.7421564 = boost
5.355831 = idf(docFreq=569, maxDocs=44421)
0.015785014 = queryNorm
0.74850017 = fieldWeight in 5580, product of:
2.236068 = tf(freq=5.0), with freq of:
5.0 = termFreq=5.0
5.355831 = idf(docFreq=569, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.07298514 = weight(abstract_txt:word in 5580) [ClassicSimilarity], result of:
0.07298514 = score(doc=5580,freq=2.0), product of:
0.15184298 = queryWeight, product of:
1.768907 = boost
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.015785014 = queryNorm
0.48066196 = fieldWeight in 5580, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.7229415 = weight(abstract_txt:segmentation in 5580) [ClassicSimilarity], result of:
0.7229415 = score(doc=5580,freq=9.0), product of:
0.48558667 = queryWeight, product of:
3.874241 = boost
7.9402676 = idf(docFreq=42, maxDocs=44421)
0.015785014 = queryNorm
1.4888002 = fieldWeight in 5580, product of:
3.0 = tf(freq=9.0), with freq of:
9.0 = termFreq=9.0
7.9402676 = idf(docFreq=42, maxDocs=44421)
0.0625 = fieldNorm(doc=5580)
0.28 = coord(7/25)
-
Wang, F.L.; Yang, C.C.: Mining Web data for Chinese segmentation (2007)
0.27
0.2733752 = sum of:
0.2733752 = product of:
0.97634 = sum of:
0.013483789 = weight(abstract_txt:retrieval in 1604) [ClassicSimilarity], result of:
0.013483789 = score(doc=1604,freq=1.0), product of:
0.062056843 = queryWeight, product of:
1.1308434 = boost
3.4765 = idf(docFreq=3732, maxDocs=44421)
0.015785014 = queryNorm
0.21728125 = fieldWeight in 1604, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
3.4765 = idf(docFreq=3732, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.01350877 = weight(abstract_txt:results in 1604) [ClassicSimilarity], result of:
0.01350877 = score(doc=1604,freq=1.0), product of:
0.06213347 = queryWeight, product of:
1.1315414 = boost
3.4786456 = idf(docFreq=3724, maxDocs=44421)
0.015785014 = queryNorm
0.21741535 = fieldWeight in 1604, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
3.4786456 = idf(docFreq=3724, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.009004284 = weight(abstract_txt:that in 1604) [ClassicSimilarity], result of:
0.009004284 = score(doc=1604,freq=2.0), product of:
0.043075956 = queryWeight, product of:
1.1539068 = boost
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.015785014 = queryNorm
0.20903271 = fieldWeight in 1604, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.0067064157 = weight(abstract_txt:this in 1604) [ClassicSimilarity], result of:
0.0067064157 = score(doc=1604,freq=1.0), product of:
0.04459359 = queryWeight, product of:
1.1740578 = boost
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.015785014 = queryNorm
0.15038967 = fieldWeight in 1604, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.09860431 = weight(abstract_txt:words in 1604) [ClassicSimilarity], result of:
0.09860431 = score(doc=1604,freq=4.0), product of:
0.14728516 = queryWeight, product of:
1.7421564 = boost
5.355831 = idf(docFreq=569, maxDocs=44421)
0.015785014 = queryNorm
0.6694789 = fieldWeight in 1604, product of:
2.0 = tf(freq=4.0), with freq of:
4.0 = termFreq=4.0
5.355831 = idf(docFreq=569, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.07298514 = weight(abstract_txt:word in 1604) [ClassicSimilarity], result of:
0.07298514 = score(doc=1604,freq=2.0), product of:
0.15184298 = queryWeight, product of:
1.768907 = boost
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.015785014 = queryNorm
0.48066196 = fieldWeight in 1604, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.7620473 = weight(abstract_txt:segmentation in 1604) [ClassicSimilarity], result of:
0.7620473 = score(doc=1604,freq=10.0), product of:
0.48558667 = queryWeight, product of:
3.874241 = boost
7.9402676 = idf(docFreq=42, maxDocs=44421)
0.015785014 = queryNorm
1.5693332 = fieldWeight in 1604, product of:
3.1622777 = tf(freq=10.0), with freq of:
10.0 = termFreq=10.0
7.9402676 = idf(docFreq=42, maxDocs=44421)
0.0625 = fieldNorm(doc=1604)
0.28 = coord(7/25)
-
Abu-Salem, H.; Al-Omari, M.; Evens, M.W.: Stemming methodologies over individual query words for an Arabic information retrieval system (1999)
0.25
0.2502525 = sum of:
0.2502525 = product of:
0.6256312 = sum of:
0.0324721 = weight(abstract_txt:using in 4672) [ClassicSimilarity], result of:
0.0324721 = score(doc=4672,freq=6.0), product of:
0.06135805 = queryWeight, product of:
1.1244584 = boost
3.4568708 = idf(docFreq=3806, maxDocs=44421)
0.015785014 = queryNorm
0.52922314 = fieldWeight in 4672, product of:
2.4494898 = tf(freq=6.0), with freq of:
6.0 = termFreq=6.0
3.4568708 = idf(docFreq=3806, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.023354605 = weight(abstract_txt:retrieval in 4672) [ClassicSimilarity], result of:
0.023354605 = score(doc=4672,freq=3.0), product of:
0.062056843 = queryWeight, product of:
1.1308434 = boost
3.4765 = idf(docFreq=3732, maxDocs=44421)
0.015785014 = queryNorm
0.37634215 = fieldWeight in 4672, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
3.4765 = idf(docFreq=3732, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.01350877 = weight(abstract_txt:results in 4672) [ClassicSimilarity], result of:
0.01350877 = score(doc=4672,freq=1.0), product of:
0.06213347 = queryWeight, product of:
1.1315414 = boost
3.4786456 = idf(docFreq=3724, maxDocs=44421)
0.015785014 = queryNorm
0.21741535 = fieldWeight in 4672, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
3.4786456 = idf(docFreq=3724, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.01102795 = weight(abstract_txt:that in 4672) [ClassicSimilarity], result of:
0.01102795 = score(doc=4672,freq=3.0), product of:
0.043075956 = queryWeight, product of:
1.1539068 = boost
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.015785014 = queryNorm
0.25601172 = fieldWeight in 4672, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.009484304 = weight(abstract_txt:this in 4672) [ClassicSimilarity], result of:
0.009484304 = score(doc=4672,freq=2.0), product of:
0.04459359 = queryWeight, product of:
1.1740578 = boost
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.015785014 = queryNorm
0.21268311 = fieldWeight in 4672, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.14296652 = weight(abstract_txt:stem in 4672) [ClassicSimilarity], result of:
0.14296652 = score(doc=4672,freq=3.0), product of:
0.16482417 = queryWeight, product of:
1.303176 = boost
8.0125885 = idf(docFreq=39, maxDocs=44421)
0.015785014 = queryNorm
0.8673881 = fieldWeight in 4672, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
8.0125885 = idf(docFreq=39, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.08264607 = weight(abstract_txt:method in 4672) [ClassicSimilarity], result of:
0.08264607 = score(doc=4672,freq=8.0), product of:
0.10392018 = queryWeight, product of:
1.4633815 = boost
4.4988065 = idf(docFreq=1342, maxDocs=44421)
0.015785014 = queryNorm
0.79528415 = fieldWeight in 4672, product of:
2.828427 = tf(freq=8.0), with freq of:
8.0 = termFreq=8.0
4.4988065 = idf(docFreq=1342, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.049302153 = weight(abstract_txt:words in 4672) [ClassicSimilarity], result of:
0.049302153 = score(doc=4672,freq=1.0), product of:
0.14728516 = queryWeight, product of:
1.7421564 = boost
5.355831 = idf(docFreq=569, maxDocs=44421)
0.015785014 = queryNorm
0.33473945 = fieldWeight in 4672, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
5.355831 = idf(docFreq=569, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.07298514 = weight(abstract_txt:word in 4672) [ClassicSimilarity], result of:
0.07298514 = score(doc=4672,freq=2.0), product of:
0.15184298 = queryWeight, product of:
1.768907 = boost
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.015785014 = queryNorm
0.48066196 = fieldWeight in 4672, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.18788356 = weight(abstract_txt:stemming in 4672) [ClassicSimilarity], result of:
0.18788356 = score(doc=4672,freq=2.0), product of:
0.2852097 = queryWeight, product of:
2.424319 = boost
7.4529724 = idf(docFreq=69, maxDocs=44421)
0.015785014 = queryNorm
0.6587559 = fieldWeight in 4672, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
7.4529724 = idf(docFreq=69, maxDocs=44421)
0.0625 = fieldNorm(doc=4672)
0.4 = coord(10/25)
-
Mustafa, S.H.: Word-oriented approximate string matching using occurrence heuristic tables : a heuristic for searching Arabic text (2005)
0.21
0.20761232 = sum of:
0.20761232 = product of:
0.6487885 = sum of:
0.028701551 = weight(abstract_txt:using in 2715) [ClassicSimilarity], result of:
0.028701551 = score(doc=2715,freq=3.0), product of:
0.06135805 = queryWeight, product of:
1.1244584 = boost
3.4568708 = idf(docFreq=3806, maxDocs=44421)
0.015785014 = queryNorm
0.46777156 = fieldWeight in 2715, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
3.4568708 = idf(docFreq=3806, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.016885962 = weight(abstract_txt:results in 2715) [ClassicSimilarity], result of:
0.016885962 = score(doc=2715,freq=1.0), product of:
0.06213347 = queryWeight, product of:
1.1315414 = boost
3.4786456 = idf(docFreq=3724, maxDocs=44421)
0.015785014 = queryNorm
0.2717692 = fieldWeight in 2715, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
3.4786456 = idf(docFreq=3724, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.007958737 = weight(abstract_txt:that in 2715) [ClassicSimilarity], result of:
0.007958737 = score(doc=2715,freq=1.0), product of:
0.043075956 = queryWeight, product of:
1.1539068 = boost
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.015785014 = queryNorm
0.18476056 = fieldWeight in 2715, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
2.3649352 = idf(docFreq=11344, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.00838302 = weight(abstract_txt:this in 2715) [ClassicSimilarity], result of:
0.00838302 = score(doc=2715,freq=1.0), product of:
0.04459359 = queryWeight, product of:
1.1740578 = boost
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.015785014 = queryNorm
0.18798709 = fieldWeight in 2715, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
2.4062347 = idf(docFreq=10885, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.18621792 = weight(abstract_txt:affixes in 2715) [ClassicSimilarity], result of:
0.18621792 = score(doc=2715,freq=1.0), product of:
0.24433145 = queryWeight, product of:
1.5866543 = boost
9.755557 = idf(docFreq=6, maxDocs=44421)
0.015785014 = queryNorm
0.7621529 = fieldWeight in 2715, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
9.755557 = idf(docFreq=6, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.10674229 = weight(abstract_txt:words in 2715) [ClassicSimilarity], result of:
0.10674229 = score(doc=2715,freq=3.0), product of:
0.14728516 = queryWeight, product of:
1.7421564 = boost
5.355831 = idf(docFreq=569, maxDocs=44421)
0.015785014 = queryNorm
0.72473216 = fieldWeight in 2715, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
5.355831 = idf(docFreq=569, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.06451036 = weight(abstract_txt:word in 2715) [ClassicSimilarity], result of:
0.06451036 = score(doc=2715,freq=1.0), product of:
0.15184298 = queryWeight, product of:
1.768907 = boost
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.015785014 = queryNorm
0.42484915 = fieldWeight in 2715, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
5.4380693 = idf(docFreq=524, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.22938865 = weight(abstract_txt:letter in 2715) [ClassicSimilarity], result of:
0.22938865 = score(doc=2715,freq=1.0), product of:
0.35374448 = queryWeight, product of:
2.6999297 = boost
8.30027 = idf(docFreq=29, maxDocs=44421)
0.015785014 = queryNorm
0.6484586 = fieldWeight in 2715, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
8.30027 = idf(docFreq=29, maxDocs=44421)
0.078125 = fieldNorm(doc=2715)
0.32 = coord(8/25)