-
Barrio, P.; Gravano, L.: Sampling strategies for information extraction over the deep web (2017)
0.24
0.23529962 = sum of:
0.23529962 = product of:
0.7353113 = sum of:
0.013497912 = weight(abstract_txt:paper in 4412) [ClassicSimilarity], result of:
0.013497912 = score(doc=4412,freq=2.0), product of:
0.050417967 = queryWeight, product of:
1.0072844 = boost
3.4616103 = idf(docFreq=3788, maxDocs=44421)
0.014459559 = queryNorm
0.26772028 = fieldWeight in 4412, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
3.4616103 = idf(docFreq=3788, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.040741183 = weight(abstract_txt:document in 4412) [ClassicSimilarity], result of:
0.040741183 = score(doc=4412,freq=5.0), product of:
0.077586 = queryWeight, product of:
1.2495428 = boost
4.29415 = idf(docFreq=1647, maxDocs=44421)
0.014459559 = queryNorm
0.52510995 = fieldWeight in 4412, product of:
2.236068 = tf(freq=5.0), with freq of:
5.0 = termFreq=5.0
4.29415 = idf(docFreq=1647, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.063593075 = weight(abstract_txt:natural in 4412) [ClassicSimilarity], result of:
0.063593075 = score(doc=4412,freq=2.0), product of:
0.16219766 = queryWeight, product of:
2.2127247 = boost
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.014459559 = queryNorm
0.39207146 = fieldWeight in 4412, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.17779207 = weight(abstract_txt:execution in 4412) [ClassicSimilarity], result of:
0.17779207 = score(doc=4412,freq=2.0), product of:
0.28120038 = queryWeight, product of:
2.378852 = boost
8.175107 = idf(docFreq=33, maxDocs=44421)
0.014459559 = queryNorm
0.63226116 = fieldWeight in 4412, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
8.175107 = idf(docFreq=33, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.047225736 = weight(abstract_txt:language in 4412) [ClassicSimilarity], result of:
0.047225736 = score(doc=4412,freq=2.0), product of:
0.14639854 = queryWeight, product of:
2.4274082 = boost
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.014459559 = queryNorm
0.32258338 = fieldWeight in 4412, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.14059266 = weight(abstract_txt:text in 4412) [ClassicSimilarity], result of:
0.14059266 = score(doc=4412,freq=7.0), product of:
0.24046363 = queryWeight, product of:
4.115458 = boost
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.014459559 = queryNorm
0.5846733 = fieldWeight in 4412, product of:
2.6457512 = tf(freq=7.0), with freq of:
7.0 = termFreq=7.0
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.11661692 = weight(abstract_txt:processing in 4412) [ClassicSimilarity], result of:
0.11661692 = score(doc=4412,freq=2.0), product of:
0.30616516 = queryWeight, product of:
4.299302 = boost
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.014459559 = queryNorm
0.38089547 = fieldWeight in 4412, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.13525178 = weight(abstract_txt:mining in 4412) [ClassicSimilarity], result of:
0.13525178 = score(doc=4412,freq=1.0), product of:
0.40070638 = queryWeight, product of:
4.489961 = boost
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.014459559 = queryNorm
0.33753335 = fieldWeight in 4412, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.0546875 = fieldNorm(doc=4412)
0.32 = coord(8/25)
-
Haravu, L.J.; Neelameghan, A.: Text mining and data mining in knowledge organization and discovery : the making of knowledge-based products (2003)
0.21
0.21280433 = sum of:
0.21280433 = product of:
0.7600155 = sum of:
0.020893741 = weight(abstract_txt:presents in 653) [ClassicSimilarity], result of:
0.020893741 = score(doc=653,freq=1.0), product of:
0.07776195 = queryWeight, product of:
1.2509588 = boost
4.299016 = idf(docFreq=1639, maxDocs=44421)
0.014459559 = queryNorm
0.2686885 = fieldWeight in 653, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.299016 = idf(docFreq=1639, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.027941557 = weight(abstract_txt:applications in 653) [ClassicSimilarity], result of:
0.027941557 = score(doc=653,freq=1.0), product of:
0.09438943 = queryWeight, product of:
1.3782282 = boost
4.7363873 = idf(docFreq=1058, maxDocs=44421)
0.014459559 = queryNorm
0.2960242 = fieldWeight in 653, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.7363873 = idf(docFreq=1058, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.05139097 = weight(abstract_txt:natural in 653) [ClassicSimilarity], result of:
0.05139097 = score(doc=653,freq=1.0), product of:
0.16219766 = queryWeight, product of:
2.2127247 = boost
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.014459559 = queryNorm
0.3168416 = fieldWeight in 653, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.038164157 = weight(abstract_txt:language in 653) [ClassicSimilarity], result of:
0.038164157 = score(doc=653,freq=1.0), product of:
0.14639854 = queryWeight, product of:
2.4274082 = boost
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.014459559 = queryNorm
0.26068673 = fieldWeight in 653, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.1487583 = weight(abstract_txt:text in 653) [ClassicSimilarity], result of:
0.1487583 = score(doc=653,freq=6.0), product of:
0.24046363 = queryWeight, product of:
4.115458 = boost
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.014459559 = queryNorm
0.61863124 = fieldWeight in 653, product of:
2.4494898 = tf(freq=6.0), with freq of:
6.0 = termFreq=6.0
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.09424071 = weight(abstract_txt:processing in 653) [ClassicSimilarity], result of:
0.09424071 = score(doc=653,freq=1.0), product of:
0.30616516 = queryWeight, product of:
4.299302 = boost
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.014459559 = queryNorm
0.30781004 = fieldWeight in 653, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.37862608 = weight(abstract_txt:mining in 653) [ClassicSimilarity], result of:
0.37862608 = score(doc=653,freq=6.0), product of:
0.40070638 = queryWeight, product of:
4.489961 = boost
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.014459559 = queryNorm
0.9448966 = fieldWeight in 653, product of:
2.4494898 = tf(freq=6.0), with freq of:
6.0 = termFreq=6.0
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.0625 = fieldNorm(doc=653)
0.28 = coord(7/25)
-
Tonkin, E.L.; Tourte, G.J.L.: Working with text. tools, techniques and approaches for text mining (2016)
0.21
0.21199487 = sum of:
0.21199487 = product of:
0.883312 = sum of:
0.027941557 = weight(abstract_txt:applications in 19) [ClassicSimilarity], result of:
0.027941557 = score(doc=19,freq=1.0), product of:
0.09438943 = queryWeight, product of:
1.3782282 = boost
4.7363873 = idf(docFreq=1058, maxDocs=44421)
0.014459559 = queryNorm
0.2960242 = fieldWeight in 19, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.7363873 = idf(docFreq=1058, maxDocs=44421)
0.0625 = fieldNorm(doc=19)
0.05139097 = weight(abstract_txt:natural in 19) [ClassicSimilarity], result of:
0.05139097 = score(doc=19,freq=1.0), product of:
0.16219766 = queryWeight, product of:
2.2127247 = boost
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.014459559 = queryNorm
0.3168416 = fieldWeight in 19, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.0625 = fieldNorm(doc=19)
0.05397227 = weight(abstract_txt:language in 19) [ClassicSimilarity], result of:
0.05397227 = score(doc=19,freq=2.0), product of:
0.14639854 = queryWeight, product of:
2.4274082 = boost
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.014459559 = queryNorm
0.3686667 = fieldWeight in 19, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.0625 = fieldNorm(doc=19)
0.19204615 = weight(abstract_txt:text in 19) [ClassicSimilarity], result of:
0.19204615 = score(doc=19,freq=10.0), product of:
0.24046363 = queryWeight, product of:
4.115458 = boost
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.014459559 = queryNorm
0.7986495 = fieldWeight in 19, product of:
3.1622777 = tf(freq=10.0), with freq of:
10.0 = termFreq=10.0
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.0625 = fieldNorm(doc=19)
0.09424071 = weight(abstract_txt:processing in 19) [ClassicSimilarity], result of:
0.09424071 = score(doc=19,freq=1.0), product of:
0.30616516 = queryWeight, product of:
4.299302 = boost
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.014459559 = queryNorm
0.30781004 = fieldWeight in 19, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.0625 = fieldNorm(doc=19)
0.46372035 = weight(abstract_txt:mining in 19) [ClassicSimilarity], result of:
0.46372035 = score(doc=19,freq=9.0), product of:
0.40070638 = queryWeight, product of:
4.489961 = boost
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.014459559 = queryNorm
1.1572572 = fieldWeight in 19, product of:
3.0 = tf(freq=9.0), with freq of:
9.0 = termFreq=9.0
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.0625 = fieldNorm(doc=19)
0.24 = coord(6/25)
-
Teich, E.; Degaetano-Ortlieb, S.; Fankhauser, P.; Kermes, H.; Lapshinova-Koltunski, E.: ¬The linguistic construal of disciplinarity : a data-mining approach using register features (2016)
0.20
0.19808747 = sum of:
0.19808747 = product of:
0.7074552 = sum of:
0.053365085 = weight(abstract_txt:speech in 4015) [ClassicSimilarity], result of:
0.053365085 = score(doc=4015,freq=1.0), product of:
0.09938277 = queryWeight, product of:
6.8731537 = idf(docFreq=124, maxDocs=44421)
0.014459559 = queryNorm
0.53696513 = fieldWeight in 4015, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
6.8731537 = idf(docFreq=124, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.06423871 = weight(abstract_txt:natural in 4015) [ClassicSimilarity], result of:
0.06423871 = score(doc=4015,freq=1.0), product of:
0.16219766 = queryWeight, product of:
2.2127247 = boost
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.014459559 = queryNorm
0.396052 = fieldWeight in 4015, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.07988339 = weight(abstract_txt:construction in 4015) [ClassicSimilarity], result of:
0.07988339 = score(doc=4015,freq=1.0), product of:
0.18756467 = queryWeight, product of:
2.379472 = boost
5.4514923 = idf(docFreq=517, maxDocs=44421)
0.014459559 = queryNorm
0.42589784 = fieldWeight in 4015, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
5.4514923 = idf(docFreq=517, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.067465335 = weight(abstract_txt:language in 4015) [ClassicSimilarity], result of:
0.067465335 = score(doc=4015,freq=2.0), product of:
0.14639854 = queryWeight, product of:
2.4274082 = boost
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.014459559 = queryNorm
0.46083337 = fieldWeight in 4015, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.131485 = weight(abstract_txt:text in 4015) [ClassicSimilarity], result of:
0.131485 = score(doc=4015,freq=3.0), product of:
0.24046363 = queryWeight, product of:
4.115458 = boost
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.014459559 = queryNorm
0.5467979 = fieldWeight in 4015, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.11780089 = weight(abstract_txt:processing in 4015) [ClassicSimilarity], result of:
0.11780089 = score(doc=4015,freq=1.0), product of:
0.30616516 = queryWeight, product of:
4.299302 = boost
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.014459559 = queryNorm
0.38476256 = fieldWeight in 4015, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.19321682 = weight(abstract_txt:mining in 4015) [ClassicSimilarity], result of:
0.19321682 = score(doc=4015,freq=1.0), product of:
0.40070638 = queryWeight, product of:
4.489961 = boost
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.014459559 = queryNorm
0.48219052 = fieldWeight in 4015, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
6.1720386 = idf(docFreq=251, maxDocs=44421)
0.078125 = fieldNorm(doc=4015)
0.28 = coord(7/25)
-
Taylor, S.L.: Integrating natural language understanding with document structure analysis (1994)
0.19
0.18614504 = sum of:
0.18614504 = product of:
0.77560437 = sum of:
0.069842026 = weight(abstract_txt:document in 1862) [ClassicSimilarity], result of:
0.069842026 = score(doc=1862,freq=5.0), product of:
0.077586 = queryWeight, product of:
1.2495428 = boost
4.29415 = idf(docFreq=1647, maxDocs=44421)
0.014459559 = queryNorm
0.9001885 = fieldWeight in 1862, product of:
2.236068 = tf(freq=5.0), with freq of:
5.0 = termFreq=5.0
4.29415 = idf(docFreq=1647, maxDocs=44421)
0.09375 = fieldNorm(doc=1862)
0.041912336 = weight(abstract_txt:applications in 1862) [ClassicSimilarity], result of:
0.041912336 = score(doc=1862,freq=1.0), product of:
0.09438943 = queryWeight, product of:
1.3782282 = boost
4.7363873 = idf(docFreq=1058, maxDocs=44421)
0.014459559 = queryNorm
0.4440363 = fieldWeight in 1862, product of:
1.0 = tf(freq=1.0), with freq of:
1.0 = termFreq=1.0
4.7363873 = idf(docFreq=1058, maxDocs=44421)
0.09375 = fieldNorm(doc=1862)
0.109016694 = weight(abstract_txt:natural in 1862) [ClassicSimilarity], result of:
0.109016694 = score(doc=1862,freq=2.0), product of:
0.16219766 = queryWeight, product of:
2.2127247 = boost
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.014459559 = queryNorm
0.6721225 = fieldWeight in 1862, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
5.0694656 = idf(docFreq=758, maxDocs=44421)
0.09375 = fieldNorm(doc=1862)
0.08095841 = weight(abstract_txt:language in 1862) [ClassicSimilarity], result of:
0.08095841 = score(doc=1862,freq=2.0), product of:
0.14639854 = queryWeight, product of:
2.4274082 = boost
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.014459559 = queryNorm
0.5530001 = fieldWeight in 1862, product of:
1.4142135 = tf(freq=2.0), with freq of:
2.0 = termFreq=2.0
4.1709876 = idf(docFreq=1863, maxDocs=44421)
0.09375 = fieldNorm(doc=1862)
0.15778202 = weight(abstract_txt:text in 1862) [ClassicSimilarity], result of:
0.15778202 = score(doc=1862,freq=3.0), product of:
0.24046363 = queryWeight, product of:
4.115458 = boost
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.014459559 = queryNorm
0.6561575 = fieldWeight in 1862, product of:
1.7320508 = tf(freq=3.0), with freq of:
3.0 = termFreq=3.0
4.040882 = idf(docFreq=2122, maxDocs=44421)
0.09375 = fieldNorm(doc=1862)
0.31609294 = weight(abstract_txt:processing in 1862) [ClassicSimilarity], result of:
0.31609294 = score(doc=1862,freq=5.0), product of:
0.30616516 = queryWeight, product of:
4.299302 = boost
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.014459559 = queryNorm
1.0324262 = fieldWeight in 1862, product of:
2.236068 = tf(freq=5.0), with freq of:
5.0 = termFreq=5.0
4.9249606 = idf(docFreq=876, maxDocs=44421)
0.09375 = fieldNorm(doc=1862)
0.24 = coord(6/25)