Document (#24089)

Author
Ahonen, H.
Title
Knowledge discovery in documents by extracting frequent word sequences
Source
Library trends. 48(1999) no.1, S.160-181
Year
1999
Theme
Computerlinguistik
Informetrie

Similar documents (content)

  1. Torra, V.; Lanau, S.; Miyamoto, S.: Image clustering for the exploration of video sequences (2006) 0.36
    0.3601748 = sum of:
      0.3601748 = product of:
        1.2606118 = sum of:
          0.36445644 = weight(abstract_txt:extracting in 284) [ClassicSimilarity], result of:
            0.36445644 = score(doc=284,freq=1.0), product of:
              0.48077875 = queryWeight, product of:
                1.954319 = boost
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.035495028 = queryNorm
              0.7580544 = fieldWeight in 284, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.109375 = fieldNorm(doc=284)
          0.8961553 = weight(abstract_txt:sequences in 284) [ClassicSimilarity], result of:
            0.8961553 = score(doc=284,freq=4.0), product of:
              0.5517602 = queryWeight, product of:
                2.0936208 = boost
                7.4248013 = idf(docFreq=71, maxDocs=44421)
                0.035495028 = queryNorm
              1.6241753 = fieldWeight in 284, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.4248013 = idf(docFreq=71, maxDocs=44421)
                0.109375 = fieldNorm(doc=284)
        0.2857143 = coord(2/7)
    
  2. Wolfekuhler, M.R.; Punch, W.F.: Finding salient features for personal Web pages categories (1997) 0.31
    0.30941075 = sum of:
      0.30941075 = product of:
        0.7219584 = sum of:
          0.10853142 = weight(abstract_txt:documents in 3673) [ClassicSimilarity], result of:
            0.10853142 = score(doc=3673,freq=2.0), product of:
              0.17016694 = queryWeight, product of:
                1.1626806 = boost
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.035495028 = queryNorm
              0.63779384 = fieldWeight in 3673, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.109375 = fieldNorm(doc=3673)
          0.24897054 = weight(abstract_txt:word in 3673) [ClassicSimilarity], result of:
            0.24897054 = score(doc=3673,freq=2.0), product of:
              0.2959853 = queryWeight, product of:
                1.5334086 = boost
                5.4380693 = idf(docFreq=524, maxDocs=44421)
                0.035495028 = queryNorm
              0.84115845 = fieldWeight in 3673, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.4380693 = idf(docFreq=524, maxDocs=44421)
                0.109375 = fieldNorm(doc=3673)
          0.36445644 = weight(abstract_txt:extracting in 3673) [ClassicSimilarity], result of:
            0.36445644 = score(doc=3673,freq=1.0), product of:
              0.48077875 = queryWeight, product of:
                1.954319 = boost
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.035495028 = queryNorm
              0.7580544 = fieldWeight in 3673, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.109375 = fieldNorm(doc=3673)
        0.42857143 = coord(3/7)
    
  3. Fayyad, U.M.: Data mining and knowledge dicovery : making sense out of data (1996) 0.31
    0.30735156 = sum of:
      0.30735156 = product of:
        0.7171536 = sum of:
          0.0789162 = weight(abstract_txt:knowledge in 76) [ClassicSimilarity], result of:
            0.0789162 = score(doc=76,freq=2.0), product of:
              0.1258793 = queryWeight, product of:
                3.5463927 = idf(docFreq=3480, maxDocs=44421)
                0.035495028 = queryNorm
              0.62691957 = fieldWeight in 76, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.5463927 = idf(docFreq=3480, maxDocs=44421)
                0.125 = fieldNorm(doc=76)
          0.22171578 = weight(abstract_txt:discovery in 76) [ClassicSimilarity], result of:
            0.22171578 = score(doc=76,freq=1.0), product of:
              0.31578 = queryWeight, product of:
                1.583854 = boost
                5.616968 = idf(docFreq=438, maxDocs=44421)
                0.035495028 = queryNorm
              0.702121 = fieldWeight in 76, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.616968 = idf(docFreq=438, maxDocs=44421)
                0.125 = fieldNorm(doc=76)
          0.41652164 = weight(abstract_txt:extracting in 76) [ClassicSimilarity], result of:
            0.41652164 = score(doc=76,freq=1.0), product of:
              0.48077875 = queryWeight, product of:
                1.954319 = boost
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.035495028 = queryNorm
              0.86634785 = fieldWeight in 76, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.125 = fieldNorm(doc=76)
        0.42857143 = coord(3/7)
    
  4. Grau, B.: Finding answers to questions, in text collections or Web, in open domain or specialty domains (2012) 0.27
    0.26678798 = sum of:
      0.26678798 = product of:
        0.46687895 = sum of:
          0.02790109 = weight(abstract_txt:knowledge in 1107) [ClassicSimilarity], result of:
            0.02790109 = score(doc=1107,freq=1.0), product of:
              0.1258793 = queryWeight, product of:
                3.5463927 = idf(docFreq=3480, maxDocs=44421)
                0.035495028 = queryNorm
              0.22164954 = fieldWeight in 1107, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.5463927 = idf(docFreq=3480, maxDocs=44421)
                0.0625 = fieldNorm(doc=1107)
          0.043853316 = weight(abstract_txt:documents in 1107) [ClassicSimilarity], result of:
            0.043853316 = score(doc=1107,freq=1.0), product of:
              0.17016694 = queryWeight, product of:
                1.1626806 = boost
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.035495028 = queryNorm
              0.25770763 = fieldWeight in 1107, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.0625 = fieldNorm(doc=1107)
          0.10059929 = weight(abstract_txt:word in 1107) [ClassicSimilarity], result of:
            0.10059929 = score(doc=1107,freq=1.0), product of:
              0.2959853 = queryWeight, product of:
                1.5334086 = boost
                5.4380693 = idf(docFreq=524, maxDocs=44421)
                0.035495028 = queryNorm
              0.33987933 = fieldWeight in 1107, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.4380693 = idf(docFreq=524, maxDocs=44421)
                0.0625 = fieldNorm(doc=1107)
          0.29452527 = weight(abstract_txt:extracting in 1107) [ClassicSimilarity], result of:
            0.29452527 = score(doc=1107,freq=2.0), product of:
              0.48077875 = queryWeight, product of:
                1.954319 = boost
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.035495028 = queryNorm
              0.61260045 = fieldWeight in 1107, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.0625 = fieldNorm(doc=1107)
        0.5714286 = coord(4/7)
    
  5. Trybula, W.J.: Data mining and knowledge discovery (1997) 0.27
    0.2657338 = sum of:
      0.2657338 = product of:
        0.62004554 = sum of:
          0.07248916 = weight(abstract_txt:knowledge in 3300) [ClassicSimilarity], result of:
            0.07248916 = score(doc=3300,freq=3.0), product of:
              0.1258793 = queryWeight, product of:
                3.5463927 = idf(docFreq=3480, maxDocs=44421)
                0.035495028 = queryNorm
              0.5758624 = fieldWeight in 3300, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.5463927 = idf(docFreq=3480, maxDocs=44421)
                0.09375 = fieldNorm(doc=3300)
          0.2351651 = weight(abstract_txt:discovery in 3300) [ClassicSimilarity], result of:
            0.2351651 = score(doc=3300,freq=2.0), product of:
              0.31578 = queryWeight, product of:
                1.583854 = boost
                5.616968 = idf(docFreq=438, maxDocs=44421)
                0.035495028 = queryNorm
              0.7447118 = fieldWeight in 3300, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.616968 = idf(docFreq=438, maxDocs=44421)
                0.09375 = fieldNorm(doc=3300)
          0.31239125 = weight(abstract_txt:extracting in 3300) [ClassicSimilarity], result of:
            0.31239125 = score(doc=3300,freq=1.0), product of:
              0.48077875 = queryWeight, product of:
                1.954319 = boost
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.035495028 = queryNorm
              0.6497609 = fieldWeight in 3300, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.930783 = idf(docFreq=117, maxDocs=44421)
                0.09375 = fieldNorm(doc=3300)
        0.42857143 = coord(3/7)