Document (#19939)

Author
Salton, G.
Buckley, C.
Title
Term-weighting approaches in automatic text retrieval
Source
Information processing and management. 24(1988) no.5, S.513-523
Year
1988
Footnote
Wiederabgedruckt in: Readings in information retrieval. Ed.: K. Sparck Jones u. P. Willett. San Francisco: Morgan Kaufmann 1997. S.323-328.
Theme
Retrievalalgorithmen

Similar documents (author)

  1. Salton, G.; Buckley, C.: Parallel text search methods (1988) 5.80
    5.798373 = sum of:
      5.798373 = sum of:
        2.4666731 = weight(author_txt:salton in 403) [ClassicSimilarity], result of:
          2.4666731 = score(doc=403,freq=1.0), product of:
            0.6333374 = queryWeight, product of:
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.08130713 = queryNorm
            3.8947222 = fieldWeight in 403, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.5 = fieldNorm(doc=403)
        3.3317 = weight(author_txt:buckley in 403) [ClassicSimilarity], result of:
          3.3317 = score(doc=403,freq=1.0), product of:
            0.7738759 = queryWeight, product of:
              1.1053965 = boost
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.08130713 = queryNorm
            4.3052125 = fieldWeight in 403, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.5 = fieldNorm(doc=403)
    
  2. Salton, G.; Buckley, C.: Approaches to global text analysis (1990) 5.80
    5.798373 = sum of:
      5.798373 = sum of:
        2.4666731 = weight(author_txt:salton in 4900) [ClassicSimilarity], result of:
          2.4666731 = score(doc=4900,freq=1.0), product of:
            0.6333374 = queryWeight, product of:
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.08130713 = queryNorm
            3.8947222 = fieldWeight in 4900, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.5 = fieldNorm(doc=4900)
        3.3317 = weight(author_txt:buckley in 4900) [ClassicSimilarity], result of:
          3.3317 = score(doc=4900,freq=1.0), product of:
            0.7738759 = queryWeight, product of:
              1.1053965 = boost
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.08130713 = queryNorm
            4.3052125 = fieldWeight in 4900, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.5 = fieldNorm(doc=4900)
    
  3. Salton, G.; Buckley, C.: Improving retrieval performance by relevance feedback (1990) 5.80
    5.798373 = sum of:
      5.798373 = sum of:
        2.4666731 = weight(author_txt:salton in 5441) [ClassicSimilarity], result of:
          2.4666731 = score(doc=5441,freq=1.0), product of:
            0.6333374 = queryWeight, product of:
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.08130713 = queryNorm
            3.8947222 = fieldWeight in 5441, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.5 = fieldNorm(doc=5441)
        3.3317 = weight(author_txt:buckley in 5441) [ClassicSimilarity], result of:
          3.3317 = score(doc=5441,freq=1.0), product of:
            0.7738759 = queryWeight, product of:
              1.1053965 = boost
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.08130713 = queryNorm
            4.3052125 = fieldWeight in 5441, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.5 = fieldNorm(doc=5441)
    
  4. Salton, G.; Buckley, C.; Allan, J.: Automatic structuring of text files (1992) 4.35
    4.34878 = sum of:
      4.34878 = sum of:
        1.8500049 = weight(author_txt:salton in 6506) [ClassicSimilarity], result of:
          1.8500049 = score(doc=6506,freq=1.0), product of:
            0.6333374 = queryWeight, product of:
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.08130713 = queryNorm
            2.9210417 = fieldWeight in 6506, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.375 = fieldNorm(doc=6506)
        2.4987752 = weight(author_txt:buckley in 6506) [ClassicSimilarity], result of:
          2.4987752 = score(doc=6506,freq=1.0), product of:
            0.7738759 = queryWeight, product of:
              1.1053965 = boost
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.08130713 = queryNorm
            3.2289095 = fieldWeight in 6506, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.375 = fieldNorm(doc=6506)
    
  5. Salton, G.; Buckley, C.; Smith, M.: On the application of syntactic methodologies in automatic text analysis (1990) 4.35
    4.34878 = sum of:
      4.34878 = sum of:
        1.8500049 = weight(author_txt:salton in 7863) [ClassicSimilarity], result of:
          1.8500049 = score(doc=7863,freq=1.0), product of:
            0.6333374 = queryWeight, product of:
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.08130713 = queryNorm
            2.9210417 = fieldWeight in 7863, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7894444 = idf(docFreq=49, maxDocs=44421)
              0.375 = fieldNorm(doc=7863)
        2.4987752 = weight(author_txt:buckley in 7863) [ClassicSimilarity], result of:
          2.4987752 = score(doc=7863,freq=1.0), product of:
            0.7738759 = queryWeight, product of:
              1.1053965 = boost
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.08130713 = queryNorm
            3.2289095 = fieldWeight in 7863, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.610425 = idf(docFreq=21, maxDocs=44421)
              0.375 = fieldNorm(doc=7863)
    

Similar documents (content)

  1. Harman, D.: ¬The Text REtrieval Conferences (TRECs) : providing a test-bed for information retrieval systems (1998) 0.88
    0.8818998 = sum of:
      0.8818998 = product of:
        1.0582798 = sum of:
          0.101904534 = weight(abstract_txt:retrieval in 2314) [ClassicSimilarity], result of:
            0.101904534 = score(doc=2314,freq=3.0), product of:
              0.18051754 = queryWeight, product of:
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.051925078 = queryNorm
              0.5645132 = fieldWeight in 2314, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.09375 = fieldNorm(doc=2314)
          0.13066214 = weight(abstract_txt:text in 2314) [ClassicSimilarity], result of:
            0.13066214 = score(doc=2314,freq=2.0), product of:
              0.24388625 = queryWeight, product of:
                1.1623421 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.051925078 = queryNorm
              0.5357503 = fieldWeight in 2314, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.09375 = fieldNorm(doc=2314)
          0.15434553 = weight(abstract_txt:term in 2314) [ClassicSimilarity], result of:
            0.15434553 = score(doc=2314,freq=1.0), product of:
              0.34336826 = queryWeight, product of:
                1.3791782 = boost
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.051925078 = queryNorm
              0.44950435 = fieldWeight in 2314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.09375 = fieldNorm(doc=2314)
          0.19639674 = weight(abstract_txt:automatic in 2314) [ClassicSimilarity], result of:
            0.19639674 = score(doc=2314,freq=1.0), product of:
              0.4031998 = queryWeight, product of:
                1.4945155 = boost
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.051925078 = queryNorm
              0.48709533 = fieldWeight in 2314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.09375 = fieldNorm(doc=2314)
          0.47497082 = weight(abstract_txt:weighting in 2314) [ClassicSimilarity], result of:
            0.47497082 = score(doc=2314,freq=1.0), product of:
              0.72645503 = queryWeight, product of:
                2.0060635 = boost
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.051925078 = queryNorm
              0.65382 = fieldWeight in 2314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.09375 = fieldNorm(doc=2314)
        0.8333333 = coord(5/6)
    
  2. Ko, Y.: ¬A new term-weighting scheme for text classification using the odds of positive and negative class probabilities (2015) 0.88
    0.87574494 = sum of:
      0.87574494 = product of:
        1.3136173 = sum of:
          0.09805769 = weight(abstract_txt:retrieval in 3339) [ClassicSimilarity], result of:
            0.09805769 = score(doc=3339,freq=4.0), product of:
              0.18051754 = queryWeight, product of:
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.051925078 = queryNorm
              0.5432031 = fieldWeight in 3339, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.078125 = fieldNorm(doc=3339)
          0.10888512 = weight(abstract_txt:text in 3339) [ClassicSimilarity], result of:
            0.10888512 = score(doc=3339,freq=2.0), product of:
              0.24388625 = queryWeight, product of:
                1.1623421 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.051925078 = queryNorm
              0.4464586 = fieldWeight in 3339, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.078125 = fieldNorm(doc=3339)
          0.3150565 = weight(abstract_txt:term in 3339) [ClassicSimilarity], result of:
            0.3150565 = score(doc=3339,freq=6.0), product of:
              0.34336826 = queryWeight, product of:
                1.3791782 = boost
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.051925078 = queryNorm
              0.917547 = fieldWeight in 3339, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.078125 = fieldNorm(doc=3339)
          0.79161805 = weight(abstract_txt:weighting in 3339) [ClassicSimilarity], result of:
            0.79161805 = score(doc=3339,freq=4.0), product of:
              0.72645503 = queryWeight, product of:
                2.0060635 = boost
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.051925078 = queryNorm
              1.0897 = fieldWeight in 3339, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.078125 = fieldNorm(doc=3339)
        0.6666667 = coord(4/6)
    
  3. Faraj, N.: Analyse d'une methode d'indexation automatique basée sur une analyse syntaxique de texte (1996) 0.87
    0.87292194 = sum of:
      0.87292194 = product of:
        1.3093829 = sum of:
          0.12318945 = weight(abstract_txt:text in 684) [ClassicSimilarity], result of:
            0.12318945 = score(doc=684,freq=1.0), product of:
              0.24388625 = queryWeight, product of:
                1.1623421 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.051925078 = queryNorm
              0.50511026 = fieldWeight in 684, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.125 = fieldNorm(doc=684)
          0.2910367 = weight(abstract_txt:term in 684) [ClassicSimilarity], result of:
            0.2910367 = score(doc=684,freq=2.0), product of:
              0.34336826 = queryWeight, product of:
                1.3791782 = boost
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.051925078 = queryNorm
              0.8475935 = fieldWeight in 684, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.125 = fieldNorm(doc=684)
          0.2618623 = weight(abstract_txt:automatic in 684) [ClassicSimilarity], result of:
            0.2618623 = score(doc=684,freq=1.0), product of:
              0.4031998 = queryWeight, product of:
                1.4945155 = boost
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.051925078 = queryNorm
              0.64946043 = fieldWeight in 684, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.125 = fieldNorm(doc=684)
          0.6332944 = weight(abstract_txt:weighting in 684) [ClassicSimilarity], result of:
            0.6332944 = score(doc=684,freq=1.0), product of:
              0.72645503 = queryWeight, product of:
                2.0060635 = boost
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.051925078 = queryNorm
              0.87175995 = fieldWeight in 684, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.125 = fieldNorm(doc=684)
        0.6666667 = coord(4/6)
    
  4. Robertson, S.E.: OKAPI at TREC-1 (1994) 0.87
    0.86869544 = sum of:
      0.86869544 = product of:
        1.3030431 = sum of:
          0.07844616 = weight(abstract_txt:retrieval in 7952) [ClassicSimilarity], result of:
            0.07844616 = score(doc=7952,freq=1.0), product of:
              0.18051754 = queryWeight, product of:
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.051925078 = queryNorm
              0.4345625 = fieldWeight in 7952, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.125 = fieldNorm(doc=7952)
          0.12318945 = weight(abstract_txt:text in 7952) [ClassicSimilarity], result of:
            0.12318945 = score(doc=7952,freq=1.0), product of:
              0.24388625 = queryWeight, product of:
                1.1623421 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.051925078 = queryNorm
              0.50511026 = fieldWeight in 7952, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.125 = fieldNorm(doc=7952)
          0.20579404 = weight(abstract_txt:term in 7952) [ClassicSimilarity], result of:
            0.20579404 = score(doc=7952,freq=1.0), product of:
              0.34336826 = queryWeight, product of:
                1.3791782 = boost
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.051925078 = queryNorm
              0.5993391 = fieldWeight in 7952, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.125 = fieldNorm(doc=7952)
          0.8956135 = weight(abstract_txt:weighting in 7952) [ClassicSimilarity], result of:
            0.8956135 = score(doc=7952,freq=2.0), product of:
              0.72645503 = queryWeight, product of:
                2.0060635 = boost
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.051925078 = queryNorm
              1.2328547 = fieldWeight in 7952, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.125 = fieldNorm(doc=7952)
        0.6666667 = coord(4/6)
    
  5. Harman, D.: Overview of the first Text Retrieval Conference (1993) 0.83
    0.83442485 = sum of:
      0.83442485 = product of:
        1.0013099 = sum of:
          0.08320471 = weight(abstract_txt:retrieval in 616) [ClassicSimilarity], result of:
            0.08320471 = score(doc=616,freq=2.0), product of:
              0.18051754 = queryWeight, product of:
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.051925078 = queryNorm
              0.46092314 = fieldWeight in 616, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.09375 = fieldNorm(doc=616)
          0.09239209 = weight(abstract_txt:text in 616) [ClassicSimilarity], result of:
            0.09239209 = score(doc=616,freq=1.0), product of:
              0.24388625 = queryWeight, product of:
                1.1623421 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.051925078 = queryNorm
              0.3788327 = fieldWeight in 616, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.09375 = fieldNorm(doc=616)
          0.15434553 = weight(abstract_txt:term in 616) [ClassicSimilarity], result of:
            0.15434553 = score(doc=616,freq=1.0), product of:
              0.34336826 = queryWeight, product of:
                1.3791782 = boost
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.051925078 = queryNorm
              0.44950435 = fieldWeight in 616, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.794713 = idf(docFreq=998, maxDocs=44421)
                0.09375 = fieldNorm(doc=616)
          0.19639674 = weight(abstract_txt:automatic in 616) [ClassicSimilarity], result of:
            0.19639674 = score(doc=616,freq=1.0), product of:
              0.4031998 = queryWeight, product of:
                1.4945155 = boost
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.051925078 = queryNorm
              0.48709533 = fieldWeight in 616, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.09375 = fieldNorm(doc=616)
          0.47497082 = weight(abstract_txt:weighting in 616) [ClassicSimilarity], result of:
            0.47497082 = score(doc=616,freq=1.0), product of:
              0.72645503 = queryWeight, product of:
                2.0060635 = boost
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.051925078 = queryNorm
              0.65382 = fieldWeight in 616, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9740796 = idf(docFreq=112, maxDocs=44421)
                0.09375 = fieldNorm(doc=616)
        0.8333333 = coord(5/6)