Document (#29085)

Author
Yu, W.
Gong, Y.
Title
Document clustering by concept factorization
Source
SIGIR'04: Proceedings of the 27th Annual International ACM-SIGIR Conference an Research and Development in Information Retrieval. Ed.: K. Järvelin, u.a
Imprint
New York, NY : ACM Press
Year
2004
Pages
S.202-209
Theme
Automatisches Klassifizieren

Similar documents (content)

  1. Cai, X.; Li, W.: Enhancing sentence-level clustering with integrated and interactive frameworks for theme-based summarization (2011) 0.61
    0.61012787 = sum of:
      0.61012787 = product of:
        0.8135038 = sum of:
          0.122821845 = weight(abstract_txt:document in 770) [ClassicSimilarity], result of:
            0.122821845 = score(doc=770,freq=6.0), product of:
              0.18682835 = queryWeight, product of:
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.043507643 = queryNorm
              0.6574048 = fieldWeight in 770, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.0625 = fieldNorm(doc=770)
          0.100265175 = weight(abstract_txt:concept in 770) [ClassicSimilarity], result of:
            0.100265175 = score(doc=770,freq=3.0), product of:
              0.205606 = queryWeight, product of:
                1.0490508 = boost
                4.5047812 = idf(docFreq=1334, maxDocs=44421)
                0.043507643 = queryNorm
              0.48765686 = fieldWeight in 770, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.5047812 = idf(docFreq=1334, maxDocs=44421)
                0.0625 = fieldNorm(doc=770)
          0.5904168 = weight(abstract_txt:clustering in 770) [ClassicSimilarity], result of:
            0.5904168 = score(doc=770,freq=15.0), product of:
              0.39208913 = queryWeight, product of:
                1.4486753 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.043507643 = queryNorm
              1.5058229 = fieldWeight in 770, product of:
                3.8729835 = tf(freq=15.0), with freq of:
                  15.0 = termFreq=15.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0625 = fieldNorm(doc=770)
        0.75 = coord(3/4)
    
  2. Lee, J.-H.; Park, S.; Ahn, C.-M.; Kim, D.: Automatic generic document summarization based on non-negative matrix factorization (2009) 0.44
    0.43563712 = sum of:
      0.43563712 = product of:
        0.87127423 = sum of:
          0.106366836 = weight(abstract_txt:document in 3448) [ClassicSimilarity], result of:
            0.106366836 = score(doc=3448,freq=2.0), product of:
              0.18682835 = queryWeight, product of:
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.043507643 = queryNorm
              0.5693292 = fieldWeight in 3448, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.09375 = fieldNorm(doc=3448)
          0.7649074 = weight(abstract_txt:factorization in 3448) [ClassicSimilarity], result of:
            0.7649074 = score(doc=3448,freq=1.0), product of:
              0.8769763 = queryWeight, product of:
                2.1665692 = boost
                9.303573 = idf(docFreq=10, maxDocs=44421)
                0.043507643 = queryNorm
              0.8722099 = fieldWeight in 3448, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.303573 = idf(docFreq=10, maxDocs=44421)
                0.09375 = fieldNorm(doc=3448)
        0.5 = coord(2/4)
    
  3. Berry, M.W.; Esau, R.; Kiefer, B.: ¬The use of text mining techniques in electronic discovery for legal matters (2012) 0.42
    0.42006007 = sum of:
      0.42006007 = product of:
        0.84012014 = sum of:
          0.07521272 = weight(abstract_txt:document in 1091) [ClassicSimilarity], result of:
            0.07521272 = score(doc=1091,freq=1.0), product of:
              0.18682835 = queryWeight, product of:
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.043507643 = queryNorm
              0.40257657 = fieldWeight in 1091, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.09375 = fieldNorm(doc=1091)
          0.7649074 = weight(abstract_txt:factorization in 1091) [ClassicSimilarity], result of:
            0.7649074 = score(doc=1091,freq=1.0), product of:
              0.8769763 = queryWeight, product of:
                2.1665692 = boost
                9.303573 = idf(docFreq=10, maxDocs=44421)
                0.043507643 = queryNorm
              0.8722099 = fieldWeight in 1091, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.303573 = idf(docFreq=10, maxDocs=44421)
                0.09375 = fieldNorm(doc=1091)
        0.5 = coord(2/4)
    
  4. Na, S.-H.; Kang, I.-S.; Lee, J.-H.: Adaptive document clustering based on query-based similarity (2007) 0.41
    0.4075657 = sum of:
      0.4075657 = product of:
        0.543421 = sum of:
          0.11212049 = weight(abstract_txt:document in 1920) [ClassicSimilarity], result of:
            0.11212049 = score(doc=1920,freq=5.0), product of:
              0.18682835 = queryWeight, product of:
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.043507643 = queryNorm
              0.6001257 = fieldWeight in 1920, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.0625 = fieldNorm(doc=1920)
          0.057888128 = weight(abstract_txt:concept in 1920) [ClassicSimilarity], result of:
            0.057888128 = score(doc=1920,freq=1.0), product of:
              0.205606 = queryWeight, product of:
                1.0490508 = boost
                4.5047812 = idf(docFreq=1334, maxDocs=44421)
                0.043507643 = queryNorm
              0.28154883 = fieldWeight in 1920, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5047812 = idf(docFreq=1334, maxDocs=44421)
                0.0625 = fieldNorm(doc=1920)
          0.37341234 = weight(abstract_txt:clustering in 1920) [ClassicSimilarity], result of:
            0.37341234 = score(doc=1920,freq=6.0), product of:
              0.39208913 = queryWeight, product of:
                1.4486753 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.043507643 = queryNorm
              0.952366 = fieldWeight in 1920, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0625 = fieldNorm(doc=1920)
        0.75 = coord(3/4)
    
  5. Lee, Y.-H.; Wei, C.-P.; Hu, P.J.-H.: ¬An ontology-based technique for preserving user preferences in document-category evolutions (2011) 0.34
    0.342327 = sum of:
      0.342327 = product of:
        0.45643598 = sum of:
          0.12409464 = weight(abstract_txt:document in 353) [ClassicSimilarity], result of:
            0.12409464 = score(doc=353,freq=8.0), product of:
              0.18682835 = queryWeight, product of:
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.043507643 = queryNorm
              0.6642174 = fieldWeight in 353, product of:
                2.828427 = tf(freq=8.0), with freq of:
                  8.0 = termFreq=8.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.0546875 = fieldNorm(doc=353)
          0.101304226 = weight(abstract_txt:concept in 353) [ClassicSimilarity], result of:
            0.101304226 = score(doc=353,freq=4.0), product of:
              0.205606 = queryWeight, product of:
                1.0490508 = boost
                4.5047812 = idf(docFreq=1334, maxDocs=44421)
                0.043507643 = queryNorm
              0.49271044 = fieldWeight in 353, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.5047812 = idf(docFreq=1334, maxDocs=44421)
                0.0546875 = fieldNorm(doc=353)
          0.23103711 = weight(abstract_txt:clustering in 353) [ClassicSimilarity], result of:
            0.23103711 = score(doc=353,freq=3.0), product of:
              0.39208913 = queryWeight, product of:
                1.4486753 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.043507643 = queryNorm
              0.5892464 = fieldWeight in 353, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0546875 = fieldNorm(doc=353)
        0.75 = coord(3/4)