Document (#28941)

Author
Fong, A.C.M.
Title
Mining a Web citation database for document clustering
Source
Applied artificial intelligence. 16(2002) no.4, S.283-292
Year
2002
Theme
Citation indexing
Data Mining
Automatisches Klassifizieren

Similar documents (author)

  1. Fong, W.W.: Searching the World Wide Web (1996) 6.19
    6.1935673 = sum of:
      6.1935673 = weight(author_txt:fong in 6665) [ClassicSimilarity], result of:
        6.1935673 = fieldWeight in 6665, product of:
          1.0 = tf(freq=1.0), with freq of:
            1.0 = termFreq=1.0
          9.909708 = idf(docFreq=5, maxDocs=44421)
          0.625 = fieldNorm(doc=6665)
    
  2. Fong, K.Y.: Interpretive object-oriented facility which can access precompiled classes (1995) 6.19
    6.1935673 = sum of:
      6.1935673 = weight(author_txt:fong in 6902) [ClassicSimilarity], result of:
        6.1935673 = fieldWeight in 6902, product of:
          1.0 = tf(freq=1.0), with freq of:
            1.0 = termFreq=1.0
          9.909708 = idf(docFreq=5, maxDocs=44421)
          0.625 = fieldNorm(doc=6902)
    
  3. Tho, Q.T.; Hui, S.C.; Fong, A.C.M.: ¬A citation-based document retrieval system for finding research expertise (2007) 3.72
    3.7161405 = sum of:
      3.7161405 = weight(author_txt:fong in 1956) [ClassicSimilarity], result of:
        3.7161405 = fieldWeight in 1956, product of:
          1.0 = tf(freq=1.0), with freq of:
            1.0 = termFreq=1.0
          9.909708 = idf(docFreq=5, maxDocs=44421)
          0.375 = fieldNorm(doc=1956)
    
  4. Collard, J.; Paiva, V. de; Fong, B.; Subrahmanian, E.: Extracting mathematical concepts from text (2022) 3.10
    3.0967836 = sum of:
      3.0967836 = weight(author_txt:fong in 1669) [ClassicSimilarity], result of:
        3.0967836 = fieldWeight in 1669, product of:
          1.0 = tf(freq=1.0), with freq of:
            1.0 = termFreq=1.0
          9.909708 = idf(docFreq=5, maxDocs=44421)
          0.3125 = fieldNorm(doc=1669)
    

Similar documents (content)

  1. He, Y.; Hui, S.C.: PubSearch : a Web citation-based retrieval system (2001) 0.96
    0.9562069 = sum of:
      0.9562069 = product of:
        1.1952586 = sum of:
          0.13385524 = weight(abstract_txt:database in 5806) [ClassicSimilarity], result of:
            0.13385524 = score(doc=5806,freq=2.0), product of:
              0.28296694 = queryWeight, product of:
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.0660908 = queryNorm
              0.47304198 = fieldWeight in 5806, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.078125 = fieldNorm(doc=5806)
          0.16539733 = weight(abstract_txt:document in 5806) [ClassicSimilarity], result of:
            0.16539733 = score(doc=5806,freq=3.0), product of:
              0.2846431 = queryWeight, product of:
                1.0029575 = boost
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.0660908 = queryNorm
              0.5810692 = fieldWeight in 5806, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.078125 = fieldNorm(doc=5806)
          0.31536058 = weight(abstract_txt:citation in 5806) [ClassicSimilarity], result of:
            0.31536058 = score(doc=5806,freq=5.0), product of:
              0.36915067 = queryWeight, product of:
                1.1421785 = boost
                4.890223 = idf(docFreq=907, maxDocs=44421)
                0.0660908 = queryNorm
              0.85428685 = fieldWeight in 5806, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.890223 = idf(docFreq=907, maxDocs=44421)
                0.078125 = fieldNorm(doc=5806)
          0.5806455 = weight(abstract_txt:clustering in 5806) [ClassicSimilarity], result of:
            0.5806455 = score(doc=5806,freq=4.0), product of:
              0.5973692 = queryWeight, product of:
                1.4529597 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0660908 = queryNorm
              0.9720045 = fieldWeight in 5806, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.078125 = fieldNorm(doc=5806)
        0.8 = coord(4/5)
    
  2. Zhan, J.; Loh, H.T.: Using latent semantic indexing to improve the accuracy of document clustering (2007) 0.75
    0.7455908 = sum of:
      0.7455908 = product of:
        1.2426513 = sum of:
          0.1909844 = weight(abstract_txt:document in 1264) [ClassicSimilarity], result of:
            0.1909844 = score(doc=1264,freq=4.0), product of:
              0.2846431 = queryWeight, product of:
                1.0029575 = boost
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.0660908 = queryNorm
              0.6709609 = fieldWeight in 1264, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.078125 = fieldNorm(doc=1264)
          0.2835452 = weight(abstract_txt:mining in 1264) [ClassicSimilarity], result of:
            0.2835452 = score(doc=1264,freq=1.0), product of:
              0.5880356 = queryWeight, product of:
                1.4415641 = boost
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.0660908 = queryNorm
              0.48219052 = fieldWeight in 1264, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.078125 = fieldNorm(doc=1264)
          0.7681218 = weight(abstract_txt:clustering in 1264) [ClassicSimilarity], result of:
            0.7681218 = score(doc=1264,freq=7.0), product of:
              0.5973692 = queryWeight, product of:
                1.4529597 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0660908 = queryNorm
              1.285841 = fieldWeight in 1264, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.078125 = fieldNorm(doc=1264)
        0.6 = coord(3/5)
    
  3. Kostoff, R.N.; Rio, J.A. del; Humenik, J.A.; Garcia, E.O.; Ramirez, A.M.: Citation mining : integrating text mining and bibliometrics for research user profiling (2001) 0.72
    0.72398514 = sum of:
      0.72398514 = product of:
        0.9049814 = sum of:
          0.056789972 = weight(abstract_txt:database in 850) [ClassicSimilarity], result of:
            0.056789972 = score(doc=850,freq=1.0), product of:
              0.28296694 = queryWeight, product of:
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.0660908 = queryNorm
              0.20069472 = fieldWeight in 850, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.046875 = fieldNorm(doc=850)
          0.22388378 = weight(abstract_txt:citation in 850) [ClassicSimilarity], result of:
            0.22388378 = score(doc=850,freq=7.0), product of:
              0.36915067 = queryWeight, product of:
                1.1421785 = boost
                4.890223 = idf(docFreq=907, maxDocs=44421)
                0.0660908 = queryNorm
              0.60648346 = fieldWeight in 850, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                4.890223 = idf(docFreq=907, maxDocs=44421)
                0.046875 = fieldNorm(doc=850)
          0.450114 = weight(abstract_txt:mining in 850) [ClassicSimilarity], result of:
            0.450114 = score(doc=850,freq=7.0), product of:
              0.5880356 = queryWeight, product of:
                1.4415641 = boost
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.0660908 = queryNorm
              0.7654537 = fieldWeight in 850, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.046875 = fieldNorm(doc=850)
          0.17419365 = weight(abstract_txt:clustering in 850) [ClassicSimilarity], result of:
            0.17419365 = score(doc=850,freq=1.0), product of:
              0.5973692 = queryWeight, product of:
                1.4529597 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0660908 = queryNorm
              0.29160133 = fieldWeight in 850, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.046875 = fieldNorm(doc=850)
        0.8 = coord(4/5)
    
  4. Liu, X.; Yu, S.; Janssens, F.; Glänzel, W.; Moreau, Y.; Moor, B.de: Weighted hybrid clustering by combining text mining and bibliometrics on a large-scale journal database (2010) 0.69
    0.68779016 = sum of:
      0.68779016 = product of:
        1.1463169 = sum of:
          0.09464995 = weight(abstract_txt:database in 451) [ClassicSimilarity], result of:
            0.09464995 = score(doc=451,freq=1.0), product of:
              0.28296694 = queryWeight, product of:
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.0660908 = queryNorm
              0.3344912 = fieldWeight in 451, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.078125 = fieldNorm(doc=451)
          0.2835452 = weight(abstract_txt:mining in 451) [ClassicSimilarity], result of:
            0.2835452 = score(doc=451,freq=1.0), product of:
              0.5880356 = queryWeight, product of:
                1.4415641 = boost
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.0660908 = queryNorm
              0.48219052 = fieldWeight in 451, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.078125 = fieldNorm(doc=451)
          0.7681218 = weight(abstract_txt:clustering in 451) [ClassicSimilarity], result of:
            0.7681218 = score(doc=451,freq=7.0), product of:
              0.5973692 = queryWeight, product of:
                1.4529597 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0660908 = queryNorm
              1.285841 = fieldWeight in 451, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.078125 = fieldNorm(doc=451)
        0.6 = coord(3/5)
    
  5. Tho, Q.T.; Hui, S.C.; Fong, A.C.M.: ¬A citation-based document retrieval system for finding research expertise (2007) 0.64
    0.6401376 = sum of:
      0.6401376 = product of:
        0.80017203 = sum of:
          0.09464995 = weight(abstract_txt:database in 1956) [ClassicSimilarity], result of:
            0.09464995 = score(doc=1956,freq=1.0), product of:
              0.28296694 = queryWeight, product of:
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.0660908 = queryNorm
              0.3344912 = fieldWeight in 1956, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2814875 = idf(docFreq=1668, maxDocs=44421)
                0.078125 = fieldNorm(doc=1956)
          0.0954922 = weight(abstract_txt:document in 1956) [ClassicSimilarity], result of:
            0.0954922 = score(doc=1956,freq=1.0), product of:
              0.2846431 = queryWeight, product of:
                1.0029575 = boost
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.0660908 = queryNorm
              0.33548045 = fieldWeight in 1956, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.29415 = idf(docFreq=1647, maxDocs=44421)
                0.078125 = fieldNorm(doc=1956)
          0.19945152 = weight(abstract_txt:citation in 1956) [ClassicSimilarity], result of:
            0.19945152 = score(doc=1956,freq=2.0), product of:
              0.36915067 = queryWeight, product of:
                1.1421785 = boost
                4.890223 = idf(docFreq=907, maxDocs=44421)
                0.0660908 = queryNorm
              0.5402984 = fieldWeight in 1956, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.890223 = idf(docFreq=907, maxDocs=44421)
                0.078125 = fieldNorm(doc=1956)
          0.41057837 = weight(abstract_txt:clustering in 1956) [ClassicSimilarity], result of:
            0.41057837 = score(doc=1956,freq=2.0), product of:
              0.5973692 = queryWeight, product of:
                1.4529597 = boost
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.0660908 = queryNorm
              0.68731093 = fieldWeight in 1956, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.2208285 = idf(docFreq=239, maxDocs=44421)
                0.078125 = fieldNorm(doc=1956)
        0.8 = coord(4/5)