Document (#22578)

Author
Chowdhury, G.G.
Title
Template mining for information extraction from digital documents
Source
Library trends. 48(1999) no.1, S.182-208
Year
1999
Theme
Data Mining

Similar documents (author)

  1. Chowdhury, G.G.; Chowdhury, S.: ¬An overview of the information retrieval features of twenty digital libraries (2000) 5.65
    5.648295 = sum of:
      5.648295 = weight(author_txt:chowdhury in 518) [ClassicSimilarity], result of:
        5.648295 = fieldWeight in 518, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          7.9878955 = idf(docFreq=40, maxDocs=44421)
          0.5 = fieldNorm(doc=518)
    
  2. Chowdhury, S.; Chowdhury, G.G.: Text retrieval system : an overview (1992) 5.65
    5.648295 = sum of:
      5.648295 = weight(author_txt:chowdhury in 6507) [ClassicSimilarity], result of:
        5.648295 = fieldWeight in 6507, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          7.9878955 = idf(docFreq=40, maxDocs=44421)
          0.5 = fieldNorm(doc=6507)
    
  3. Chowdhury, S.; Chowdhury, G.G.: Development of library management system using Micro-CDS/ISIS (1992) 5.65
    5.648295 = sum of:
      5.648295 = weight(author_txt:chowdhury in 440) [ClassicSimilarity], result of:
        5.648295 = fieldWeight in 440, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          7.9878955 = idf(docFreq=40, maxDocs=44421)
          0.5 = fieldNorm(doc=440)
    
  4. Chowdhury, G.G.; Chowdhury, S.: Text retrieval and library management software in India (1994) 5.65
    5.648295 = sum of:
      5.648295 = weight(author_txt:chowdhury in 2542) [ClassicSimilarity], result of:
        5.648295 = fieldWeight in 2542, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          7.9878955 = idf(docFreq=40, maxDocs=44421)
          0.5 = fieldNorm(doc=2542)
    
  5. Chowdhury, S.; Chowdhury, G.G.: Using DDC to create a visual knowledge map as an aid to online information retrieval (2004) 5.65
    5.648295 = sum of:
      5.648295 = weight(author_txt:chowdhury in 3643) [ClassicSimilarity], result of:
        5.648295 = fieldWeight in 3643, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          7.9878955 = idf(docFreq=40, maxDocs=44421)
          0.5 = fieldNorm(doc=3643)
    

Similar documents (content)

  1. Lawson, M.: Automatic extraction of citations from the text of English-language patents : an example of template mining (1996) 0.82
    0.8192773 = sum of:
      0.8192773 = product of:
        1.1469882 = sum of:
          0.020441484 = weight(abstract_txt:from in 3654) [ClassicSimilarity], result of:
            0.020441484 = score(doc=3654,freq=2.0), product of:
              0.083811365 = queryWeight, product of:
                1.1407663 = boost
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.02662513 = queryNorm
              0.2438987 = fieldWeight in 3654, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.0625 = fieldNorm(doc=3654)
          0.068204135 = weight(abstract_txt:documents in 3654) [ClassicSimilarity], result of:
            0.068204135 = score(doc=3654,freq=2.0), product of:
              0.18714078 = queryWeight, product of:
                1.7046273 = boost
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.02662513 = queryNorm
              0.3644536 = fieldWeight in 3654, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.0625 = fieldNorm(doc=3654)
          0.16174833 = weight(abstract_txt:mining in 3654) [ClassicSimilarity], result of:
            0.16174833 = score(doc=3654,freq=1.0), product of:
              0.4193061 = queryWeight, product of:
                2.5515895 = boost
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.02662513 = queryNorm
              0.3857524 = fieldWeight in 3654, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.0625 = fieldNorm(doc=3654)
          0.23098214 = weight(abstract_txt:extraction in 3654) [ClassicSimilarity], result of:
            0.23098214 = score(doc=3654,freq=2.0), product of:
              0.4220335 = queryWeight, product of:
                2.5598745 = boost
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.02662513 = queryNorm
              0.5473076 = fieldWeight in 3654, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.0625 = fieldNorm(doc=3654)
          0.6656121 = weight(abstract_txt:template in 3654) [ClassicSimilarity], result of:
            0.6656121 = score(doc=3654,freq=3.0), product of:
              0.7465834 = queryWeight, product of:
                3.4047434 = boost
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.02662513 = queryNorm
              0.89154416 = fieldWeight in 3654, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.0625 = fieldNorm(doc=3654)
        0.71428573 = coord(5/7)
    
  2. Barrio, P.; Gravano, L.: Sampling strategies for information extraction over the deep web (2017) 0.48
    0.47620827 = sum of:
      0.47620827 = product of:
        0.66669154 = sum of:
          0.024096861 = weight(abstract_txt:information in 4412) [ClassicSimilarity], result of:
            0.024096861 = score(doc=4412,freq=8.0), product of:
              0.06440352 = queryWeight, product of:
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.02662513 = queryNorm
              0.37415442 = fieldWeight in 4412, product of:
                2.828427 = tf(freq=8.0), with freq of:
                  8.0 = termFreq=8.0
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.0546875 = fieldNorm(doc=4412)
          0.012647523 = weight(abstract_txt:from in 4412) [ClassicSimilarity], result of:
            0.012647523 = score(doc=4412,freq=1.0), product of:
              0.083811365 = queryWeight, product of:
                1.1407663 = boost
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.02662513 = queryNorm
              0.15090463 = fieldWeight in 4412, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.0546875 = fieldNorm(doc=4412)
          0.059678618 = weight(abstract_txt:documents in 4412) [ClassicSimilarity], result of:
            0.059678618 = score(doc=4412,freq=2.0), product of:
              0.18714078 = queryWeight, product of:
                1.7046273 = boost
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.02662513 = queryNorm
              0.31889692 = fieldWeight in 4412, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.0546875 = fieldNorm(doc=4412)
          0.1415298 = weight(abstract_txt:mining in 4412) [ClassicSimilarity], result of:
            0.1415298 = score(doc=4412,freq=1.0), product of:
              0.4193061 = queryWeight, product of:
                2.5515895 = boost
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.02662513 = queryNorm
              0.33753335 = fieldWeight in 4412, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.0546875 = fieldNorm(doc=4412)
          0.42873874 = weight(abstract_txt:extraction in 4412) [ClassicSimilarity], result of:
            0.42873874 = score(doc=4412,freq=9.0), product of:
              0.4220335 = queryWeight, product of:
                2.5598745 = boost
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.02662513 = queryNorm
              1.015888 = fieldWeight in 4412, product of:
                3.0 = tf(freq=9.0), with freq of:
                  9.0 = termFreq=9.0
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.0546875 = fieldNorm(doc=4412)
        0.71428573 = coord(5/7)
    
  3. Yim, W.-w.; Kwan, S.W.; Yetisgen, M.: Classifying tumor event attributes in radiology reports (2017) 0.46
    0.46386164 = sum of:
      0.46386164 = product of:
        0.81175786 = sum of:
          0.01686429 = weight(abstract_txt:information in 4929) [ClassicSimilarity], result of:
            0.01686429 = score(doc=4929,freq=3.0), product of:
              0.06440352 = queryWeight, product of:
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.02662513 = queryNorm
              0.26185355 = fieldWeight in 4929, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.0625 = fieldNorm(doc=4929)
          0.020441484 = weight(abstract_txt:from in 4929) [ClassicSimilarity], result of:
            0.020441484 = score(doc=4929,freq=2.0), product of:
              0.083811365 = queryWeight, product of:
                1.1407663 = boost
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.02662513 = queryNorm
              0.2438987 = fieldWeight in 4929, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.0625 = fieldNorm(doc=4929)
          0.23098214 = weight(abstract_txt:extraction in 4929) [ClassicSimilarity], result of:
            0.23098214 = score(doc=4929,freq=2.0), product of:
              0.4220335 = queryWeight, product of:
                2.5598745 = boost
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.02662513 = queryNorm
              0.5473076 = fieldWeight in 4929, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.0625 = fieldNorm(doc=4929)
          0.54346997 = weight(abstract_txt:template in 4929) [ClassicSimilarity], result of:
            0.54346997 = score(doc=4929,freq=2.0), product of:
              0.7465834 = queryWeight, product of:
                3.4047434 = boost
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.02662513 = queryNorm
              0.72794276 = fieldWeight in 4929, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.0625 = fieldNorm(doc=4929)
        0.5714286 = coord(4/7)
    
  4. Ku, L.-W.; Chen, H.-H.: Mining opinions from the Web : beyond relevance retrieval (2007) 0.43
    0.4300042 = sum of:
      0.4300042 = product of:
        0.6020059 = sum of:
          0.021771707 = weight(abstract_txt:information in 1605) [ClassicSimilarity], result of:
            0.021771707 = score(doc=1605,freq=5.0), product of:
              0.06440352 = queryWeight, product of:
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.02662513 = queryNorm
              0.3380515 = fieldWeight in 1605, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.0625 = fieldNorm(doc=1605)
          0.028908623 = weight(abstract_txt:from in 1605) [ClassicSimilarity], result of:
            0.028908623 = score(doc=1605,freq=4.0), product of:
              0.083811365 = queryWeight, product of:
                1.1407663 = boost
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.02662513 = queryNorm
              0.34492487 = fieldWeight in 1605, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                2.759399 = idf(docFreq=7646, maxDocs=44421)
                0.0625 = fieldNorm(doc=1605)
          0.10784021 = weight(abstract_txt:documents in 1605) [ClassicSimilarity], result of:
            0.10784021 = score(doc=1605,freq=5.0), product of:
              0.18714078 = queryWeight, product of:
                1.7046273 = boost
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.02662513 = queryNorm
              0.5762518 = fieldWeight in 1605, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.123322 = idf(docFreq=1954, maxDocs=44421)
                0.0625 = fieldNorm(doc=1605)
          0.2801563 = weight(abstract_txt:mining in 1605) [ClassicSimilarity], result of:
            0.2801563 = score(doc=1605,freq=3.0), product of:
              0.4193061 = queryWeight, product of:
                2.5515895 = boost
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.02662513 = queryNorm
              0.66814274 = fieldWeight in 1605, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.1720386 = idf(docFreq=251, maxDocs=44421)
                0.0625 = fieldNorm(doc=1605)
          0.16332905 = weight(abstract_txt:extraction in 1605) [ClassicSimilarity], result of:
            0.16332905 = score(doc=1605,freq=1.0), product of:
              0.4220335 = queryWeight, product of:
                2.5598745 = boost
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.02662513 = queryNorm
              0.38700494 = fieldWeight in 1605, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.0625 = fieldNorm(doc=1605)
        0.71428573 = coord(5/7)
    
  5. Yang, T.-H.; Hsieh, Y.-L.; Liu, S.-H.; Chang, Y.-C.; Hsu, W.-L.: ¬A flexible template generation and matching method with applications for publication reference metadata extraction (2021) 0.40
    0.40356353 = sum of:
      0.40356353 = product of:
        0.94164824 = sum of:
          0.009736602 = weight(abstract_txt:information in 1064) [ClassicSimilarity], result of:
            0.009736602 = score(doc=1064,freq=1.0), product of:
              0.06440352 = queryWeight, product of:
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.02662513 = queryNorm
              0.15118122 = fieldWeight in 1064, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                2.4188995 = idf(docFreq=10748, maxDocs=44421)
                0.0625 = fieldNorm(doc=1064)
          0.16332905 = weight(abstract_txt:extraction in 1064) [ClassicSimilarity], result of:
            0.16332905 = score(doc=1064,freq=1.0), product of:
              0.4220335 = queryWeight, product of:
                2.5598745 = boost
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.02662513 = queryNorm
              0.38700494 = fieldWeight in 1064, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.192079 = idf(docFreq=246, maxDocs=44421)
                0.0625 = fieldNorm(doc=1064)
          0.7685826 = weight(abstract_txt:template in 1064) [ClassicSimilarity], result of:
            0.7685826 = score(doc=1064,freq=4.0), product of:
              0.7465834 = queryWeight, product of:
                3.4047434 = boost
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.02662513 = queryNorm
              1.0294665 = fieldWeight in 1064, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.0625 = fieldNorm(doc=1064)
        0.42857143 = coord(3/7)