Document (#18152)

Author
Thistlewaite, P.
Title
Automatic construction and management of large open webs
Source
Information processing and management. 33(1997) no.2, S.161-173
Year
1997
Abstract
Reviews the problems associated with manually created or maintained hyperdocument links, and the consequent need for automated methods. A number of techniques have been applied to the problem, including pattern-matching, information retrieval, and natural language processing. Describes a system for the automatic detection and management of structural and referential links. Addresses the issues of link-set soundness and completeness, open link management, and the particular problem engendered by large volatile hyperbases
Footnote
Contribution to a special issue on methods and tools for the automatic construction of hypertext

Similar documents (content)

  1. Salton, G.: Automatic text structuring and summarization (1997) 0.08
    0.083394706 = sum of:
      0.083394706 = product of:
        0.5212169 = sum of:
          0.07822417 = weight(abstract_txt:pattern in 1145) [ClassicSimilarity], result of:
            0.07822417 = score(doc=1145,freq=1.0), product of:
              0.13376722 = queryWeight, product of:
                1.1861042 = boost
                6.2376356 = idf(docFreq=235, maxDocs=44421)
                0.018080352 = queryNorm
              0.5847783 = fieldWeight in 1145, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2376356 = idf(docFreq=235, maxDocs=44421)
                0.09375 = fieldNorm(doc=1145)
          0.18082939 = weight(abstract_txt:automatic in 1145) [ClassicSimilarity], result of:
            0.18082939 = score(doc=1145,freq=4.0), product of:
              0.18562013 = queryWeight, product of:
                1.975948 = boost
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.018080352 = queryNorm
              0.97419065 = fieldWeight in 1145, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.09375 = fieldNorm(doc=1145)
          0.09266516 = weight(abstract_txt:links in 1145) [ClassicSimilarity], result of:
            0.09266516 = score(doc=1145,freq=1.0), product of:
              0.18868761 = queryWeight, product of:
                1.9922079 = boost
                5.238438 = idf(docFreq=640, maxDocs=44421)
                0.018080352 = queryNorm
              0.4911036 = fieldWeight in 1145, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.238438 = idf(docFreq=640, maxDocs=44421)
                0.09375 = fieldNorm(doc=1145)
          0.16949822 = weight(abstract_txt:link in 1145) [ClassicSimilarity], result of:
            0.16949822 = score(doc=1145,freq=2.0), product of:
              0.22399199 = queryWeight, product of:
                2.170597 = boost
                5.707506 = idf(docFreq=400, maxDocs=44421)
                0.018080352 = queryNorm
              0.75671554 = fieldWeight in 1145, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.707506 = idf(docFreq=400, maxDocs=44421)
                0.09375 = fieldNorm(doc=1145)
        0.16 = coord(4/25)
    
  2. Sood, S.O.; Churchill, E.F.; Antin, J.: Automatic identification of personal insults on social news sites (2012) 0.07
    0.06738835 = sum of:
      0.06738835 = product of:
        0.33694172 = sum of:
          0.037759047 = weight(abstract_txt:automated in 976) [ClassicSimilarity], result of:
            0.037759047 = score(doc=976,freq=1.0), product of:
              0.10786086 = queryWeight, product of:
                1.0650743 = boost
                5.6011486 = idf(docFreq=445, maxDocs=44421)
                0.018080352 = queryNorm
              0.3500718 = fieldWeight in 976, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6011486 = idf(docFreq=445, maxDocs=44421)
                0.0625 = fieldNorm(doc=976)
          0.11569831 = weight(abstract_txt:detection in 976) [ClassicSimilarity], result of:
            0.11569831 = score(doc=976,freq=3.0), product of:
              0.15777111 = queryWeight, product of:
                1.288136 = boost
                6.774214 = idf(docFreq=137, maxDocs=44421)
                0.018080352 = queryNorm
              0.73333013 = fieldWeight in 976, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.774214 = idf(docFreq=137, maxDocs=44421)
                0.0625 = fieldNorm(doc=976)
          0.038110506 = weight(abstract_txt:problem in 976) [ClassicSimilarity], result of:
            0.038110506 = score(doc=976,freq=1.0), product of:
              0.13673815 = queryWeight, product of:
                1.6959296 = boost
                4.4593854 = idf(docFreq=1396, maxDocs=44421)
                0.018080352 = queryNorm
              0.2787116 = fieldWeight in 976, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.4593854 = idf(docFreq=1396, maxDocs=44421)
                0.0625 = fieldNorm(doc=976)
          0.060276464 = weight(abstract_txt:automatic in 976) [ClassicSimilarity], result of:
            0.060276464 = score(doc=976,freq=1.0), product of:
              0.18562013 = queryWeight, product of:
                1.975948 = boost
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.018080352 = queryNorm
              0.32473022 = fieldWeight in 976, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.0625 = fieldNorm(doc=976)
          0.08509736 = weight(abstract_txt:management in 976) [ClassicSimilarity], result of:
            0.08509736 = score(doc=976,freq=3.0), product of:
              0.18540749 = queryWeight, product of:
                2.4186456 = boost
                4.239827 = idf(docFreq=1739, maxDocs=44421)
                0.018080352 = queryNorm
              0.45897475 = fieldWeight in 976, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.239827 = idf(docFreq=1739, maxDocs=44421)
                0.0625 = fieldNorm(doc=976)
        0.2 = coord(5/25)
    
  3. May, A.D.: Automatic classification of e-mail messages by message type (1997) 0.06
    0.062296893 = sum of:
      0.062296893 = product of:
        0.3893556 = sum of:
          0.05663857 = weight(abstract_txt:automated in 6561) [ClassicSimilarity], result of:
            0.05663857 = score(doc=6561,freq=1.0), product of:
              0.10786086 = queryWeight, product of:
                1.0650743 = boost
                5.6011486 = idf(docFreq=445, maxDocs=44421)
                0.018080352 = queryNorm
              0.5251077 = fieldWeight in 6561, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6011486 = idf(docFreq=445, maxDocs=44421)
                0.09375 = fieldNorm(doc=6561)
          0.07109189 = weight(abstract_txt:matching in 6561) [ClassicSimilarity], result of:
            0.07109189 = score(doc=6561,freq=1.0), product of:
              0.12550732 = queryWeight, product of:
                1.1489007 = boost
                6.0419855 = idf(docFreq=286, maxDocs=44421)
                0.018080352 = queryNorm
              0.5664362 = fieldWeight in 6561, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.0419855 = idf(docFreq=286, maxDocs=44421)
                0.09375 = fieldNorm(doc=6561)
          0.13375944 = weight(abstract_txt:manually in 6561) [ClassicSimilarity], result of:
            0.13375944 = score(doc=6561,freq=2.0), product of:
              0.1518199 = queryWeight, product of:
                1.2636079 = boost
                6.6452217 = idf(docFreq=156, maxDocs=44421)
                0.018080352 = queryNorm
              0.8810402 = fieldWeight in 6561, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.6452217 = idf(docFreq=156, maxDocs=44421)
                0.09375 = fieldNorm(doc=6561)
          0.1278657 = weight(abstract_txt:automatic in 6561) [ClassicSimilarity], result of:
            0.1278657 = score(doc=6561,freq=2.0), product of:
              0.18562013 = queryWeight, product of:
                1.975948 = boost
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.018080352 = queryNorm
              0.68885684 = fieldWeight in 6561, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.1956835 = idf(docFreq=668, maxDocs=44421)
                0.09375 = fieldNorm(doc=6561)
        0.16 = coord(4/25)
    
  4. Maurer, H.: Object-oriented modelling of hyperstructure : overcoming the static link deficiency (1994) 0.06
    0.061361153 = sum of:
      0.061361153 = product of:
        0.38350722 = sum of:
          0.04709431 = weight(abstract_txt:large in 832) [ClassicSimilarity], result of:
            0.04709431 = score(doc=832,freq=1.0), product of:
              0.13569552 = queryWeight, product of:
                1.6894515 = boost
                4.4423513 = idf(docFreq=1420, maxDocs=44421)
                0.018080352 = queryNorm
              0.3470587 = fieldWeight in 832, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.4423513 = idf(docFreq=1420, maxDocs=44421)
                0.078125 = fieldNorm(doc=832)
          0.13375065 = weight(abstract_txt:links in 832) [ClassicSimilarity], result of:
            0.13375065 = score(doc=832,freq=3.0), product of:
              0.18868761 = queryWeight, product of:
                1.9922079 = boost
                5.238438 = idf(docFreq=640, maxDocs=44421)
                0.018080352 = queryNorm
              0.708847 = fieldWeight in 832, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.238438 = idf(docFreq=640, maxDocs=44421)
                0.078125 = fieldNorm(doc=832)
          0.14124851 = weight(abstract_txt:link in 832) [ClassicSimilarity], result of:
            0.14124851 = score(doc=832,freq=2.0), product of:
              0.22399199 = queryWeight, product of:
                2.170597 = boost
                5.707506 = idf(docFreq=400, maxDocs=44421)
                0.018080352 = queryNorm
              0.6305963 = fieldWeight in 832, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.707506 = idf(docFreq=400, maxDocs=44421)
                0.078125 = fieldNorm(doc=832)
          0.061413724 = weight(abstract_txt:management in 832) [ClassicSimilarity], result of:
            0.061413724 = score(doc=832,freq=1.0), product of:
              0.18540749 = queryWeight, product of:
                2.4186456 = boost
                4.239827 = idf(docFreq=1739, maxDocs=44421)
                0.018080352 = queryNorm
              0.33123648 = fieldWeight in 832, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.239827 = idf(docFreq=1739, maxDocs=44421)
                0.078125 = fieldNorm(doc=832)
        0.16 = coord(4/25)
    
  5. Saverio Perugini, S.: Symbolic links in the Open Directory Project (2008) 0.06
    0.0597305 = sum of:
      0.0597305 = product of:
        0.37331563 = sum of:
          0.037461773 = weight(abstract_txt:structural in 3070) [ClassicSimilarity], result of:
            0.037461773 = score(doc=3070,freq=1.0), product of:
              0.11728345 = queryWeight, product of:
                1.1106222 = boost
                5.8406816 = idf(docFreq=350, maxDocs=44421)
                0.018080352 = queryNorm
              0.31941226 = fieldWeight in 3070, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.8406816 = idf(docFreq=350, maxDocs=44421)
                0.0546875 = fieldNorm(doc=3070)
          0.042083003 = weight(abstract_txt:open in 3070) [ClassicSimilarity], result of:
            0.042083003 = score(doc=3070,freq=1.0), product of:
              0.15968312 = queryWeight, product of:
                1.8327047 = boost
                4.8190303 = idf(docFreq=974, maxDocs=44421)
                0.018080352 = queryNorm
              0.26354071 = fieldWeight in 3070, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8190303 = idf(docFreq=974, maxDocs=44421)
                0.0546875 = fieldNorm(doc=3070)
          0.1948969 = weight(abstract_txt:links in 3070) [ClassicSimilarity], result of:
            0.1948969 = score(doc=3070,freq=13.0), product of:
              0.18868761 = queryWeight, product of:
                1.9922079 = boost
                5.238438 = idf(docFreq=640, maxDocs=44421)
                0.018080352 = queryNorm
              1.0329078 = fieldWeight in 3070, product of:
                3.6055512 = tf(freq=13.0), with freq of:
                  13.0 = termFreq=13.0
                5.238438 = idf(docFreq=640, maxDocs=44421)
                0.0546875 = fieldNorm(doc=3070)
          0.09887396 = weight(abstract_txt:link in 3070) [ClassicSimilarity], result of:
            0.09887396 = score(doc=3070,freq=2.0), product of:
              0.22399199 = queryWeight, product of:
                2.170597 = boost
                5.707506 = idf(docFreq=400, maxDocs=44421)
                0.018080352 = queryNorm
              0.4414174 = fieldWeight in 3070, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.707506 = idf(docFreq=400, maxDocs=44421)
                0.0546875 = fieldNorm(doc=3070)
        0.16 = coord(4/25)