Document (#18153)

Author
Thistlewaite, P.
Title
Automatic construction and management of large open webs
Source
Information processing and management. 33(1997) no.2, S.161-173
Year
1997
Abstract
Reviews the problems associated with manually created or maintained hyperdocument links, and the consequent need for automated methods. A number of techniques have been applied to the problem, including pattern-matching, information retrieval, and natural language processing. Describes a system for the automatic detection and management of structural and referential links. Addresses the issues of link-set soundness and completeness, open link management, and the particular problem engendered by large volatile hyperbases
Footnote
Contribution to a special issue on methods and tools for the automatic construction of hypertext

Similar documents (content)

  1. Salton, G.: Automatic text structuring and summarization (1997) 0.08
    0.0834136 = sum of:
      0.0834136 = product of:
        0.521335 = sum of:
          0.07867689 = weight(abstract_txt:pattern in 1146) [ClassicSimilarity], result of:
            0.07867689 = score(doc=1146,freq=1.0), product of:
              0.13417815 = queryWeight, product of:
                1.1839443 = boost
                6.2545214 = idf(docFreq=220, maxDocs=42306)
                0.018119927 = queryNorm
              0.5863614 = fieldWeight in 1146, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2545214 = idf(docFreq=220, maxDocs=42306)
                0.09375 = fieldNorm(doc=1146)
          0.18043095 = weight(abstract_txt:automatic in 1146) [ClassicSimilarity], result of:
            0.18043095 = score(doc=1146,freq=4.0), product of:
              0.18520288 = queryWeight, product of:
                1.9671127 = boost
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.018119927 = queryNorm
              0.974234 = fieldWeight in 1146, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.09375 = fieldNorm(doc=1146)
          0.0919729 = weight(abstract_txt:links in 1146) [ClassicSimilarity], result of:
            0.0919729 = score(doc=1146,freq=1.0), product of:
              0.18760034 = queryWeight, product of:
                1.9798039 = boost
                5.2294374 = idf(docFreq=615, maxDocs=42306)
                0.018119927 = queryNorm
              0.49025977 = fieldWeight in 1146, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.2294374 = idf(docFreq=615, maxDocs=42306)
                0.09375 = fieldNorm(doc=1146)
          0.17025426 = weight(abstract_txt:link in 1146) [ClassicSimilarity], result of:
            0.17025426 = score(doc=1146,freq=2.0), product of:
              0.22448245 = queryWeight, product of:
                2.1656914 = boost
                5.720439 = idf(docFreq=376, maxDocs=42306)
                0.018119927 = queryNorm
              0.7584302 = fieldWeight in 1146, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.720439 = idf(docFreq=376, maxDocs=42306)
                0.09375 = fieldNorm(doc=1146)
        0.16 = coord(4/25)
    
  2. Sood, S.O.; Churchill, E.F.; Antin, J.: Automatic identification of personal insults on social news sites (2012) 0.07
    0.068417095 = sum of:
      0.068417095 = product of:
        0.34208548 = sum of:
          0.038142018 = weight(abstract_txt:automated in 1977) [ClassicSimilarity], result of:
            0.038142018 = score(doc=1977,freq=1.0), product of:
              0.10850431 = queryWeight, product of:
                1.0646672 = boost
                5.624406 = idf(docFreq=414, maxDocs=42306)
                0.018119927 = queryNorm
              0.35152537 = fieldWeight in 1977, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.624406 = idf(docFreq=414, maxDocs=42306)
                0.0625 = fieldNorm(doc=1977)
          0.12014134 = weight(abstract_txt:detection in 1977) [ClassicSimilarity], result of:
            0.12014134 = score(doc=1977,freq=3.0), product of:
              0.16165872 = queryWeight, product of:
                1.2995409 = boost
                6.8651924 = idf(docFreq=119, maxDocs=42306)
                0.018119927 = queryNorm
              0.74317884 = fieldWeight in 1977, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.8651924 = idf(docFreq=119, maxDocs=42306)
                0.0625 = fieldNorm(doc=1977)
          0.038243648 = weight(abstract_txt:problem in 1977) [ClassicSimilarity], result of:
            0.038243648 = score(doc=1977,freq=1.0), product of:
              0.1369496 = queryWeight, product of:
                1.6915536 = boost
                4.4680552 = idf(docFreq=1318, maxDocs=42306)
                0.018119927 = queryNorm
              0.27925345 = fieldWeight in 1977, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.4680552 = idf(docFreq=1318, maxDocs=42306)
                0.0625 = fieldNorm(doc=1977)
          0.06014365 = weight(abstract_txt:automatic in 1977) [ClassicSimilarity], result of:
            0.06014365 = score(doc=1977,freq=1.0), product of:
              0.18520288 = queryWeight, product of:
                1.9671127 = boost
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.018119927 = queryNorm
              0.32474467 = fieldWeight in 1977, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.0625 = fieldNorm(doc=1977)
          0.085414834 = weight(abstract_txt:management in 1977) [ClassicSimilarity], result of:
            0.085414834 = score(doc=1977,freq=3.0), product of:
              0.18572345 = queryWeight, product of:
                2.4125948 = boost
                4.248405 = idf(docFreq=1642, maxDocs=42306)
                0.018119927 = queryNorm
              0.45990333 = fieldWeight in 1977, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.248405 = idf(docFreq=1642, maxDocs=42306)
                0.0625 = fieldNorm(doc=1977)
        0.2 = coord(5/25)
    
  3. May, A.D.: Automatic classification of e-mail messages by message type (1997) 0.06
    0.06265503 = sum of:
      0.06265503 = product of:
        0.39159396 = sum of:
          0.05721303 = weight(abstract_txt:automated in 6562) [ClassicSimilarity], result of:
            0.05721303 = score(doc=6562,freq=1.0), product of:
              0.10850431 = queryWeight, product of:
                1.0646672 = boost
                5.624406 = idf(docFreq=414, maxDocs=42306)
                0.018119927 = queryNorm
              0.5272881 = fieldWeight in 6562, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.624406 = idf(docFreq=414, maxDocs=42306)
                0.09375 = fieldNorm(doc=6562)
          0.07149027 = weight(abstract_txt:matching in 6562) [ClassicSimilarity], result of:
            0.07149027 = score(doc=6562,freq=1.0), product of:
              0.12587756 = queryWeight, product of:
                1.1467389 = boost
                6.057973 = idf(docFreq=268, maxDocs=42306)
                0.018119927 = queryNorm
              0.567935 = fieldWeight in 6562, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.057973 = idf(docFreq=268, maxDocs=42306)
                0.09375 = fieldNorm(doc=6562)
          0.1353067 = weight(abstract_txt:manually in 6562) [ClassicSimilarity], result of:
            0.1353067 = score(doc=6562,freq=2.0), product of:
              0.15286918 = queryWeight, product of:
                1.2637185 = boost
                6.6759505 = idf(docFreq=144, maxDocs=42306)
                0.018119927 = queryNorm
              0.8851143 = fieldWeight in 6562, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.6759505 = idf(docFreq=144, maxDocs=42306)
                0.09375 = fieldNorm(doc=6562)
          0.12758395 = weight(abstract_txt:automatic in 6562) [ClassicSimilarity], result of:
            0.12758395 = score(doc=6562,freq=2.0), product of:
              0.18520288 = queryWeight, product of:
                1.9671127 = boost
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.018119927 = queryNorm
              0.6888875 = fieldWeight in 6562, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.09375 = fieldNorm(doc=6562)
        0.16 = coord(4/25)
    
  4. Maurer, H.: Object-oriented modelling of hyperstructure : overcoming the static link deficiency (1994) 0.06
    0.061471906 = sum of:
      0.061471906 = product of:
        0.3841994 = sum of:
          0.047926556 = weight(abstract_txt:large in 833) [ClassicSimilarity], result of:
            0.047926556 = score(doc=833,freq=1.0), product of:
              0.13718249 = queryWeight, product of:
                1.6929913 = boost
                4.471853 = idf(docFreq=1313, maxDocs=42306)
                0.018119927 = queryNorm
              0.3493635 = fieldWeight in 833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.471853 = idf(docFreq=1313, maxDocs=42306)
                0.078125 = fieldNorm(doc=833)
          0.13275144 = weight(abstract_txt:links in 833) [ClassicSimilarity], result of:
            0.13275144 = score(doc=833,freq=3.0), product of:
              0.18760034 = queryWeight, product of:
                1.9798039 = boost
                5.2294374 = idf(docFreq=615, maxDocs=42306)
                0.018119927 = queryNorm
              0.70762897 = fieldWeight in 833, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.2294374 = idf(docFreq=615, maxDocs=42306)
                0.078125 = fieldNorm(doc=833)
          0.14187855 = weight(abstract_txt:link in 833) [ClassicSimilarity], result of:
            0.14187855 = score(doc=833,freq=2.0), product of:
              0.22448245 = queryWeight, product of:
                2.1656914 = boost
                5.720439 = idf(docFreq=376, maxDocs=42306)
                0.018119927 = queryNorm
              0.6320251 = fieldWeight in 833, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.720439 = idf(docFreq=376, maxDocs=42306)
                0.078125 = fieldNorm(doc=833)
          0.061642848 = weight(abstract_txt:management in 833) [ClassicSimilarity], result of:
            0.061642848 = score(doc=833,freq=1.0), product of:
              0.18572345 = queryWeight, product of:
                2.4125948 = boost
                4.248405 = idf(docFreq=1642, maxDocs=42306)
                0.018119927 = queryNorm
              0.33190665 = fieldWeight in 833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.248405 = idf(docFreq=1642, maxDocs=42306)
                0.078125 = fieldNorm(doc=833)
        0.16 = coord(4/25)
    
  5. Saverio Perugini, S.: Symbolic links in the Open Directory Project (2008) 0.06
    0.06018208 = sum of:
      0.06018208 = product of:
        0.376138 = sum of:
          0.038526755 = weight(abstract_txt:structural in 4071) [ClassicSimilarity], result of:
            0.038526755 = score(doc=4071,freq=1.0), product of:
              0.1194027 = queryWeight, product of:
                1.1168567 = boost
                5.9001117 = idf(docFreq=314, maxDocs=42306)
                0.018119927 = queryNorm
              0.32266235 = fieldWeight in 4071, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.9001117 = idf(docFreq=314, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4071)
          0.04485534 = weight(abstract_txt:open in 4071) [ClassicSimilarity], result of:
            0.04485534 = score(doc=4071,freq=1.0), product of:
              0.16649146 = queryWeight, product of:
                1.8650968 = boost
                4.9264507 = idf(docFreq=833, maxDocs=42306)
                0.018119927 = queryNorm
              0.26941526 = fieldWeight in 4071, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9264507 = idf(docFreq=833, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4071)
          0.19344091 = weight(abstract_txt:links in 4071) [ClassicSimilarity], result of:
            0.19344091 = score(doc=4071,freq=13.0), product of:
              0.18760034 = queryWeight, product of:
                1.9798039 = boost
                5.2294374 = idf(docFreq=615, maxDocs=42306)
                0.018119927 = queryNorm
              1.031133 = fieldWeight in 4071, product of:
                3.6055512 = tf(freq=13.0), with freq of:
                  13.0 = termFreq=13.0
                5.2294374 = idf(docFreq=615, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4071)
          0.09931499 = weight(abstract_txt:link in 4071) [ClassicSimilarity], result of:
            0.09931499 = score(doc=4071,freq=2.0), product of:
              0.22448245 = queryWeight, product of:
                2.1656914 = boost
                5.720439 = idf(docFreq=376, maxDocs=42306)
                0.018119927 = queryNorm
              0.44241762 = fieldWeight in 4071, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.720439 = idf(docFreq=376, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4071)
        0.16 = coord(4/25)