Document (#18153)

Author
Thistlewaite, P.
Title
Automatic construction and management of large open webs
Source
Information processing and management. 33(1997) no.2, S.161-173
Year
1997
Abstract
Reviews the problems associated with manually created or maintained hyperdocument links, and the consequent need for automated methods. A number of techniques have been applied to the problem, including pattern-matching, information retrieval, and natural language processing. Describes a system for the automatic detection and management of structural and referential links. Addresses the issues of link-set soundness and completeness, open link management, and the particular problem engendered by large volatile hyperbases
Footnote
Contribution to a special issue on methods and tools for the automatic construction of hypertext

Similar documents (content)

  1. Salton, G.: Automatic text structuring and summarization (1997) 0.08
    0.08330887 = sum of:
      0.08330887 = product of:
        0.5206804 = sum of:
          0.07857769 = weight(abstract_txt:pattern in 1146) [ClassicSimilarity], result of:
            0.07857769 = score(doc=1146,freq=1.0), product of:
              0.13407922 = queryWeight, product of:
                1.1859754 = boost
                6.2512445 = idf(docFreq=223, maxDocs=42740)
                0.018085033 = queryNorm
              0.5860542 = fieldWeight in 1146, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2512445 = idf(docFreq=223, maxDocs=42740)
                0.09375 = fieldNorm(doc=1146)
          0.1808985 = weight(abstract_txt:automatic in 1146) [ClassicSimilarity], result of:
            0.1808985 = score(doc=1146,freq=4.0), product of:
              0.18554188 = queryWeight, product of:
                1.9730175 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.018085033 = queryNorm
              0.9749739 = fieldWeight in 1146, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.09375 = fieldNorm(doc=1146)
          0.09185918 = weight(abstract_txt:links in 1146) [ClassicSimilarity], result of:
            0.09185918 = score(doc=1146,freq=1.0), product of:
              0.18746506 = queryWeight, product of:
                1.9832164 = boost
                5.2267404 = idf(docFreq=623, maxDocs=42740)
                0.018085033 = queryNorm
              0.49000692 = fieldWeight in 1146, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.2267404 = idf(docFreq=623, maxDocs=42740)
                0.09375 = fieldNorm(doc=1146)
          0.16934507 = weight(abstract_txt:link in 1146) [ClassicSimilarity], result of:
            0.16934507 = score(doc=1146,freq=2.0), product of:
              0.22370568 = queryWeight, product of:
                2.1664488 = boost
                5.709647 = idf(docFreq=384, maxDocs=42740)
                0.018085033 = queryNorm
              0.7569994 = fieldWeight in 1146, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.709647 = idf(docFreq=384, maxDocs=42740)
                0.09375 = fieldNorm(doc=1146)
        0.16 = coord(4/25)
    
  2. Sood, S.O.; Churchill, E.F.; Antin, J.: Automatic identification of personal insults on social news sites (2012) 0.07
    0.06797154 = sum of:
      0.06797154 = product of:
        0.3398577 = sum of:
          0.038069505 = weight(abstract_txt:automated in 1977) [ClassicSimilarity], result of:
            0.038069505 = score(doc=1977,freq=1.0), product of:
              0.10837796 = queryWeight, product of:
                1.0662657 = boost
                5.620258 = idf(docFreq=420, maxDocs=42740)
                0.018085033 = queryNorm
              0.35126612 = fieldWeight in 1977, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.620258 = idf(docFreq=420, maxDocs=42740)
                0.0625 = fieldNorm(doc=1977)
          0.11816373 = weight(abstract_txt:detection in 1977) [ClassicSimilarity], result of:
            0.11816373 = score(doc=1977,freq=3.0), product of:
              0.15989634 = queryWeight, product of:
                1.2951325 = boost
                6.8266087 = idf(docFreq=125, maxDocs=42740)
                0.018085033 = queryNorm
              0.73900205 = fieldWeight in 1977, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.8266087 = idf(docFreq=125, maxDocs=42740)
                0.0625 = fieldNorm(doc=1977)
          0.037997764 = weight(abstract_txt:problem in 1977) [ClassicSimilarity], result of:
            0.037997764 = score(doc=1977,freq=1.0), product of:
              0.13637607 = queryWeight, product of:
                1.6915274 = boost
                4.457998 = idf(docFreq=1345, maxDocs=42740)
                0.018085033 = queryNorm
              0.27862486 = fieldWeight in 1977, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.457998 = idf(docFreq=1345, maxDocs=42740)
                0.0625 = fieldNorm(doc=1977)
          0.0602995 = weight(abstract_txt:automatic in 1977) [ClassicSimilarity], result of:
            0.0602995 = score(doc=1977,freq=1.0), product of:
              0.18554188 = queryWeight, product of:
                1.9730175 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.018085033 = queryNorm
              0.32499132 = fieldWeight in 1977, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.0625 = fieldNorm(doc=1977)
          0.08532719 = weight(abstract_txt:management in 1977) [ClassicSimilarity], result of:
            0.08532719 = score(doc=1977,freq=3.0), product of:
              0.1856156 = queryWeight, product of:
                2.416923 = boost
                4.246512 = idf(docFreq=1662, maxDocs=42740)
                0.018085033 = queryNorm
              0.45969838 = fieldWeight in 1977, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.246512 = idf(docFreq=1662, maxDocs=42740)
                0.0625 = fieldNorm(doc=1977)
        0.2 = coord(5/25)
    
  3. May, A.D.: Automatic classification of e-mail messages by message type (1997) 0.06
    0.06261684 = sum of:
      0.06261684 = product of:
        0.39135528 = sum of:
          0.057104256 = weight(abstract_txt:automated in 6562) [ClassicSimilarity], result of:
            0.057104256 = score(doc=6562,freq=1.0), product of:
              0.10837796 = queryWeight, product of:
                1.0662657 = boost
                5.620258 = idf(docFreq=420, maxDocs=42740)
                0.018085033 = queryNorm
              0.52689916 = fieldWeight in 6562, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.620258 = idf(docFreq=420, maxDocs=42740)
                0.09375 = fieldNorm(doc=6562)
          0.071611635 = weight(abstract_txt:matching in 6562) [ClassicSimilarity], result of:
            0.071611635 = score(doc=6562,freq=1.0), product of:
              0.12603302 = queryWeight, product of:
                1.1498393 = boost
                6.060772 = idf(docFreq=270, maxDocs=42740)
                0.018085033 = queryNorm
              0.56819737 = fieldWeight in 6562, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.060772 = idf(docFreq=270, maxDocs=42740)
                0.09375 = fieldNorm(doc=6562)
          0.13472486 = weight(abstract_txt:manually in 6562) [ClassicSimilarity], result of:
            0.13472486 = score(doc=6562,freq=2.0), product of:
              0.15244639 = queryWeight, product of:
                1.264601 = boost
                6.665678 = idf(docFreq=147, maxDocs=42740)
                0.018085033 = queryNorm
              0.88375235 = fieldWeight in 6562, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.665678 = idf(docFreq=147, maxDocs=42740)
                0.09375 = fieldNorm(doc=6562)
          0.12791456 = weight(abstract_txt:automatic in 6562) [ClassicSimilarity], result of:
            0.12791456 = score(doc=6562,freq=2.0), product of:
              0.18554188 = queryWeight, product of:
                1.9730175 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.018085033 = queryNorm
              0.6894107 = fieldWeight in 6562, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.09375 = fieldNorm(doc=6562)
        0.16 = coord(4/25)
    
  4. Maurer, H.: Object-oriented modelling of hyperstructure : overcoming the static link deficiency (1994) 0.06
    0.06129919 = sum of:
      0.06129919 = product of:
        0.38311994 = sum of:
          0.0478322 = weight(abstract_txt:large in 833) [ClassicSimilarity], result of:
            0.0478322 = score(doc=833,freq=1.0), product of:
              0.13701655 = queryWeight, product of:
                1.6954948 = boost
                4.468454 = idf(docFreq=1331, maxDocs=42740)
                0.018085033 = queryNorm
              0.34909797 = fieldWeight in 833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.468454 = idf(docFreq=1331, maxDocs=42740)
                0.078125 = fieldNorm(doc=833)
          0.13258728 = weight(abstract_txt:links in 833) [ClassicSimilarity], result of:
            0.13258728 = score(doc=833,freq=3.0), product of:
              0.18746506 = queryWeight, product of:
                1.9832164 = boost
                5.2267404 = idf(docFreq=623, maxDocs=42740)
                0.018085033 = queryNorm
              0.707264 = fieldWeight in 833, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.2267404 = idf(docFreq=623, maxDocs=42740)
                0.078125 = fieldNorm(doc=833)
          0.1411209 = weight(abstract_txt:link in 833) [ClassicSimilarity], result of:
            0.1411209 = score(doc=833,freq=2.0), product of:
              0.22370568 = queryWeight, product of:
                2.1664488 = boost
                5.709647 = idf(docFreq=384, maxDocs=42740)
                0.018085033 = queryNorm
              0.63083285 = fieldWeight in 833, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.709647 = idf(docFreq=384, maxDocs=42740)
                0.078125 = fieldNorm(doc=833)
          0.061579596 = weight(abstract_txt:management in 833) [ClassicSimilarity], result of:
            0.061579596 = score(doc=833,freq=1.0), product of:
              0.1856156 = queryWeight, product of:
                2.416923 = boost
                4.246512 = idf(docFreq=1662, maxDocs=42740)
                0.018085033 = queryNorm
              0.33175874 = fieldWeight in 833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.246512 = idf(docFreq=1662, maxDocs=42740)
                0.078125 = fieldNorm(doc=833)
        0.16 = coord(4/25)
    
  5. ¬The Fourth Text Retrieval Conference (TREC-4) (1996) 0.06
    0.060071666 = sum of:
      0.060071666 = product of:
        0.37544793 = sum of:
          0.08354691 = weight(abstract_txt:matching in 591) [ClassicSimilarity], result of:
            0.08354691 = score(doc=591,freq=1.0), product of:
              0.12603302 = queryWeight, product of:
                1.1498393 = boost
                6.060772 = idf(docFreq=270, maxDocs=42740)
                0.018085033 = queryNorm
              0.66289693 = fieldWeight in 591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.060772 = idf(docFreq=270, maxDocs=42740)
                0.109375 = fieldNorm(doc=591)
          0.09167397 = weight(abstract_txt:pattern in 591) [ClassicSimilarity], result of:
            0.09167397 = score(doc=591,freq=1.0), product of:
              0.13407922 = queryWeight, product of:
                1.1859754 = boost
                6.2512445 = idf(docFreq=223, maxDocs=42740)
                0.018085033 = queryNorm
              0.6837299 = fieldWeight in 591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2512445 = idf(docFreq=223, maxDocs=42740)
                0.109375 = fieldNorm(doc=591)
          0.094702914 = weight(abstract_txt:large in 591) [ClassicSimilarity], result of:
            0.094702914 = score(doc=591,freq=2.0), product of:
              0.13701655 = queryWeight, product of:
                1.6954948 = boost
                4.468454 = idf(docFreq=1331, maxDocs=42740)
                0.018085033 = queryNorm
              0.6911787 = fieldWeight in 591, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.468454 = idf(docFreq=1331, maxDocs=42740)
                0.109375 = fieldNorm(doc=591)
          0.10552413 = weight(abstract_txt:automatic in 591) [ClassicSimilarity], result of:
            0.10552413 = score(doc=591,freq=1.0), product of:
              0.18554188 = queryWeight, product of:
                1.9730175 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.018085033 = queryNorm
              0.5687348 = fieldWeight in 591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.109375 = fieldNorm(doc=591)
        0.16 = coord(4/25)