Document (#19951)

Author
Salton, G.
Allan, J.
Buckley, C.
Singhal, A.
Title
Automatic analysis, theme generation, and summarization of machine readable texts
Source
Science. 264(1994), S.1421-1426
Year
1994
Footnote
Wiederabgedruckt in: Readings in information retrieval. Ed.: K. Sparck Jones u. P. Willett. San Francisco: Morgan Kaufmann 1997. S.478-483.
Theme
Automatisches Indexieren
Automatisches Abstracting

Similar documents (author)

  1. Salton, G.; Allan, J.; Singhal, A.: Automatic text decomposition and structuring (1996) 3.73
    3.7304034 = sum of:
      3.7304034 = product of:
        4.973871 = sum of:
          1.13855 = weight(author_txt:salton in 4136) [ClassicSimilarity], result of:
            1.13855 = score(doc=4136,freq=1.0), product of:
              0.39171532 = queryWeight, product of:
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.050538257 = queryNorm
              2.9065752 = fieldWeight in 4136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.375 = fieldNorm(doc=4136)
          1.6832002 = weight(author_txt:allan in 4136) [ClassicSimilarity], result of:
            1.6832002 = score(doc=4136,freq=1.0), product of:
              0.5083463 = queryWeight, product of:
                1.1391858 = boost
                8.829678 = idf(docFreq=16, maxDocs=42740)
                0.050538257 = queryNorm
              3.311129 = fieldWeight in 4136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.829678 = idf(docFreq=16, maxDocs=42740)
                0.375 = fieldNorm(doc=4136)
          2.1521213 = weight(author_txt:singhal in 4136) [ClassicSimilarity], result of:
            2.1521213 = score(doc=4136,freq=1.0), product of:
              0.59884393 = queryWeight, product of:
                1.2364358 = boost
                9.583449 = idf(docFreq=7, maxDocs=42740)
                0.050538257 = queryNorm
              3.5937934 = fieldWeight in 4136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.583449 = idf(docFreq=7, maxDocs=42740)
                0.375 = fieldNorm(doc=4136)
        0.75 = coord(3/4)
    
  2. Salton, G.; Buckley, C.; Allan, J.: Automatic structuring of text files (1992) 3.27
    3.271323 = sum of:
      3.271323 = product of:
        4.361764 = sum of:
          1.13855 = weight(author_txt:salton in 6507) [ClassicSimilarity], result of:
            1.13855 = score(doc=6507,freq=1.0), product of:
              0.39171532 = queryWeight, product of:
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.050538257 = queryNorm
              2.9065752 = fieldWeight in 6507, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.375 = fieldNorm(doc=6507)
          1.5400137 = weight(author_txt:buckley in 6507) [ClassicSimilarity], result of:
            1.5400137 = score(doc=6507,freq=1.0), product of:
              0.47909194 = queryWeight, product of:
                1.1059211 = boost
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.050538257 = queryNorm
              3.214443 = fieldWeight in 6507, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.375 = fieldNorm(doc=6507)
          1.6832002 = weight(author_txt:allan in 6507) [ClassicSimilarity], result of:
            1.6832002 = score(doc=6507,freq=1.0), product of:
              0.5083463 = queryWeight, product of:
                1.1391858 = boost
                8.829678 = idf(docFreq=16, maxDocs=42740)
                0.050538257 = queryNorm
              3.311129 = fieldWeight in 6507, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.829678 = idf(docFreq=16, maxDocs=42740)
                0.375 = fieldNorm(doc=6507)
        0.75 = coord(3/4)
    
  3. Buckley, C.; Allan, J.; Salton, G.: Automatic routing and retrieval using Smart : TREC-2 (1995) 3.27
    3.271323 = sum of:
      3.271323 = product of:
        4.361764 = sum of:
          1.13855 = weight(author_txt:salton in 615) [ClassicSimilarity], result of:
            1.13855 = score(doc=615,freq=1.0), product of:
              0.39171532 = queryWeight, product of:
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.050538257 = queryNorm
              2.9065752 = fieldWeight in 615, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.375 = fieldNorm(doc=615)
          1.5400137 = weight(author_txt:buckley in 615) [ClassicSimilarity], result of:
            1.5400137 = score(doc=615,freq=1.0), product of:
              0.47909194 = queryWeight, product of:
                1.1059211 = boost
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.050538257 = queryNorm
              3.214443 = fieldWeight in 615, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.375 = fieldNorm(doc=615)
          1.6832002 = weight(author_txt:allan in 615) [ClassicSimilarity], result of:
            1.6832002 = score(doc=615,freq=1.0), product of:
              0.5083463 = queryWeight, product of:
                1.1391858 = boost
                8.829678 = idf(docFreq=16, maxDocs=42740)
                0.050538257 = queryNorm
              3.311129 = fieldWeight in 615, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.829678 = idf(docFreq=16, maxDocs=42740)
                0.375 = fieldNorm(doc=615)
        0.75 = coord(3/4)
    
  4. Salton, G.; Allen, J.; Buckley, C.; Singhal, A.: Automatic analysis, theme generation, and summarization of machine-readable data (1994) 3.02
    3.0191782 = sum of:
      3.0191782 = product of:
        4.025571 = sum of:
          0.94879174 = weight(author_txt:salton in 1237) [ClassicSimilarity], result of:
            0.94879174 = score(doc=1237,freq=1.0), product of:
              0.39171532 = queryWeight, product of:
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.050538257 = queryNorm
              2.422146 = fieldWeight in 1237, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.3125 = fieldNorm(doc=1237)
          1.2833447 = weight(author_txt:buckley in 1237) [ClassicSimilarity], result of:
            1.2833447 = score(doc=1237,freq=1.0), product of:
              0.47909194 = queryWeight, product of:
                1.1059211 = boost
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.050538257 = queryNorm
              2.6787024 = fieldWeight in 1237, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.3125 = fieldNorm(doc=1237)
          1.7934346 = weight(author_txt:singhal in 1237) [ClassicSimilarity], result of:
            1.7934346 = score(doc=1237,freq=1.0), product of:
              0.59884393 = queryWeight, product of:
                1.2364358 = boost
                9.583449 = idf(docFreq=7, maxDocs=42740)
                0.050538257 = queryNorm
              2.994828 = fieldWeight in 1237, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.583449 = idf(docFreq=7, maxDocs=42740)
                0.3125 = fieldNorm(doc=1237)
        0.75 = coord(3/4)
    
  5. Buckley, C.; Singhal, A.; Mitra, M.; Salton, G.: New retrieval approaches using SMART : TREC 4 (1996) 3.02
    3.0191782 = sum of:
      3.0191782 = product of:
        4.025571 = sum of:
          0.94879174 = weight(author_txt:salton in 598) [ClassicSimilarity], result of:
            0.94879174 = score(doc=598,freq=1.0), product of:
              0.39171532 = queryWeight, product of:
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.050538257 = queryNorm
              2.422146 = fieldWeight in 598, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7508674 = idf(docFreq=49, maxDocs=42740)
                0.3125 = fieldNorm(doc=598)
          1.2833447 = weight(author_txt:buckley in 598) [ClassicSimilarity], result of:
            1.2833447 = score(doc=598,freq=1.0), product of:
              0.47909194 = queryWeight, product of:
                1.1059211 = boost
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.050538257 = queryNorm
              2.6787024 = fieldWeight in 598, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.3125 = fieldNorm(doc=598)
          1.7934346 = weight(author_txt:singhal in 598) [ClassicSimilarity], result of:
            1.7934346 = score(doc=598,freq=1.0), product of:
              0.59884393 = queryWeight, product of:
                1.2364358 = boost
                9.583449 = idf(docFreq=7, maxDocs=42740)
                0.050538257 = queryNorm
              2.994828 = fieldWeight in 598, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.583449 = idf(docFreq=7, maxDocs=42740)
                0.3125 = fieldNorm(doc=598)
        0.75 = coord(3/4)
    

Similar documents (content)

  1. Coombs, J.H.; Renear, A.H.; DeRose, S.J.: Markup systems and the future of scholarly text processing (1987) 0.70
    0.70361304 = sum of:
      0.70361304 = product of:
        1.4072261 = sum of:
          0.10819948 = weight(abstract_txt:analysis in 1594) [ClassicSimilarity], result of:
            0.10819948 = score(doc=1594,freq=1.0), product of:
              0.13410473 = queryWeight, product of:
                3.6883576 = idf(docFreq=2905, maxDocs=42740)
                0.03635893 = queryNorm
              0.8068282 = fieldWeight in 1594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6883576 = idf(docFreq=2905, maxDocs=42740)
                0.21875 = fieldNorm(doc=1594)
          0.3280889 = weight(abstract_txt:machine in 1594) [ClassicSimilarity], result of:
            0.3280889 = score(doc=1594,freq=1.0), product of:
              0.28094524 = queryWeight, product of:
                1.4474007 = boost
                5.3385315 = idf(docFreq=557, maxDocs=42740)
                0.03635893 = queryNorm
              1.1678038 = fieldWeight in 1594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.3385315 = idf(docFreq=557, maxDocs=42740)
                0.21875 = fieldNorm(doc=1594)
          0.3928522 = weight(abstract_txt:texts in 1594) [ClassicSimilarity], result of:
            0.3928522 = score(doc=1594,freq=1.0), product of:
              0.3167963 = queryWeight, product of:
                1.5369792 = boost
                5.668929 = idf(docFreq=400, maxDocs=42740)
                0.03635893 = queryNorm
              1.2400782 = fieldWeight in 1594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.668929 = idf(docFreq=400, maxDocs=42740)
                0.21875 = fieldNorm(doc=1594)
          0.5780855 = weight(abstract_txt:readable in 1594) [ClassicSimilarity], result of:
            0.5780855 = score(doc=1594,freq=1.0), product of:
              0.40984726 = queryWeight, product of:
                1.7481914 = boost
                6.4479547 = idf(docFreq=183, maxDocs=42740)
                0.03635893 = queryNorm
              1.41049 = fieldWeight in 1594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.4479547 = idf(docFreq=183, maxDocs=42740)
                0.21875 = fieldNorm(doc=1594)
        0.5 = coord(4/8)
    
  2. Smeaton, A.F.: Progress in the application of natural language processing to information retrieval tasks (1992) 0.52
    0.51518464 = sum of:
      0.51518464 = product of:
        1.3738258 = sum of:
          0.36751035 = weight(abstract_txt:automatic in 7080) [ClassicSimilarity], result of:
            0.36751035 = score(doc=7080,freq=2.0), product of:
              0.26653948 = queryWeight, product of:
                1.409804 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.03635893 = queryNorm
              1.3788214 = fieldWeight in 7080, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.1875 = fieldNorm(doc=7080)
          0.33322263 = weight(abstract_txt:generation in 7080) [ClassicSimilarity], result of:
            0.33322263 = score(doc=7080,freq=1.0), product of:
              0.31459236 = queryWeight, product of:
                1.5316235 = boost
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.03635893 = queryNorm
              1.0592203 = fieldWeight in 7080, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.1875 = fieldNorm(doc=7080)
          0.6730929 = weight(abstract_txt:summarization in 7080) [ClassicSimilarity], result of:
            0.6730929 = score(doc=7080,freq=1.0), product of:
              0.50269955 = queryWeight, product of:
                1.9361197 = boost
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.03635893 = queryNorm
              1.3389566 = fieldWeight in 7080, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.1875 = fieldNorm(doc=7080)
        0.375 = coord(3/8)
    
  3. Sabourin, C.F. (Bearb.): Computational lexicology and lexicography : bibliography (1994) 0.50
    0.50111914 = sum of:
      0.50111914 = product of:
        1.0022383 = sum of:
          0.07728534 = weight(abstract_txt:analysis in 871) [ClassicSimilarity], result of:
            0.07728534 = score(doc=871,freq=1.0), product of:
              0.13410473 = queryWeight, product of:
                3.6883576 = idf(docFreq=2905, maxDocs=42740)
                0.03635893 = queryNorm
              0.57630587 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6883576 = idf(docFreq=2905, maxDocs=42740)
                0.15625 = fieldNorm(doc=871)
          0.23434922 = weight(abstract_txt:machine in 871) [ClassicSimilarity], result of:
            0.23434922 = score(doc=871,freq=1.0), product of:
              0.28094524 = queryWeight, product of:
                1.4474007 = boost
                5.3385315 = idf(docFreq=557, maxDocs=42740)
                0.03635893 = queryNorm
              0.83414555 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.3385315 = idf(docFreq=557, maxDocs=42740)
                0.15625 = fieldNorm(doc=871)
          0.27768552 = weight(abstract_txt:generation in 871) [ClassicSimilarity], result of:
            0.27768552 = score(doc=871,freq=1.0), product of:
              0.31459236 = queryWeight, product of:
                1.5316235 = boost
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.03635893 = queryNorm
              0.88268363 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.15625 = fieldNorm(doc=871)
          0.4129182 = weight(abstract_txt:readable in 871) [ClassicSimilarity], result of:
            0.4129182 = score(doc=871,freq=1.0), product of:
              0.40984726 = queryWeight, product of:
                1.7481914 = boost
                6.4479547 = idf(docFreq=183, maxDocs=42740)
                0.03635893 = queryNorm
              1.0074929 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.4479547 = idf(docFreq=183, maxDocs=42740)
                0.15625 = fieldNorm(doc=871)
        0.5 = coord(4/8)
    
  4. Maybury, M.T.: Generating summaries from event data (1995) 0.47
    0.47415745 = sum of:
      0.47415745 = product of:
        0.9483149 = sum of:
          0.03864267 = weight(abstract_txt:analysis in 2418) [ClassicSimilarity], result of:
            0.03864267 = score(doc=2418,freq=1.0), product of:
              0.13410473 = queryWeight, product of:
                3.6883576 = idf(docFreq=2905, maxDocs=42740)
                0.03635893 = queryNorm
              0.28815293 = fieldWeight in 2418, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6883576 = idf(docFreq=2905, maxDocs=42740)
                0.078125 = fieldNorm(doc=2418)
          0.10827877 = weight(abstract_txt:automatic in 2418) [ClassicSimilarity], result of:
            0.10827877 = score(doc=2418,freq=1.0), product of:
              0.26653948 = queryWeight, product of:
                1.409804 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.03635893 = queryNorm
              0.40623915 = fieldWeight in 2418, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.078125 = fieldNorm(doc=2418)
          0.24048273 = weight(abstract_txt:generation in 2418) [ClassicSimilarity], result of:
            0.24048273 = score(doc=2418,freq=3.0), product of:
              0.31459236 = queryWeight, product of:
                1.5316235 = boost
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.03635893 = queryNorm
              0.76442647 = fieldWeight in 2418, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.078125 = fieldNorm(doc=2418)
          0.56091076 = weight(abstract_txt:summarization in 2418) [ClassicSimilarity], result of:
            0.56091076 = score(doc=2418,freq=4.0), product of:
              0.50269955 = queryWeight, product of:
                1.9361197 = boost
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.03635893 = queryNorm
              1.1157972 = fieldWeight in 2418, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.078125 = fieldNorm(doc=2418)
        0.5 = coord(4/8)
    
  5. Aker, A.; Gaizauskas, R.: Generating descriptive multi-document summaries of geo-located entities using entity type models (2015) 0.38
    0.37933463 = sum of:
      0.37933463 = product of:
        0.75866926 = sum of:
          0.08662302 = weight(abstract_txt:automatic in 3727) [ClassicSimilarity], result of:
            0.08662302 = score(doc=3727,freq=1.0), product of:
              0.26653948 = queryWeight, product of:
                1.409804 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.03635893 = queryNorm
              0.32499132 = fieldWeight in 3727, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.0625 = fieldNorm(doc=3727)
          0.11107421 = weight(abstract_txt:generation in 3727) [ClassicSimilarity], result of:
            0.11107421 = score(doc=3727,freq=1.0), product of:
              0.31459236 = queryWeight, product of:
                1.5316235 = boost
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.03635893 = queryNorm
              0.35307345 = fieldWeight in 3727, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.649175 = idf(docFreq=408, maxDocs=42740)
                0.0625 = fieldNorm(doc=3727)
          0.11224349 = weight(abstract_txt:texts in 3727) [ClassicSimilarity], result of:
            0.11224349 = score(doc=3727,freq=1.0), product of:
              0.3167963 = queryWeight, product of:
                1.5369792 = boost
                5.668929 = idf(docFreq=400, maxDocs=42740)
                0.03635893 = queryNorm
              0.35430807 = fieldWeight in 3727, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.668929 = idf(docFreq=400, maxDocs=42740)
                0.0625 = fieldNorm(doc=3727)
          0.4487286 = weight(abstract_txt:summarization in 3727) [ClassicSimilarity], result of:
            0.4487286 = score(doc=3727,freq=4.0), product of:
              0.50269955 = queryWeight, product of:
                1.9361197 = boost
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.03635893 = queryNorm
              0.8926377 = fieldWeight in 3727, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.0625 = fieldNorm(doc=3727)
        0.5 = coord(4/8)