Document (#19951)

Author
Salton, G.
Allan, J.
Buckley, C.
Singhal, A.
Title
Automatic analysis, theme generation, and summarization of machine readable texts
Source
Science. 264(1994), S.1421-1426
Year
1994
Footnote
Wiederabgedruckt in: Readings in information retrieval. Ed.: K. Sparck Jones u. P. Willett. San Francisco: Morgan Kaufmann 1997. S.478-483.
Theme
Automatisches Indexieren
Automatisches Abstracting

Similar documents (author)

  1. Salton, G.; Allan, J.; Singhal, A.: Automatic text decomposition and structuring (1996) 3.74
    3.735421 = sum of:
      3.735421 = product of:
        4.9805613 = sum of:
          1.1407354 = weight(author_txt:salton in 5136) [ClassicSimilarity], result of:
            1.1407354 = score(doc=5136,freq=1.0), product of:
              0.39186275 = queryWeight, product of:
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.05047942 = queryNorm
              2.9110584 = fieldWeight in 5136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.375 = fieldNorm(doc=5136)
          1.6854787 = weight(author_txt:allan in 5136) [ClassicSimilarity], result of:
            1.6854787 = score(doc=5136,freq=1.0), product of:
              0.5083462 = queryWeight, product of:
                1.1389713 = boost
                8.841632 = idf(docFreq=16, maxDocs=43254)
                0.05047942 = queryNorm
              3.3156118 = fieldWeight in 5136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.841632 = idf(docFreq=16, maxDocs=43254)
                0.375 = fieldNorm(doc=5136)
          2.1543474 = weight(author_txt:singhal in 5136) [ClassicSimilarity], result of:
            2.1543474 = score(doc=5136,freq=1.0), product of:
              0.5987165 = queryWeight, product of:
                1.2360716 = boost
                9.595404 = idf(docFreq=7, maxDocs=43254)
                0.05047942 = queryNorm
              3.5982764 = fieldWeight in 5136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.595404 = idf(docFreq=7, maxDocs=43254)
                0.375 = fieldNorm(doc=5136)
        0.75 = coord(3/4)
    
  2. Salton, G.; Buckley, C.; Allan, J.: Automatic structuring of text files (1992) 3.28
    3.2763755 = sum of:
      3.2763755 = product of:
        4.3685007 = sum of:
          1.1407354 = weight(author_txt:salton in 6507) [ClassicSimilarity], result of:
            1.1407354 = score(doc=6507,freq=1.0), product of:
              0.39186275 = queryWeight, product of:
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.05047942 = queryNorm
              2.9110584 = fieldWeight in 6507, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.375 = fieldNorm(doc=6507)
          1.5422866 = weight(author_txt:buckley in 6507) [ClassicSimilarity], result of:
            1.5422866 = score(doc=6507,freq=1.0), product of:
              0.47913083 = queryWeight, product of:
                1.105758 = boost
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.05047942 = queryNorm
              3.218926 = fieldWeight in 6507, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.375 = fieldNorm(doc=6507)
          1.6854787 = weight(author_txt:allan in 6507) [ClassicSimilarity], result of:
            1.6854787 = score(doc=6507,freq=1.0), product of:
              0.5083462 = queryWeight, product of:
                1.1389713 = boost
                8.841632 = idf(docFreq=16, maxDocs=43254)
                0.05047942 = queryNorm
              3.3156118 = fieldWeight in 6507, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.841632 = idf(docFreq=16, maxDocs=43254)
                0.375 = fieldNorm(doc=6507)
        0.75 = coord(3/4)
    
  3. Buckley, C.; Allan, J.; Salton, G.: Automatic routing and retrieval using Smart : TREC-2 (1995) 3.28
    3.2763755 = sum of:
      3.2763755 = product of:
        4.3685007 = sum of:
          1.1407354 = weight(author_txt:salton in 700) [ClassicSimilarity], result of:
            1.1407354 = score(doc=700,freq=1.0), product of:
              0.39186275 = queryWeight, product of:
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.05047942 = queryNorm
              2.9110584 = fieldWeight in 700, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.375 = fieldNorm(doc=700)
          1.5422866 = weight(author_txt:buckley in 700) [ClassicSimilarity], result of:
            1.5422866 = score(doc=700,freq=1.0), product of:
              0.47913083 = queryWeight, product of:
                1.105758 = boost
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.05047942 = queryNorm
              3.218926 = fieldWeight in 700, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.375 = fieldNorm(doc=700)
          1.6854787 = weight(author_txt:allan in 700) [ClassicSimilarity], result of:
            1.6854787 = score(doc=700,freq=1.0), product of:
              0.5083462 = queryWeight, product of:
                1.1389713 = boost
                8.841632 = idf(docFreq=16, maxDocs=43254)
                0.05047942 = queryNorm
              3.3156118 = fieldWeight in 700, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.841632 = idf(docFreq=16, maxDocs=43254)
                0.375 = fieldNorm(doc=700)
        0.75 = coord(3/4)
    
  4. Salton, G.; Allen, J.; Buckley, C.; Singhal, A.: Automatic analysis, theme generation, and summarization of machine-readable data (1994) 3.02
    3.023356 = sum of:
      3.023356 = product of:
        4.0311413 = sum of:
          0.9506127 = weight(author_txt:salton in 2237) [ClassicSimilarity], result of:
            0.9506127 = score(doc=2237,freq=1.0), product of:
              0.39186275 = queryWeight, product of:
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.05047942 = queryNorm
              2.4258819 = fieldWeight in 2237, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.3125 = fieldNorm(doc=2237)
          1.2852389 = weight(author_txt:buckley in 2237) [ClassicSimilarity], result of:
            1.2852389 = score(doc=2237,freq=1.0), product of:
              0.47913083 = queryWeight, product of:
                1.105758 = boost
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.05047942 = queryNorm
              2.6824381 = fieldWeight in 2237, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.3125 = fieldNorm(doc=2237)
          1.7952896 = weight(author_txt:singhal in 2237) [ClassicSimilarity], result of:
            1.7952896 = score(doc=2237,freq=1.0), product of:
              0.5987165 = queryWeight, product of:
                1.2360716 = boost
                9.595404 = idf(docFreq=7, maxDocs=43254)
                0.05047942 = queryNorm
              2.9985638 = fieldWeight in 2237, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.595404 = idf(docFreq=7, maxDocs=43254)
                0.3125 = fieldNorm(doc=2237)
        0.75 = coord(3/4)
    
  5. Buckley, C.; Singhal, A.; Mitra, M.; Salton, G.: New retrieval approaches using SMART : TREC 4 (1996) 3.02
    3.023356 = sum of:
      3.023356 = product of:
        4.0311413 = sum of:
          0.9506127 = weight(author_txt:salton in 598) [ClassicSimilarity], result of:
            0.9506127 = score(doc=598,freq=1.0), product of:
              0.39186275 = queryWeight, product of:
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.05047942 = queryNorm
              2.4258819 = fieldWeight in 598, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.762822 = idf(docFreq=49, maxDocs=43254)
                0.3125 = fieldNorm(doc=598)
          1.2852389 = weight(author_txt:buckley in 598) [ClassicSimilarity], result of:
            1.2852389 = score(doc=598,freq=1.0), product of:
              0.47913083 = queryWeight, product of:
                1.105758 = boost
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.05047942 = queryNorm
              2.6824381 = fieldWeight in 598, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.583802 = idf(docFreq=21, maxDocs=43254)
                0.3125 = fieldNorm(doc=598)
          1.7952896 = weight(author_txt:singhal in 598) [ClassicSimilarity], result of:
            1.7952896 = score(doc=598,freq=1.0), product of:
              0.5987165 = queryWeight, product of:
                1.2360716 = boost
                9.595404 = idf(docFreq=7, maxDocs=43254)
                0.05047942 = queryNorm
              2.9985638 = fieldWeight in 598, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.595404 = idf(docFreq=7, maxDocs=43254)
                0.3125 = fieldNorm(doc=598)
        0.75 = coord(3/4)
    

Similar documents (content)

  1. Coombs, J.H.; Renear, A.H.; DeRose, S.J.: Markup systems and the future of scholarly text processing (1987) 0.70
    0.70121545 = sum of:
      0.70121545 = product of:
        1.4024309 = sum of:
          0.10702172 = weight(abstract_txt:analysis in 2594) [ClassicSimilarity], result of:
            0.10702172 = score(doc=2594,freq=1.0), product of:
              0.13318184 = queryWeight, product of:
                3.67349 = idf(docFreq=2984, maxDocs=43254)
                0.036254853 = queryNorm
              0.80357593 = fieldWeight in 2594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.67349 = idf(docFreq=2984, maxDocs=43254)
                0.21875 = fieldNorm(doc=2594)
          0.32515213 = weight(abstract_txt:machine in 2594) [ClassicSimilarity], result of:
            0.32515213 = score(doc=2594,freq=1.0), product of:
              0.27937537 = queryWeight, product of:
                1.4483434 = boost
                5.320475 = idf(docFreq=574, maxDocs=43254)
                0.036254853 = queryNorm
              1.1638539 = fieldWeight in 2594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.320475 = idf(docFreq=574, maxDocs=43254)
                0.21875 = fieldNorm(doc=2594)
          0.3911854 = weight(abstract_txt:texts in 2594) [ClassicSimilarity], result of:
            0.3911854 = score(doc=2594,freq=1.0), product of:
              0.31602308 = queryWeight, product of:
                1.540412 = boost
                5.658688 = idf(docFreq=409, maxDocs=43254)
                0.036254853 = queryNorm
              1.237838 = fieldWeight in 2594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.658688 = idf(docFreq=409, maxDocs=43254)
                0.21875 = fieldNorm(doc=2594)
          0.57907164 = weight(abstract_txt:readable in 2594) [ClassicSimilarity], result of:
            0.57907164 = score(doc=2594,freq=1.0), product of:
              0.41047361 = queryWeight, product of:
                1.7555779 = boost
                6.449098 = idf(docFreq=185, maxDocs=43254)
                0.036254853 = queryNorm
              1.4107403 = fieldWeight in 2594, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.449098 = idf(docFreq=185, maxDocs=43254)
                0.21875 = fieldNorm(doc=2594)
        0.5 = coord(4/8)
    
  2. Smeaton, A.F.: Progress in the application of natural language processing to information retrieval tasks (1992) 0.51
    0.5148212 = sum of:
      0.5148212 = product of:
        1.3728564 = sum of:
          0.36719355 = weight(abstract_txt:automatic in 80) [ClassicSimilarity], result of:
            0.36719355 = score(doc=80,freq=2.0), product of:
              0.26649043 = queryWeight, product of:
                1.41455 = boost
                5.1963353 = idf(docFreq=650, maxDocs=43254)
                0.036254853 = queryNorm
              1.3778864 = fieldWeight in 80, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.1963353 = idf(docFreq=650, maxDocs=43254)
                0.1875 = fieldNorm(doc=80)
          0.33145654 = weight(abstract_txt:generation in 80) [ClassicSimilarity], result of:
            0.33145654 = score(doc=80,freq=1.0), product of:
              0.31360236 = queryWeight, product of:
                1.534501 = boost
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.036254853 = queryNorm
              1.0569326 = fieldWeight in 80, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.1875 = fieldNorm(doc=80)
          0.6742063 = weight(abstract_txt:summarization in 80) [ClassicSimilarity], result of:
            0.6742063 = score(doc=80,freq=1.0), product of:
              0.5034505 = queryWeight, product of:
                1.9442669 = boost
                7.1422453 = idf(docFreq=92, maxDocs=43254)
                0.036254853 = queryNorm
              1.3391709 = fieldWeight in 80, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.1422453 = idf(docFreq=92, maxDocs=43254)
                0.1875 = fieldNorm(doc=80)
        0.375 = coord(3/8)
    
  3. Sabourin, C.F. (Bearb.): Computational lexicology and lexicography : bibliography (1994) 0.50
    0.49926603 = sum of:
      0.49926603 = product of:
        0.99853206 = sum of:
          0.07644409 = weight(abstract_txt:analysis in 871) [ClassicSimilarity], result of:
            0.07644409 = score(doc=871,freq=1.0), product of:
              0.13318184 = queryWeight, product of:
                3.67349 = idf(docFreq=2984, maxDocs=43254)
                0.036254853 = queryNorm
              0.57398283 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.67349 = idf(docFreq=2984, maxDocs=43254)
                0.15625 = fieldNorm(doc=871)
          0.23225151 = weight(abstract_txt:machine in 871) [ClassicSimilarity], result of:
            0.23225151 = score(doc=871,freq=1.0), product of:
              0.27937537 = queryWeight, product of:
                1.4483434 = boost
                5.320475 = idf(docFreq=574, maxDocs=43254)
                0.036254853 = queryNorm
              0.8313242 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.320475 = idf(docFreq=574, maxDocs=43254)
                0.15625 = fieldNorm(doc=871)
          0.2762138 = weight(abstract_txt:generation in 871) [ClassicSimilarity], result of:
            0.2762138 = score(doc=871,freq=1.0), product of:
              0.31360236 = queryWeight, product of:
                1.534501 = boost
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.036254853 = queryNorm
              0.8807772 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.15625 = fieldNorm(doc=871)
          0.4136226 = weight(abstract_txt:readable in 871) [ClassicSimilarity], result of:
            0.4136226 = score(doc=871,freq=1.0), product of:
              0.41047361 = queryWeight, product of:
                1.7555779 = boost
                6.449098 = idf(docFreq=185, maxDocs=43254)
                0.036254853 = queryNorm
              1.0076716 = fieldWeight in 871, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.449098 = idf(docFreq=185, maxDocs=43254)
                0.15625 = fieldNorm(doc=871)
        0.5 = coord(4/8)
    
  4. Maybury, M.T.: Generating summaries from event data (1995) 0.47
    0.47372714 = sum of:
      0.47372714 = product of:
        0.9474543 = sum of:
          0.038222045 = weight(abstract_txt:analysis in 3418) [ClassicSimilarity], result of:
            0.038222045 = score(doc=3418,freq=1.0), product of:
              0.13318184 = queryWeight, product of:
                3.67349 = idf(docFreq=2984, maxDocs=43254)
                0.036254853 = queryNorm
              0.28699142 = fieldWeight in 3418, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.67349 = idf(docFreq=2984, maxDocs=43254)
                0.078125 = fieldNorm(doc=3418)
          0.10818544 = weight(abstract_txt:automatic in 3418) [ClassicSimilarity], result of:
            0.10818544 = score(doc=3418,freq=1.0), product of:
              0.26649043 = queryWeight, product of:
                1.41455 = boost
                5.1963353 = idf(docFreq=650, maxDocs=43254)
                0.036254853 = queryNorm
              0.4059637 = fieldWeight in 3418, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1963353 = idf(docFreq=650, maxDocs=43254)
                0.078125 = fieldNorm(doc=3418)
          0.23920818 = weight(abstract_txt:generation in 3418) [ClassicSimilarity], result of:
            0.23920818 = score(doc=3418,freq=3.0), product of:
              0.31360236 = queryWeight, product of:
                1.534501 = boost
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.036254853 = queryNorm
              0.7627754 = fieldWeight in 3418, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.078125 = fieldNorm(doc=3418)
          0.5618386 = weight(abstract_txt:summarization in 3418) [ClassicSimilarity], result of:
            0.5618386 = score(doc=3418,freq=4.0), product of:
              0.5034505 = queryWeight, product of:
                1.9442669 = boost
                7.1422453 = idf(docFreq=92, maxDocs=43254)
                0.036254853 = queryNorm
              1.1159759 = fieldWeight in 3418, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.1422453 = idf(docFreq=92, maxDocs=43254)
                0.078125 = fieldNorm(doc=3418)
        0.5 = coord(4/8)
    
  5. Aker, A.; Gaizauskas, R.: Generating descriptive multi-document summaries of geo-located entities using entity type models (2015) 0.38
    0.379136 = sum of:
      0.379136 = product of:
        0.758272 = sum of:
          0.08654835 = weight(abstract_txt:automatic in 3191) [ClassicSimilarity], result of:
            0.08654835 = score(doc=3191,freq=1.0), product of:
              0.26649043 = queryWeight, product of:
                1.41455 = boost
                5.1963353 = idf(docFreq=650, maxDocs=43254)
                0.036254853 = queryNorm
              0.32477096 = fieldWeight in 3191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1963353 = idf(docFreq=650, maxDocs=43254)
                0.0625 = fieldNorm(doc=3191)
          0.11048552 = weight(abstract_txt:generation in 3191) [ClassicSimilarity], result of:
            0.11048552 = score(doc=3191,freq=1.0), product of:
              0.31360236 = queryWeight, product of:
                1.534501 = boost
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.036254853 = queryNorm
              0.35231087 = fieldWeight in 3191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.636974 = idf(docFreq=418, maxDocs=43254)
                0.0625 = fieldNorm(doc=3191)
          0.111767255 = weight(abstract_txt:texts in 3191) [ClassicSimilarity], result of:
            0.111767255 = score(doc=3191,freq=1.0), product of:
              0.31602308 = queryWeight, product of:
                1.540412 = boost
                5.658688 = idf(docFreq=409, maxDocs=43254)
                0.036254853 = queryNorm
              0.353668 = fieldWeight in 3191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.658688 = idf(docFreq=409, maxDocs=43254)
                0.0625 = fieldNorm(doc=3191)
          0.44947088 = weight(abstract_txt:summarization in 3191) [ClassicSimilarity], result of:
            0.44947088 = score(doc=3191,freq=4.0), product of:
              0.5034505 = queryWeight, product of:
                1.9442669 = boost
                7.1422453 = idf(docFreq=92, maxDocs=43254)
                0.036254853 = queryNorm
              0.89278066 = fieldWeight in 3191, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.1422453 = idf(docFreq=92, maxDocs=43254)
                0.0625 = fieldNorm(doc=3191)
        0.5 = coord(4/8)