Document (#19948)

Author
Salton, G.
Allan, J.
Buckley, C.
Singhal, A.
Title
Automatic analysis, theme generation, and summarization of machine readable texts
Source
Science. 264(1994), S.1421-1426
Year
1994
Footnote
Wiederabgedruckt in: Readings in information retrieval. Ed.: K. Sparck Jones u. P. Willett. San Francisco: Morgan Kaufmann 1997. S.478-483.
Theme
Automatisches Indexieren
Automatisches Abstracting

Similar documents (author)

  1. Salton, G.; Allan, J.; Singhal, A.: Automatic text decomposition and structuring (1996) 3.74
    3.7383406 = sum of:
      3.7383406 = product of:
        4.984454 = sum of:
          1.142007 = weight(author_txt:salton in 4133) [ClassicSimilarity], result of:
            1.142007 = score(doc=4133,freq=1.0), product of:
              0.3919483 = queryWeight, product of:
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.05044523 = queryNorm
              2.9136674 = fieldWeight in 4133, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.375 = fieldNorm(doc=4133)
          1.6868044 = weight(author_txt:allan in 4133) [ClassicSimilarity], result of:
            1.6868044 = score(doc=4133,freq=1.0), product of:
              0.508346 = queryWeight, product of:
                1.1388469 = boost
                8.848589 = idf(docFreq=16, maxDocs=43556)
                0.05044523 = queryNorm
              3.3182209 = fieldWeight in 4133, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.848589 = idf(docFreq=16, maxDocs=43556)
                0.375 = fieldNorm(doc=4133)
          2.155643 = weight(author_txt:singhal in 4133) [ClassicSimilarity], result of:
            2.155643 = score(doc=4133,freq=1.0), product of:
              0.59864247 = queryWeight, product of:
                1.2358602 = boost
                9.602362 = idf(docFreq=7, maxDocs=43556)
                0.05044523 = queryNorm
              3.6008856 = fieldWeight in 4133, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.602362 = idf(docFreq=7, maxDocs=43556)
                0.375 = fieldNorm(doc=4133)
        0.75 = coord(3/4)
    
  2. Salton, G.; Buckley, C.; Allan, J.: Automatic structuring of text files (1992) 3.28
    3.2793155 = sum of:
      3.2793155 = product of:
        4.372421 = sum of:
          1.142007 = weight(author_txt:salton in 6504) [ClassicSimilarity], result of:
            1.142007 = score(doc=6504,freq=1.0), product of:
              0.3919483 = queryWeight, product of:
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.05044523 = queryNorm
              2.9136674 = fieldWeight in 6504, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.375 = fieldNorm(doc=6504)
          1.5436096 = weight(author_txt:buckley in 6504) [ClassicSimilarity], result of:
            1.5436096 = score(doc=6504,freq=1.0), product of:
              0.47915342 = queryWeight, product of:
                1.1056633 = boost
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.05044523 = queryNorm
              3.2215352 = fieldWeight in 6504, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.375 = fieldNorm(doc=6504)
          1.6868044 = weight(author_txt:allan in 6504) [ClassicSimilarity], result of:
            1.6868044 = score(doc=6504,freq=1.0), product of:
              0.508346 = queryWeight, product of:
                1.1388469 = boost
                8.848589 = idf(docFreq=16, maxDocs=43556)
                0.05044523 = queryNorm
              3.3182209 = fieldWeight in 6504, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.848589 = idf(docFreq=16, maxDocs=43556)
                0.375 = fieldNorm(doc=6504)
        0.75 = coord(3/4)
    
  3. Buckley, C.; Allan, J.; Salton, G.: Automatic routing and retrieval using Smart : TREC-2 (1995) 3.28
    3.2793155 = sum of:
      3.2793155 = product of:
        4.372421 = sum of:
          1.142007 = weight(author_txt:salton in 697) [ClassicSimilarity], result of:
            1.142007 = score(doc=697,freq=1.0), product of:
              0.3919483 = queryWeight, product of:
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.05044523 = queryNorm
              2.9136674 = fieldWeight in 697, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.375 = fieldNorm(doc=697)
          1.5436096 = weight(author_txt:buckley in 697) [ClassicSimilarity], result of:
            1.5436096 = score(doc=697,freq=1.0), product of:
              0.47915342 = queryWeight, product of:
                1.1056633 = boost
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.05044523 = queryNorm
              3.2215352 = fieldWeight in 697, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.375 = fieldNorm(doc=697)
          1.6868044 = weight(author_txt:allan in 697) [ClassicSimilarity], result of:
            1.6868044 = score(doc=697,freq=1.0), product of:
              0.508346 = queryWeight, product of:
                1.1388469 = boost
                8.848589 = idf(docFreq=16, maxDocs=43556)
                0.05044523 = queryNorm
              3.3182209 = fieldWeight in 697, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.848589 = idf(docFreq=16, maxDocs=43556)
                0.375 = fieldNorm(doc=697)
        0.75 = coord(3/4)
    
  4. Salton, G.; Allen, J.; Buckley, C.; Singhal, A.: Automatic analysis, theme generation, and summarization of machine-readable data (1994) 3.03
    3.025787 = sum of:
      3.025787 = product of:
        4.034383 = sum of:
          0.95167255 = weight(author_txt:salton in 1234) [ClassicSimilarity], result of:
            0.95167255 = score(doc=1234,freq=1.0), product of:
              0.3919483 = queryWeight, product of:
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.05044523 = queryNorm
              2.4280562 = fieldWeight in 1234, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.3125 = fieldNorm(doc=1234)
          1.2863413 = weight(author_txt:buckley in 1234) [ClassicSimilarity], result of:
            1.2863413 = score(doc=1234,freq=1.0), product of:
              0.47915342 = queryWeight, product of:
                1.1056633 = boost
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.05044523 = queryNorm
              2.6846125 = fieldWeight in 1234, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.3125 = fieldNorm(doc=1234)
          1.7963693 = weight(author_txt:singhal in 1234) [ClassicSimilarity], result of:
            1.7963693 = score(doc=1234,freq=1.0), product of:
              0.59864247 = queryWeight, product of:
                1.2358602 = boost
                9.602362 = idf(docFreq=7, maxDocs=43556)
                0.05044523 = queryNorm
              3.0007381 = fieldWeight in 1234, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.602362 = idf(docFreq=7, maxDocs=43556)
                0.3125 = fieldNorm(doc=1234)
        0.75 = coord(3/4)
    
  5. Buckley, C.; Singhal, A.; Mitra, M.; Salton, G.: New retrieval approaches using SMART : TREC 4 (1996) 3.03
    3.025787 = sum of:
      3.025787 = product of:
        4.034383 = sum of:
          0.95167255 = weight(author_txt:salton in 595) [ClassicSimilarity], result of:
            0.95167255 = score(doc=595,freq=1.0), product of:
              0.3919483 = queryWeight, product of:
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.05044523 = queryNorm
              2.4280562 = fieldWeight in 595, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7697797 = idf(docFreq=49, maxDocs=43556)
                0.3125 = fieldNorm(doc=595)
          1.2863413 = weight(author_txt:buckley in 595) [ClassicSimilarity], result of:
            1.2863413 = score(doc=595,freq=1.0), product of:
              0.47915342 = queryWeight, product of:
                1.1056633 = boost
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.05044523 = queryNorm
              2.6846125 = fieldWeight in 595, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.59076 = idf(docFreq=21, maxDocs=43556)
                0.3125 = fieldNorm(doc=595)
          1.7963693 = weight(author_txt:singhal in 595) [ClassicSimilarity], result of:
            1.7963693 = score(doc=595,freq=1.0), product of:
              0.59864247 = queryWeight, product of:
                1.2358602 = boost
                9.602362 = idf(docFreq=7, maxDocs=43556)
                0.05044523 = queryNorm
              3.0007381 = fieldWeight in 595, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.602362 = idf(docFreq=7, maxDocs=43556)
                0.3125 = fieldNorm(doc=595)
        0.75 = coord(3/4)
    

Similar documents (content)

  1. Coombs, J.H.; Renear, A.H.; DeRose, S.J.: Markup systems and the future of scholarly text processing (1987) 0.70
    0.7005153 = sum of:
      0.7005153 = product of:
        1.4010305 = sum of:
          0.10662437 = weight(abstract_txt:analysis in 1591) [ClassicSimilarity], result of:
            0.10662437 = score(doc=1591,freq=1.0), product of:
              0.1328693 = queryWeight, product of:
                3.6684597 = idf(docFreq=3020, maxDocs=43556)
                0.03621937 = queryNorm
              0.8024756 = fieldWeight in 1591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6684597 = idf(docFreq=3020, maxDocs=43556)
                0.21875 = fieldNorm(doc=1591)
          0.32246304 = weight(abstract_txt:machine in 1591) [ClassicSimilarity], result of:
            0.32246304 = score(doc=1591,freq=1.0), product of:
              0.27786914 = queryWeight, product of:
                1.4461317 = boost
                5.3050756 = idf(docFreq=587, maxDocs=43556)
                0.03621937 = queryNorm
              1.1604853 = fieldWeight in 1591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.3050756 = idf(docFreq=587, maxDocs=43556)
                0.21875 = fieldNorm(doc=1591)
          0.39076787 = weight(abstract_txt:texts in 1591) [ClassicSimilarity], result of:
            0.39076787 = score(doc=1591,freq=1.0), product of:
              0.31583935 = queryWeight, product of:
                1.5417743 = boost
                5.6559367 = idf(docFreq=413, maxDocs=43556)
                0.03621937 = queryNorm
              1.2372361 = fieldWeight in 1591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6559367 = idf(docFreq=413, maxDocs=43556)
                0.21875 = fieldNorm(doc=1591)
          0.5811752 = weight(abstract_txt:readable in 1591) [ClassicSimilarity], result of:
            0.5811752 = score(doc=1591,freq=1.0), product of:
              0.41152072 = queryWeight, product of:
                1.759882 = boost
                6.456056 = idf(docFreq=185, maxDocs=43556)
                0.03621937 = queryNorm
              1.4122623 = fieldWeight in 1591, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.456056 = idf(docFreq=185, maxDocs=43556)
                0.21875 = fieldNorm(doc=1591)
        0.5 = coord(4/8)
    
  2. Smeaton, A.F.: Progress in the application of natural language processing to information retrieval tasks (1992) 0.52
    0.51553905 = sum of:
      0.51553905 = product of:
        1.3747709 = sum of:
          0.36719018 = weight(abstract_txt:automatic in 7077) [ClassicSimilarity], result of:
            0.36719018 = score(doc=7077,freq=2.0), product of:
              0.26652354 = queryWeight, product of:
                1.4163007 = boost
                5.195642 = idf(docFreq=655, maxDocs=43556)
                0.03621937 = queryNorm
              1.3777026 = fieldWeight in 7077, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.195642 = idf(docFreq=655, maxDocs=43556)
                0.1875 = fieldNorm(doc=7077)
          0.3311376 = weight(abstract_txt:generation in 7077) [ClassicSimilarity], result of:
            0.3311376 = score(doc=7077,freq=1.0), product of:
              0.313442 = queryWeight, product of:
                1.5359118 = boost
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.03621937 = queryNorm
              1.0564557 = fieldWeight in 7077, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.1875 = fieldNorm(doc=7077)
          0.67644316 = weight(abstract_txt:summarization in 7077) [ClassicSimilarity], result of:
            0.67644316 = score(doc=7077,freq=1.0), product of:
              0.50462925 = queryWeight, product of:
                1.9488298 = boost
                7.1492033 = idf(docFreq=92, maxDocs=43556)
                0.03621937 = queryNorm
              1.3404756 = fieldWeight in 7077, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.1492033 = idf(docFreq=92, maxDocs=43556)
                0.1875 = fieldNorm(doc=7077)
        0.375 = coord(3/8)
    
  3. Sabourin, C.F. (Bearb.): Computational lexicology and lexicography : bibliography (1994) 0.50
    0.49878207 = sum of:
      0.49878207 = product of:
        0.99756414 = sum of:
          0.07616026 = weight(abstract_txt:analysis in 868) [ClassicSimilarity], result of:
            0.07616026 = score(doc=868,freq=1.0), product of:
              0.1328693 = queryWeight, product of:
                3.6684597 = idf(docFreq=3020, maxDocs=43556)
                0.03621937 = queryNorm
              0.5731968 = fieldWeight in 868, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6684597 = idf(docFreq=3020, maxDocs=43556)
                0.15625 = fieldNorm(doc=868)
          0.23033075 = weight(abstract_txt:machine in 868) [ClassicSimilarity], result of:
            0.23033075 = score(doc=868,freq=1.0), product of:
              0.27786914 = queryWeight, product of:
                1.4461317 = boost
                5.3050756 = idf(docFreq=587, maxDocs=43556)
                0.03621937 = queryNorm
              0.8289181 = fieldWeight in 868, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.3050756 = idf(docFreq=587, maxDocs=43556)
                0.15625 = fieldNorm(doc=868)
          0.275948 = weight(abstract_txt:generation in 868) [ClassicSimilarity], result of:
            0.275948 = score(doc=868,freq=1.0), product of:
              0.313442 = queryWeight, product of:
                1.5359118 = boost
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.03621937 = queryNorm
              0.88037974 = fieldWeight in 868, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.15625 = fieldNorm(doc=868)
          0.41512513 = weight(abstract_txt:readable in 868) [ClassicSimilarity], result of:
            0.41512513 = score(doc=868,freq=1.0), product of:
              0.41152072 = queryWeight, product of:
                1.759882 = boost
                6.456056 = idf(docFreq=185, maxDocs=43556)
                0.03621937 = queryNorm
              1.0087588 = fieldWeight in 868, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.456056 = idf(docFreq=185, maxDocs=43556)
                0.15625 = fieldNorm(doc=868)
        0.5 = coord(4/8)
    
  4. Maybury, M.T.: Generating summaries from event data (1995) 0.47
    0.47447264 = sum of:
      0.47447264 = product of:
        0.9489453 = sum of:
          0.03808013 = weight(abstract_txt:analysis in 2415) [ClassicSimilarity], result of:
            0.03808013 = score(doc=2415,freq=1.0), product of:
              0.1328693 = queryWeight, product of:
                3.6684597 = idf(docFreq=3020, maxDocs=43556)
                0.03621937 = queryNorm
              0.2865984 = fieldWeight in 2415, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6684597 = idf(docFreq=3020, maxDocs=43556)
                0.078125 = fieldNorm(doc=2415)
          0.10818445 = weight(abstract_txt:automatic in 2415) [ClassicSimilarity], result of:
            0.10818445 = score(doc=2415,freq=1.0), product of:
              0.26652354 = queryWeight, product of:
                1.4163007 = boost
                5.195642 = idf(docFreq=655, maxDocs=43556)
                0.03621937 = queryNorm
              0.40590954 = fieldWeight in 2415, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.195642 = idf(docFreq=655, maxDocs=43556)
                0.078125 = fieldNorm(doc=2415)
          0.23897797 = weight(abstract_txt:generation in 2415) [ClassicSimilarity], result of:
            0.23897797 = score(doc=2415,freq=3.0), product of:
              0.313442 = queryWeight, product of:
                1.5359118 = boost
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.03621937 = queryNorm
              0.76243126 = fieldWeight in 2415, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.078125 = fieldNorm(doc=2415)
          0.5637027 = weight(abstract_txt:summarization in 2415) [ClassicSimilarity], result of:
            0.5637027 = score(doc=2415,freq=4.0), product of:
              0.50462925 = queryWeight, product of:
                1.9488298 = boost
                7.1492033 = idf(docFreq=92, maxDocs=43556)
                0.03621937 = queryNorm
              1.117063 = fieldWeight in 2415, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.1492033 = idf(docFreq=92, maxDocs=43556)
                0.078125 = fieldNorm(doc=2415)
        0.5 = coord(4/8)
    
  5. Aker, A.; Gaizauskas, R.: Generating descriptive multi-document summaries of geo-located entities using entity type models (2015) 0.38
    0.37976843 = sum of:
      0.37976843 = product of:
        0.75953686 = sum of:
          0.08654755 = weight(abstract_txt:automatic in 3724) [ClassicSimilarity], result of:
            0.08654755 = score(doc=3724,freq=1.0), product of:
              0.26652354 = queryWeight, product of:
                1.4163007 = boost
                5.195642 = idf(docFreq=655, maxDocs=43556)
                0.03621937 = queryNorm
              0.32472762 = fieldWeight in 3724, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.195642 = idf(docFreq=655, maxDocs=43556)
                0.0625 = fieldNorm(doc=3724)
          0.1103792 = weight(abstract_txt:generation in 3724) [ClassicSimilarity], result of:
            0.1103792 = score(doc=3724,freq=1.0), product of:
              0.313442 = queryWeight, product of:
                1.5359118 = boost
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.03621937 = queryNorm
              0.3521519 = fieldWeight in 3724, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6344304 = idf(docFreq=422, maxDocs=43556)
                0.0625 = fieldNorm(doc=3724)
          0.11164796 = weight(abstract_txt:texts in 3724) [ClassicSimilarity], result of:
            0.11164796 = score(doc=3724,freq=1.0), product of:
              0.31583935 = queryWeight, product of:
                1.5417743 = boost
                5.6559367 = idf(docFreq=413, maxDocs=43556)
                0.03621937 = queryNorm
              0.35349604 = fieldWeight in 3724, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6559367 = idf(docFreq=413, maxDocs=43556)
                0.0625 = fieldNorm(doc=3724)
          0.45096216 = weight(abstract_txt:summarization in 3724) [ClassicSimilarity], result of:
            0.45096216 = score(doc=3724,freq=4.0), product of:
              0.50462925 = queryWeight, product of:
                1.9488298 = boost
                7.1492033 = idf(docFreq=92, maxDocs=43556)
                0.03621937 = queryNorm
              0.8936504 = fieldWeight in 3724, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.1492033 = idf(docFreq=92, maxDocs=43556)
                0.0625 = fieldNorm(doc=3724)
        0.5 = coord(4/8)