Document (#19939)

Author
Salton, G.
Buckley, C.
Title
Term-weighting approaches in automatic text retrieval
Source
Information processing and management. 24(1988) no.5, S.513-523
Year
1988
Footnote
Wiederabgedruckt in: Readings in information retrieval. Ed.: K. Sparck Jones u. P. Willett. San Francisco: Morgan Kaufmann 1997. S.323-328.
Theme
Retrievalalgorithmen

Similar documents (author)

  1. Salton, G.; Buckley, C.: Parallel text search methods (1988) 5.80
    5.7951345 = sum of:
      5.7951345 = sum of:
        2.4650571 = weight(author_txt:salton in 404) [ClassicSimilarity], result of:
          2.4650571 = score(doc=404,freq=1.0), product of:
            0.6332948 = queryWeight, product of:
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.0813495 = queryNorm
            3.8924322 = fieldWeight in 404, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.5 = fieldNorm(doc=404)
        3.3300774 = weight(author_txt:buckley in 404) [ClassicSimilarity], result of:
          3.3300774 = score(doc=404,freq=1.0), product of:
            0.77391064 = queryWeight, product of:
              1.1054585 = boost
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.0813495 = queryNorm
            4.3029222 = fieldWeight in 404, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.5 = fieldNorm(doc=404)
    
  2. Salton, G.; Buckley, C.: Approaches to global text analysis (1990) 5.80
    5.7951345 = sum of:
      5.7951345 = sum of:
        2.4650571 = weight(author_txt:salton in 4901) [ClassicSimilarity], result of:
          2.4650571 = score(doc=4901,freq=1.0), product of:
            0.6332948 = queryWeight, product of:
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.0813495 = queryNorm
            3.8924322 = fieldWeight in 4901, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.5 = fieldNorm(doc=4901)
        3.3300774 = weight(author_txt:buckley in 4901) [ClassicSimilarity], result of:
          3.3300774 = score(doc=4901,freq=1.0), product of:
            0.77391064 = queryWeight, product of:
              1.1054585 = boost
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.0813495 = queryNorm
            4.3029222 = fieldWeight in 4901, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.5 = fieldNorm(doc=4901)
    
  3. Salton, G.; Buckley, C.: Improving retrieval performance by relevance feedback (1990) 5.80
    5.7951345 = sum of:
      5.7951345 = sum of:
        2.4650571 = weight(author_txt:salton in 5442) [ClassicSimilarity], result of:
          2.4650571 = score(doc=5442,freq=1.0), product of:
            0.6332948 = queryWeight, product of:
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.0813495 = queryNorm
            3.8924322 = fieldWeight in 5442, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.5 = fieldNorm(doc=5442)
        3.3300774 = weight(author_txt:buckley in 5442) [ClassicSimilarity], result of:
          3.3300774 = score(doc=5442,freq=1.0), product of:
            0.77391064 = queryWeight, product of:
              1.1054585 = boost
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.0813495 = queryNorm
            4.3029222 = fieldWeight in 5442, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.5 = fieldNorm(doc=5442)
    
  4. Salton, G.; Buckley, C.; Allan, J.: Automatic structuring of text files (1992) 4.35
    4.3463507 = sum of:
      4.3463507 = sum of:
        1.8487929 = weight(author_txt:salton in 6507) [ClassicSimilarity], result of:
          1.8487929 = score(doc=6507,freq=1.0), product of:
            0.6332948 = queryWeight, product of:
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.0813495 = queryNorm
            2.9193242 = fieldWeight in 6507, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.375 = fieldNorm(doc=6507)
        2.4975579 = weight(author_txt:buckley in 6507) [ClassicSimilarity], result of:
          2.4975579 = score(doc=6507,freq=1.0), product of:
            0.77391064 = queryWeight, product of:
              1.1054585 = boost
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.0813495 = queryNorm
            3.2271917 = fieldWeight in 6507, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.375 = fieldNorm(doc=6507)
    
  5. Salton, G.; Buckley, C.; Smith, M.: On the application of syntactic methodologies in automatic text analysis (1990) 4.35
    4.3463507 = sum of:
      4.3463507 = sum of:
        1.8487929 = weight(author_txt:salton in 7864) [ClassicSimilarity], result of:
          1.8487929 = score(doc=7864,freq=1.0), product of:
            0.6332948 = queryWeight, product of:
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.0813495 = queryNorm
            2.9193242 = fieldWeight in 7864, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              7.7848644 = idf(docFreq=49, maxDocs=44218)
              0.375 = fieldNorm(doc=7864)
        2.4975579 = weight(author_txt:buckley in 7864) [ClassicSimilarity], result of:
          2.4975579 = score(doc=7864,freq=1.0), product of:
            0.77391064 = queryWeight, product of:
              1.1054585 = boost
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.0813495 = queryNorm
            3.2271917 = fieldWeight in 7864, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              8.6058445 = idf(docFreq=21, maxDocs=44218)
              0.375 = fieldNorm(doc=7864)
    

Similar documents (content)

  1. Harman, D.: ¬The Text REtrieval Conferences (TRECs) : providing a test-bed for information retrieval systems (1998) 0.88
    0.8819868 = sum of:
      0.8819868 = product of:
        1.0583842 = sum of:
          0.10163468 = weight(abstract_txt:retrieval in 1314) [ClassicSimilarity], result of:
            0.10163468 = score(doc=1314,freq=3.0), product of:
              0.18011 = queryWeight, product of:
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.051828135 = queryNorm
              0.5642923 = fieldWeight in 1314, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.09375 = fieldNorm(doc=1314)
          0.13075857 = weight(abstract_txt:text in 1314) [ClassicSimilarity], result of:
            0.13075857 = score(doc=1314,freq=2.0), product of:
              0.2438861 = queryWeight, product of:
                1.163656 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.051828135 = queryNorm
              0.53614604 = fieldWeight in 1314, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.09375 = fieldNorm(doc=1314)
          0.1547445 = weight(abstract_txt:term in 1314) [ClassicSimilarity], result of:
            0.1547445 = score(doc=1314,freq=1.0), product of:
              0.3437904 = queryWeight, product of:
                1.3815862 = boost
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.051828135 = queryNorm
              0.45011294 = fieldWeight in 1314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.09375 = fieldNorm(doc=1314)
          0.19609709 = weight(abstract_txt:automatic in 1314) [ClassicSimilarity], result of:
            0.19609709 = score(doc=1314,freq=1.0), product of:
              0.4025913 = queryWeight, product of:
                1.4950761 = boost
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.051828135 = queryNorm
              0.48708728 = fieldWeight in 1314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.09375 = fieldNorm(doc=1314)
          0.47514927 = weight(abstract_txt:weighting in 1314) [ClassicSimilarity], result of:
            0.47514927 = score(doc=1314,freq=1.0), product of:
              0.72627926 = queryWeight, product of:
                2.0080888 = boost
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.051828135 = queryNorm
              0.6542239 = fieldWeight in 1314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.09375 = fieldNorm(doc=1314)
        0.8333333 = coord(5/6)
    
  2. Ko, Y.: ¬A new term-weighting scheme for text classification using the odds of positive and negative class probabilities (2015) 0.88
    0.87636656 = sum of:
      0.87636656 = product of:
        1.3145498 = sum of:
          0.09779802 = weight(abstract_txt:retrieval in 2339) [ClassicSimilarity], result of:
            0.09779802 = score(doc=2339,freq=4.0), product of:
              0.18011 = queryWeight, product of:
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.051828135 = queryNorm
              0.5429905 = fieldWeight in 2339, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.078125 = fieldNorm(doc=2339)
          0.10896547 = weight(abstract_txt:text in 2339) [ClassicSimilarity], result of:
            0.10896547 = score(doc=2339,freq=2.0), product of:
              0.2438861 = queryWeight, product of:
                1.163656 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.051828135 = queryNorm
              0.44678837 = fieldWeight in 2339, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.078125 = fieldNorm(doc=2339)
          0.3158709 = weight(abstract_txt:term in 2339) [ClassicSimilarity], result of:
            0.3158709 = score(doc=2339,freq=6.0), product of:
              0.3437904 = queryWeight, product of:
                1.3815862 = boost
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.051828135 = queryNorm
              0.9187892 = fieldWeight in 2339, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.078125 = fieldNorm(doc=2339)
          0.7919154 = weight(abstract_txt:weighting in 2339) [ClassicSimilarity], result of:
            0.7919154 = score(doc=2339,freq=4.0), product of:
              0.72627926 = queryWeight, product of:
                2.0080888 = boost
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.051828135 = queryNorm
              1.0903732 = fieldWeight in 2339, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.078125 = fieldNorm(doc=2339)
        0.6666667 = coord(4/6)
    
  3. Faraj, N.: Analyse d'une methode d'indexation automatique basée sur une analyse syntaxique de texte (1996) 0.87
    0.87337637 = sum of:
      0.87337637 = product of:
        1.3100646 = sum of:
          0.123280354 = weight(abstract_txt:text in 685) [ClassicSimilarity], result of:
            0.123280354 = score(doc=685,freq=1.0), product of:
              0.2438861 = queryWeight, product of:
                1.163656 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.051828135 = queryNorm
              0.5054833 = fieldWeight in 685, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.125 = fieldNorm(doc=685)
          0.29178903 = weight(abstract_txt:term in 685) [ClassicSimilarity], result of:
            0.29178903 = score(doc=685,freq=2.0), product of:
              0.3437904 = queryWeight, product of:
                1.3815862 = boost
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.051828135 = queryNorm
              0.84874105 = fieldWeight in 685, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.125 = fieldNorm(doc=685)
          0.2614628 = weight(abstract_txt:automatic in 685) [ClassicSimilarity], result of:
            0.2614628 = score(doc=685,freq=1.0), product of:
              0.4025913 = queryWeight, product of:
                1.4950761 = boost
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.051828135 = queryNorm
              0.6494497 = fieldWeight in 685, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.125 = fieldNorm(doc=685)
          0.63353235 = weight(abstract_txt:weighting in 685) [ClassicSimilarity], result of:
            0.63353235 = score(doc=685,freq=1.0), product of:
              0.72627926 = queryWeight, product of:
                2.0080888 = boost
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.051828135 = queryNorm
              0.87229854 = fieldWeight in 685, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.125 = fieldNorm(doc=685)
        0.6666667 = coord(4/6)
    
  4. Robertson, S.E.: OKAPI at TREC-1 (1994) 0.87
    0.86919653 = sum of:
      0.86919653 = product of:
        1.3037947 = sum of:
          0.07823841 = weight(abstract_txt:retrieval in 7953) [ClassicSimilarity], result of:
            0.07823841 = score(doc=7953,freq=1.0), product of:
              0.18011 = queryWeight, product of:
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.051828135 = queryNorm
              0.43439242 = fieldWeight in 7953, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.125 = fieldNorm(doc=7953)
          0.123280354 = weight(abstract_txt:text in 7953) [ClassicSimilarity], result of:
            0.123280354 = score(doc=7953,freq=1.0), product of:
              0.2438861 = queryWeight, product of:
                1.163656 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.051828135 = queryNorm
              0.5054833 = fieldWeight in 7953, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.125 = fieldNorm(doc=7953)
          0.20632602 = weight(abstract_txt:term in 7953) [ClassicSimilarity], result of:
            0.20632602 = score(doc=7953,freq=1.0), product of:
              0.3437904 = queryWeight, product of:
                1.3815862 = boost
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.051828135 = queryNorm
              0.6001506 = fieldWeight in 7953, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.125 = fieldNorm(doc=7953)
          0.89594996 = weight(abstract_txt:weighting in 7953) [ClassicSimilarity], result of:
            0.89594996 = score(doc=7953,freq=2.0), product of:
              0.72627926 = queryWeight, product of:
                2.0080888 = boost
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.051828135 = queryNorm
              1.2336164 = fieldWeight in 7953, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.125 = fieldNorm(doc=7953)
        0.6666667 = coord(4/6)
    
  5. Harman, D.: Overview of the first Text Retrieval Conference (1993) 0.83
    0.8345296 = sum of:
      0.8345296 = product of:
        1.0014355 = sum of:
          0.082984366 = weight(abstract_txt:retrieval in 548) [ClassicSimilarity], result of:
            0.082984366 = score(doc=548,freq=2.0), product of:
              0.18011 = queryWeight, product of:
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.051828135 = queryNorm
              0.4607427 = fieldWeight in 548, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.09375 = fieldNorm(doc=548)
          0.09246027 = weight(abstract_txt:text in 548) [ClassicSimilarity], result of:
            0.09246027 = score(doc=548,freq=1.0), product of:
              0.2438861 = queryWeight, product of:
                1.163656 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.051828135 = queryNorm
              0.37911248 = fieldWeight in 548, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.09375 = fieldNorm(doc=548)
          0.1547445 = weight(abstract_txt:term in 548) [ClassicSimilarity], result of:
            0.1547445 = score(doc=548,freq=1.0), product of:
              0.3437904 = queryWeight, product of:
                1.3815862 = boost
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.051828135 = queryNorm
              0.45011294 = fieldWeight in 548, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8012047 = idf(docFreq=987, maxDocs=44218)
                0.09375 = fieldNorm(doc=548)
          0.19609709 = weight(abstract_txt:automatic in 548) [ClassicSimilarity], result of:
            0.19609709 = score(doc=548,freq=1.0), product of:
              0.4025913 = queryWeight, product of:
                1.4950761 = boost
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.051828135 = queryNorm
              0.48708728 = fieldWeight in 548, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.09375 = fieldNorm(doc=548)
          0.47514927 = weight(abstract_txt:weighting in 548) [ClassicSimilarity], result of:
            0.47514927 = score(doc=548,freq=1.0), product of:
              0.72627926 = queryWeight, product of:
                2.0080888 = boost
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.051828135 = queryNorm
              0.6542239 = fieldWeight in 548, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.09375 = fieldNorm(doc=548)
        0.8333333 = coord(5/6)