Document (#16318)

Author
Veenema, F.
Title
To index or not to index
Source
Canadian journal of information and library science. 21(1996) no.2, S.1-22
Year
1996
Abstract
Describes an experiment comparing the performance of automatic full-text indexing software for personal computers with the human intellectual assignment of indexing terms in each document in a collection. Considers the times required to index the document, to retrieve documents satisfying 5 typical foreseen information needs, and the recall and precision ratios of searching. The software used is QuickFinder facility in WordPerfect 6.1 for Windows
Theme
Indexierungsstudien

Similar documents (content)

  1. Mulvany, N.C.: Software tools for indexing : what we need (1990) 0.17
    0.16555202 = sum of:
      0.16555202 = product of:
        0.8277601 = sum of:
          0.073213495 = weight(abstract_txt:document in 453) [ClassicSimilarity], result of:
            0.073213495 = score(doc=453,freq=1.0), product of:
              0.15636933 = queryWeight, product of:
                1.742227 = boost
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.020966472 = queryNorm
              0.4682088 = fieldWeight in 453, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.109375 = fieldNorm(doc=453)
          0.076315016 = weight(abstract_txt:indexing in 453) [ClassicSimilarity], result of:
            0.076315016 = score(doc=453,freq=1.0), product of:
              0.16075487 = queryWeight, product of:
                1.7664894 = boost
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.020966472 = queryNorm
              0.4747291 = fieldWeight in 453, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.109375 = fieldNorm(doc=453)
          0.13290983 = weight(abstract_txt:software in 453) [ClassicSimilarity], result of:
            0.13290983 = score(doc=453,freq=3.0), product of:
              0.16134486 = queryWeight, product of:
                1.769728 = boost
                4.3483377 = idf(docFreq=1501, maxDocs=42740)
                0.020966472 = queryNorm
              0.8237624 = fieldWeight in 453, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.3483377 = idf(docFreq=1501, maxDocs=42740)
                0.109375 = fieldNorm(doc=453)
          0.33509678 = weight(abstract_txt:wordperfect in 453) [ClassicSimilarity], result of:
            0.33509678 = score(doc=453,freq=1.0), product of:
              0.3421325 = queryWeight, product of:
                1.8222632 = boost
                8.954841 = idf(docFreq=14, maxDocs=42740)
                0.020966472 = queryNorm
              0.9794357 = fieldWeight in 453, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.954841 = idf(docFreq=14, maxDocs=42740)
                0.109375 = fieldNorm(doc=453)
          0.210225 = weight(abstract_txt:index in 453) [ClassicSimilarity], result of:
            0.210225 = score(doc=453,freq=2.0), product of:
              0.28701252 = queryWeight, product of:
                2.8908463 = boost
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.020966472 = queryNorm
              0.73245937 = fieldWeight in 453, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.109375 = fieldNorm(doc=453)
        0.2 = coord(5/25)
    
  2. Chung, E.-K.; Miksa, S.; Hastings, S.K.: ¬A framework of automatic subject term assignment for text categorization : an indexing conception-based approach (2010) 0.16
    0.16186038 = sum of:
      0.16186038 = product of:
        0.5780728 = sum of:
          0.055377953 = weight(abstract_txt:full in 435) [ClassicSimilarity], result of:
            0.055377953 = score(doc=435,freq=4.0), product of:
              0.10303199 = queryWeight, product of:
                4.914131 = idf(docFreq=852, maxDocs=42740)
                0.020966472 = queryNorm
              0.5374831 = fieldWeight in 435, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.914131 = idf(docFreq=852, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
          0.06561029 = weight(abstract_txt:automatic in 435) [ClassicSimilarity], result of:
            0.06561029 = score(doc=435,freq=4.0), product of:
              0.115361825 = queryWeight, product of:
                1.0581446 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.020966472 = queryNorm
              0.5687348 = fieldWeight in 435, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
          0.0425641 = weight(abstract_txt:experiment in 435) [ClassicSimilarity], result of:
            0.0425641 = score(doc=435,freq=1.0), product of:
              0.13723445 = queryWeight, product of:
                1.1541055 = boost
                5.671426 = idf(docFreq=399, maxDocs=42740)
                0.020966472 = queryNorm
              0.3101561 = fieldWeight in 435, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.671426 = idf(docFreq=399, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
          0.09078002 = weight(abstract_txt:typical in 435) [ClassicSimilarity], result of:
            0.09078002 = score(doc=435,freq=2.0), product of:
              0.18047526 = queryWeight, product of:
                1.3234965 = boost
                6.503835 = idf(docFreq=173, maxDocs=42740)
                0.020966472 = queryNorm
              0.5030053 = fieldWeight in 435, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.503835 = idf(docFreq=173, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
          0.15749815 = weight(abstract_txt:assignment in 435) [ClassicSimilarity], result of:
            0.15749815 = score(doc=435,freq=4.0), product of:
              0.2068225 = queryWeight, product of:
                1.416814 = boost
                6.96241 = idf(docFreq=109, maxDocs=42740)
                0.020966472 = queryNorm
              0.7615136 = fieldWeight in 435, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.96241 = idf(docFreq=109, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
          0.05176976 = weight(abstract_txt:document in 435) [ClassicSimilarity], result of:
            0.05176976 = score(doc=435,freq=2.0), product of:
              0.15636933 = queryWeight, product of:
                1.742227 = boost
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.020966472 = queryNorm
              0.3310736 = fieldWeight in 435, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
          0.11447252 = weight(abstract_txt:indexing in 435) [ClassicSimilarity], result of:
            0.11447252 = score(doc=435,freq=9.0), product of:
              0.16075487 = queryWeight, product of:
                1.7664894 = boost
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.020966472 = queryNorm
              0.71209365 = fieldWeight in 435, product of:
                3.0 = tf(freq=9.0), with freq of:
                  9.0 = termFreq=9.0
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.0546875 = fieldNorm(doc=435)
        0.28 = coord(7/25)
    
  3. Ward, M.L.: ¬The future of the human indexer (1996) 0.16
    0.1614546 = sum of:
      0.1614546 = product of:
        0.57662356 = sum of:
          0.044338144 = weight(abstract_txt:considers in 314) [ClassicSimilarity], result of:
            0.044338144 = score(doc=314,freq=1.0), product of:
              0.11117774 = queryWeight, product of:
                1.0387783 = boost
                5.104693 = idf(docFreq=704, maxDocs=42740)
                0.020966472 = queryNorm
              0.39880413 = fieldWeight in 314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.104693 = idf(docFreq=704, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
          0.08117168 = weight(abstract_txt:automatic in 314) [ClassicSimilarity], result of:
            0.08117168 = score(doc=314,freq=3.0), product of:
              0.115361825 = queryWeight, product of:
                1.0581446 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.020966472 = queryNorm
              0.7036268 = fieldWeight in 314, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
          0.054326873 = weight(abstract_txt:required in 314) [ClassicSimilarity], result of:
            0.054326873 = score(doc=314,freq=1.0), product of:
              0.12730418 = queryWeight, product of:
                1.1115661 = boost
                5.4623814 = idf(docFreq=492, maxDocs=42740)
                0.020966472 = queryNorm
              0.42674854 = fieldWeight in 314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.4623814 = idf(docFreq=492, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
          0.058291562 = weight(abstract_txt:intellectual in 314) [ClassicSimilarity], result of:
            0.058291562 = score(doc=314,freq=1.0), product of:
              0.13342483 = queryWeight, product of:
                1.1379738 = boost
                5.5921526 = idf(docFreq=432, maxDocs=42740)
                0.020966472 = queryNorm
              0.4368869 = fieldWeight in 314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5921526 = idf(docFreq=432, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
          0.13352346 = weight(abstract_txt:indexing in 314) [ClassicSimilarity], result of:
            0.13352346 = score(doc=314,freq=6.0), product of:
              0.16075487 = queryWeight, product of:
                1.7664894 = boost
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.020966472 = queryNorm
              0.8306029 = fieldWeight in 314, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
          0.054811087 = weight(abstract_txt:software in 314) [ClassicSimilarity], result of:
            0.054811087 = score(doc=314,freq=1.0), product of:
              0.16134486 = queryWeight, product of:
                1.769728 = boost
                4.3483377 = idf(docFreq=1501, maxDocs=42740)
                0.020966472 = queryNorm
              0.33971387 = fieldWeight in 314, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.3483377 = idf(docFreq=1501, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
          0.15016071 = weight(abstract_txt:index in 314) [ClassicSimilarity], result of:
            0.15016071 = score(doc=314,freq=2.0), product of:
              0.28701252 = queryWeight, product of:
                2.8908463 = boost
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.020966472 = queryNorm
              0.52318525 = fieldWeight in 314, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.078125 = fieldNorm(doc=314)
        0.28 = coord(7/25)
    
  4. Prasher, R.G.: Evaluation of indexing system (1989) 0.15
    0.14729726 = sum of:
      0.14729726 = product of:
        0.7364863 = sum of:
          0.07834333 = weight(abstract_txt:precision in 5067) [ClassicSimilarity], result of:
            0.07834333 = score(doc=5067,freq=1.0), product of:
              0.1298421 = queryWeight, product of:
                1.1225914 = boost
                5.5165615 = idf(docFreq=466, maxDocs=42740)
                0.020966472 = queryNorm
              0.6033739 = fieldWeight in 5067, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5165615 = idf(docFreq=466, maxDocs=42740)
                0.109375 = fieldNorm(doc=5067)
          0.087944955 = weight(abstract_txt:recall in 5067) [ClassicSimilarity], result of:
            0.087944955 = score(doc=5067,freq=1.0), product of:
              0.14024523 = queryWeight, product of:
                1.1666968 = boost
                5.733301 = idf(docFreq=375, maxDocs=42740)
                0.020966472 = queryNorm
              0.62707984 = fieldWeight in 5067, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.733301 = idf(docFreq=375, maxDocs=42740)
                0.109375 = fieldNorm(doc=5067)
          0.289365 = weight(abstract_txt:ratios in 5067) [ClassicSimilarity], result of:
            0.289365 = score(doc=5067,freq=1.0), product of:
              0.31024978 = queryWeight, product of:
                1.7352805 = boost
                8.527396 = idf(docFreq=22, maxDocs=42740)
                0.020966472 = queryNorm
              0.93268394 = fieldWeight in 5067, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.527396 = idf(docFreq=22, maxDocs=42740)
                0.109375 = fieldNorm(doc=5067)
          0.13218148 = weight(abstract_txt:indexing in 5067) [ClassicSimilarity], result of:
            0.13218148 = score(doc=5067,freq=3.0), product of:
              0.16075487 = queryWeight, product of:
                1.7664894 = boost
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.020966472 = queryNorm
              0.8222549 = fieldWeight in 5067, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.109375 = fieldNorm(doc=5067)
          0.14865153 = weight(abstract_txt:index in 5067) [ClassicSimilarity], result of:
            0.14865153 = score(doc=5067,freq=1.0), product of:
              0.28701252 = queryWeight, product of:
                2.8908463 = boost
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.020966472 = queryNorm
              0.517927 = fieldWeight in 5067, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.109375 = fieldNorm(doc=5067)
        0.2 = coord(5/25)
    
  5. Lancaster, F.W.: Trends in subject indexing from 1957 to 2000 (1980) 0.15
    0.14682005 = sum of:
      0.14682005 = product of:
        0.61175025 = sum of:
          0.053205773 = weight(abstract_txt:considers in 209) [ClassicSimilarity], result of:
            0.053205773 = score(doc=209,freq=1.0), product of:
              0.11117774 = queryWeight, product of:
                1.0387783 = boost
                5.104693 = idf(docFreq=704, maxDocs=42740)
                0.020966472 = queryNorm
              0.47856498 = fieldWeight in 209, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.104693 = idf(docFreq=704, maxDocs=42740)
                0.09375 = fieldNorm(doc=209)
          0.056237385 = weight(abstract_txt:automatic in 209) [ClassicSimilarity], result of:
            0.056237385 = score(doc=209,freq=1.0), product of:
              0.115361825 = queryWeight, product of:
                1.0581446 = boost
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.020966472 = queryNorm
              0.48748696 = fieldWeight in 209, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.199861 = idf(docFreq=640, maxDocs=42740)
                0.09375 = fieldNorm(doc=209)
          0.06994988 = weight(abstract_txt:intellectual in 209) [ClassicSimilarity], result of:
            0.06994988 = score(doc=209,freq=1.0), product of:
              0.13342483 = queryWeight, product of:
                1.1379738 = boost
                5.5921526 = idf(docFreq=432, maxDocs=42740)
                0.020966472 = queryNorm
              0.52426434 = fieldWeight in 209, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5921526 = idf(docFreq=432, maxDocs=42740)
                0.09375 = fieldNorm(doc=209)
          0.0919362 = weight(abstract_txt:computers in 209) [ClassicSimilarity], result of:
            0.0919362 = score(doc=209,freq=1.0), product of:
              0.16009204 = queryWeight, product of:
                1.2465187 = boost
                6.1255565 = idf(docFreq=253, maxDocs=42740)
                0.020966472 = queryNorm
              0.5742709 = fieldWeight in 209, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1255565 = idf(docFreq=253, maxDocs=42740)
                0.09375 = fieldNorm(doc=209)
          0.16022815 = weight(abstract_txt:indexing in 209) [ClassicSimilarity], result of:
            0.16022815 = score(doc=209,freq=6.0), product of:
              0.16075487 = queryWeight, product of:
                1.7664894 = boost
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.020966472 = queryNorm
              0.9967234 = fieldWeight in 209, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.34038 = idf(docFreq=1513, maxDocs=42740)
                0.09375 = fieldNorm(doc=209)
          0.18019286 = weight(abstract_txt:index in 209) [ClassicSimilarity], result of:
            0.18019286 = score(doc=209,freq=2.0), product of:
              0.28701252 = queryWeight, product of:
                2.8908463 = boost
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.020966472 = queryNorm
              0.6278223 = fieldWeight in 209, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.7353325 = idf(docFreq=1019, maxDocs=42740)
                0.09375 = fieldNorm(doc=209)
        0.24 = coord(6/25)