Document (#11879)

Author
Boeri, R.J.
Hensel, M.
Title
Set up a winning text retrieval system : carefully
Source
CD-ROM professional. 8(1995) no.8, S.67-68
Year
1995
Abstract
Considers some of the practical issues involved when a company plans to develop an in house computerized document management system: conversion of paper to electronic form via optical character recognition (OCR) or rekeying; coding of document elements using SGML; indexing for information searching and retrieval (including proximity searching); and hybrid CD-ROM and online information retrieval systems
Theme
Dokumentenmanagement
Aid
SGML

Similar documents (content)

  1. Thiel, T.J.: Automated indexing of document image management systems (1992) 0.32
    0.32374778 = sum of:
      0.32374778 = product of:
        1.0117118 = sum of:
          0.013009736 = weight(abstract_txt:information in 3049) [ClassicSimilarity], result of:
            0.013009736 = score(doc=3049,freq=1.0), product of:
              0.057179686 = queryWeight, product of:
                1.1106349 = boost
                2.42692 = idf(docFreq=10382, maxDocs=43254)
                0.02121363 = queryNorm
              0.22752374 = fieldWeight in 3049, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                2.42692 = idf(docFreq=10382, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.1490737 = weight(abstract_txt:recognition in 3049) [ClassicSimilarity], result of:
            0.1490737 = score(doc=3049,freq=2.0), product of:
              0.18308109 = queryWeight, product of:
                1.4052616 = boost
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.02121363 = queryNorm
              0.81424963 = fieldWeight in 3049, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.178028 = weight(abstract_txt:character in 3049) [ClassicSimilarity], result of:
            0.178028 = score(doc=3049,freq=2.0), product of:
              0.2060796 = queryWeight, product of:
                1.4909152 = boost
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.02121363 = queryNorm
              0.8638798 = fieldWeight in 3049, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.034668252 = weight(abstract_txt:system in 3049) [ClassicSimilarity], result of:
            0.034668252 = score(doc=3049,freq=1.0), product of:
              0.10990498 = queryWeight, product of:
                1.5397816 = boost
                3.364676 = idf(docFreq=4064, maxDocs=43254)
                0.02121363 = queryNorm
              0.3154384 = fieldWeight in 3049, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.364676 = idf(docFreq=4064, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.19965053 = weight(abstract_txt:coding in 3049) [ClassicSimilarity], result of:
            0.19965053 = score(doc=3049,freq=2.0), product of:
              0.22244522 = queryWeight, product of:
                1.5489842 = boost
                6.7695704 = idf(docFreq=134, maxDocs=43254)
                0.02121363 = queryNorm
              0.8975267 = fieldWeight in 3049, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.7695704 = idf(docFreq=134, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.2563024 = weight(abstract_txt:optical in 3049) [ClassicSimilarity], result of:
            0.2563024 = score(doc=3049,freq=2.0), product of:
              0.2627511 = queryWeight, product of:
                1.6834791 = boost
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.02121363 = queryNorm
              0.97545695 = fieldWeight in 3049, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.12394394 = weight(abstract_txt:document in 3049) [ClassicSimilarity], result of:
            0.12394394 = score(doc=3049,freq=3.0), product of:
              0.1781719 = queryWeight, product of:
                1.9605145 = boost
                4.2840466 = idf(docFreq=1620, maxDocs=43254)
                0.02121363 = queryNorm
              0.6956425 = fieldWeight in 3049, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.2840466 = idf(docFreq=1620, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
          0.057035364 = weight(abstract_txt:retrieval in 3049) [ClassicSimilarity], result of:
            0.057035364 = score(doc=3049,freq=1.0), product of:
              0.17532991 = queryWeight, product of:
                2.381903 = boost
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.02121363 = queryNorm
              0.3253031 = fieldWeight in 3049, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.09375 = fieldNorm(doc=3049)
        0.32 = coord(8/25)
    
  2. Ramsden, A.: ELINOR electronic library system (1998) 0.22
    0.21925531 = sum of:
      0.21925531 = product of:
        0.91356385 = sum of:
          0.14054805 = weight(abstract_txt:recognition in 3404) [ClassicSimilarity], result of:
            0.14054805 = score(doc=3404,freq=1.0), product of:
              0.18308109 = queryWeight, product of:
                1.4052616 = boost
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.02121363 = queryNorm
              0.76768196 = fieldWeight in 3404, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.125 = fieldNorm(doc=3404)
          0.16113958 = weight(abstract_txt:computerized in 3404) [ClassicSimilarity], result of:
            0.16113958 = score(doc=3404,freq=1.0), product of:
              0.20055266 = queryWeight, product of:
                1.4707866 = boost
                6.427821 = idf(docFreq=189, maxDocs=43254)
                0.02121363 = queryNorm
              0.80347764 = fieldWeight in 3404, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.427821 = idf(docFreq=189, maxDocs=43254)
                0.125 = fieldNorm(doc=3404)
          0.16784641 = weight(abstract_txt:character in 3404) [ClassicSimilarity], result of:
            0.16784641 = score(doc=3404,freq=1.0), product of:
              0.2060796 = queryWeight, product of:
                1.4909152 = boost
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.02121363 = queryNorm
              0.8144737 = fieldWeight in 3404, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.125 = fieldNorm(doc=3404)
          0.2416442 = weight(abstract_txt:optical in 3404) [ClassicSimilarity], result of:
            0.2416442 = score(doc=3404,freq=1.0), product of:
              0.2627511 = queryWeight, product of:
                1.6834791 = boost
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.02121363 = queryNorm
              0.9196696 = fieldWeight in 3404, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.125 = fieldNorm(doc=3404)
          0.094838664 = weight(abstract_txt:searching in 3404) [ClassicSimilarity], result of:
            0.094838664 = score(doc=3404,freq=1.0), product of:
              0.17745732 = queryWeight, product of:
                1.956579 = boost
                4.275447 = idf(docFreq=1634, maxDocs=43254)
                0.02121363 = queryNorm
              0.53443086 = fieldWeight in 3404, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.275447 = idf(docFreq=1634, maxDocs=43254)
                0.125 = fieldNorm(doc=3404)
          0.10754691 = weight(abstract_txt:retrieval in 3404) [ClassicSimilarity], result of:
            0.10754691 = score(doc=3404,freq=2.0), product of:
              0.17532991 = queryWeight, product of:
                2.381903 = boost
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.02121363 = queryNorm
              0.6133974 = fieldWeight in 3404, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.125 = fieldNorm(doc=3404)
        0.24 = coord(6/25)
    
  3. Broadhurst, R.: ¬The digitisation of library material (1993) 0.21
    0.20964992 = sum of:
      0.20964992 = product of:
        0.87354136 = sum of:
          0.08027778 = weight(abstract_txt:considers in 6256) [ClassicSimilarity], result of:
            0.08027778 = score(doc=6256,freq=1.0), product of:
              0.12603481 = queryWeight, product of:
                1.1659521 = boost
                5.095594 = idf(docFreq=719, maxDocs=43254)
                0.02121363 = queryNorm
              0.63694924 = fieldWeight in 6256, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.095594 = idf(docFreq=719, maxDocs=43254)
                0.125 = fieldNorm(doc=6256)
          0.14054805 = weight(abstract_txt:recognition in 6256) [ClassicSimilarity], result of:
            0.14054805 = score(doc=6256,freq=1.0), product of:
              0.18308109 = queryWeight, product of:
                1.4052616 = boost
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.02121363 = queryNorm
              0.76768196 = fieldWeight in 6256, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.125 = fieldNorm(doc=6256)
          0.14781289 = weight(abstract_txt:conversion in 6256) [ClassicSimilarity], result of:
            0.14781289 = score(doc=6256,freq=1.0), product of:
              0.18933685 = queryWeight, product of:
                1.4290684 = boost
                6.245499 = idf(docFreq=227, maxDocs=43254)
                0.02121363 = queryNorm
              0.7806874 = fieldWeight in 6256, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.245499 = idf(docFreq=227, maxDocs=43254)
                0.125 = fieldNorm(doc=6256)
          0.16784641 = weight(abstract_txt:character in 6256) [ClassicSimilarity], result of:
            0.16784641 = score(doc=6256,freq=1.0), product of:
              0.2060796 = queryWeight, product of:
                1.4909152 = boost
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.02121363 = queryNorm
              0.8144737 = fieldWeight in 6256, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.125 = fieldNorm(doc=6256)
          0.2416442 = weight(abstract_txt:optical in 6256) [ClassicSimilarity], result of:
            0.2416442 = score(doc=6256,freq=1.0), product of:
              0.2627511 = queryWeight, product of:
                1.6834791 = boost
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.02121363 = queryNorm
              0.9196696 = fieldWeight in 6256, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.125 = fieldNorm(doc=6256)
          0.09541209 = weight(abstract_txt:document in 6256) [ClassicSimilarity], result of:
            0.09541209 = score(doc=6256,freq=1.0), product of:
              0.1781719 = queryWeight, product of:
                1.9605145 = boost
                4.2840466 = idf(docFreq=1620, maxDocs=43254)
                0.02121363 = queryNorm
              0.53550583 = fieldWeight in 6256, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2840466 = idf(docFreq=1620, maxDocs=43254)
                0.125 = fieldNorm(doc=6256)
        0.24 = coord(6/25)
    
  4. Lunin, L.F.: ¬The big picture : selection and design issues for image information systems (1997) 0.17
    0.1715268 = sum of:
      0.1715268 = product of:
        0.5360213 = sum of:
          0.03798521 = weight(abstract_txt:including in 1758) [ClassicSimilarity], result of:
            0.03798521 = score(doc=1758,freq=1.0), product of:
              0.09271054 = queryWeight, product of:
                4.370329 = idf(docFreq=1486, maxDocs=43254)
                0.02121363 = queryNorm
              0.40971833 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.370329 = idf(docFreq=1486, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.018398544 = weight(abstract_txt:information in 1758) [ClassicSimilarity], result of:
            0.018398544 = score(doc=1758,freq=2.0), product of:
              0.057179686 = queryWeight, product of:
                1.1106349 = boost
                2.42692 = idf(docFreq=10382, maxDocs=43254)
                0.02121363 = queryNorm
              0.32176715 = fieldWeight in 1758, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                2.42692 = idf(docFreq=10382, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.06020833 = weight(abstract_txt:considers in 1758) [ClassicSimilarity], result of:
            0.06020833 = score(doc=1758,freq=1.0), product of:
              0.12603481 = queryWeight, product of:
                1.1659521 = boost
                5.095594 = idf(docFreq=719, maxDocs=43254)
                0.02121363 = queryNorm
              0.47771192 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.095594 = idf(docFreq=719, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.06396389 = weight(abstract_txt:involved in 1758) [ClassicSimilarity], result of:
            0.06396389 = score(doc=1758,freq=1.0), product of:
              0.13122281 = queryWeight, product of:
                1.1897073 = boost
                5.1994123 = idf(docFreq=648, maxDocs=43254)
                0.02121363 = queryNorm
              0.4874449 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1994123 = idf(docFreq=648, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.06671563 = weight(abstract_txt:elements in 1758) [ClassicSimilarity], result of:
            0.06671563 = score(doc=1758,freq=1.0), product of:
              0.13495982 = queryWeight, product of:
                1.2065288 = boost
                5.2729278 = idf(docFreq=602, maxDocs=43254)
                0.02121363 = queryNorm
              0.49433696 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.2729278 = idf(docFreq=602, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.11085967 = weight(abstract_txt:conversion in 1758) [ClassicSimilarity], result of:
            0.11085967 = score(doc=1758,freq=1.0), product of:
              0.18933685 = queryWeight, product of:
                1.4290684 = boost
                6.245499 = idf(docFreq=227, maxDocs=43254)
                0.02121363 = queryNorm
              0.58551556 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.245499 = idf(docFreq=227, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.120854676 = weight(abstract_txt:computerized in 1758) [ClassicSimilarity], result of:
            0.120854676 = score(doc=1758,freq=1.0), product of:
              0.20055266 = queryWeight, product of:
                1.4707866 = boost
                6.427821 = idf(docFreq=189, maxDocs=43254)
                0.02121363 = queryNorm
              0.6026082 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.427821 = idf(docFreq=189, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
          0.057035364 = weight(abstract_txt:retrieval in 1758) [ClassicSimilarity], result of:
            0.057035364 = score(doc=1758,freq=1.0), product of:
              0.17532991 = queryWeight, product of:
                2.381903 = boost
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.02121363 = queryNorm
              0.3253031 = fieldWeight in 1758, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.09375 = fieldNorm(doc=1758)
        0.32 = coord(8/25)
    
  5. Initiatives for access (1994) 0.17
    0.16568995 = sum of:
      0.16568995 = product of:
        0.5917498 = sum of:
          0.010841447 = weight(abstract_txt:information in 4906) [ClassicSimilarity], result of:
            0.010841447 = score(doc=4906,freq=1.0), product of:
              0.057179686 = queryWeight, product of:
                1.1106349 = boost
                2.42692 = idf(docFreq=10382, maxDocs=43254)
                0.02121363 = queryNorm
              0.18960312 = fieldWeight in 4906, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                2.42692 = idf(docFreq=10382, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
          0.053303245 = weight(abstract_txt:involved in 4906) [ClassicSimilarity], result of:
            0.053303245 = score(doc=4906,freq=1.0), product of:
              0.13122281 = queryWeight, product of:
                1.1897073 = boost
                5.1994123 = idf(docFreq=648, maxDocs=43254)
                0.02121363 = queryNorm
              0.4062041 = fieldWeight in 4906, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1994123 = idf(docFreq=648, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
          0.08784253 = weight(abstract_txt:recognition in 4906) [ClassicSimilarity], result of:
            0.08784253 = score(doc=4906,freq=1.0), product of:
              0.18308109 = queryWeight, product of:
                1.4052616 = boost
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.02121363 = queryNorm
              0.47980124 = fieldWeight in 4906, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1414557 = idf(docFreq=252, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
          0.09238306 = weight(abstract_txt:conversion in 4906) [ClassicSimilarity], result of:
            0.09238306 = score(doc=4906,freq=1.0), product of:
              0.18933685 = queryWeight, product of:
                1.4290684 = boost
                6.245499 = idf(docFreq=227, maxDocs=43254)
                0.02121363 = queryNorm
              0.4879296 = fieldWeight in 4906, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.245499 = idf(docFreq=227, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
          0.10490401 = weight(abstract_txt:character in 4906) [ClassicSimilarity], result of:
            0.10490401 = score(doc=4906,freq=1.0), product of:
              0.2060796 = queryWeight, product of:
                1.4909152 = boost
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.02121363 = queryNorm
              0.5090461 = fieldWeight in 4906, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5157895 = idf(docFreq=173, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
          0.028890207 = weight(abstract_txt:system in 4906) [ClassicSimilarity], result of:
            0.028890207 = score(doc=4906,freq=1.0), product of:
              0.10990498 = queryWeight, product of:
                1.5397816 = boost
                3.364676 = idf(docFreq=4064, maxDocs=43254)
                0.02121363 = queryNorm
              0.2628653 = fieldWeight in 4906, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.364676 = idf(docFreq=4064, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
          0.21358532 = weight(abstract_txt:optical in 4906) [ClassicSimilarity], result of:
            0.21358532 = score(doc=4906,freq=2.0), product of:
              0.2627511 = queryWeight, product of:
                1.6834791 = boost
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.02121363 = queryNorm
              0.81288075 = fieldWeight in 4906, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.357357 = idf(docFreq=74, maxDocs=43254)
                0.078125 = fieldNorm(doc=4906)
        0.28 = coord(7/25)