Document (#6510)

Author
Ashford, J.H.
Title
Free text retrieval in the Welsh language : problems, and proposed working practice
Source
Journal of documentation. 51(1995) no.2, S.118-125
Year
1995
Abstract
A bilingual Welsh-English full text database is planned for Inspection Reports of Her Majesty's Inspectors of Schools for Wales. Special requirements for free text retrieval in the Welsh language are identified, and practical solutions are proposed for problems arising from the use of standard text database products, some of which may also apply to other lesser-used languages
Theme
Volltextretrieval

Similar documents (content)

  1. Cunliffe, D.; Harries, R.: Promoting minority-language use in a bilingual online community (2005) 0.22
    0.21679804 = sum of:
      0.21679804 = product of:
        0.9033252 = sum of:
          0.047499117 = weight(abstract_txt:practice in 5915) [ClassicSimilarity], result of:
            0.047499117 = score(doc=5915,freq=1.0), product of:
              0.104898974 = queryWeight, product of:
                4.829954 = idf(docFreq=959, maxDocs=44218)
                0.02171842 = queryNorm
              0.4528082 = fieldWeight in 5915, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.829954 = idf(docFreq=959, maxDocs=44218)
                0.09375 = fieldNorm(doc=5915)
          0.05886892 = weight(abstract_txt:languages in 5915) [ClassicSimilarity], result of:
            0.05886892 = score(doc=5915,freq=1.0), product of:
              0.12103332 = queryWeight, product of:
                1.0741547 = boost
                5.188118 = idf(docFreq=670, maxDocs=44218)
                0.02171842 = queryNorm
              0.48638606 = fieldWeight in 5915, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.188118 = idf(docFreq=670, maxDocs=44218)
                0.09375 = fieldNorm(doc=5915)
          0.10326769 = weight(abstract_txt:english in 5915) [ClassicSimilarity], result of:
            0.10326769 = score(doc=5915,freq=2.0), product of:
              0.13972707 = queryWeight, product of:
                1.1541299 = boost
                5.574394 = idf(docFreq=455, maxDocs=44218)
                0.02171842 = queryNorm
              0.7390672 = fieldWeight in 5915, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.574394 = idf(docFreq=455, maxDocs=44218)
                0.09375 = fieldNorm(doc=5915)
          0.37802798 = weight(abstract_txt:bilingual in 5915) [ClassicSimilarity], result of:
            0.37802798 = score(doc=5915,freq=4.0), product of:
              0.26341683 = queryWeight, product of:
                1.5846602 = boost
                7.653836 = idf(docFreq=56, maxDocs=44218)
                0.02171842 = queryNorm
              1.4350942 = fieldWeight in 5915, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.653836 = idf(docFreq=56, maxDocs=44218)
                0.09375 = fieldNorm(doc=5915)
          0.20884797 = weight(abstract_txt:wales in 5915) [ClassicSimilarity], result of:
            0.20884797 = score(doc=5915,freq=1.0), product of:
              0.28153628 = queryWeight, product of:
                1.6382552 = boost
                7.912698 = idf(docFreq=43, maxDocs=44218)
                0.02171842 = queryNorm
              0.74181545 = fieldWeight in 5915, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.912698 = idf(docFreq=43, maxDocs=44218)
                0.09375 = fieldNorm(doc=5915)
          0.10681358 = weight(abstract_txt:language in 5915) [ClassicSimilarity], result of:
            0.10681358 = score(doc=5915,freq=3.0), product of:
              0.15729012 = queryWeight, product of:
                1.7317296 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.02171842 = queryNorm
              0.6790864 = fieldWeight in 5915, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.09375 = fieldNorm(doc=5915)
        0.24 = coord(6/25)
    
  2. Tseng, Y.-H.: Automatic cataloguing and searching for retrospective data by use of OCR text (2001) 0.18
    0.18266435 = sum of:
      0.18266435 = product of:
        0.5708261 = sum of:
          0.043268844 = weight(abstract_txt:special in 5421) [ClassicSimilarity], result of:
            0.043268844 = score(doc=5421,freq=1.0), product of:
              0.11131454 = queryWeight, product of:
                1.030126 = boost
                4.9754615 = idf(docFreq=829, maxDocs=44218)
                0.02171842 = queryNorm
              0.38870794 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9754615 = idf(docFreq=829, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.08496997 = weight(abstract_txt:languages in 5421) [ClassicSimilarity], result of:
            0.08496997 = score(doc=5421,freq=3.0), product of:
              0.12103332 = queryWeight, product of:
                1.0741547 = boost
                5.188118 = idf(docFreq=670, maxDocs=44218)
                0.02171842 = queryNorm
              0.7020378 = fieldWeight in 5421, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.188118 = idf(docFreq=670, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.060851075 = weight(abstract_txt:english in 5421) [ClassicSimilarity], result of:
            0.060851075 = score(doc=5421,freq=1.0), product of:
              0.13972707 = queryWeight, product of:
                1.1541299 = boost
                5.574394 = idf(docFreq=455, maxDocs=44218)
                0.02171842 = queryNorm
              0.43549955 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.574394 = idf(docFreq=455, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.06256178 = weight(abstract_txt:solutions in 5421) [ClassicSimilarity], result of:
            0.06256178 = score(doc=5421,freq=1.0), product of:
              0.14233372 = queryWeight, product of:
                1.1648453 = boost
                5.6261497 = idf(docFreq=432, maxDocs=44218)
                0.02171842 = queryNorm
              0.43954295 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6261497 = idf(docFreq=432, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.051071957 = weight(abstract_txt:retrieval in 5421) [ClassicSimilarity], result of:
            0.051071957 = score(doc=5421,freq=3.0), product of:
              0.108607456 = queryWeight, product of:
                1.4389948 = boost
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.02171842 = queryNorm
              0.47024357 = fieldWeight in 5421, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.051390704 = weight(abstract_txt:language in 5421) [ClassicSimilarity], result of:
            0.051390704 = score(doc=5421,freq=1.0), product of:
              0.15729012 = queryWeight, product of:
                1.7317296 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.02171842 = queryNorm
              0.32672557 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.05576345 = weight(abstract_txt:problems in 5421) [ClassicSimilarity], result of:
            0.05576345 = score(doc=5421,freq=1.0), product of:
              0.1660905 = queryWeight, product of:
                1.7795155 = boost
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.02171842 = queryNorm
              0.33574134 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
          0.16094829 = weight(abstract_txt:text in 5421) [ClassicSimilarity], result of:
            0.16094829 = score(doc=5421,freq=3.0), product of:
              0.2941297 = queryWeight, product of:
                3.3489897 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.02171842 = queryNorm
              0.54720175 = fieldWeight in 5421, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.078125 = fieldNorm(doc=5421)
        0.32 = coord(8/25)
    
  3. Riggs, K.R.: XML and free text (2002) 0.18
    0.17917465 = sum of:
      0.17917465 = product of:
        0.8958732 = sum of:
          0.08222513 = weight(abstract_txt:language in 461) [ClassicSimilarity], result of:
            0.08222513 = score(doc=461,freq=1.0), product of:
              0.15729012 = queryWeight, product of:
                1.7317296 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.02171842 = queryNorm
              0.5227609 = fieldWeight in 461, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.125 = fieldNorm(doc=461)
          0.12617828 = weight(abstract_txt:problems in 461) [ClassicSimilarity], result of:
            0.12617828 = score(doc=461,freq=2.0), product of:
              0.1660905 = queryWeight, product of:
                1.7795155 = boost
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.02171842 = queryNorm
              0.75969595 = fieldWeight in 461, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.125 = fieldNorm(doc=461)
          0.110086486 = weight(abstract_txt:proposed in 461) [ClassicSimilarity], result of:
            0.110086486 = score(doc=461,freq=1.0), product of:
              0.1910679 = queryWeight, product of:
                1.9086366 = boost
                4.6093135 = idf(docFreq=1196, maxDocs=44218)
                0.02171842 = queryNorm
              0.5761642 = fieldWeight in 461, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.6093135 = idf(docFreq=1196, maxDocs=44218)
                0.125 = fieldNorm(doc=461)
          0.28002793 = weight(abstract_txt:free in 461) [ClassicSimilarity], result of:
            0.28002793 = score(doc=461,freq=2.0), product of:
              0.28258947 = queryWeight, product of:
                2.3211722 = boost
                5.6055775 = idf(docFreq=441, maxDocs=44218)
                0.02171842 = queryNorm
              0.99093544 = fieldWeight in 461, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.6055775 = idf(docFreq=441, maxDocs=44218)
                0.125 = fieldNorm(doc=461)
          0.29735532 = weight(abstract_txt:text in 461) [ClassicSimilarity], result of:
            0.29735532 = score(doc=461,freq=4.0), product of:
              0.2941297 = queryWeight, product of:
                3.3489897 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.02171842 = queryNorm
              1.0109667 = fieldWeight in 461, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.125 = fieldNorm(doc=461)
        0.2 = coord(5/25)
    
  4. Ata, B.M.A.: SISDOM: a multilingual document retrieval system (1995) 0.16
    0.15710343 = sum of:
      0.15710343 = product of:
        0.65459764 = sum of:
          0.05866832 = weight(abstract_txt:full in 895) [ClassicSimilarity], result of:
            0.05866832 = score(doc=895,freq=1.0), product of:
              0.108964615 = queryWeight, product of:
                1.0191946 = boost
                4.922663 = idf(docFreq=874, maxDocs=44218)
                0.02171842 = queryNorm
              0.53841627 = fieldWeight in 895, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.922663 = idf(docFreq=874, maxDocs=44218)
                0.109375 = fieldNorm(doc=895)
          0.08519151 = weight(abstract_txt:english in 895) [ClassicSimilarity], result of:
            0.08519151 = score(doc=895,freq=1.0), product of:
              0.13972707 = queryWeight, product of:
                1.1541299 = boost
                5.574394 = idf(docFreq=455, maxDocs=44218)
                0.02171842 = queryNorm
              0.60969937 = fieldWeight in 895, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.574394 = idf(docFreq=455, maxDocs=44218)
                0.109375 = fieldNorm(doc=895)
          0.05838011 = weight(abstract_txt:retrieval in 895) [ClassicSimilarity], result of:
            0.05838011 = score(doc=895,freq=2.0), product of:
              0.108607456 = queryWeight, product of:
                1.4389948 = boost
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.02171842 = queryNorm
              0.53753316 = fieldWeight in 895, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.109375 = fieldNorm(doc=895)
          0.22051631 = weight(abstract_txt:bilingual in 895) [ClassicSimilarity], result of:
            0.22051631 = score(doc=895,freq=1.0), product of:
              0.26341683 = queryWeight, product of:
                1.5846602 = boost
                7.653836 = idf(docFreq=56, maxDocs=44218)
                0.02171842 = queryNorm
              0.8371383 = fieldWeight in 895, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.653836 = idf(docFreq=56, maxDocs=44218)
                0.109375 = fieldNorm(doc=895)
          0.10174841 = weight(abstract_txt:language in 895) [ClassicSimilarity], result of:
            0.10174841 = score(doc=895,freq=2.0), product of:
              0.15729012 = queryWeight, product of:
                1.7317296 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.02171842 = queryNorm
              0.64688367 = fieldWeight in 895, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.109375 = fieldNorm(doc=895)
          0.13009295 = weight(abstract_txt:text in 895) [ClassicSimilarity], result of:
            0.13009295 = score(doc=895,freq=1.0), product of:
              0.2941297 = queryWeight, product of:
                3.3489897 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.02171842 = queryNorm
              0.4422979 = fieldWeight in 895, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.109375 = fieldNorm(doc=895)
        0.24 = coord(6/25)
    
  5. Asija, S.P.: Natural language interface without artifical intelligence (1989) 0.15
    0.14785577 = sum of:
      0.14785577 = product of:
        0.61606574 = sum of:
          0.08381189 = weight(abstract_txt:full in 5711) [ClassicSimilarity], result of:
            0.08381189 = score(doc=5711,freq=1.0), product of:
              0.108964615 = queryWeight, product of:
                1.0191946 = boost
                4.922663 = idf(docFreq=874, maxDocs=44218)
                0.02171842 = queryNorm
              0.7691661 = fieldWeight in 5711, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.922663 = idf(docFreq=874, maxDocs=44218)
                0.15625 = fieldNorm(doc=5711)
          0.08653769 = weight(abstract_txt:special in 5711) [ClassicSimilarity], result of:
            0.08653769 = score(doc=5711,freq=1.0), product of:
              0.11131454 = queryWeight, product of:
                1.030126 = boost
                4.9754615 = idf(docFreq=829, maxDocs=44218)
                0.02171842 = queryNorm
              0.7774159 = fieldWeight in 5711, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9754615 = idf(docFreq=829, maxDocs=44218)
                0.15625 = fieldNorm(doc=5711)
          0.09811486 = weight(abstract_txt:languages in 5711) [ClassicSimilarity], result of:
            0.09811486 = score(doc=5711,freq=1.0), product of:
              0.12103332 = queryWeight, product of:
                1.0741547 = boost
                5.188118 = idf(docFreq=670, maxDocs=44218)
                0.02171842 = queryNorm
              0.81064343 = fieldWeight in 5711, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.188118 = idf(docFreq=670, maxDocs=44218)
                0.15625 = fieldNorm(doc=5711)
          0.058972817 = weight(abstract_txt:retrieval in 5711) [ClassicSimilarity], result of:
            0.058972817 = score(doc=5711,freq=1.0), product of:
              0.108607456 = queryWeight, product of:
                1.4389948 = boost
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.02171842 = queryNorm
              0.5429905 = fieldWeight in 5711, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.15625 = fieldNorm(doc=5711)
          0.10278141 = weight(abstract_txt:language in 5711) [ClassicSimilarity], result of:
            0.10278141 = score(doc=5711,freq=1.0), product of:
              0.15729012 = queryWeight, product of:
                1.7317296 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.02171842 = queryNorm
              0.65345114 = fieldWeight in 5711, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.15625 = fieldNorm(doc=5711)
          0.18584707 = weight(abstract_txt:text in 5711) [ClassicSimilarity], result of:
            0.18584707 = score(doc=5711,freq=1.0), product of:
              0.2941297 = queryWeight, product of:
                3.3489897 = boost
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.02171842 = queryNorm
              0.6318542 = fieldWeight in 5711, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0438666 = idf(docFreq=2106, maxDocs=44218)
                0.15625 = fieldNorm(doc=5711)
        0.24 = coord(6/25)