Document (#6510)

Author
Ashford, J.H.
Title
Free text retrieval in the Welsh language : problems, and proposed working practice
Source
Journal of documentation. 51(1995) no.2, S.118-125
Year
1995
Abstract
A bilingual Welsh-English full text database is planned for Inspection Reports of Her Majesty's Inspectors of Schools for Wales. Special requirements for free text retrieval in the Welsh language are identified, and practical solutions are proposed for problems arising from the use of standard text database products, some of which may also apply to other lesser-used languages
Theme
Volltextretrieval

Similar documents (content)

  1. Cunliffe, D.; Harries, R.: Promoting minority-language use in a bilingual online community (2005) 0.22
    0.21736905 = sum of:
      0.21736905 = product of:
        0.9057044 = sum of:
          0.048484888 = weight(abstract_txt:practice in 916) [ClassicSimilarity], result of:
            0.048484888 = score(doc=916,freq=1.0), product of:
              0.10618361 = queryWeight, product of:
                4.870546 = idf(docFreq=890, maxDocs=42740)
                0.021801172 = queryNorm
              0.45661366 = fieldWeight in 916, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.870546 = idf(docFreq=890, maxDocs=42740)
                0.09375 = fieldNorm(doc=916)
          0.058735464 = weight(abstract_txt:languages in 916) [ClassicSimilarity], result of:
            0.058735464 = score(doc=916,freq=1.0), product of:
              0.12066653 = queryWeight, product of:
                1.0660183 = boost
                5.192091 = idf(docFreq=645, maxDocs=42740)
                0.021801172 = queryNorm
              0.48675853 = fieldWeight in 916, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.192091 = idf(docFreq=645, maxDocs=42740)
                0.09375 = fieldNorm(doc=916)
          0.104956694 = weight(abstract_txt:english in 916) [ClassicSimilarity], result of:
            0.104956694 = score(doc=916,freq=2.0), product of:
              0.14103167 = queryWeight, product of:
                1.1524699 = boost
                5.6131573 = idf(docFreq=423, maxDocs=42740)
                0.021801172 = queryNorm
              0.74420655 = fieldWeight in 916, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.6131573 = idf(docFreq=423, maxDocs=42740)
                0.09375 = fieldNorm(doc=916)
          0.3792739 = weight(abstract_txt:bilingual in 916) [ClassicSimilarity], result of:
            0.3792739 = score(doc=916,freq=4.0), product of:
              0.2635938 = queryWeight, product of:
                1.5755742 = boost
                7.6739063 = idf(docFreq=53, maxDocs=42740)
                0.021801172 = queryNorm
              1.4388574 = fieldWeight in 916, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.6739063 = idf(docFreq=53, maxDocs=42740)
                0.09375 = fieldNorm(doc=916)
          0.2070301 = weight(abstract_txt:wales in 916) [ClassicSimilarity], result of:
            0.2070301 = score(doc=916,freq=1.0), product of:
              0.27947453 = queryWeight, product of:
                1.6223419 = boost
                7.9016905 = idf(docFreq=42, maxDocs=42740)
                0.021801172 = queryNorm
              0.74078345 = fieldWeight in 916, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.9016905 = idf(docFreq=42, maxDocs=42740)
                0.09375 = fieldNorm(doc=916)
          0.10722333 = weight(abstract_txt:language in 916) [ClassicSimilarity], result of:
            0.10722333 = score(doc=916,freq=3.0), product of:
              0.1574523 = queryWeight, product of:
                1.7221096 = boost
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.021801172 = queryNorm
              0.6809893 = fieldWeight in 916, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.09375 = fieldNorm(doc=916)
        0.24 = coord(6/25)
    
  2. Tseng, Y.-H.: Automatic cataloguing and searching for retrospective data by use of OCR text (2001) 0.18
    0.18277504 = sum of:
      0.18277504 = product of:
        0.571172 = sum of:
          0.04298315 = weight(abstract_txt:special in 5421) [ClassicSimilarity], result of:
            0.04298315 = score(doc=5421,freq=1.0), product of:
              0.110655464 = queryWeight, product of:
                1.02084 = boost
                4.9720483 = idf(docFreq=804, maxDocs=42740)
                0.021801172 = queryNorm
              0.38844126 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9720483 = idf(docFreq=804, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.08477734 = weight(abstract_txt:languages in 5421) [ClassicSimilarity], result of:
            0.08477734 = score(doc=5421,freq=3.0), product of:
              0.12066653 = queryWeight, product of:
                1.0660183 = boost
                5.192091 = idf(docFreq=645, maxDocs=42740)
                0.021801172 = queryNorm
              0.70257545 = fieldWeight in 5421, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.192091 = idf(docFreq=645, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.061846323 = weight(abstract_txt:english in 5421) [ClassicSimilarity], result of:
            0.061846323 = score(doc=5421,freq=1.0), product of:
              0.14103167 = queryWeight, product of:
                1.1524699 = boost
                5.6131573 = idf(docFreq=423, maxDocs=42740)
                0.021801172 = queryNorm
              0.4385279 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6131573 = idf(docFreq=423, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.06329133 = weight(abstract_txt:solutions in 5421) [ClassicSimilarity], result of:
            0.06329133 = score(doc=5421,freq=1.0), product of:
              0.14321996 = queryWeight, product of:
                1.1613765 = boost
                5.6565375 = idf(docFreq=405, maxDocs=42740)
                0.021801172 = queryNorm
              0.441917 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6565375 = idf(docFreq=405, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.050386924 = weight(abstract_txt:retrieval in 5421) [ClassicSimilarity], result of:
            0.050386924 = score(doc=5421,freq=3.0), product of:
              0.10747041 = queryWeight, product of:
                1.4227569 = boost
                3.4648013 = idf(docFreq=3633, maxDocs=42740)
                0.021801172 = queryNorm
              0.46884465 = fieldWeight in 5421, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4648013 = idf(docFreq=3633, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.05158785 = weight(abstract_txt:language in 5421) [ClassicSimilarity], result of:
            0.05158785 = score(doc=5421,freq=1.0), product of:
              0.1574523 = queryWeight, product of:
                1.7221096 = boost
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.021801172 = queryNorm
              0.32764113 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.05534683 = weight(abstract_txt:problems in 5421) [ClassicSimilarity], result of:
            0.05534683 = score(doc=5421,freq=1.0), product of:
              0.16501087 = queryWeight, product of:
                1.7629603 = boost
                4.2932897 = idf(docFreq=1586, maxDocs=42740)
                0.021801172 = queryNorm
              0.33541325 = fieldWeight in 5421, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2932897 = idf(docFreq=1586, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
          0.16095224 = weight(abstract_txt:text in 5421) [ClassicSimilarity], result of:
            0.16095224 = score(doc=5421,freq=3.0), product of:
              0.29368716 = queryWeight, product of:
                3.3261647 = boost
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.021801172 = queryNorm
              0.54803973 = fieldWeight in 5421, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.078125 = fieldNorm(doc=5421)
        0.32 = coord(8/25)
    
  3. Riggs, K.R.: XML and free text (2002) 0.18
    0.17916481 = sum of:
      0.17916481 = product of:
        0.8958241 = sum of:
          0.082540564 = weight(abstract_txt:language in 1462) [ClassicSimilarity], result of:
            0.082540564 = score(doc=1462,freq=1.0), product of:
              0.1574523 = queryWeight, product of:
                1.7221096 = boost
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.021801172 = queryNorm
              0.52422583 = fieldWeight in 1462, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.125 = fieldNorm(doc=1462)
          0.12523559 = weight(abstract_txt:problems in 1462) [ClassicSimilarity], result of:
            0.12523559 = score(doc=1462,freq=2.0), product of:
              0.16501087 = queryWeight, product of:
                1.7629603 = boost
                4.2932897 = idf(docFreq=1586, maxDocs=42740)
                0.021801172 = queryNorm
              0.7589536 = fieldWeight in 1462, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.2932897 = idf(docFreq=1586, maxDocs=42740)
                0.125 = fieldNorm(doc=1462)
          0.11185432 = weight(abstract_txt:proposed in 1462) [ClassicSimilarity], result of:
            0.11185432 = score(doc=1462,freq=1.0), product of:
              0.1928143 = queryWeight, product of:
                1.9057059 = boost
                4.640914 = idf(docFreq=1120, maxDocs=42740)
                0.021801172 = queryNorm
              0.58011425 = fieldWeight in 1462, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.640914 = idf(docFreq=1120, maxDocs=42740)
                0.125 = fieldNorm(doc=1462)
          0.27883106 = weight(abstract_txt:free in 1462) [ClassicSimilarity], result of:
            0.27883106 = score(doc=1462,freq=2.0), product of:
              0.28135514 = queryWeight, product of:
                2.3020444 = boost
                5.6061063 = idf(docFreq=426, maxDocs=42740)
                0.021801172 = queryNorm
              0.9910289 = fieldWeight in 1462, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.6061063 = idf(docFreq=426, maxDocs=42740)
                0.125 = fieldNorm(doc=1462)
          0.2973626 = weight(abstract_txt:text in 1462) [ClassicSimilarity], result of:
            0.2973626 = score(doc=1462,freq=4.0), product of:
              0.29368716 = queryWeight, product of:
                3.3261647 = boost
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.021801172 = queryNorm
              1.0125148 = fieldWeight in 1462, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.125 = fieldNorm(doc=1462)
        0.2 = coord(5/25)
    
  4. Ata, B.M.A.: SISDOM: a multilingual document retrieval system (1995) 0.16
    0.15738188 = sum of:
      0.15738188 = product of:
        0.65575784 = sum of:
          0.05809791 = weight(abstract_txt:full in 964) [ClassicSimilarity], result of:
            0.05809791 = score(doc=964,freq=1.0), product of:
              0.10809253 = queryWeight, product of:
                1.0089488 = boost
                4.914131 = idf(docFreq=852, maxDocs=42740)
                0.021801172 = queryNorm
              0.5374831 = fieldWeight in 964, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.914131 = idf(docFreq=852, maxDocs=42740)
                0.109375 = fieldNorm(doc=964)
          0.08658485 = weight(abstract_txt:english in 964) [ClassicSimilarity], result of:
            0.08658485 = score(doc=964,freq=1.0), product of:
              0.14103167 = queryWeight, product of:
                1.1524699 = boost
                5.6131573 = idf(docFreq=423, maxDocs=42740)
                0.021801172 = queryNorm
              0.61393905 = fieldWeight in 964, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6131573 = idf(docFreq=423, maxDocs=42740)
                0.109375 = fieldNorm(doc=964)
          0.057597056 = weight(abstract_txt:retrieval in 964) [ClassicSimilarity], result of:
            0.057597056 = score(doc=964,freq=2.0), product of:
              0.10747041 = queryWeight, product of:
                1.4227569 = boost
                3.4648013 = idf(docFreq=3633, maxDocs=42740)
                0.021801172 = queryNorm
              0.5359341 = fieldWeight in 964, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4648013 = idf(docFreq=3633, maxDocs=42740)
                0.109375 = fieldNorm(doc=964)
          0.22124311 = weight(abstract_txt:bilingual in 964) [ClassicSimilarity], result of:
            0.22124311 = score(doc=964,freq=1.0), product of:
              0.2635938 = queryWeight, product of:
                1.5755742 = boost
                7.6739063 = idf(docFreq=53, maxDocs=42740)
                0.021801172 = queryNorm
              0.83933353 = fieldWeight in 964, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.6739063 = idf(docFreq=53, maxDocs=42740)
                0.109375 = fieldNorm(doc=964)
          0.102138735 = weight(abstract_txt:language in 964) [ClassicSimilarity], result of:
            0.102138735 = score(doc=964,freq=2.0), product of:
              0.1574523 = queryWeight, product of:
                1.7221096 = boost
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.021801172 = queryNorm
              0.64869636 = fieldWeight in 964, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.109375 = fieldNorm(doc=964)
          0.13009614 = weight(abstract_txt:text in 964) [ClassicSimilarity], result of:
            0.13009614 = score(doc=964,freq=1.0), product of:
              0.29368716 = queryWeight, product of:
                3.3261647 = boost
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.021801172 = queryNorm
              0.44297522 = fieldWeight in 964, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.109375 = fieldNorm(doc=964)
        0.24 = coord(6/25)
    
  5. Asija, S.P.: Natural language interface without artifical intelligence (1989) 0.15
    0.14737558 = sum of:
      0.14737558 = product of:
        0.61406493 = sum of:
          0.08299701 = weight(abstract_txt:full in 5780) [ClassicSimilarity], result of:
            0.08299701 = score(doc=5780,freq=1.0), product of:
              0.10809253 = queryWeight, product of:
                1.0089488 = boost
                4.914131 = idf(docFreq=852, maxDocs=42740)
                0.021801172 = queryNorm
              0.767833 = fieldWeight in 5780, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.914131 = idf(docFreq=852, maxDocs=42740)
                0.15625 = fieldNorm(doc=5780)
          0.0859663 = weight(abstract_txt:special in 5780) [ClassicSimilarity], result of:
            0.0859663 = score(doc=5780,freq=1.0), product of:
              0.110655464 = queryWeight, product of:
                1.02084 = boost
                4.9720483 = idf(docFreq=804, maxDocs=42740)
                0.021801172 = queryNorm
              0.7768825 = fieldWeight in 5780, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9720483 = idf(docFreq=804, maxDocs=42740)
                0.15625 = fieldNorm(doc=5780)
          0.09789244 = weight(abstract_txt:languages in 5780) [ClassicSimilarity], result of:
            0.09789244 = score(doc=5780,freq=1.0), product of:
              0.12066653 = queryWeight, product of:
                1.0660183 = boost
                5.192091 = idf(docFreq=645, maxDocs=42740)
                0.021801172 = queryNorm
              0.8112642 = fieldWeight in 5780, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.192091 = idf(docFreq=645, maxDocs=42740)
                0.15625 = fieldNorm(doc=5780)
          0.058181815 = weight(abstract_txt:retrieval in 5780) [ClassicSimilarity], result of:
            0.058181815 = score(doc=5780,freq=1.0), product of:
              0.10747041 = queryWeight, product of:
                1.4227569 = boost
                3.4648013 = idf(docFreq=3633, maxDocs=42740)
                0.021801172 = queryNorm
              0.5413752 = fieldWeight in 5780, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4648013 = idf(docFreq=3633, maxDocs=42740)
                0.15625 = fieldNorm(doc=5780)
          0.1031757 = weight(abstract_txt:language in 5780) [ClassicSimilarity], result of:
            0.1031757 = score(doc=5780,freq=1.0), product of:
              0.1574523 = queryWeight, product of:
                1.7221096 = boost
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.021801172 = queryNorm
              0.65528226 = fieldWeight in 5780, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1938066 = idf(docFreq=1752, maxDocs=42740)
                0.15625 = fieldNorm(doc=5780)
          0.18585163 = weight(abstract_txt:text in 5780) [ClassicSimilarity], result of:
            0.18585163 = score(doc=5780,freq=1.0), product of:
              0.29368716 = queryWeight, product of:
                3.3261647 = boost
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.021801172 = queryNorm
              0.6328218 = fieldWeight in 5780, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.0500593 = idf(docFreq=2023, maxDocs=42740)
                0.15625 = fieldNorm(doc=5780)
        0.24 = coord(6/25)