Document (#17531)

Author
Bordoni, L.
Pazienza, M.T.
Title
Documents automatic indexing in an environmental domain
Source
International forum on information and documentation. 22(1997) no.1, S.17-28
Year
1997
Abstract
Describes an application of Natural Language Processing (NLP) techniques, in HIRMA (Hypertextual Information Retrieval Managed by ARIOSTO), to the problem of document indexing by referring to a system which incorporates natural language processing techniques to determine the subject of the text of documents and to associate them with relevant semantic indexes. Describes briefly the overall system, details of its implementation on a corpus of scientific abstracts related to environmental topics and experimental evidence of the system's behaviour. Analyzes in detail an experiment designed to evaluate the system's retrieval ability in terms of recall and precision
Theme
Automatisches Indexieren

Similar documents (content)

  1. Polity, Y.: Vers une ergonomie linguistique (1994) 0.25
    0.25201246 = sum of:
      0.25201246 = product of:
        0.787539 = sum of:
          0.033750195 = weight(abstract_txt:system in 36) [ClassicSimilarity], result of:
            0.033750195 = score(doc=36,freq=1.0), product of:
              0.09150207 = queryWeight, product of:
                1.1769189 = boost
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.023054574 = queryNorm
              0.36884624 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.036932703 = weight(abstract_txt:retrieval in 36) [ClassicSimilarity], result of:
            0.036932703 = score(doc=36,freq=1.0), product of:
              0.09716745 = queryWeight, product of:
                1.2128063 = boost
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.023054574 = queryNorm
              0.38009337 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.04921137 = weight(abstract_txt:describes in 36) [ClassicSimilarity], result of:
            0.04921137 = score(doc=36,freq=1.0), product of:
              0.11765861 = queryWeight, product of:
                1.3345748 = boost
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.023054574 = queryNorm
              0.4182556 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.06436855 = weight(abstract_txt:language in 36) [ClassicSimilarity], result of:
            0.06436855 = score(doc=36,freq=1.0), product of:
              0.14072219 = queryWeight, product of:
                1.4595277 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.023054574 = queryNorm
              0.45741582 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.07241668 = weight(abstract_txt:indexing in 36) [ClassicSimilarity], result of:
            0.07241668 = score(doc=36,freq=1.0), product of:
              0.15222026 = queryWeight, product of:
                1.5179844 = boost
                4.3495874 = idf(docFreq=1551, maxDocs=44218)
                0.023054574 = queryNorm
              0.47573614 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.3495874 = idf(docFreq=1551, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.10556585 = weight(abstract_txt:processing in 36) [ClassicSimilarity], result of:
            0.10556585 = score(doc=36,freq=1.0), product of:
              0.1957022 = queryWeight, product of:
                1.7211905 = boost
                4.931848 = idf(docFreq=866, maxDocs=44218)
                0.023054574 = queryNorm
              0.5394209 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.931848 = idf(docFreq=866, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.11533293 = weight(abstract_txt:natural in 36) [ClassicSimilarity], result of:
            0.11533293 = score(doc=36,freq=1.0), product of:
              0.2075944 = queryWeight, product of:
                1.7727149 = boost
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.023054574 = queryNorm
              0.55556864 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
          0.30996075 = weight(abstract_txt:system's in 36) [ClassicSimilarity], result of:
            0.30996075 = score(doc=36,freq=1.0), product of:
              0.40128338 = queryWeight, product of:
                2.464658 = boost
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.023054574 = queryNorm
              0.77242357 = fieldWeight in 36, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.109375 = fieldNorm(doc=36)
        0.32 = coord(8/25)
    
  2. Oard, D.W.; He, D.; Wang, J.: User-assisted query translation for interactive cross-language information retrieval (2008) 0.21
    0.20973486 = sum of:
      0.20973486 = product of:
        0.65542144 = sum of:
          0.048214562 = weight(abstract_txt:system in 2030) [ClassicSimilarity], result of:
            0.048214562 = score(doc=2030,freq=4.0), product of:
              0.09150207 = queryWeight, product of:
                1.1769189 = boost
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.023054574 = queryNorm
              0.5269232 = fieldWeight in 2030, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.03730766 = weight(abstract_txt:retrieval in 2030) [ClassicSimilarity], result of:
            0.03730766 = score(doc=2030,freq=2.0), product of:
              0.09716745 = queryWeight, product of:
                1.2128063 = boost
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.023054574 = queryNorm
              0.38395226 = fieldWeight in 2030, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.11305687 = weight(abstract_txt:incorporates in 2030) [ClassicSimilarity], result of:
            0.11305687 = score(doc=2030,freq=1.0), product of:
              0.20347922 = queryWeight, product of:
                1.2410123 = boost
                7.11192 = idf(docFreq=97, maxDocs=44218)
                0.023054574 = queryNorm
              0.55561876 = fieldWeight in 2030, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.11192 = idf(docFreq=97, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.03515098 = weight(abstract_txt:describes in 2030) [ClassicSimilarity], result of:
            0.03515098 = score(doc=2030,freq=1.0), product of:
              0.11765861 = queryWeight, product of:
                1.3345748 = boost
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.023054574 = queryNorm
              0.298754 = fieldWeight in 2030, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.062227864 = weight(abstract_txt:documents in 2030) [ClassicSimilarity], result of:
            0.062227864 = score(doc=2030,freq=2.0), product of:
              0.13666125 = queryWeight, product of:
                1.4383142 = boost
                4.1213026 = idf(docFreq=1949, maxDocs=44218)
                0.023054574 = queryNorm
              0.4553439 = fieldWeight in 2030, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.1213026 = idf(docFreq=1949, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.079635434 = weight(abstract_txt:language in 2030) [ClassicSimilarity], result of:
            0.079635434 = score(doc=2030,freq=3.0), product of:
              0.14072219 = queryWeight, product of:
                1.4595277 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.023054574 = queryNorm
              0.56590533 = fieldWeight in 2030, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.058427554 = weight(abstract_txt:techniques in 2030) [ClassicSimilarity], result of:
            0.058427554 = score(doc=2030,freq=1.0), product of:
              0.16509879 = queryWeight, product of:
                1.580895 = boost
                4.5298495 = idf(docFreq=1295, maxDocs=44218)
                0.023054574 = queryNorm
              0.3538945 = fieldWeight in 2030, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5298495 = idf(docFreq=1295, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
          0.22140053 = weight(abstract_txt:system's in 2030) [ClassicSimilarity], result of:
            0.22140053 = score(doc=2030,freq=1.0), product of:
              0.40128338 = queryWeight, product of:
                2.464658 = boost
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.023054574 = queryNorm
              0.5517311 = fieldWeight in 2030, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.078125 = fieldNorm(doc=2030)
        0.32 = coord(8/25)
    
  3. Vledutz-Stokolov, N.: Concept recognition in an automatic text-processing system for the life sciences (1987) 0.20
    0.19867706 = sum of:
      0.19867706 = product of:
        0.6208658 = sum of:
          0.038571652 = weight(abstract_txt:system in 2849) [ClassicSimilarity], result of:
            0.038571652 = score(doc=2849,freq=4.0), product of:
              0.09150207 = queryWeight, product of:
                1.1769189 = boost
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.023054574 = queryNorm
              0.42153856 = fieldWeight in 2849, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.028120784 = weight(abstract_txt:describes in 2849) [ClassicSimilarity], result of:
            0.028120784 = score(doc=2849,freq=1.0), product of:
              0.11765861 = queryWeight, product of:
                1.3345748 = boost
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.023054574 = queryNorm
              0.2390032 = fieldWeight in 2849, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.0973161 = weight(abstract_txt:language in 2849) [ClassicSimilarity], result of:
            0.0973161 = score(doc=2849,freq=7.0), product of:
              0.14072219 = queryWeight, product of:
                1.4595277 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.023054574 = queryNorm
              0.6915477 = fieldWeight in 2849, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.058521513 = weight(abstract_txt:indexing in 2849) [ClassicSimilarity], result of:
            0.058521513 = score(doc=2849,freq=2.0), product of:
              0.15222026 = queryWeight, product of:
                1.5179844 = boost
                4.3495874 = idf(docFreq=1551, maxDocs=44218)
                0.023054574 = queryNorm
              0.38445285 = fieldWeight in 2849, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.3495874 = idf(docFreq=1551, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.04674204 = weight(abstract_txt:techniques in 2849) [ClassicSimilarity], result of:
            0.04674204 = score(doc=2849,freq=1.0), product of:
              0.16509879 = queryWeight, product of:
                1.580895 = boost
                4.5298495 = idf(docFreq=1295, maxDocs=44218)
                0.023054574 = queryNorm
              0.2831156 = fieldWeight in 2849, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5298495 = idf(docFreq=1295, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.060323343 = weight(abstract_txt:processing in 2849) [ClassicSimilarity], result of:
            0.060323343 = score(doc=2849,freq=1.0), product of:
              0.1957022 = queryWeight, product of:
                1.7211905 = boost
                4.931848 = idf(docFreq=866, maxDocs=44218)
                0.023054574 = queryNorm
              0.3082405 = fieldWeight in 2849, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.931848 = idf(docFreq=866, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.114149995 = weight(abstract_txt:natural in 2849) [ClassicSimilarity], result of:
            0.114149995 = score(doc=2849,freq=3.0), product of:
              0.2075944 = queryWeight, product of:
                1.7727149 = boost
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.023054574 = queryNorm
              0.5498703 = fieldWeight in 2849, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
          0.17712042 = weight(abstract_txt:system's in 2849) [ClassicSimilarity], result of:
            0.17712042 = score(doc=2849,freq=1.0), product of:
              0.40128338 = queryWeight, product of:
                2.464658 = boost
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.023054574 = queryNorm
              0.44138488 = fieldWeight in 2849, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.0625 = fieldNorm(doc=2849)
        0.32 = coord(8/25)
    
  4. Burke, R.D.: Question answering from frequently asked question files : experiences with the FAQ Finder System (1997) 0.19
    0.19357942 = sum of:
      0.19357942 = product of:
        0.69135505 = sum of:
          0.033750195 = weight(abstract_txt:system in 1191) [ClassicSimilarity], result of:
            0.033750195 = score(doc=1191,freq=1.0), product of:
              0.09150207 = queryWeight, product of:
                1.1769189 = boost
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.023054574 = queryNorm
              0.36884624 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
          0.036932703 = weight(abstract_txt:retrieval in 1191) [ClassicSimilarity], result of:
            0.036932703 = score(doc=1191,freq=1.0), product of:
              0.09716745 = queryWeight, product of:
                1.2128063 = boost
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.023054574 = queryNorm
              0.38009337 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4751394 = idf(docFreq=3720, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
          0.04921137 = weight(abstract_txt:describes in 1191) [ClassicSimilarity], result of:
            0.04921137 = score(doc=1191,freq=1.0), product of:
              0.11765861 = queryWeight, product of:
                1.3345748 = boost
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.023054574 = queryNorm
              0.4182556 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
          0.06436855 = weight(abstract_txt:language in 1191) [ClassicSimilarity], result of:
            0.06436855 = score(doc=1191,freq=1.0), product of:
              0.14072219 = queryWeight, product of:
                1.4595277 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.023054574 = queryNorm
              0.45741582 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
          0.08179857 = weight(abstract_txt:techniques in 1191) [ClassicSimilarity], result of:
            0.08179857 = score(doc=1191,freq=1.0), product of:
              0.16509879 = queryWeight, product of:
                1.580895 = boost
                4.5298495 = idf(docFreq=1295, maxDocs=44218)
                0.023054574 = queryNorm
              0.49545228 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5298495 = idf(docFreq=1295, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
          0.11533293 = weight(abstract_txt:natural in 1191) [ClassicSimilarity], result of:
            0.11533293 = score(doc=1191,freq=1.0), product of:
              0.2075944 = queryWeight, product of:
                1.7727149 = boost
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.023054574 = queryNorm
              0.55556864 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
          0.30996075 = weight(abstract_txt:system's in 1191) [ClassicSimilarity], result of:
            0.30996075 = score(doc=1191,freq=1.0), product of:
              0.40128338 = queryWeight, product of:
                2.464658 = boost
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.023054574 = queryNorm
              0.77242357 = fieldWeight in 1191, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.062158 = idf(docFreq=102, maxDocs=44218)
                0.109375 = fieldNorm(doc=1191)
        0.28 = coord(7/25)
    
  5. Evans, D.A.; Lefferts, R.G.: CLARIT-TREC experiments (1995) 0.19
    0.19255131 = sum of:
      0.19255131 = product of:
        0.6876833 = sum of:
          0.095543206 = weight(abstract_txt:recall in 1912) [ClassicSimilarity], result of:
            0.095543206 = score(doc=1912,freq=1.0), product of:
              0.13295622 = queryWeight, product of:
                1.0031605 = boost
                5.7488523 = idf(docFreq=382, maxDocs=44218)
                0.023054574 = queryNorm
              0.71860653 = fieldWeight in 1912, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.7488523 = idf(docFreq=382, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
          0.077143304 = weight(abstract_txt:system in 1912) [ClassicSimilarity], result of:
            0.077143304 = score(doc=1912,freq=4.0), product of:
              0.09150207 = queryWeight, product of:
                1.1769189 = boost
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.023054574 = queryNorm
              0.8430771 = fieldWeight in 1912, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.3723085 = idf(docFreq=4123, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
          0.05624157 = weight(abstract_txt:describes in 1912) [ClassicSimilarity], result of:
            0.05624157 = score(doc=1912,freq=1.0), product of:
              0.11765861 = queryWeight, product of:
                1.3345748 = boost
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.023054574 = queryNorm
              0.4780064 = fieldWeight in 1912, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.8240511 = idf(docFreq=2624, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
          0.07356406 = weight(abstract_txt:language in 1912) [ClassicSimilarity], result of:
            0.07356406 = score(doc=1912,freq=1.0), product of:
              0.14072219 = queryWeight, product of:
                1.4595277 = boost
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.023054574 = queryNorm
              0.5227609 = fieldWeight in 1912, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1820874 = idf(docFreq=1834, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
          0.08276192 = weight(abstract_txt:indexing in 1912) [ClassicSimilarity], result of:
            0.08276192 = score(doc=1912,freq=1.0), product of:
              0.15222026 = queryWeight, product of:
                1.5179844 = boost
                4.3495874 = idf(docFreq=1551, maxDocs=44218)
                0.023054574 = queryNorm
              0.54369843 = fieldWeight in 1912, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.3495874 = idf(docFreq=1551, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
          0.17062017 = weight(abstract_txt:processing in 1912) [ClassicSimilarity], result of:
            0.17062017 = score(doc=1912,freq=2.0), product of:
              0.1957022 = queryWeight, product of:
                1.7211905 = boost
                4.931848 = idf(docFreq=866, maxDocs=44218)
                0.023054574 = queryNorm
              0.87183577 = fieldWeight in 1912, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.931848 = idf(docFreq=866, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
          0.13180906 = weight(abstract_txt:natural in 1912) [ClassicSimilarity], result of:
            0.13180906 = score(doc=1912,freq=1.0), product of:
              0.2075944 = queryWeight, product of:
                1.7727149 = boost
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.023054574 = queryNorm
              0.63493556 = fieldWeight in 1912, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.0794845 = idf(docFreq=747, maxDocs=44218)
                0.125 = fieldNorm(doc=1912)
        0.28 = coord(7/25)