Document (#686)

Author
Faraj, N.
Title
Analyse d'une methode d'indexation automatique basée sur une analyse syntaxique de texte
Source
Canadian journal of information and library science. 21(1996) no.1, S.1-21
Year
1996
Abstract
Evaluates an automatic indexing method based on syntactical text analysis combined with statistical analysis. Tests many combinations for the choice of term categories and weighting methods. The experiment, conducted on a software engineering corpus, shows systematic improvement in the use of syntactic term phrases compared to using only individual words as index terms
Footnote
Übers. d. Titels: Analysis of an automatic indexing method based on syntactic analysis of text
Theme
Automatisches Indexieren

Similar documents (content)

  1. Coret, A.; Menon, B.; Schibler, D.; Terrasse, C.: ¬Un système d'indexation structurée à l'INIST : bilan d'une étude préalable (1994) 0.18
    0.1783684 = sum of:
      0.1783684 = product of:
        2.2296052 = sum of:
          1.0941038 = weight(title_txt:d'indexation in 757) [ClassicSimilarity], result of:
            1.0941038 = score(doc=757,freq=1.0), product of:
              0.37027624 = queryWeight, product of:
                1.8197873 = boost
                9.45546 = idf(docFreq=8, maxDocs=42306)
                0.021519026 = queryNorm
              2.9548311 = fieldWeight in 757, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.45546 = idf(docFreq=8, maxDocs=42306)
                0.3125 = fieldNorm(doc=757)
          1.1355015 = weight(title_txt:d'une in 757) [ClassicSimilarity], result of:
            1.1355015 = score(doc=757,freq=1.0), product of:
              0.37955844 = queryWeight, product of:
                1.8424556 = boost
                9.573242 = idf(docFreq=7, maxDocs=42306)
                0.021519026 = queryNorm
              2.9916382 = fieldWeight in 757, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.573242 = idf(docFreq=7, maxDocs=42306)
                0.3125 = fieldNorm(doc=757)
        0.08 = coord(2/25)
    
  2. Lavallee, C.: Indexation manuelle et indexation assistee par ordinateur : comparison de la performance de deux index d'une monographie (1996) 0.14
    0.1393604 = sum of:
      0.1393604 = product of:
        1.1613367 = sum of:
          0.09545349 = weight(abstract_txt:experiment in 741) [ClassicSimilarity], result of:
            0.09545349 = score(doc=741,freq=1.0), product of:
              0.13416567 = queryWeight, product of:
                1.0954143 = boost
                5.691679 = idf(docFreq=387, maxDocs=42306)
                0.021519026 = queryNorm
              0.7114599 = fieldWeight in 741, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.691679 = idf(docFreq=387, maxDocs=42306)
                0.125 = fieldNorm(doc=741)
          0.15748197 = weight(abstract_txt:evaluates in 741) [ClassicSimilarity], result of:
            0.15748197 = score(doc=741,freq=1.0), product of:
              0.18732716 = queryWeight, product of:
                1.2943689 = boost
                6.7254305 = idf(docFreq=137, maxDocs=42306)
                0.021519026 = queryNorm
              0.8406788 = fieldWeight in 741, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.7254305 = idf(docFreq=137, maxDocs=42306)
                0.125 = fieldNorm(doc=741)
          0.90840125 = weight(title_txt:d'une in 741) [ClassicSimilarity], result of:
            0.90840125 = score(doc=741,freq=1.0), product of:
              0.37955844 = queryWeight, product of:
                1.8424556 = boost
                9.573242 = idf(docFreq=7, maxDocs=42306)
                0.021519026 = queryNorm
              2.3933105 = fieldWeight in 741, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.573242 = idf(docFreq=7, maxDocs=42306)
                0.25 = fieldNorm(doc=741)
        0.12 = coord(3/25)
    
  3. Grefenstette, G.: Explorations in automatic thesaurus discovery (1994) 0.14
    0.1392088 = sum of:
      0.1392088 = product of:
        0.58003664 = sum of:
          0.05446505 = weight(abstract_txt:automatic in 1171) [ClassicSimilarity], result of:
            0.05446505 = score(doc=1171,freq=1.0), product of:
              0.11181103 = queryWeight, product of:
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.021519026 = queryNorm
              0.487117 = fieldWeight in 1171, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.09375 = fieldNorm(doc=1171)
          0.059827007 = weight(abstract_txt:words in 1171) [ClassicSimilarity], result of:
            0.059827007 = score(doc=1171,freq=1.0), product of:
              0.119033955 = queryWeight, product of:
                1.0317943 = boost
                5.361115 = idf(docFreq=539, maxDocs=42306)
                0.021519026 = queryNorm
              0.50260454 = fieldWeight in 1171, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.361115 = idf(docFreq=539, maxDocs=42306)
                0.09375 = fieldNorm(doc=1171)
          0.18612848 = weight(abstract_txt:syntactic in 1171) [ClassicSimilarity], result of:
            0.18612848 = score(doc=1171,freq=3.0), product of:
              0.17588986 = queryWeight, product of:
                1.2542326 = boost
                6.5168858 = idf(docFreq=169, maxDocs=42306)
                0.021519026 = queryNorm
              1.0582104 = fieldWeight in 1171, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.5168858 = idf(docFreq=169, maxDocs=42306)
                0.09375 = fieldNorm(doc=1171)
          0.039336108 = weight(abstract_txt:analysis in 1171) [ClassicSimilarity], result of:
            0.039336108 = score(doc=1171,freq=1.0), product of:
              0.113399275 = queryWeight, product of:
                1.4242225 = boost
                3.7000692 = idf(docFreq=2842, maxDocs=42306)
                0.021519026 = queryNorm
              0.34688148 = fieldWeight in 1171, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.7000692 = idf(docFreq=2842, maxDocs=42306)
                0.09375 = fieldNorm(doc=1171)
          0.08782271 = weight(abstract_txt:term in 1171) [ClassicSimilarity], result of:
            0.08782271 = score(doc=1171,freq=1.0), product of:
              0.19371083 = queryWeight, product of:
                1.8614426 = boost
                4.8359485 = idf(docFreq=912, maxDocs=42306)
                0.021519026 = queryNorm
              0.45337015 = fieldWeight in 1171, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8359485 = idf(docFreq=912, maxDocs=42306)
                0.09375 = fieldNorm(doc=1171)
          0.15245731 = weight(abstract_txt:analyse in 1171) [ClassicSimilarity], result of:
            0.15245731 = score(doc=1171,freq=1.0), product of:
              0.2798003 = queryWeight, product of:
                2.2371585 = boost
                5.8120427 = idf(docFreq=343, maxDocs=42306)
                0.021519026 = queryNorm
              0.544879 = fieldWeight in 1171, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.8120427 = idf(docFreq=343, maxDocs=42306)
                0.09375 = fieldNorm(doc=1171)
        0.24 = coord(6/25)
    
  4. Lioma, C.; Ounis, I.: ¬A syntactically-based query reformulation technique for information retrieval (2008) 0.13
    0.13202283 = sum of:
      0.13202283 = product of:
        0.47151008 = sum of:
          0.07104275 = weight(abstract_txt:automatic in 4032) [ClassicSimilarity], result of:
            0.07104275 = score(doc=4032,freq=5.0), product of:
              0.11181103 = queryWeight, product of:
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.021519026 = queryNorm
              0.6353823 = fieldWeight in 4032, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                5.1959147 = idf(docFreq=636, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
          0.034899086 = weight(abstract_txt:words in 4032) [ClassicSimilarity], result of:
            0.034899086 = score(doc=4032,freq=1.0), product of:
              0.119033955 = queryWeight, product of:
                1.0317943 = boost
                5.361115 = idf(docFreq=539, maxDocs=42306)
                0.021519026 = queryNorm
              0.29318598 = fieldWeight in 4032, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.361115 = idf(docFreq=539, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
          0.03872194 = weight(abstract_txt:statistical in 4032) [ClassicSimilarity], result of:
            0.03872194 = score(doc=4032,freq=1.0), product of:
              0.12757519 = queryWeight, product of:
                1.068171 = boost
                5.5501256 = idf(docFreq=446, maxDocs=42306)
                0.021519026 = queryNorm
              0.3035225 = fieldWeight in 4032, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5501256 = idf(docFreq=446, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
          0.041760903 = weight(abstract_txt:experiment in 4032) [ClassicSimilarity], result of:
            0.041760903 = score(doc=4032,freq=1.0), product of:
              0.13416567 = queryWeight, product of:
                1.0954143 = boost
                5.691679 = idf(docFreq=387, maxDocs=42306)
                0.021519026 = queryNorm
              0.31126368 = fieldWeight in 4032, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.691679 = idf(docFreq=387, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
          0.12537156 = weight(abstract_txt:syntactic in 4032) [ClassicSimilarity], result of:
            0.12537156 = score(doc=4032,freq=4.0), product of:
              0.17588986 = queryWeight, product of:
                1.2542326 = boost
                6.5168858 = idf(docFreq=169, maxDocs=42306)
                0.021519026 = queryNorm
              0.7127844 = fieldWeight in 4032, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.5168858 = idf(docFreq=169, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
          0.10848391 = weight(abstract_txt:weighting in 4032) [ClassicSimilarity], result of:
            0.10848391 = score(doc=4032,freq=2.0), product of:
              0.20123108 = queryWeight, product of:
                1.3415449 = boost
                6.970553 = idf(docFreq=107, maxDocs=42306)
                0.021519026 = queryNorm
              0.5391012 = fieldWeight in 4032, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.970553 = idf(docFreq=107, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
          0.051229917 = weight(abstract_txt:term in 4032) [ClassicSimilarity], result of:
            0.051229917 = score(doc=4032,freq=1.0), product of:
              0.19371083 = queryWeight, product of:
                1.8614426 = boost
                4.8359485 = idf(docFreq=912, maxDocs=42306)
                0.021519026 = queryNorm
              0.26446593 = fieldWeight in 4032, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8359485 = idf(docFreq=912, maxDocs=42306)
                0.0546875 = fieldNorm(doc=4032)
        0.28 = coord(7/25)
    
  5. Martins, A.L.; Souza, R.R.; Ribeiro de Mello, H.: ¬The use of noun phrases in information retrieval : proposing a mechanism for automatic classification (2014) 0.09
    0.093887314 = sum of:
      0.093887314 = product of:
        0.39119714 = sum of:
          0.060446993 = weight(abstract_txt:words in 3442) [ClassicSimilarity], result of:
            0.060446993 = score(doc=3442,freq=3.0), product of:
              0.119033955 = queryWeight, product of:
                1.0317943 = boost
                5.361115 = idf(docFreq=539, maxDocs=42306)
                0.021519026 = queryNorm
              0.50781304 = fieldWeight in 3442, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.361115 = idf(docFreq=539, maxDocs=42306)
                0.0546875 = fieldNorm(doc=3442)
          0.041760903 = weight(abstract_txt:experiment in 3442) [ClassicSimilarity], result of:
            0.041760903 = score(doc=3442,freq=1.0), product of:
              0.13416567 = queryWeight, product of:
                1.0954143 = boost
                5.691679 = idf(docFreq=387, maxDocs=42306)
                0.021519026 = queryNorm
              0.31126368 = fieldWeight in 3442, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.691679 = idf(docFreq=387, maxDocs=42306)
                0.0546875 = fieldNorm(doc=3442)
          0.07147425 = weight(abstract_txt:tests in 3442) [ClassicSimilarity], result of:
            0.07147425 = score(doc=3442,freq=2.0), product of:
              0.15236476 = queryWeight, product of:
                1.167347 = boost
                6.0654354 = idf(docFreq=266, maxDocs=42306)
                0.021519026 = queryNorm
              0.46909958 = fieldWeight in 3442, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.0654354 = idf(docFreq=266, maxDocs=42306)
                0.0546875 = fieldNorm(doc=3442)
          0.052304797 = weight(abstract_txt:corpus in 3442) [ClassicSimilarity], result of:
            0.052304797 = score(doc=3442,freq=1.0), product of:
              0.15589152 = queryWeight, product of:
                1.1807798 = boost
                6.1352315 = idf(docFreq=248, maxDocs=42306)
                0.021519026 = queryNorm
              0.33552048 = fieldWeight in 3442, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1352315 = idf(docFreq=248, maxDocs=42306)
                0.0546875 = fieldNorm(doc=3442)
          0.06268578 = weight(abstract_txt:syntactic in 3442) [ClassicSimilarity], result of:
            0.06268578 = score(doc=3442,freq=1.0), product of:
              0.17588986 = queryWeight, product of:
                1.2542326 = boost
                6.5168858 = idf(docFreq=169, maxDocs=42306)
                0.021519026 = queryNorm
              0.3563922 = fieldWeight in 3442, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5168858 = idf(docFreq=169, maxDocs=42306)
                0.0546875 = fieldNorm(doc=3442)
          0.102524385 = weight(abstract_txt:phrases in 3442) [ClassicSimilarity], result of:
            0.102524385 = score(doc=3442,freq=2.0), product of:
              0.1937922 = queryWeight, product of:
                1.3165151 = boost
                6.8405 = idf(docFreq=122, maxDocs=42306)
                0.021519026 = queryNorm
              0.5290429 = fieldWeight in 3442, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.8405 = idf(docFreq=122, maxDocs=42306)
                0.0546875 = fieldNorm(doc=3442)
        0.24 = coord(6/25)