Document (#24089)

Author
Ahonen, H.
Title
Knowledge discovery in documents by extracting frequent word sequences
Source
Library trends. 48(1999) no.1, S.160-181
Year
1999
Theme
Computerlinguistik
Informetrie

Similar documents (content)

  1. Torra, V.; Lanau, S.; Miyamoto, S.: Image clustering for the exploration of video sequences (2006) 0.36
    0.36002094 = sum of:
      0.36002094 = product of:
        1.2600732 = sum of:
          0.3652213 = weight(abstract_txt:extracting in 5284) [ClassicSimilarity], result of:
            0.3652213 = score(doc=5284,freq=1.0), product of:
              0.48151466 = queryWeight, product of:
                1.951907 = boost
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.035573114 = queryNorm
              0.75848424 = fieldWeight in 5284, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.109375 = fieldNorm(doc=5284)
          0.89485186 = weight(abstract_txt:sequences in 5284) [ClassicSimilarity], result of:
            0.89485186 = score(doc=5284,freq=4.0), product of:
              0.5512977 = queryWeight, product of:
                2.0885625 = boost
                7.4202213 = idf(docFreq=71, maxDocs=44218)
                0.035573114 = queryNorm
              1.6231735 = fieldWeight in 5284, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.4202213 = idf(docFreq=71, maxDocs=44218)
                0.109375 = fieldNorm(doc=5284)
        0.2857143 = coord(2/7)
    
  2. Wolfekuhler, M.R.; Punch, W.F.: Finding salient features for personal Web pages categories (1997) 0.31
    0.30957347 = sum of:
      0.30957347 = product of:
        0.7223381 = sum of:
          0.10841492 = weight(abstract_txt:documents in 2673) [ClassicSimilarity], result of:
            0.10841492 = score(doc=2673,freq=2.0), product of:
              0.17006756 = queryWeight, product of:
                1.160019 = boost
                4.1213026 = idf(docFreq=1949, maxDocs=44218)
                0.035573114 = queryNorm
              0.63748145 = fieldWeight in 2673, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.1213026 = idf(docFreq=1949, maxDocs=44218)
                0.109375 = fieldNorm(doc=2673)
          0.24870187 = weight(abstract_txt:word in 2673) [ClassicSimilarity], result of:
            0.24870187 = score(doc=2673,freq=2.0), product of:
              0.29581136 = queryWeight, product of:
                1.5298955 = boost
                5.4353957 = idf(docFreq=523, maxDocs=44218)
                0.035573114 = queryNorm
              0.84074485 = fieldWeight in 2673, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.4353957 = idf(docFreq=523, maxDocs=44218)
                0.109375 = fieldNorm(doc=2673)
          0.3652213 = weight(abstract_txt:extracting in 2673) [ClassicSimilarity], result of:
            0.3652213 = score(doc=2673,freq=1.0), product of:
              0.48151466 = queryWeight, product of:
                1.951907 = boost
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.035573114 = queryNorm
              0.75848424 = fieldWeight in 2673, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.109375 = fieldNorm(doc=2673)
        0.42857143 = coord(3/7)
    
  3. Fayyad, U.M.: Data mining and knowledge dicovery : making sense out of data (1996) 0.31
    0.30807617 = sum of:
      0.30807617 = product of:
        0.7188444 = sum of:
          0.07937535 = weight(abstract_txt:knowledge in 7007) [ClassicSimilarity], result of:
            0.07937535 = score(doc=7007,freq=2.0), product of:
              0.12638375 = queryWeight, product of:
                3.5527887 = idf(docFreq=3442, maxDocs=44218)
                0.035573114 = queryNorm
              0.62805027 = fieldWeight in 7007, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.5527887 = idf(docFreq=3442, maxDocs=44218)
                0.125 = fieldNorm(doc=7007)
          0.22207333 = weight(abstract_txt:discovery in 7007) [ClassicSimilarity], result of:
            0.22207333 = score(doc=7007,freq=1.0), product of:
              0.3161611 = queryWeight, product of:
                1.5816435 = boost
                5.619245 = idf(docFreq=435, maxDocs=44218)
                0.035573114 = queryNorm
              0.70240563 = fieldWeight in 7007, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.619245 = idf(docFreq=435, maxDocs=44218)
                0.125 = fieldNorm(doc=7007)
          0.41739577 = weight(abstract_txt:extracting in 7007) [ClassicSimilarity], result of:
            0.41739577 = score(doc=7007,freq=1.0), product of:
              0.48151466 = queryWeight, product of:
                1.951907 = boost
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.035573114 = queryNorm
              0.8668392 = fieldWeight in 7007, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.125 = fieldNorm(doc=7007)
        0.42857143 = coord(3/7)
    
  4. Grau, B.: Finding answers to questions, in text collections or Web, in open domain or specialty domains (2012) 0.27
    0.26714504 = sum of:
      0.26714504 = product of:
        0.4675038 = sum of:
          0.028063424 = weight(abstract_txt:knowledge in 107) [ClassicSimilarity], result of:
            0.028063424 = score(doc=107,freq=1.0), product of:
              0.12638375 = queryWeight, product of:
                3.5527887 = idf(docFreq=3442, maxDocs=44218)
                0.035573114 = queryNorm
              0.2220493 = fieldWeight in 107, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.5527887 = idf(docFreq=3442, maxDocs=44218)
                0.0625 = fieldNorm(doc=107)
          0.043806244 = weight(abstract_txt:documents in 107) [ClassicSimilarity], result of:
            0.043806244 = score(doc=107,freq=1.0), product of:
              0.17006756 = queryWeight, product of:
                1.160019 = boost
                4.1213026 = idf(docFreq=1949, maxDocs=44218)
                0.035573114 = queryNorm
              0.2575814 = fieldWeight in 107, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1213026 = idf(docFreq=1949, maxDocs=44218)
                0.0625 = fieldNorm(doc=107)
          0.100490734 = weight(abstract_txt:word in 107) [ClassicSimilarity], result of:
            0.100490734 = score(doc=107,freq=1.0), product of:
              0.29581136 = queryWeight, product of:
                1.5298955 = boost
                5.4353957 = idf(docFreq=523, maxDocs=44218)
                0.035573114 = queryNorm
              0.33971223 = fieldWeight in 107, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.4353957 = idf(docFreq=523, maxDocs=44218)
                0.0625 = fieldNorm(doc=107)
          0.29514337 = weight(abstract_txt:extracting in 107) [ClassicSimilarity], result of:
            0.29514337 = score(doc=107,freq=2.0), product of:
              0.48151466 = queryWeight, product of:
                1.951907 = boost
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.035573114 = queryNorm
              0.6129478 = fieldWeight in 107, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.0625 = fieldNorm(doc=107)
        0.5714286 = coord(4/7)
    
  5. Trybula, W.J.: Data mining and knowledge discovery (1997) 0.27
    0.26635805 = sum of:
      0.26635805 = product of:
        0.6215021 = sum of:
          0.07291091 = weight(abstract_txt:knowledge in 2300) [ClassicSimilarity], result of:
            0.07291091 = score(doc=2300,freq=3.0), product of:
              0.12638375 = queryWeight, product of:
                3.5527887 = idf(docFreq=3442, maxDocs=44218)
                0.035573114 = queryNorm
              0.576901 = fieldWeight in 2300, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.5527887 = idf(docFreq=3442, maxDocs=44218)
                0.09375 = fieldNorm(doc=2300)
          0.23554435 = weight(abstract_txt:discovery in 2300) [ClassicSimilarity], result of:
            0.23554435 = score(doc=2300,freq=2.0), product of:
              0.3161611 = queryWeight, product of:
                1.5816435 = boost
                5.619245 = idf(docFreq=435, maxDocs=44218)
                0.035573114 = queryNorm
              0.7450137 = fieldWeight in 2300, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.619245 = idf(docFreq=435, maxDocs=44218)
                0.09375 = fieldNorm(doc=2300)
          0.31304684 = weight(abstract_txt:extracting in 2300) [ClassicSimilarity], result of:
            0.31304684 = score(doc=2300,freq=1.0), product of:
              0.48151466 = queryWeight, product of:
                1.951907 = boost
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.035573114 = queryNorm
              0.6501294 = fieldWeight in 2300, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9347134 = idf(docFreq=116, maxDocs=44218)
                0.09375 = fieldNorm(doc=2300)
        0.42857143 = coord(3/7)