Document (#28942)

Author
Fong, A.C.M.
Title
Mining a Web citation database for document clustering
Source
Applied artificial intelligence. 16(2002) no.4, S.283-292
Year
2002
Theme
Citation indexing
Data Mining
Automatisches Klassifizieren

Similar documents (content)

  1. He, Y.; Hui, S.C.: PubSearch : a Web citation-based retrieval system (2001) 0.95
    0.9533753 = sum of:
      0.9533753 = product of:
        1.191719 = sum of:
          0.13143508 = weight(abstract_txt:database in 5807) [ClassicSimilarity], result of:
            0.13143508 = score(doc=5807,freq=2.0), product of:
              0.27916434 = queryWeight, product of:
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.06551091 = queryNorm
              0.47081617 = fieldWeight in 5807, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.078125 = fieldNorm(doc=5807)
          0.1629424 = weight(abstract_txt:document in 5807) [ClassicSimilarity], result of:
            0.1629424 = score(doc=5807,freq=3.0), product of:
              0.28143498 = queryWeight, product of:
                1.0040586 = boost
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.06551091 = queryNorm
              0.57896996 = fieldWeight in 5807, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.078125 = fieldNorm(doc=5807)
          0.32010952 = weight(abstract_txt:citation in 5807) [ClassicSimilarity], result of:
            0.32010952 = score(doc=5807,freq=5.0), product of:
              0.37233865 = queryWeight, product of:
                1.1548859 = boost
                4.9213634 = idf(docFreq=843, maxDocs=42596)
                0.06551091 = queryNorm
              0.8597268 = fieldWeight in 5807, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.9213634 = idf(docFreq=843, maxDocs=42596)
                0.078125 = fieldNorm(doc=5807)
          0.577232 = weight(abstract_txt:clustering in 5807) [ClassicSimilarity], result of:
            0.577232 = score(doc=5807,freq=4.0), product of:
              0.5942137 = queryWeight, product of:
                1.4589531 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.06551091 = queryNorm
              0.97142154 = fieldWeight in 5807, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.078125 = fieldNorm(doc=5807)
        0.8 = coord(4/5)
    
  2. Zhan, J.; Loh, H.T.: Using latent semantic indexing to improve the accuracy of document clustering (2007) 0.74
    0.7435038 = sum of:
      0.7435038 = product of:
        1.2391729 = sum of:
          0.18814969 = weight(abstract_txt:document in 1444) [ClassicSimilarity], result of:
            0.18814969 = score(doc=1444,freq=4.0), product of:
              0.28143498 = queryWeight, product of:
                1.0040586 = boost
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.06551091 = queryNorm
              0.66853696 = fieldWeight in 1444, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.078125 = fieldNorm(doc=1444)
          0.28741705 = weight(abstract_txt:mining in 1444) [ClassicSimilarity], result of:
            0.28741705 = score(doc=1444,freq=1.0), product of:
              0.59256697 = queryWeight, product of:
                1.4569302 = boost
                6.208477 = idf(docFreq=232, maxDocs=42596)
                0.06551091 = queryNorm
              0.48503727 = fieldWeight in 1444, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.208477 = idf(docFreq=232, maxDocs=42596)
                0.078125 = fieldNorm(doc=1444)
          0.7636062 = weight(abstract_txt:clustering in 1444) [ClassicSimilarity], result of:
            0.7636062 = score(doc=1444,freq=7.0), product of:
              0.5942137 = queryWeight, product of:
                1.4589531 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.06551091 = queryNorm
              1.28507 = fieldWeight in 1444, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.078125 = fieldNorm(doc=1444)
        0.6 = coord(3/5)
    
  3. Kostoff, R.N.; Rio, J.A. del; Humenik, J.A.; Garcia, E.O.; Ramirez, A.M.: Citation mining : integrating text mining and bibliometrics for research user profiling (2001) 0.73
    0.7299588 = sum of:
      0.7299588 = product of:
        0.91244847 = sum of:
          0.05576319 = weight(abstract_txt:database in 851) [ClassicSimilarity], result of:
            0.05576319 = score(doc=851,freq=1.0), product of:
              0.27916434 = queryWeight, product of:
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.06551091 = queryNorm
              0.1997504 = fieldWeight in 851, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.046875 = fieldNorm(doc=851)
          0.22725521 = weight(abstract_txt:citation in 851) [ClassicSimilarity], result of:
            0.22725521 = score(doc=851,freq=7.0), product of:
              0.37233865 = queryWeight, product of:
                1.1548859 = boost
                4.9213634 = idf(docFreq=843, maxDocs=42596)
                0.06551091 = queryNorm
              0.6103455 = fieldWeight in 851, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                4.9213634 = idf(docFreq=843, maxDocs=42596)
                0.046875 = fieldNorm(doc=851)
          0.45626044 = weight(abstract_txt:mining in 851) [ClassicSimilarity], result of:
            0.45626044 = score(doc=851,freq=7.0), product of:
              0.59256697 = queryWeight, product of:
                1.4569302 = boost
                6.208477 = idf(docFreq=232, maxDocs=42596)
                0.06551091 = queryNorm
              0.7699728 = fieldWeight in 851, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.208477 = idf(docFreq=232, maxDocs=42596)
                0.046875 = fieldNorm(doc=851)
          0.1731696 = weight(abstract_txt:clustering in 851) [ClassicSimilarity], result of:
            0.1731696 = score(doc=851,freq=1.0), product of:
              0.5942137 = queryWeight, product of:
                1.4589531 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.06551091 = queryNorm
              0.29142645 = fieldWeight in 851, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.046875 = fieldNorm(doc=851)
        0.8 = coord(4/5)
    
  4. Liu, X.; Yu, S.; Janssens, F.; Glänzel, W.; Moreau, Y.; Moor, B.de: Weighted hybrid clustering by combining text mining and bibliometrics on a large-scale journal database (2010) 0.69
    0.68637717 = sum of:
      0.68637717 = product of:
        1.1439619 = sum of:
          0.09293864 = weight(abstract_txt:database in 4644) [ClassicSimilarity], result of:
            0.09293864 = score(doc=4644,freq=1.0), product of:
              0.27916434 = queryWeight, product of:
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.06551091 = queryNorm
              0.3329173 = fieldWeight in 4644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.078125 = fieldNorm(doc=4644)
          0.28741705 = weight(abstract_txt:mining in 4644) [ClassicSimilarity], result of:
            0.28741705 = score(doc=4644,freq=1.0), product of:
              0.59256697 = queryWeight, product of:
                1.4569302 = boost
                6.208477 = idf(docFreq=232, maxDocs=42596)
                0.06551091 = queryNorm
              0.48503727 = fieldWeight in 4644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.208477 = idf(docFreq=232, maxDocs=42596)
                0.078125 = fieldNorm(doc=4644)
          0.7636062 = weight(abstract_txt:clustering in 4644) [ClassicSimilarity], result of:
            0.7636062 = score(doc=4644,freq=7.0), product of:
              0.5942137 = queryWeight, product of:
                1.4589531 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.06551091 = queryNorm
              1.28507 = fieldWeight in 4644, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.078125 = fieldNorm(doc=4644)
        0.6 = coord(3/5)
    
  5. Tho, Q.T.; Hui, S.C.; Fong, A.C.M.: ¬A citation-based document retrieval system for finding research expertise (2007) 0.64
    0.6381065 = sum of:
      0.6381065 = product of:
        0.7976332 = sum of:
          0.09293864 = weight(abstract_txt:database in 2136) [ClassicSimilarity], result of:
            0.09293864 = score(doc=2136,freq=1.0), product of:
              0.27916434 = queryWeight, product of:
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.06551091 = queryNorm
              0.3329173 = fieldWeight in 2136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2613416 = idf(docFreq=1632, maxDocs=42596)
                0.078125 = fieldNorm(doc=2136)
          0.094074845 = weight(abstract_txt:document in 2136) [ClassicSimilarity], result of:
            0.094074845 = score(doc=2136,freq=1.0), product of:
              0.28143498 = queryWeight, product of:
                1.0040586 = boost
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.06551091 = queryNorm
              0.33426848 = fieldWeight in 2136, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.078125 = fieldNorm(doc=2136)
          0.20245503 = weight(abstract_txt:citation in 2136) [ClassicSimilarity], result of:
            0.20245503 = score(doc=2136,freq=2.0), product of:
              0.37233865 = queryWeight, product of:
                1.1548859 = boost
                4.9213634 = idf(docFreq=843, maxDocs=42596)
                0.06551091 = queryNorm
              0.54373896 = fieldWeight in 2136, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.9213634 = idf(docFreq=843, maxDocs=42596)
                0.078125 = fieldNorm(doc=2136)
          0.40816468 = weight(abstract_txt:clustering in 2136) [ClassicSimilarity], result of:
            0.40816468 = score(doc=2136,freq=2.0), product of:
              0.5942137 = queryWeight, product of:
                1.4589531 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.06551091 = queryNorm
              0.68689877 = fieldWeight in 2136, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.078125 = fieldNorm(doc=2136)
        0.8 = coord(4/5)