Document (#28942)

Author
Fong, A.C.M.
Title
Mining a Web citation database for document clustering
Source
Applied artificial intelligence. 16(2002) no.4, S.283-292
Year
2002
Theme
Citation indexing
Data Mining
Automatisches Klassifizieren

Similar documents (content)

  1. He, Y.; Hui, S.C.: PubSearch : a Web citation-based retrieval system (2001) 0.95
    0.9538769 = sum of:
      0.9538769 = product of:
        1.1923461 = sum of:
          0.13147925 = weight(abstract_txt:database in 807) [ClassicSimilarity], result of:
            0.13147925 = score(doc=807,freq=2.0), product of:
              0.2791973 = queryWeight, product of:
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.06550437 = queryNorm
              0.47091874 = fieldWeight in 807, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.078125 = fieldNorm(doc=807)
          0.163134 = weight(abstract_txt:document in 807) [ClassicSimilarity], result of:
            0.163134 = score(doc=807,freq=3.0), product of:
              0.28162572 = queryWeight, product of:
                1.0043395 = boost
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.06550437 = queryNorm
              0.57925814 = fieldWeight in 807, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.078125 = fieldNorm(doc=807)
          0.31974396 = weight(abstract_txt:citation in 807) [ClassicSimilarity], result of:
            0.31974396 = score(doc=807,freq=5.0), product of:
              0.37201574 = queryWeight, product of:
                1.1543169 = boost
                4.92001 = idf(docFreq=847, maxDocs=42740)
                0.06550437 = queryNorm
              0.8594904 = fieldWeight in 807, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.92001 = idf(docFreq=847, maxDocs=42740)
                0.078125 = fieldNorm(doc=807)
          0.5779889 = weight(abstract_txt:clustering in 807) [ClassicSimilarity], result of:
            0.5779889 = score(doc=807,freq=4.0), product of:
              0.5946701 = queryWeight, product of:
                1.4594272 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.06550437 = queryNorm
              0.97194886 = fieldWeight in 807, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.078125 = fieldNorm(doc=807)
        0.8 = coord(4/5)
    
  2. Zhan, J.; Loh, H.T.: Using latent semantic indexing to improve the accuracy of document clustering (2007) 0.74
    0.74410695 = sum of:
      0.74410695 = product of:
        1.2401782 = sum of:
          0.1883709 = weight(abstract_txt:document in 2265) [ClassicSimilarity], result of:
            0.1883709 = score(doc=2265,freq=4.0), product of:
              0.28162572 = queryWeight, product of:
                1.0043395 = boost
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.06550437 = queryNorm
              0.6688697 = fieldWeight in 2265, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.078125 = fieldNorm(doc=2265)
          0.28719983 = weight(abstract_txt:mining in 2265) [ClassicSimilarity], result of:
            0.28719983 = score(doc=2265,freq=1.0), product of:
              0.59220564 = queryWeight, product of:
                1.4563999 = boost
                6.2075696 = idf(docFreq=233, maxDocs=42740)
                0.06550437 = queryNorm
              0.48496637 = fieldWeight in 2265, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2075696 = idf(docFreq=233, maxDocs=42740)
                0.078125 = fieldNorm(doc=2265)
          0.7646075 = weight(abstract_txt:clustering in 2265) [ClassicSimilarity], result of:
            0.7646075 = score(doc=2265,freq=7.0), product of:
              0.5946701 = queryWeight, product of:
                1.4594272 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.06550437 = queryNorm
              1.2857674 = fieldWeight in 2265, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.078125 = fieldNorm(doc=2265)
        0.6 = coord(3/5)
    
  3. Kostoff, R.N.; Rio, J.A. del; Humenik, J.A.; Garcia, E.O.; Ramirez, A.M.: Citation mining : integrating text mining and bibliometrics for research user profiling (2001) 0.73
    0.72967196 = sum of:
      0.72967196 = product of:
        0.91208994 = sum of:
          0.05578192 = weight(abstract_txt:database in 851) [ClassicSimilarity], result of:
            0.05578192 = score(doc=851,freq=1.0), product of:
              0.2791973 = queryWeight, product of:
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.06550437 = queryNorm
              0.1997939 = fieldWeight in 851, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.046875 = fieldNorm(doc=851)
          0.22699569 = weight(abstract_txt:citation in 851) [ClassicSimilarity], result of:
            0.22699569 = score(doc=851,freq=7.0), product of:
              0.37201574 = queryWeight, product of:
                1.1543169 = boost
                4.92001 = idf(docFreq=847, maxDocs=42740)
                0.06550437 = queryNorm
              0.61017764 = fieldWeight in 851, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                4.92001 = idf(docFreq=847, maxDocs=42740)
                0.046875 = fieldNorm(doc=851)
          0.4559156 = weight(abstract_txt:mining in 851) [ClassicSimilarity], result of:
            0.4559156 = score(doc=851,freq=7.0), product of:
              0.59220564 = queryWeight, product of:
                1.4563999 = boost
                6.2075696 = idf(docFreq=233, maxDocs=42740)
                0.06550437 = queryNorm
              0.76986027 = fieldWeight in 851, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.2075696 = idf(docFreq=233, maxDocs=42740)
                0.046875 = fieldNorm(doc=851)
          0.17339669 = weight(abstract_txt:clustering in 851) [ClassicSimilarity], result of:
            0.17339669 = score(doc=851,freq=1.0), product of:
              0.5946701 = queryWeight, product of:
                1.4594272 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.06550437 = queryNorm
              0.29158467 = fieldWeight in 851, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.046875 = fieldNorm(doc=851)
        0.8 = coord(4/5)
    
  4. Liu, X.; Yu, S.; Janssens, F.; Glänzel, W.; Moreau, Y.; Moor, B.de: Weighted hybrid clustering by combining text mining and bibliometrics on a large-scale journal database (2010) 0.69
    0.68686634 = sum of:
      0.68686634 = product of:
        1.1447772 = sum of:
          0.092969865 = weight(abstract_txt:database in 465) [ClassicSimilarity], result of:
            0.092969865 = score(doc=465,freq=1.0), product of:
              0.2791973 = queryWeight, product of:
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.06550437 = queryNorm
              0.33298984 = fieldWeight in 465, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.078125 = fieldNorm(doc=465)
          0.28719983 = weight(abstract_txt:mining in 465) [ClassicSimilarity], result of:
            0.28719983 = score(doc=465,freq=1.0), product of:
              0.59220564 = queryWeight, product of:
                1.4563999 = boost
                6.2075696 = idf(docFreq=233, maxDocs=42740)
                0.06550437 = queryNorm
              0.48496637 = fieldWeight in 465, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2075696 = idf(docFreq=233, maxDocs=42740)
                0.078125 = fieldNorm(doc=465)
          0.7646075 = weight(abstract_txt:clustering in 465) [ClassicSimilarity], result of:
            0.7646075 = score(doc=465,freq=7.0), product of:
              0.5946701 = queryWeight, product of:
                1.4594272 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.06550437 = queryNorm
              1.2857674 = fieldWeight in 465, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.078125 = fieldNorm(doc=465)
        0.6 = coord(3/5)
    
  5. Tho, Q.T.; Hui, S.C.; Fong, A.C.M.: ¬A citation-based document retrieval system for finding research expertise (2007) 0.64
    0.63846326 = sum of:
      0.63846326 = product of:
        0.7980791 = sum of:
          0.092969865 = weight(abstract_txt:database in 2957) [ClassicSimilarity], result of:
            0.092969865 = score(doc=2957,freq=1.0), product of:
              0.2791973 = queryWeight, product of:
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.06550437 = queryNorm
              0.33298984 = fieldWeight in 2957, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.26227 = idf(docFreq=1636, maxDocs=42740)
                0.078125 = fieldNorm(doc=2957)
          0.09418545 = weight(abstract_txt:document in 2957) [ClassicSimilarity], result of:
            0.09418545 = score(doc=2957,freq=1.0), product of:
              0.28162572 = queryWeight, product of:
                1.0043395 = boost
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.06550437 = queryNorm
              0.33443484 = fieldWeight in 2957, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.078125 = fieldNorm(doc=2957)
          0.20222384 = weight(abstract_txt:citation in 2957) [ClassicSimilarity], result of:
            0.20222384 = score(doc=2957,freq=2.0), product of:
              0.37201574 = queryWeight, product of:
                1.1543169 = boost
                4.92001 = idf(docFreq=847, maxDocs=42740)
                0.06550437 = queryNorm
              0.5435895 = fieldWeight in 2957, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.92001 = idf(docFreq=847, maxDocs=42740)
                0.078125 = fieldNorm(doc=2957)
          0.40869993 = weight(abstract_txt:clustering in 2957) [ClassicSimilarity], result of:
            0.40869993 = score(doc=2957,freq=2.0), product of:
              0.5946701 = queryWeight, product of:
                1.4594272 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.06550437 = queryNorm
              0.68727165 = fieldWeight in 2957, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.078125 = fieldNorm(doc=2957)
        0.8 = coord(4/5)