Document (#29086)

Author
Yu, W.
Gong, Y.
Title
Document clustering by concept factorization
Source
SIGIR'04: Proceedings of the 27th Annual International ACM-SIGIR Conference an Research and Development in Information Retrieval. Ed.: K. Järvelin, u.a
Imprint
New York, NY : ACM Press
Year
2004
Pages
S.202-209
Theme
Automatisches Klassifizieren

Similar documents (content)

  1. Cai, X.; Li, W.: Enhancing sentence-level clustering with integrated and interactive frameworks for theme-based summarization (2011) 0.61
    0.61448485 = sum of:
      0.61448485 = product of:
        0.8193131 = sum of:
          0.12240938 = weight(abstract_txt:document in 1771) [ClassicSimilarity], result of:
            0.12240938 = score(doc=1771,freq=6.0), product of:
              0.18678309 = queryWeight, product of:
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0436331 = queryNorm
              0.6553558 = fieldWeight in 1771, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0625 = fieldNorm(doc=1771)
          0.10303507 = weight(abstract_txt:concept in 1771) [ClassicSimilarity], result of:
            0.10303507 = score(doc=1771,freq=3.0), product of:
              0.20979469 = queryWeight, product of:
                1.0598111 = boost
                4.5368032 = idf(docFreq=1243, maxDocs=42740)
                0.0436331 = queryNorm
              0.49112335 = fieldWeight in 1771, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.5368032 = idf(docFreq=1243, maxDocs=42740)
                0.0625 = fieldNorm(doc=1771)
          0.5938687 = weight(abstract_txt:clustering in 1771) [ClassicSimilarity], result of:
            0.5938687 = score(doc=1771,freq=15.0), product of:
              0.39440405 = queryWeight, product of:
                1.4531214 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.0436331 = queryNorm
              1.5057367 = fieldWeight in 1771, product of:
                3.8729835 = tf(freq=15.0), with freq of:
                  15.0 = termFreq=15.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.0625 = fieldNorm(doc=1771)
        0.75 = coord(3/4)
    
  2. Lee, J.-H.; Park, S.; Ahn, C.-M.; Kim, D.: Automatic generic document summarization based on non-negative matrix factorization (2009) 0.43
    0.43299425 = sum of:
      0.43299425 = product of:
        0.8659885 = sum of:
          0.10600963 = weight(abstract_txt:document in 4449) [ClassicSimilarity], result of:
            0.10600963 = score(doc=4449,freq=2.0), product of:
              0.18678309 = queryWeight, product of:
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0436331 = queryNorm
              0.5675548 = fieldWeight in 4449, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.09375 = fieldNorm(doc=4449)
          0.75997883 = weight(abstract_txt:factorization in 4449) [ClassicSimilarity], result of:
            0.75997883 = score(doc=4449,freq=1.0), product of:
              0.87495357 = queryWeight, product of:
                2.1643312 = boost
                9.264996 = idf(docFreq=10, maxDocs=42740)
                0.0436331 = queryNorm
              0.86859334 = fieldWeight in 4449, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.264996 = idf(docFreq=10, maxDocs=42740)
                0.09375 = fieldNorm(doc=4449)
        0.5 = coord(2/4)
    
  3. Berry, M.W.; Esau, R.; Kiefer, B.: ¬The use of text mining techniques in electronic discovery for legal matters (2012) 0.42
    0.41746947 = sum of:
      0.41746947 = product of:
        0.83493894 = sum of:
          0.074960135 = weight(abstract_txt:document in 2092) [ClassicSimilarity], result of:
            0.074960135 = score(doc=2092,freq=1.0), product of:
              0.18678309 = queryWeight, product of:
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0436331 = queryNorm
              0.40132183 = fieldWeight in 2092, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.09375 = fieldNorm(doc=2092)
          0.75997883 = weight(abstract_txt:factorization in 2092) [ClassicSimilarity], result of:
            0.75997883 = score(doc=2092,freq=1.0), product of:
              0.87495357 = queryWeight, product of:
                2.1643312 = boost
                9.264996 = idf(docFreq=10, maxDocs=42740)
                0.0436331 = queryNorm
              0.86859334 = fieldWeight in 2092, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.264996 = idf(docFreq=10, maxDocs=42740)
                0.09375 = fieldNorm(doc=2092)
        0.5 = coord(2/4)
    
  4. Na, S.-H.; Kang, I.-S.; Lee, J.-H.: Adaptive document clustering based on query-based similarity (2007) 0.41
    0.41012013 = sum of:
      0.41012013 = product of:
        0.54682684 = sum of:
          0.11174396 = weight(abstract_txt:document in 2921) [ClassicSimilarity], result of:
            0.11174396 = score(doc=2921,freq=5.0), product of:
              0.18678309 = queryWeight, product of:
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0436331 = queryNorm
              0.5982552 = fieldWeight in 2921, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0625 = fieldNorm(doc=2921)
          0.059487324 = weight(abstract_txt:concept in 2921) [ClassicSimilarity], result of:
            0.059487324 = score(doc=2921,freq=1.0), product of:
              0.20979469 = queryWeight, product of:
                1.0598111 = boost
                4.5368032 = idf(docFreq=1243, maxDocs=42740)
                0.0436331 = queryNorm
              0.2835502 = fieldWeight in 2921, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5368032 = idf(docFreq=1243, maxDocs=42740)
                0.0625 = fieldNorm(doc=2921)
          0.37559554 = weight(abstract_txt:clustering in 2921) [ClassicSimilarity], result of:
            0.37559554 = score(doc=2921,freq=6.0), product of:
              0.39440405 = queryWeight, product of:
                1.4531214 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.0436331 = queryNorm
              0.9523116 = fieldWeight in 2921, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.0625 = fieldNorm(doc=2921)
        0.75 = coord(3/4)
    
  5. Lee, Y.-H.; Wei, C.-P.; Hu, P.J.-H.: ¬An ontology-based technique for preserving user preferences in document-category evolutions (2011) 0.35
    0.34512645 = sum of:
      0.34512645 = product of:
        0.4601686 = sum of:
          0.1236779 = weight(abstract_txt:document in 1354) [ClassicSimilarity], result of:
            0.1236779 = score(doc=1354,freq=8.0), product of:
              0.18678309 = queryWeight, product of:
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0436331 = queryNorm
              0.6621472 = fieldWeight in 1354, product of:
                2.828427 = tf(freq=8.0), with freq of:
                  8.0 = termFreq=8.0
                4.280766 = idf(docFreq=1606, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1354)
          0.10410282 = weight(abstract_txt:concept in 1354) [ClassicSimilarity], result of:
            0.10410282 = score(doc=1354,freq=4.0), product of:
              0.20979469 = queryWeight, product of:
                1.0598111 = boost
                4.5368032 = idf(docFreq=1243, maxDocs=42740)
                0.0436331 = queryNorm
              0.49621284 = fieldWeight in 1354, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.5368032 = idf(docFreq=1243, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1354)
          0.23238786 = weight(abstract_txt:clustering in 1354) [ClassicSimilarity], result of:
            0.23238786 = score(doc=1354,freq=3.0), product of:
              0.39440405 = queryWeight, product of:
                1.4531214 = boost
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.0436331 = queryNorm
              0.58921266 = fieldWeight in 1354, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.220473 = idf(docFreq=230, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1354)
        0.75 = coord(3/4)