Document (#29086)

Author
Yu, W.
Gong, Y.
Title
Document clustering by concept factorization
Source
SIGIR'04: Proceedings of the 27th Annual International ACM-SIGIR Conference an Research and Development in Information Retrieval. Ed.: K. Järvelin, u.a
Imprint
New York, NY : ACM Press
Year
2004
Pages
S.202-209
Theme
Automatisches Klassifizieren

Similar documents (content)

  1. Cai, X.; Li, W.: Enhancing sentence-level clustering with integrated and interactive frameworks for theme-based summarization (2011) 0.61
    0.61408466 = sum of:
      0.61408466 = product of:
        0.8187795 = sum of:
          0.12232025 = weight(abstract_txt:document in 771) [ClassicSimilarity], result of:
            0.12232025 = score(doc=771,freq=6.0), product of:
              0.18673998 = queryWeight, product of:
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.04364474 = queryNorm
              0.6550298 = fieldWeight in 771, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.0625 = fieldNorm(doc=771)
          0.10310332 = weight(abstract_txt:concept in 771) [ClassicSimilarity], result of:
            0.10310332 = score(doc=771,freq=3.0), product of:
              0.20994079 = queryWeight, product of:
                1.0603025 = boost
                4.5366488 = idf(docFreq=1239, maxDocs=42596)
                0.04364474 = queryNorm
              0.49110663 = fieldWeight in 771, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.5366488 = idf(docFreq=1239, maxDocs=42596)
                0.0625 = fieldNorm(doc=771)
          0.59335595 = weight(abstract_txt:clustering in 771) [ClassicSimilarity], result of:
            0.59335595 = score(doc=771,freq=15.0), product of:
              0.39427745 = queryWeight, product of:
                1.4530559 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.04364474 = queryNorm
              1.5049198 = fieldWeight in 771, product of:
                3.8729835 = tf(freq=15.0), with freq of:
                  15.0 = termFreq=15.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.0625 = fieldNorm(doc=771)
        0.75 = coord(3/4)
    
  2. Lee, J.-H.; Park, S.; Ahn, C.-M.; Kim, D.: Automatic generic document summarization based on non-negative matrix factorization (2009) 0.43
    0.4328308 = sum of:
      0.4328308 = product of:
        0.8656616 = sum of:
          0.105932444 = weight(abstract_txt:document in 3628) [ClassicSimilarity], result of:
            0.105932444 = score(doc=3628,freq=2.0), product of:
              0.18673998 = queryWeight, product of:
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.04364474 = queryNorm
              0.5672724 = fieldWeight in 3628, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.09375 = fieldNorm(doc=3628)
          0.75972915 = weight(abstract_txt:factorization in 3628) [ClassicSimilarity], result of:
            0.75972915 = score(doc=3628,freq=1.0), product of:
              0.8749848 = queryWeight, product of:
                2.1646197 = boost
                9.2616205 = idf(docFreq=10, maxDocs=42596)
                0.04364474 = queryNorm
              0.86827695 = fieldWeight in 3628, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.2616205 = idf(docFreq=10, maxDocs=42596)
                0.09375 = fieldNorm(doc=3628)
        0.5 = coord(2/4)
    
  3. Berry, M.W.; Esau, R.; Kiefer, B.: ¬The use of text mining techniques in electronic discovery for legal matters (2012) 0.42
    0.41731733 = sum of:
      0.41731733 = product of:
        0.83463466 = sum of:
          0.074905545 = weight(abstract_txt:document in 1092) [ClassicSimilarity], result of:
            0.074905545 = score(doc=1092,freq=1.0), product of:
              0.18673998 = queryWeight, product of:
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.04364474 = queryNorm
              0.40112215 = fieldWeight in 1092, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.09375 = fieldNorm(doc=1092)
          0.75972915 = weight(abstract_txt:factorization in 1092) [ClassicSimilarity], result of:
            0.75972915 = score(doc=1092,freq=1.0), product of:
              0.8749848 = queryWeight, product of:
                2.1646197 = boost
                9.2616205 = idf(docFreq=10, maxDocs=42596)
                0.04364474 = queryNorm
              0.86827695 = fieldWeight in 1092, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.2616205 = idf(docFreq=10, maxDocs=42596)
                0.09375 = fieldNorm(doc=1092)
        0.5 = coord(2/4)
    
  4. Na, S.-H.; Kang, I.-S.; Lee, J.-H.: Adaptive document clustering based on query-based similarity (2007) 0.41
    0.4098454 = sum of:
      0.4098454 = product of:
        0.54646057 = sum of:
          0.1116626 = weight(abstract_txt:document in 2100) [ClassicSimilarity], result of:
            0.1116626 = score(doc=2100,freq=5.0), product of:
              0.18673998 = queryWeight, product of:
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.04364474 = queryNorm
              0.5979576 = fieldWeight in 2100, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.0625 = fieldNorm(doc=2100)
          0.059526727 = weight(abstract_txt:concept in 2100) [ClassicSimilarity], result of:
            0.059526727 = score(doc=2100,freq=1.0), product of:
              0.20994079 = queryWeight, product of:
                1.0603025 = boost
                4.5366488 = idf(docFreq=1239, maxDocs=42596)
                0.04364474 = queryNorm
              0.28354055 = fieldWeight in 2100, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5366488 = idf(docFreq=1239, maxDocs=42596)
                0.0625 = fieldNorm(doc=2100)
          0.37527126 = weight(abstract_txt:clustering in 2100) [ClassicSimilarity], result of:
            0.37527126 = score(doc=2100,freq=6.0), product of:
              0.39427745 = queryWeight, product of:
                1.4530559 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.04364474 = queryNorm
              0.95179486 = fieldWeight in 2100, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.0625 = fieldNorm(doc=2100)
        0.75 = coord(3/4)
    
  5. Lee, Y.-H.; Wei, C.-P.; Hu, P.J.-H.: ¬An ontology-based technique for preserving user preferences in document-category evolutions (2011) 0.34
    0.34496012 = sum of:
      0.34496012 = product of:
        0.45994684 = sum of:
          0.12358784 = weight(abstract_txt:document in 354) [ClassicSimilarity], result of:
            0.12358784 = score(doc=354,freq=8.0), product of:
              0.18673998 = queryWeight, product of:
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.04364474 = queryNorm
              0.6618178 = fieldWeight in 354, product of:
                2.828427 = tf(freq=8.0), with freq of:
                  8.0 = termFreq=8.0
                4.2786365 = idf(docFreq=1604, maxDocs=42596)
                0.0546875 = fieldNorm(doc=354)
          0.104171775 = weight(abstract_txt:concept in 354) [ClassicSimilarity], result of:
            0.104171775 = score(doc=354,freq=4.0), product of:
              0.20994079 = queryWeight, product of:
                1.0603025 = boost
                4.5366488 = idf(docFreq=1239, maxDocs=42596)
                0.04364474 = queryNorm
              0.49619597 = fieldWeight in 354, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.5366488 = idf(docFreq=1239, maxDocs=42596)
                0.0546875 = fieldNorm(doc=354)
          0.23218723 = weight(abstract_txt:clustering in 354) [ClassicSimilarity], result of:
            0.23218723 = score(doc=354,freq=3.0), product of:
              0.39427745 = queryWeight, product of:
                1.4530559 = boost
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.04364474 = queryNorm
              0.588893 = fieldWeight in 354, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.2170978 = idf(docFreq=230, maxDocs=42596)
                0.0546875 = fieldNorm(doc=354)
        0.75 = coord(3/4)