Document (#29085)

Author
Yu, W.
Gong, Y.
Title
Document clustering by concept factorization
Source
SIGIR'04: Proceedings of the 27th Annual International ACM-SIGIR Conference an Research and Development in Information Retrieval. Ed.: K. Järvelin, u.a
Imprint
New York, NY : ACM Press
Year
2004
Pages
S.202-209
Theme
Automatisches Klassifizieren

Similar documents (content)

  1. Cai, X.; Li, W.: Enhancing sentence-level clustering with integrated and interactive frameworks for theme-based summarization (2011) 0.61
    0.6096923 = sum of:
      0.6096923 = product of:
        0.812923 = sum of:
          0.122811876 = weight(abstract_txt:document in 4770) [ClassicSimilarity], result of:
            0.122811876 = score(doc=4770,freq=6.0), product of:
              0.18688028 = queryWeight, product of:
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.043535367 = queryNorm
              0.65716875 = fieldWeight in 4770, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.0625 = fieldNorm(doc=4770)
          0.10041032 = weight(abstract_txt:concept in 4770) [ClassicSimilarity], result of:
            0.10041032 = score(doc=4770,freq=3.0), product of:
              0.20587271 = queryWeight, product of:
                1.0495851 = boost
                4.505458 = idf(docFreq=1327, maxDocs=44218)
                0.043535367 = queryNorm
              0.48773012 = fieldWeight in 4770, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.505458 = idf(docFreq=1327, maxDocs=44218)
                0.0625 = fieldNorm(doc=4770)
          0.5897008 = weight(abstract_txt:clustering in 4770) [ClassicSimilarity], result of:
            0.5897008 = score(doc=4770,freq=15.0), product of:
              0.3919022 = queryWeight, product of:
                1.4481286 = boost
                6.2162485 = idf(docFreq=239, maxDocs=44218)
                0.043535367 = queryNorm
              1.5047143 = fieldWeight in 4770, product of:
                3.8729835 = tf(freq=15.0), with freq of:
                  15.0 = termFreq=15.0
                6.2162485 = idf(docFreq=239, maxDocs=44218)
                0.0625 = fieldNorm(doc=4770)
        0.75 = coord(3/4)
    
  2. Lee, J.-H.; Park, S.; Ahn, C.-M.; Kim, D.: Automatic generic document summarization based on non-negative matrix factorization (2009) 0.44
    0.43544883 = sum of:
      0.43544883 = product of:
        0.87089765 = sum of:
          0.1063582 = weight(abstract_txt:document in 2448) [ClassicSimilarity], result of:
            0.1063582 = score(doc=2448,freq=2.0), product of:
              0.18688028 = queryWeight, product of:
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.043535367 = queryNorm
              0.5691248 = fieldWeight in 2448, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.09375 = fieldNorm(doc=2448)
          0.7645395 = weight(abstract_txt:factorization in 2448) [ClassicSimilarity], result of:
            0.7645395 = score(doc=2448,freq=1.0), product of:
              0.8769862 = queryWeight, product of:
                2.1662803 = boost
                9.298992 = idf(docFreq=10, maxDocs=44218)
                0.043535367 = queryNorm
              0.8717805 = fieldWeight in 2448, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.298992 = idf(docFreq=10, maxDocs=44218)
                0.09375 = fieldNorm(doc=2448)
        0.5 = coord(2/4)
    
  3. Berry, M.W.; Esau, R.; Kiefer, B.: ¬The use of text mining techniques in electronic discovery for legal matters (2012) 0.42
    0.41987306 = sum of:
      0.41987306 = product of:
        0.8397461 = sum of:
          0.07520661 = weight(abstract_txt:document in 91) [ClassicSimilarity], result of:
            0.07520661 = score(doc=91,freq=1.0), product of:
              0.18688028 = queryWeight, product of:
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.043535367 = queryNorm
              0.40243202 = fieldWeight in 91, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.09375 = fieldNorm(doc=91)
          0.7645395 = weight(abstract_txt:factorization in 91) [ClassicSimilarity], result of:
            0.7645395 = score(doc=91,freq=1.0), product of:
              0.8769862 = queryWeight, product of:
                2.1662803 = boost
                9.298992 = idf(docFreq=10, maxDocs=44218)
                0.043535367 = queryNorm
              0.8717805 = fieldWeight in 91, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.298992 = idf(docFreq=10, maxDocs=44218)
                0.09375 = fieldNorm(doc=91)
        0.5 = coord(2/4)
    
  4. Na, S.-H.; Kang, I.-S.; Lee, J.-H.: Adaptive document clustering based on query-based similarity (2007) 0.41
    0.40728217 = sum of:
      0.40728217 = product of:
        0.5430429 = sum of:
          0.1121114 = weight(abstract_txt:document in 920) [ClassicSimilarity], result of:
            0.1121114 = score(doc=920,freq=5.0), product of:
              0.18688028 = queryWeight, product of:
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.043535367 = queryNorm
              0.59991026 = fieldWeight in 920, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.0625 = fieldNorm(doc=920)
          0.05797193 = weight(abstract_txt:concept in 920) [ClassicSimilarity], result of:
            0.05797193 = score(doc=920,freq=1.0), product of:
              0.20587271 = queryWeight, product of:
                1.0495851 = boost
                4.505458 = idf(docFreq=1327, maxDocs=44218)
                0.043535367 = queryNorm
              0.28159112 = fieldWeight in 920, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.505458 = idf(docFreq=1327, maxDocs=44218)
                0.0625 = fieldNorm(doc=920)
          0.37295955 = weight(abstract_txt:clustering in 920) [ClassicSimilarity], result of:
            0.37295955 = score(doc=920,freq=6.0), product of:
              0.3919022 = queryWeight, product of:
                1.4481286 = boost
                6.2162485 = idf(docFreq=239, maxDocs=44218)
                0.043535367 = queryNorm
              0.95166487 = fieldWeight in 920, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                6.2162485 = idf(docFreq=239, maxDocs=44218)
                0.0625 = fieldNorm(doc=920)
        0.75 = coord(3/4)
    
  5. Lee, Y.-H.; Wei, C.-P.; Hu, P.J.-H.: ¬An ontology-based technique for preserving user preferences in document-category evolutions (2011) 0.34
    0.3422193 = sum of:
      0.3422193 = product of:
        0.4562924 = sum of:
          0.12408458 = weight(abstract_txt:document in 4353) [ClassicSimilarity], result of:
            0.12408458 = score(doc=4353,freq=8.0), product of:
              0.18688028 = queryWeight, product of:
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.043535367 = queryNorm
              0.663979 = fieldWeight in 4353, product of:
                2.828427 = tf(freq=8.0), with freq of:
                  8.0 = termFreq=8.0
                4.2926083 = idf(docFreq=1642, maxDocs=44218)
                0.0546875 = fieldNorm(doc=4353)
          0.10145087 = weight(abstract_txt:concept in 4353) [ClassicSimilarity], result of:
            0.10145087 = score(doc=4353,freq=4.0), product of:
              0.20587271 = queryWeight, product of:
                1.0495851 = boost
                4.505458 = idf(docFreq=1327, maxDocs=44218)
                0.043535367 = queryNorm
              0.49278444 = fieldWeight in 4353, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.505458 = idf(docFreq=1327, maxDocs=44218)
                0.0546875 = fieldNorm(doc=4353)
          0.23075692 = weight(abstract_txt:clustering in 4353) [ClassicSimilarity], result of:
            0.23075692 = score(doc=4353,freq=3.0), product of:
              0.3919022 = queryWeight, product of:
                1.4481286 = boost
                6.2162485 = idf(docFreq=239, maxDocs=44218)
                0.043535367 = queryNorm
              0.58881253 = fieldWeight in 4353, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.2162485 = idf(docFreq=239, maxDocs=44218)
                0.0546875 = fieldNorm(doc=4353)
        0.75 = coord(3/4)