Document (#29134)

Author
Shen, D.
Chen, Z.
Yang, Q.
Zeng, H.J.
Zhang, B.
Lu, Y.
Ma, W.Y.
Title
Web page classification through summarization
Source
SIGIR'04: Proceedings of the 27th Annual International ACM-SIGIR Conference an Research and Development in Information Retrieval. Ed.: K. Järvelin, u.a
Imprint
New York, NY : ACM Press
Year
2004
Pages
S.242-249
Theme
Automatisches Klassifizieren

Similar documents (author)

  1. Shen, D.; Yang, Q.; Chen, Z.: Noise reduction through summarization for Web-page classification (2007) 2.31
    2.3063965 = sum of:
      2.3063965 = product of:
        3.8439941 = sum of:
          0.72414166 = weight(author_txt:chen in 2954) [ClassicSimilarity], result of:
            0.72414166 = score(doc=2954,freq=1.0), product of:
              0.31298184 = queryWeight, product of:
                6.169829 = idf(docFreq=242, maxDocs=42740)
                0.0507278 = queryNorm
              2.313686 = fieldWeight in 2954, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.169829 = idf(docFreq=242, maxDocs=42740)
                0.375 = fieldNorm(doc=2954)
          1.1779497 = weight(author_txt:yang in 2954) [ClassicSimilarity], result of:
            1.1779497 = score(doc=2954,freq=1.0), product of:
              0.43290037 = queryWeight, product of:
                1.1760733 = boost
                7.256171 = idf(docFreq=81, maxDocs=42740)
                0.0507278 = queryNorm
              2.721064 = fieldWeight in 2954, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.256171 = idf(docFreq=81, maxDocs=42740)
                0.375 = fieldNorm(doc=2954)
          1.941903 = weight(author_txt:shen in 2954) [ClassicSimilarity], result of:
            1.941903 = score(doc=2954,freq=1.0), product of:
              0.60411805 = queryWeight, product of:
                1.3893169 = boost
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.0507278 = queryNorm
              3.214443 = fieldWeight in 2954, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.375 = fieldNorm(doc=2954)
        0.6 = coord(3/5)
    
  2. Zhang, J.; Zeng, M.L.: ¬A new similarity measure for subject hierarchical structures (2014) 1.18
    1.1838322 = sum of:
      1.1838322 = product of:
        2.9595804 = sum of:
          1.1653827 = weight(author_txt:zhang in 3779) [ClassicSimilarity], result of:
            1.1653827 = score(doc=3779,freq=1.0), product of:
              0.35480523 = queryWeight, product of:
                1.06472 = boost
                6.5691404 = idf(docFreq=162, maxDocs=42740)
                0.0507278 = queryNorm
              3.2845702 = fieldWeight in 3779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5691404 = idf(docFreq=162, maxDocs=42740)
                0.5 = fieldNorm(doc=3779)
          1.7941976 = weight(author_txt:zeng in 3779) [ClassicSimilarity], result of:
            1.7941976 = score(doc=3779,freq=1.0), product of:
              0.47306898 = queryWeight, product of:
                1.2294267 = boost
                7.585353 = idf(docFreq=58, maxDocs=42740)
                0.0507278 = queryNorm
              3.7926764 = fieldWeight in 3779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.585353 = idf(docFreq=58, maxDocs=42740)
                0.5 = fieldNorm(doc=3779)
        0.4 = coord(2/5)
    
  3. Shen, X.-L.; Zhang, K.Z.K.; Zhao, S.J.: Herd behavior in consumers' adoption of online reviews (2016) 1.13
    1.126376 = sum of:
      1.126376 = product of:
        2.81594 = sum of:
          0.87403697 = weight(author_txt:zhang in 5158) [ClassicSimilarity], result of:
            0.87403697 = score(doc=5158,freq=1.0), product of:
              0.35480523 = queryWeight, product of:
                1.06472 = boost
                6.5691404 = idf(docFreq=162, maxDocs=42740)
                0.0507278 = queryNorm
              2.4634275 = fieldWeight in 5158, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5691404 = idf(docFreq=162, maxDocs=42740)
                0.375 = fieldNorm(doc=5158)
          1.941903 = weight(author_txt:shen in 5158) [ClassicSimilarity], result of:
            1.941903 = score(doc=5158,freq=1.0), product of:
              0.60411805 = queryWeight, product of:
                1.3893169 = boost
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.0507278 = queryNorm
              3.214443 = fieldWeight in 5158, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.571848 = idf(docFreq=21, maxDocs=42740)
                0.375 = fieldNorm(doc=5158)
        0.4 = coord(2/5)
    
  4. Zeng, M.L.; Chen, Y.: Features of an integrated thesaurus management and search system for the networked environment (2003) 1.10
    1.1038879 = sum of:
      1.1038879 = product of:
        2.7597198 = sum of:
          0.9655222 = weight(author_txt:chen in 4818) [ClassicSimilarity], result of:
            0.9655222 = score(doc=4818,freq=1.0), product of:
              0.31298184 = queryWeight, product of:
                6.169829 = idf(docFreq=242, maxDocs=42740)
                0.0507278 = queryNorm
              3.0849144 = fieldWeight in 4818, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.169829 = idf(docFreq=242, maxDocs=42740)
                0.5 = fieldNorm(doc=4818)
          1.7941976 = weight(author_txt:zeng in 4818) [ClassicSimilarity], result of:
            1.7941976 = score(doc=4818,freq=1.0), product of:
              0.47306898 = queryWeight, product of:
                1.2294267 = boost
                7.585353 = idf(docFreq=58, maxDocs=42740)
                0.0507278 = queryNorm
              3.7926764 = fieldWeight in 4818, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.585353 = idf(docFreq=58, maxDocs=42740)
                0.5 = fieldNorm(doc=4818)
        0.4 = coord(2/5)
    
  5. Zhang, M.; Yang, C.C.: Using content and network analysis to understand the social support exchange patterns and user behaviors of an online smoking cessation intervention program (2015) 1.09
    1.094393 = sum of:
      1.094393 = product of:
        2.7359824 = sum of:
          1.1653827 = weight(author_txt:zhang in 3669) [ClassicSimilarity], result of:
            1.1653827 = score(doc=3669,freq=1.0), product of:
              0.35480523 = queryWeight, product of:
                1.06472 = boost
                6.5691404 = idf(docFreq=162, maxDocs=42740)
                0.0507278 = queryNorm
              3.2845702 = fieldWeight in 3669, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.5691404 = idf(docFreq=162, maxDocs=42740)
                0.5 = fieldNorm(doc=3669)
          1.5705996 = weight(author_txt:yang in 3669) [ClassicSimilarity], result of:
            1.5705996 = score(doc=3669,freq=1.0), product of:
              0.43290037 = queryWeight, product of:
                1.1760733 = boost
                7.256171 = idf(docFreq=81, maxDocs=42740)
                0.0507278 = queryNorm
              3.6280856 = fieldWeight in 3669, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.256171 = idf(docFreq=81, maxDocs=42740)
                0.5 = fieldNorm(doc=3669)
        0.4 = coord(2/5)
    

Similar documents (content)

  1. Shen, D.; Yang, Q.; Chen, Z.: Noise reduction through summarization for Web-page classification (2007) 1.93
    1.9297807 = sum of:
      1.9297807 = sum of:
        0.18449573 = weight(abstract_txt:classification in 2954) [ClassicSimilarity], result of:
          0.18449573 = score(doc=2954,freq=6.0), product of:
            0.24102704 = queryWeight, product of:
              3.9999528 = idf(docFreq=2127, maxDocs=42740)
              0.060257472 = queryNorm
            0.76545656 = fieldWeight in 2954, product of:
              2.4494898 = tf(freq=6.0), with freq of:
                6.0 = termFreq=6.0
              3.9999528 = idf(docFreq=2127, maxDocs=42740)
              0.078125 = fieldNorm(doc=2954)
        0.078129046 = weight(abstract_txt:through in 2954) [ClassicSimilarity], result of:
          0.078129046 = score(doc=2954,freq=1.0), product of:
            0.24698296 = queryWeight, product of:
              1.0122799 = boost
              4.049072 = idf(docFreq=2025, maxDocs=42740)
              0.060257472 = queryNorm
            0.31633374 = fieldWeight in 2954, product of:
              1.0 = tf(freq=1.0), with freq of:
                1.0 = termFreq=1.0
              4.049072 = idf(docFreq=2025, maxDocs=42740)
              0.078125 = fieldNorm(doc=2954)
        0.61732984 = weight(abstract_txt:page in 2954) [ClassicSimilarity], result of:
          0.61732984 = score(doc=2954,freq=6.0), product of:
            0.53920394 = queryWeight, product of:
              1.4956971 = boost
              5.982718 = idf(docFreq=292, maxDocs=42740)
              0.060257472 = queryNorm
            1.1448911 = fieldWeight in 2954, product of:
              2.4494898 = tf(freq=6.0), with freq of:
                6.0 = termFreq=6.0
              5.982718 = idf(docFreq=292, maxDocs=42740)
              0.078125 = fieldNorm(doc=2954)
        1.0498261 = weight(abstract_txt:summarization in 2954) [ClassicSimilarity], result of:
          1.0498261 = score(doc=2954,freq=6.0), product of:
            0.76822156 = queryWeight, product of:
              1.7852966 = boost
              7.141102 = idf(docFreq=91, maxDocs=42740)
              0.060257472 = queryNorm
            1.3665669 = fieldWeight in 2954, product of:
              2.4494898 = tf(freq=6.0), with freq of:
                6.0 = termFreq=6.0
              7.141102 = idf(docFreq=91, maxDocs=42740)
              0.078125 = fieldNorm(doc=2954)
    
  2. Huo, W.: Automatic multi-word term extraction and its application to Web-page summarization (2012) 0.88
    0.8805561 = sum of:
      0.8805561 = product of:
        1.1740748 = sum of:
          0.07532006 = weight(abstract_txt:classification in 2564) [ClassicSimilarity], result of:
            0.07532006 = score(doc=2564,freq=1.0), product of:
              0.24102704 = queryWeight, product of:
                3.9999528 = idf(docFreq=2127, maxDocs=42740)
                0.060257472 = queryNorm
              0.3124963 = fieldWeight in 2564, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.9999528 = idf(docFreq=2127, maxDocs=42740)
                0.078125 = fieldNorm(doc=2564)
          0.35641554 = weight(abstract_txt:page in 2564) [ClassicSimilarity], result of:
            0.35641554 = score(doc=2564,freq=2.0), product of:
              0.53920394 = queryWeight, product of:
                1.4956971 = boost
                5.982718 = idf(docFreq=292, maxDocs=42740)
                0.060257472 = queryNorm
              0.66100323 = fieldWeight in 2564, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.982718 = idf(docFreq=292, maxDocs=42740)
                0.078125 = fieldNorm(doc=2564)
          0.74233913 = weight(abstract_txt:summarization in 2564) [ClassicSimilarity], result of:
            0.74233913 = score(doc=2564,freq=3.0), product of:
              0.76822156 = queryWeight, product of:
                1.7852966 = boost
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.060257472 = queryNorm
              0.96630865 = fieldWeight in 2564, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.078125 = fieldNorm(doc=2564)
        0.75 = coord(3/4)
    
  3. Balas, J.: Dewey and the net (1996) 0.43
    0.4345446 = sum of:
      0.4345446 = product of:
        0.8690892 = sum of:
          0.15625809 = weight(abstract_txt:through in 4773) [ClassicSimilarity], result of:
            0.15625809 = score(doc=4773,freq=1.0), product of:
              0.24698296 = queryWeight, product of:
                1.0122799 = boost
                4.049072 = idf(docFreq=2025, maxDocs=42740)
                0.060257472 = queryNorm
              0.6326675 = fieldWeight in 4773, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.049072 = idf(docFreq=2025, maxDocs=42740)
                0.15625 = fieldNorm(doc=4773)
          0.7128311 = weight(abstract_txt:page in 4773) [ClassicSimilarity], result of:
            0.7128311 = score(doc=4773,freq=2.0), product of:
              0.53920394 = queryWeight, product of:
                1.4956971 = boost
                5.982718 = idf(docFreq=292, maxDocs=42740)
                0.060257472 = queryNorm
              1.3220065 = fieldWeight in 4773, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.982718 = idf(docFreq=292, maxDocs=42740)
                0.15625 = fieldNorm(doc=4773)
        0.5 = coord(2/4)
    
  4. Over, P.; Dang, H.; Harman, D.: DUC in context (2007) 0.35
    0.35470313 = sum of:
      0.35470313 = product of:
        0.70940626 = sum of:
          0.109380655 = weight(abstract_txt:through in 2935) [ClassicSimilarity], result of:
            0.109380655 = score(doc=2935,freq=1.0), product of:
              0.24698296 = queryWeight, product of:
                1.0122799 = boost
                4.049072 = idf(docFreq=2025, maxDocs=42740)
                0.060257472 = queryNorm
              0.44286722 = fieldWeight in 2935, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.049072 = idf(docFreq=2025, maxDocs=42740)
                0.109375 = fieldNorm(doc=2935)
          0.6000256 = weight(abstract_txt:summarization in 2935) [ClassicSimilarity], result of:
            0.6000256 = score(doc=2935,freq=1.0), product of:
              0.76822156 = queryWeight, product of:
                1.7852966 = boost
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.060257472 = queryNorm
              0.781058 = fieldWeight in 2935, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.141102 = idf(docFreq=91, maxDocs=42740)
                0.109375 = fieldNorm(doc=2935)
        0.5 = coord(2/4)
    
  5. Bar-Ilan, J.: What do we know about links and linking? : a framework for studying links in academic environments (2005) 0.35
    0.3454583 = sum of:
      0.3454583 = product of:
        0.46061108 = sum of:
          0.13045818 = weight(abstract_txt:classification in 3059) [ClassicSimilarity], result of:
            0.13045818 = score(doc=3059,freq=3.0), product of:
              0.24102704 = queryWeight, product of:
                3.9999528 = idf(docFreq=2127, maxDocs=42740)
                0.060257472 = queryNorm
              0.5412595 = fieldWeight in 3059, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.9999528 = idf(docFreq=2127, maxDocs=42740)
                0.078125 = fieldNorm(doc=3059)
          0.078129046 = weight(abstract_txt:through in 3059) [ClassicSimilarity], result of:
            0.078129046 = score(doc=3059,freq=1.0), product of:
              0.24698296 = queryWeight, product of:
                1.0122799 = boost
                4.049072 = idf(docFreq=2025, maxDocs=42740)
                0.060257472 = queryNorm
              0.31633374 = fieldWeight in 3059, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.049072 = idf(docFreq=2025, maxDocs=42740)
                0.078125 = fieldNorm(doc=3059)
          0.25202385 = weight(abstract_txt:page in 3059) [ClassicSimilarity], result of:
            0.25202385 = score(doc=3059,freq=1.0), product of:
              0.53920394 = queryWeight, product of:
                1.4956971 = boost
                5.982718 = idf(docFreq=292, maxDocs=42740)
                0.060257472 = queryNorm
              0.46739984 = fieldWeight in 3059, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.982718 = idf(docFreq=292, maxDocs=42740)
                0.078125 = fieldNorm(doc=3059)
        0.75 = coord(3/4)