Document (#21322)

Author
Dietterich, T.G.
Title
Machine-learning research : four current directions
Source
AI magazine. 18(1997) no.4, S.97-136
Year
1997
Abstract
Summarizes 4 directions in machine-learning research and discusses some current open problems: the improvement of classification accuracy by learning ensembles of classifiers, methods for scaling up supervised learning algorithms, reinforcement learning and the learning of complex stochastic models
Footnote
Contribution to a special section reviewing recent research in empirical methods in speech recognition, syntactic parsing, semantic processing, information extraction and machine translation

Similar documents (content)

  1. Pong, J.Y.-H.; Kwok, R.C.-W.; Lau, R.Y.-K.; Hao, J.-X.; Wong, P.C.-C.: ¬A comparative study of two automatic document classification methods in a library setting (2008) 0.32
    0.31578588 = sum of:
      0.31578588 = product of:
        0.8420957 = sum of:
          0.011928104 = weight(abstract_txt:some in 2532) [ClassicSimilarity], result of:
            0.011928104 = score(doc=2532,freq=1.0), product of:
              0.051890474 = queryWeight, product of:
                3.6779325 = idf(docFreq=3037, maxDocs=44218)
                0.014108598 = queryNorm
              0.22987078 = fieldWeight in 2532, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6779325 = idf(docFreq=3037, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.037362155 = weight(abstract_txt:classification in 2532) [ClassicSimilarity], result of:
            0.037362155 = score(doc=2532,freq=6.0), product of:
              0.061133258 = queryWeight, product of:
                1.0854129 = boost
                3.9920752 = idf(docFreq=2218, maxDocs=44218)
                0.014108598 = queryNorm
              0.6111592 = fieldWeight in 2532, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                3.9920752 = idf(docFreq=2218, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.017095597 = weight(abstract_txt:methods in 2532) [ClassicSimilarity], result of:
            0.017095597 = score(doc=2532,freq=1.0), product of:
              0.06596237 = queryWeight, product of:
                1.1274682 = boost
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.014108598 = queryNorm
              0.259172 = fieldWeight in 2532, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.06305362 = weight(abstract_txt:algorithms in 2532) [ClassicSimilarity], result of:
            0.06305362 = score(doc=2532,freq=2.0), product of:
              0.124978915 = queryWeight, product of:
                1.5519387 = boost
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.014108598 = queryNorm
              0.5045141 = fieldWeight in 2532, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.015279418 = weight(abstract_txt:research in 2532) [ClassicSimilarity], result of:
            0.015279418 = score(doc=2532,freq=1.0), product of:
              0.07711187 = queryWeight, product of:
                1.7239783 = boost
                3.170338 = idf(docFreq=5046, maxDocs=44218)
                0.014108598 = queryNorm
              0.19814612 = fieldWeight in 2532, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.170338 = idf(docFreq=5046, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.14092149 = weight(abstract_txt:supervised in 2532) [ClassicSimilarity], result of:
            0.14092149 = score(doc=2532,freq=2.0), product of:
              0.21363948 = queryWeight, product of:
                2.0290697 = boost
                7.462781 = idf(docFreq=68, maxDocs=44218)
                0.014108598 = queryNorm
              0.65962285 = fieldWeight in 2532, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.462781 = idf(docFreq=68, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.053843707 = weight(abstract_txt:current in 2532) [ClassicSimilarity], result of:
            0.053843707 = score(doc=2532,freq=2.0), product of:
              0.1417305 = queryWeight, product of:
                2.3372376 = boost
                4.298101 = idf(docFreq=1633, maxDocs=44218)
                0.014108598 = queryNorm
              0.37990203 = fieldWeight in 2532, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.298101 = idf(docFreq=1633, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.15769294 = weight(abstract_txt:machine in 2532) [ClassicSimilarity], result of:
            0.15769294 = score(doc=2532,freq=5.0), product of:
              0.21376415 = queryWeight, product of:
                2.870375 = boost
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.014108598 = queryNorm
              0.73769593 = fieldWeight in 2532, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
          0.34491867 = weight(abstract_txt:learning in 2532) [ClassicSimilarity], result of:
            0.34491867 = score(doc=2532,freq=5.0), product of:
              0.51949126 = queryWeight, product of:
                7.750343 = boost
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.014108598 = queryNorm
              0.66395473 = fieldWeight in 2532, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.0625 = fieldNorm(doc=2532)
        0.375 = coord(9/24)
    
  2. Ko, Y.; Seo, J.: Text classification from unlabeled documents with bootstrapping and feature projection techniques (2009) 0.25
    0.2464488 = sum of:
      0.2464488 = product of:
        0.84496737 = sum of:
          0.011928104 = weight(abstract_txt:some in 2452) [ClassicSimilarity], result of:
            0.011928104 = score(doc=2452,freq=1.0), product of:
              0.051890474 = queryWeight, product of:
                3.6779325 = idf(docFreq=3037, maxDocs=44218)
                0.014108598 = queryNorm
              0.22987078 = fieldWeight in 2452, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.6779325 = idf(docFreq=3037, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
          0.034106825 = weight(abstract_txt:classification in 2452) [ClassicSimilarity], result of:
            0.034106825 = score(doc=2452,freq=5.0), product of:
              0.061133258 = queryWeight, product of:
                1.0854129 = boost
                3.9920752 = idf(docFreq=2218, maxDocs=44218)
                0.014108598 = queryNorm
              0.5579095 = fieldWeight in 2452, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                3.9920752 = idf(docFreq=2218, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
          0.019028496 = weight(abstract_txt:problems in 2452) [ClassicSimilarity], result of:
            0.019028496 = score(doc=2452,freq=1.0), product of:
              0.070845075 = queryWeight, product of:
                1.1684524 = boost
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.014108598 = queryNorm
              0.26859307 = fieldWeight in 2452, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
          0.04458565 = weight(abstract_txt:algorithms in 2452) [ClassicSimilarity], result of:
            0.04458565 = score(doc=2452,freq=1.0), product of:
              0.124978915 = queryWeight, product of:
                1.5519387 = boost
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.014108598 = queryNorm
              0.35674536 = fieldWeight in 2452, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
          0.19929308 = weight(abstract_txt:supervised in 2452) [ClassicSimilarity], result of:
            0.19929308 = score(doc=2452,freq=4.0), product of:
              0.21363948 = queryWeight, product of:
                2.0290697 = boost
                7.462781 = idf(docFreq=68, maxDocs=44218)
                0.014108598 = queryNorm
              0.9328476 = fieldWeight in 2452, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.462781 = idf(docFreq=68, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
          0.09973378 = weight(abstract_txt:machine in 2452) [ClassicSimilarity], result of:
            0.09973378 = score(doc=2452,freq=2.0), product of:
              0.21376415 = queryWeight, product of:
                2.870375 = boost
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.014108598 = queryNorm
              0.4665599 = fieldWeight in 2452, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
          0.43629143 = weight(abstract_txt:learning in 2452) [ClassicSimilarity], result of:
            0.43629143 = score(doc=2452,freq=8.0), product of:
              0.51949126 = queryWeight, product of:
                7.750343 = boost
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.014108598 = queryNorm
              0.83984363 = fieldWeight in 2452, product of:
                2.828427 = tf(freq=8.0), with freq of:
                  8.0 = termFreq=8.0
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.0625 = fieldNorm(doc=2452)
        0.29166666 = coord(7/24)
    
  3. Xiang, R.; Chersoni, E.; Lu, Q.; Huang, C.-R.; Li, W.; Long, Y.: Lexical data augmentation for sentiment analysis (2021) 0.24
    0.23764667 = sum of:
      0.23764667 = product of:
        0.71294 = sum of:
          0.036641058 = weight(abstract_txt:methods in 392) [ClassicSimilarity], result of:
            0.036641058 = score(doc=392,freq=6.0), product of:
              0.06596237 = queryWeight, product of:
                1.1274682 = boost
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.014108598 = queryNorm
              0.5554843 = fieldWeight in 392, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.029667376 = weight(abstract_txt:models in 392) [ClassicSimilarity], result of:
            0.029667376 = score(doc=392,freq=2.0), product of:
              0.08264389 = queryWeight, product of:
                1.2620064 = boost
                4.6415744 = idf(docFreq=1158, maxDocs=44218)
                0.014108598 = queryNorm
              0.35897845 = fieldWeight in 392, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.6415744 = idf(docFreq=1158, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.055171918 = weight(abstract_txt:algorithms in 392) [ClassicSimilarity], result of:
            0.055171918 = score(doc=392,freq=2.0), product of:
              0.124978915 = queryWeight, product of:
                1.5519387 = boost
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.014108598 = queryNorm
              0.44144982 = fieldWeight in 392, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.04463749 = weight(abstract_txt:accuracy in 392) [ClassicSimilarity], result of:
            0.04463749 = score(doc=392,freq=1.0), product of:
              0.13672078 = queryWeight, product of:
                1.6232053 = boost
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.014108598 = queryNorm
              0.32648653 = fieldWeight in 392, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.04883775 = weight(abstract_txt:improvement in 392) [ClassicSimilarity], result of:
            0.04883775 = score(doc=392,freq=1.0), product of:
              0.14516829 = queryWeight, product of:
                1.6725999 = boost
                6.1517096 = idf(docFreq=255, maxDocs=44218)
                0.014108598 = queryNorm
              0.3364216 = fieldWeight in 392, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.1517096 = idf(docFreq=255, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.08930068 = weight(abstract_txt:classifiers in 392) [ClassicSimilarity], result of:
            0.08930068 = score(doc=392,freq=1.0), product of:
              0.21707234 = queryWeight, product of:
                2.0453067 = boost
                7.5225 = idf(docFreq=64, maxDocs=44218)
                0.014108598 = queryNorm
              0.41138673 = fieldWeight in 392, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.5225 = idf(docFreq=64, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.10687987 = weight(abstract_txt:machine in 392) [ClassicSimilarity], result of:
            0.10687987 = score(doc=392,freq=3.0), product of:
              0.21376415 = queryWeight, product of:
                2.870375 = boost
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.014108598 = queryNorm
              0.4999897 = fieldWeight in 392, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
          0.30180386 = weight(abstract_txt:learning in 392) [ClassicSimilarity], result of:
            0.30180386 = score(doc=392,freq=5.0), product of:
              0.51949126 = queryWeight, product of:
                7.750343 = boost
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.014108598 = queryNorm
              0.5809604 = fieldWeight in 392, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.0546875 = fieldNorm(doc=392)
        0.33333334 = coord(8/24)
    
  4. Li, H.; Wu, H.; Li, D.; Lin, S.; Su, Z.; Luo, X.: PSI: A probabilistic semantic interpretable framework for fine-grained image ranking (2018) 0.21
    0.21388094 = sum of:
      0.21388094 = product of:
        0.6416428 = sum of:
          0.030221034 = weight(abstract_txt:methods in 4577) [ClassicSimilarity], result of:
            0.030221034 = score(doc=4577,freq=2.0), product of:
              0.06596237 = queryWeight, product of:
                1.1274682 = boost
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.014108598 = queryNorm
              0.4581557 = fieldWeight in 4577, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.02378562 = weight(abstract_txt:problems in 4577) [ClassicSimilarity], result of:
            0.02378562 = score(doc=4577,freq=1.0), product of:
              0.070845075 = queryWeight, product of:
                1.1684524 = boost
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.014108598 = queryNorm
              0.33574134 = fieldWeight in 4577, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.05993715 = weight(abstract_txt:models in 4577) [ClassicSimilarity], result of:
            0.05993715 = score(doc=4577,freq=4.0), product of:
              0.08264389 = queryWeight, product of:
                1.2620064 = boost
                4.6415744 = idf(docFreq=1158, maxDocs=44218)
                0.014108598 = queryNorm
              0.725246 = fieldWeight in 4577, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.6415744 = idf(docFreq=1158, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.06376784 = weight(abstract_txt:accuracy in 4577) [ClassicSimilarity], result of:
            0.06376784 = score(doc=4577,freq=1.0), product of:
              0.13672078 = queryWeight, product of:
                1.6232053 = boost
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.014108598 = queryNorm
              0.46640933 = fieldWeight in 4577, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.019099273 = weight(abstract_txt:research in 4577) [ClassicSimilarity], result of:
            0.019099273 = score(doc=4577,freq=1.0), product of:
              0.07711187 = queryWeight, product of:
                1.7239783 = boost
                3.170338 = idf(docFreq=5046, maxDocs=44218)
                0.014108598 = queryNorm
              0.24768265 = fieldWeight in 4577, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.170338 = idf(docFreq=5046, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.12455817 = weight(abstract_txt:supervised in 4577) [ClassicSimilarity], result of:
            0.12455817 = score(doc=4577,freq=1.0), product of:
              0.21363948 = queryWeight, product of:
                2.0290697 = boost
                7.462781 = idf(docFreq=68, maxDocs=44218)
                0.014108598 = queryNorm
              0.58302975 = fieldWeight in 4577, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.462781 = idf(docFreq=68, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.047591563 = weight(abstract_txt:current in 4577) [ClassicSimilarity], result of:
            0.047591563 = score(doc=4577,freq=1.0), product of:
              0.1417305 = queryWeight, product of:
                2.3372376 = boost
                4.298101 = idf(docFreq=1633, maxDocs=44218)
                0.014108598 = queryNorm
              0.33578914 = fieldWeight in 4577, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.298101 = idf(docFreq=1633, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
          0.27268216 = weight(abstract_txt:learning in 4577) [ClassicSimilarity], result of:
            0.27268216 = score(doc=4577,freq=2.0), product of:
              0.51949126 = queryWeight, product of:
                7.750343 = boost
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.014108598 = queryNorm
              0.5249023 = fieldWeight in 4577, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.078125 = fieldNorm(doc=4577)
        0.33333334 = coord(8/24)
    
  5. Cardie, C.: Empirical methods in information extraction (1997) 0.21
    0.21019608 = sum of:
      0.21019608 = product of:
        0.8407843 = sum of:
          0.034191195 = weight(abstract_txt:methods in 3246) [ClassicSimilarity], result of:
            0.034191195 = score(doc=3246,freq=1.0), product of:
              0.06596237 = queryWeight, product of:
                1.1274682 = boost
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.014108598 = queryNorm
              0.518344 = fieldWeight in 3246, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.146752 = idf(docFreq=1900, maxDocs=44218)
                0.125 = fieldNorm(doc=3246)
          0.038056992 = weight(abstract_txt:problems in 3246) [ClassicSimilarity], result of:
            0.038056992 = score(doc=3246,freq=1.0), product of:
              0.070845075 = queryWeight, product of:
                1.1684524 = boost
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.014108598 = queryNorm
              0.53718615 = fieldWeight in 3246, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.297489 = idf(docFreq=1634, maxDocs=44218)
                0.125 = fieldNorm(doc=3246)
          0.0891713 = weight(abstract_txt:algorithms in 3246) [ClassicSimilarity], result of:
            0.0891713 = score(doc=3246,freq=1.0), product of:
              0.124978915 = queryWeight, product of:
                1.5519387 = boost
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.014108598 = queryNorm
              0.7134907 = fieldWeight in 3246, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.707926 = idf(docFreq=398, maxDocs=44218)
                0.125 = fieldNorm(doc=3246)
          0.10202855 = weight(abstract_txt:accuracy in 3246) [ClassicSimilarity], result of:
            0.10202855 = score(doc=3246,freq=1.0), product of:
              0.13672078 = queryWeight, product of:
                1.6232053 = boost
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.014108598 = queryNorm
              0.7462549 = fieldWeight in 3246, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.125 = fieldNorm(doc=3246)
          0.14104486 = weight(abstract_txt:machine in 3246) [ClassicSimilarity], result of:
            0.14104486 = score(doc=3246,freq=1.0), product of:
              0.21376415 = queryWeight, product of:
                2.870375 = boost
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.014108598 = queryNorm
              0.6598153 = fieldWeight in 3246, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.2785225 = idf(docFreq=612, maxDocs=44218)
                0.125 = fieldNorm(doc=3246)
          0.43629143 = weight(abstract_txt:learning in 3246) [ClassicSimilarity], result of:
            0.43629143 = score(doc=3246,freq=2.0), product of:
              0.51949126 = queryWeight, product of:
                7.750343 = boost
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.014108598 = queryNorm
              0.83984363 = fieldWeight in 3246, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.750873 = idf(docFreq=1038, maxDocs=44218)
                0.125 = fieldNorm(doc=3246)
        0.25 = coord(6/24)