Search (76 results, page 1 of 4)

Tiefschürfen in Datenbanken (2002) 0.03

0.034505457 = product of:
  0.075912006 = sum of:
    0.007251961 = product of:
      0.014503922 = sum of:
        0.014503922 = weight(_text_:h in 996) [ClassicSimilarity], result of:
          0.014503922 = score(doc=996,freq=2.0), product of:
            0.0660481 = queryWeight, product of:
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.026584605 = queryNorm
            0.21959636 = fieldWeight in 996, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.0625 = fieldNorm(doc=996)
      0.5 = coord(1/2)
    0.0031240587 = weight(_text_:a in 996) [ClassicSimilarity], result of:
      0.0031240587 = score(doc=996,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.10191591 = fieldWeight in 996, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0625 = fieldNorm(doc=996)
    0.036413636 = weight(_text_:r in 996) [ClassicSimilarity], result of:
      0.036413636 = score(doc=996,freq=4.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.4137823 = fieldWeight in 996, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.0625 = fieldNorm(doc=996)
    0.00392816 = weight(_text_:s in 996) [ClassicSimilarity], result of:
      0.00392816 = score(doc=996,freq=4.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.1359047 = fieldWeight in 996, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0625 = fieldNorm(doc=996)
    0.025194194 = weight(_text_:u in 996) [ClassicSimilarity], result of:
      0.025194194 = score(doc=996,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.28942272 = fieldWeight in 996, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.0625 = fieldNorm(doc=996)
  0.45454547 = coord(5/11)

Content: Enthält die Beiträge: Kruse, R., C. Borgelt: Suche im Datendschungel - Borgelt, C. u. R. Kruse: Unsicheres Wissen nutzen - Wrobel, S.: Lern- und Entdeckungsverfahren - Keim, D.A.: Data Mining mit bloßem Auge
Source: Spektrum der Wissenschaft. 2002, H.11, S.80-91
Type: a

Kruse, R.; Borgelt, C.: Suche im Datendschungel (2002) 0.02

0.02121926 = product of:
  0.058352962 = sum of:
    0.010877941 = product of:
      0.021755882 = sum of:
        0.021755882 = weight(_text_:h in 1087) [ClassicSimilarity], result of:
          0.021755882 = score(doc=1087,freq=2.0), product of:
            0.0660481 = queryWeight, product of:
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.026584605 = queryNorm
            0.32939452 = fieldWeight in 1087, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.09375 = fieldNorm(doc=1087)
      0.5 = coord(1/2)
    0.0046860883 = weight(_text_:a in 1087) [ClassicSimilarity], result of:
      0.0046860883 = score(doc=1087,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.15287387 = fieldWeight in 1087, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.09375 = fieldNorm(doc=1087)
    0.03862249 = weight(_text_:r in 1087) [ClassicSimilarity], result of:
      0.03862249 = score(doc=1087,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.4388824 = fieldWeight in 1087, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.09375 = fieldNorm(doc=1087)
    0.0041664424 = weight(_text_:s in 1087) [ClassicSimilarity], result of:
      0.0041664424 = score(doc=1087,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.14414869 = fieldWeight in 1087, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.09375 = fieldNorm(doc=1087)
  0.36363637 = coord(4/11)

Source: Spektrum der Wissenschaft. 2002, H.11, S.80-81
Type: a

Schwartz, D.: Graphische Datenanalyse für digitale Bibliotheken : Leistungs- und Funktionsumfang moderner Analyse- und Visualisierungsinstrumente (2006) 0.02

0.019421732 = product of:
  0.053409763 = sum of:
    0.0027335514 = weight(_text_:a in 30) [ClassicSimilarity], result of:
      0.0027335514 = score(doc=30,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.089176424 = fieldWeight in 30, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0546875 = fieldNorm(doc=30)
    0.0024304248 = weight(_text_:s in 30) [ClassicSimilarity], result of:
      0.0024304248 = score(doc=30,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.08408674 = fieldWeight in 30, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0546875 = fieldNorm(doc=30)
    0.02204492 = weight(_text_:u in 30) [ClassicSimilarity], result of:
      0.02204492 = score(doc=30,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.25324488 = fieldWeight in 30, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.0546875 = fieldNorm(doc=30)
    0.02620087 = weight(_text_:k in 30) [ClassicSimilarity], result of:
      0.02620087 = score(doc=30,freq=2.0), product of:
        0.09490114 = queryWeight, product of:
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.026584605 = queryNorm
        0.27608594 = fieldWeight in 30, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.0546875 = fieldNorm(doc=30)
  0.36363637 = coord(4/11)

Pages: S.273-291
Source: Vom Wandel der Wissensorganisation im Informationszeitalter: Festschrift für Walther Umstätter zum 65. Geburtstag, hrsg. von P. Hauke u. K. Umlauf
Type: a

Baumgartner, R.: Methoden und Werkzeuge zur Webdatenextraktion (2006) 0.02

0.018498529 = product of:
  0.050870955 = sum of:
    0.003865826 = weight(_text_:a in 5808) [ClassicSimilarity], result of:
      0.003865826 = score(doc=5808,freq=4.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.12611452 = fieldWeight in 5808, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0546875 = fieldNorm(doc=5808)
    0.022529786 = weight(_text_:r in 5808) [ClassicSimilarity], result of:
      0.022529786 = score(doc=5808,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.25601473 = fieldWeight in 5808, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.0546875 = fieldNorm(doc=5808)
    0.0024304248 = weight(_text_:s in 5808) [ClassicSimilarity], result of:
      0.0024304248 = score(doc=5808,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.08408674 = fieldWeight in 5808, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0546875 = fieldNorm(doc=5808)
    0.02204492 = weight(_text_:u in 5808) [ClassicSimilarity], result of:
      0.02204492 = score(doc=5808,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.25324488 = fieldWeight in 5808, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.0546875 = fieldNorm(doc=5808)
  0.36363637 = coord(4/11)

Pages: S.419-435
Source: Semantic Web: Wege zur vernetzten Wissensgesellschaft. Hrsg.: T. Pellegrini, u. A. Blumauer
Type: a

Borgelt, C.; Kruse, R.: Unsicheres Wissen nutzen (2002) 0.02

0.017682716 = product of:
  0.04862747 = sum of:
    0.009064952 = product of:
      0.018129904 = sum of:
        0.018129904 = weight(_text_:h in 1104) [ClassicSimilarity], result of:
          0.018129904 = score(doc=1104,freq=2.0), product of:
            0.0660481 = queryWeight, product of:
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.026584605 = queryNorm
            0.27449545 = fieldWeight in 1104, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.078125 = fieldNorm(doc=1104)
      0.5 = coord(1/2)
    0.0039050733 = weight(_text_:a in 1104) [ClassicSimilarity], result of:
      0.0039050733 = score(doc=1104,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.12739488 = fieldWeight in 1104, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.078125 = fieldNorm(doc=1104)
    0.03218541 = weight(_text_:r in 1104) [ClassicSimilarity], result of:
      0.03218541 = score(doc=1104,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.36573532 = fieldWeight in 1104, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.078125 = fieldNorm(doc=1104)
    0.0034720355 = weight(_text_:s in 1104) [ClassicSimilarity], result of:
      0.0034720355 = score(doc=1104,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.120123915 = fieldWeight in 1104, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.078125 = fieldNorm(doc=1104)
  0.36363637 = coord(4/11)

Source: Spektrum der Wissenschaft. 2002, H.11, S.82-84
Type: a

Ohly, H.P.: Bibliometric mining : added value from document analysis and retrieval (2008) 0.02

0.016960982 = product of:
  0.0466427 = sum of:
    0.0023430442 = weight(_text_:a in 2386) [ClassicSimilarity], result of:
      0.0023430442 = score(doc=2386,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.07643694 = fieldWeight in 2386, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.046875 = fieldNorm(doc=2386)
    0.00294612 = weight(_text_:s in 2386) [ClassicSimilarity], result of:
      0.00294612 = score(doc=2386,freq=4.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.101928525 = fieldWeight in 2386, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.046875 = fieldNorm(doc=2386)
    0.018895645 = weight(_text_:u in 2386) [ClassicSimilarity], result of:
      0.018895645 = score(doc=2386,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.21706703 = fieldWeight in 2386, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.046875 = fieldNorm(doc=2386)
    0.022457888 = weight(_text_:k in 2386) [ClassicSimilarity], result of:
      0.022457888 = score(doc=2386,freq=2.0), product of:
        0.09490114 = queryWeight, product of:
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.026584605 = queryNorm
        0.23664509 = fieldWeight in 2386, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.046875 = fieldNorm(doc=2386)
  0.36363637 = coord(4/11)

Pages: S.181-186
Source: Kompatibilität, Medien und Ethik in der Wissensorganisation - Compatibility, Media and Ethics in Knowledge Organization: Proceedings der 10. Tagung der Deutschen Sektion der Internationalen Gesellschaft für Wissensorganisation Wien, 3.-5. Juli 2006 - Proceedings of the 10th Conference of the German Section of the International Society of Knowledge Organization Vienna, 3-5 July 2006. Ed.: H.P. Ohly, S. Netscher u. K. Mitgutsch
Type: a

Relational data mining (2001) 0.02

0.016909536 = product of:
  0.046501223 = sum of:
    0.0046860883 = weight(_text_:a in 1303) [ClassicSimilarity], result of:
      0.0046860883 = score(doc=1303,freq=8.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.15287387 = fieldWeight in 1303, product of:
          2.828427 = tf(freq=8.0), with freq of:
            8.0 = termFreq=8.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.046875 = fieldNorm(doc=1303)
    0.019311246 = weight(_text_:r in 1303) [ClassicSimilarity], result of:
      0.019311246 = score(doc=1303,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.2194412 = fieldWeight in 1303, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.046875 = fieldNorm(doc=1303)
    0.0036082454 = weight(_text_:s in 1303) [ClassicSimilarity], result of:
      0.0036082454 = score(doc=1303,freq=6.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.124836445 = fieldWeight in 1303, product of:
          2.4494898 = tf(freq=6.0), with freq of:
            6.0 = termFreq=6.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.046875 = fieldNorm(doc=1303)
    0.018895645 = weight(_text_:u in 1303) [ClassicSimilarity], result of:
      0.018895645 = score(doc=1303,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.21706703 = fieldWeight in 1303, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.046875 = fieldNorm(doc=1303)
  0.36363637 = coord(4/11)

Abstract: As the first book devoted to relational data mining, this coherently written multi-author monograph provides a thorough introduction and systematic overview of the area. The ferst part introduces the reader to the basics and principles of classical knowledge discovery in databases and inductive logic programmeng; subsequent chapters by leading experts assess the techniques in relational data mining in a principled and comprehensive way; finally, three chapters deal with advanced applications in various fields and refer the reader to resources for relational data mining. This book will become a valuable source of reference for R&D professionals active in relational data mining. Students as well as IT professionals and ambitioned practitioners interested in learning about relational data mining will appreciate the book as a useful text and gentle introduction to this exciting new field.
Editor: Dzeroski, S. u. N. Lavrac
Pages: XIX,398 S
Type: s

Heyer, G.; Läuter, M.; Quasthoff, U.; Wolff, C.: Texttechnologische Anwendungen am Beispiel Text Mining (2000) 0.02

0.0166472 = product of:
  0.0457798 = sum of:
    0.0023430442 = weight(_text_:a in 5565) [ClassicSimilarity], result of:
      0.0023430442 = score(doc=5565,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.07643694 = fieldWeight in 5565, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.046875 = fieldNorm(doc=5565)
    0.0020832212 = weight(_text_:s in 5565) [ClassicSimilarity], result of:
      0.0020832212 = score(doc=5565,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.072074346 = fieldWeight in 5565, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.046875 = fieldNorm(doc=5565)
    0.018895645 = weight(_text_:u in 5565) [ClassicSimilarity], result of:
      0.018895645 = score(doc=5565,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.21706703 = fieldWeight in 5565, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.046875 = fieldNorm(doc=5565)
    0.022457888 = weight(_text_:k in 5565) [ClassicSimilarity], result of:
      0.022457888 = score(doc=5565,freq=2.0), product of:
        0.09490114 = queryWeight, product of:
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.026584605 = queryNorm
        0.23664509 = fieldWeight in 5565, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.046875 = fieldNorm(doc=5565)
  0.36363637 = coord(4/11)

Pages: S.203-209
Source: Sprachtechnologie für eine dynamische Wirtschaft im Medienzeitalter - Language technologies for dynamic business in the age of the media - L'ingénierie linguistique au service de la dynamisation économique à l'ère du multimédia: Tagungsakten der XXVI. Jahrestagung der Internationalen Vereinigung Sprache und Wirtschaft e.V., 23.-25.11.2000, Fachhochschule Köln. Hrsg.: K.-D. Schmitz
Type: a

Hereth, J.; Stumme, G.; Wille, R.; Wille, U.: Conceptual knowledge discovery and data analysis (2000) 0.02

0.01637223 = product of:
  0.04502363 = sum of:
    0.004782719 = weight(_text_:a in 5083) [ClassicSimilarity], result of:
      0.004782719 = score(doc=5083,freq=12.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.15602624 = fieldWeight in 5083, product of:
          3.4641016 = tf(freq=12.0), with freq of:
            12.0 = termFreq=12.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0390625 = fieldNorm(doc=5083)
    0.022758523 = weight(_text_:r in 5083) [ClassicSimilarity], result of:
      0.022758523 = score(doc=5083,freq=4.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.25861394 = fieldWeight in 5083, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.0390625 = fieldNorm(doc=5083)
    0.0017360178 = weight(_text_:s in 5083) [ClassicSimilarity], result of:
      0.0017360178 = score(doc=5083,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.060061958 = fieldWeight in 5083, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0390625 = fieldNorm(doc=5083)
    0.015746372 = weight(_text_:u in 5083) [ClassicSimilarity], result of:
      0.015746372 = score(doc=5083,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.1808892 = fieldWeight in 5083, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.0390625 = fieldNorm(doc=5083)
  0.36363637 = coord(4/11)

Abstract: In this paper, we discuss Conceptual Knowledge Discovery in Databases (CKDD) in its connection with Data Analysis. Our approach is based on Formal Concept Analysis, a mathematical theory which has been developed and proven useful during the last 20 years. Formal Concept Analysis has led to a theory of conceptual information systems which has been applied by using the management system TOSCANA in a wide range of domains. In this paper, we use such an application in database marketing to demonstrate how methods and procedures of CKDD can be applied in Data Analysis. In particular, we show the interplay and integration of data mining and data analysis techniques based on Formal Concept Analysis. The main concern of this paper is to explain how the transition from data to knowledge can be supported by a TOSCANA system. To clarify the transition steps we discuss their correspondence to the five levels of knowledge representation established by R. Brachman and to the steps of empirically grounded theory building proposed by A. Strauss and J. Corbin
Pages: S.421-437
Type: a

Keim, D.A.: Datenvisualisierung und Data Mining (2004) 0.01

0.012919139 = product of:
  0.03552763 = sum of:
    0.0019525366 = weight(_text_:a in 2931) [ClassicSimilarity], result of:
      0.0019525366 = score(doc=2931,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.06369744 = fieldWeight in 2931, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0390625 = fieldNorm(doc=2931)
    0.016092705 = weight(_text_:r in 2931) [ClassicSimilarity], result of:
      0.016092705 = score(doc=2931,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.18286766 = fieldWeight in 2931, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.0390625 = fieldNorm(doc=2931)
    0.0017360178 = weight(_text_:s in 2931) [ClassicSimilarity], result of:
      0.0017360178 = score(doc=2931,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.060061958 = fieldWeight in 2931, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0390625 = fieldNorm(doc=2931)
    0.015746372 = weight(_text_:u in 2931) [ClassicSimilarity], result of:
      0.015746372 = score(doc=2931,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.1808892 = fieldWeight in 2931, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.0390625 = fieldNorm(doc=2931)
  0.36363637 = coord(4/11)

Pages: S.363-370
Source: Grundlagen der praktischen Information und Dokumentation. 5., völlig neu gefaßte Ausgabe. 2 Bde. Hrsg. von R. Kuhlen, Th. Seeger u. D. Strauch. Begründet von Klaus Laisiepen, Ernst Lutterbeck, Karl-Heinrich Meyer-Uhlenried. Bd.1: Handbuch zur Einführung in die Informationswissenschaft und -praxis
Type: a

Kulathuramaiyer, N.; Maurer, H.: Implications of emerging data mining (2009) 0.01

0.01186071 = product of:
  0.03261695 = sum of:
    0.0054389704 = product of:
      0.010877941 = sum of:
        0.010877941 = weight(_text_:h in 3144) [ClassicSimilarity], result of:
          0.010877941 = score(doc=3144,freq=2.0), product of:
            0.0660481 = queryWeight, product of:
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.026584605 = queryNorm
            0.16469726 = fieldWeight in 3144, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.046875 = fieldNorm(doc=3144)
      0.5 = coord(1/2)
    0.0061991126 = weight(_text_:a in 3144) [ClassicSimilarity], result of:
      0.0061991126 = score(doc=3144,freq=14.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.20223314 = fieldWeight in 3144, product of:
          3.7416575 = tf(freq=14.0), with freq of:
            14.0 = termFreq=14.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.046875 = fieldNorm(doc=3144)
    0.0020832212 = weight(_text_:s in 3144) [ClassicSimilarity], result of:
      0.0020832212 = score(doc=3144,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.072074346 = fieldWeight in 3144, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.046875 = fieldNorm(doc=3144)
    0.018895645 = weight(_text_:u in 3144) [ClassicSimilarity], result of:
      0.018895645 = score(doc=3144,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.21706703 = fieldWeight in 3144, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.046875 = fieldNorm(doc=3144)
  0.36363637 = coord(4/11)

Abstract: Data Mining describes a technology that discovers non-trivial hidden patterns in a large collection of data. Although this technology has a tremendous impact on our lives, the invaluable contributions of this invisible technology often go unnoticed. This paper discusses advances in data mining while focusing on the emerging data mining capability. Such data mining applications perform multidimensional mining on a wide variety of heterogeneous data sources, providing solutions to many unresolved problems. This paper also highlights the advantages and disadvantages arising from the ever-expanding scope of data mining. Data Mining augments human intelligence by equipping us with a wealth of knowledge and by empowering us to perform our daily tasks better. As the mining scope and capacity increases, users and organizations become more willing to compromise privacy. The huge data stores of the 'master miners' allow them to gain deep insights into individual lifestyles and their social and behavioural patterns. Data integration and analysis capability of combining business and financial trends together with the ability to deterministically track market changes will drastically affect our lives.
Pages: S.469-483
Source: Social Semantic Web: Web 2.0, was nun? Hrsg.: A. Blumauer u. T. Pellegrini
Type: a

Lackes, R.; Tillmanns, C.: Data Mining für die Unternehmenspraxis : Entscheidungshilfen und Fallstudien mit führenden Softwarelösungen (2006) 0.01

0.008781821 = product of:
  0.03220001 = sum of:
    0.019311246 = weight(_text_:r in 1383) [ClassicSimilarity], result of:
      0.019311246 = score(doc=1383,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.2194412 = fieldWeight in 1383, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.046875 = fieldNorm(doc=1383)
    0.0020832212 = weight(_text_:s in 1383) [ClassicSimilarity], result of:
      0.0020832212 = score(doc=1383,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.072074346 = fieldWeight in 1383, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.046875 = fieldNorm(doc=1383)
    0.010805541 = product of:
      0.021611081 = sum of:
        0.021611081 = weight(_text_:22 in 1383) [ClassicSimilarity], result of:
          0.021611081 = score(doc=1383,freq=2.0), product of:
            0.09309476 = queryWeight, product of:
              3.5018296 = idf(docFreq=3622, maxDocs=44218)
              0.026584605 = queryNorm
            0.23214069 = fieldWeight in 1383, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              3.5018296 = idf(docFreq=3622, maxDocs=44218)
              0.046875 = fieldNorm(doc=1383)
      0.5 = coord(1/2)
  0.27272728 = coord(3/11)

Date: 22. 3.2008 14:46:06
Pages: 300 S

Baeza-Yates, R.; Hurtado, C.; Mendoza, M.: Improving search engines by query clustering (2007) 0.01

0.008298359 = product of:
  0.030427314 = sum of:
    0.005467103 = weight(_text_:a in 601) [ClassicSimilarity], result of:
      0.005467103 = score(doc=601,freq=8.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.17835285 = fieldWeight in 601, product of:
          2.828427 = tf(freq=8.0), with freq of:
            8.0 = termFreq=8.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0546875 = fieldNorm(doc=601)
    0.022529786 = weight(_text_:r in 601) [ClassicSimilarity], result of:
      0.022529786 = score(doc=601,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.25601473 = fieldWeight in 601, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.0546875 = fieldNorm(doc=601)
    0.0024304248 = weight(_text_:s in 601) [ClassicSimilarity], result of:
      0.0024304248 = score(doc=601,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.08408674 = fieldWeight in 601, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0546875 = fieldNorm(doc=601)
  0.27272728 = coord(3/11)

Abstract: In this paper, we present a framework for clustering Web search engine queries whose aim is to identify groups of queries used to search for similar information on the Web. The framework is based on a novel term vector model of queries that integrates user selections and the content of selected documents extracted from the logs of a search engine. The query representation obtained allows us to treat query clustering similarly to standard document clustering. We study the application of the clustering framework to two problems: relevance ranking boosting and query recommendation. Finally, we evaluate with experiments the effectiveness of our approach.
Source: Journal of the American Society for Information Science and Technology. 58(2007) no.12, S.1793-1804
Type: a

Data Mining im praktischen Einsatz : Verfahren und Anwendungsfälle für Marketing, Vertrieb, Controlling und Kundenunterstützung (2000) 0.01

0.0079424605 = product of:
  0.04368353 = sum of:
    0.00589224 = weight(_text_:s in 3425) [ClassicSimilarity], result of:
      0.00589224 = score(doc=3425,freq=4.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.20385705 = fieldWeight in 3425, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.09375 = fieldNorm(doc=3425)
    0.03779129 = weight(_text_:u in 3425) [ClassicSimilarity], result of:
      0.03779129 = score(doc=3425,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.43413407 = fieldWeight in 3425, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.09375 = fieldNorm(doc=3425)
  0.18181819 = coord(2/11)

Editor: Alpar, P. u. I. Niedereichholz
Pages: VII, 230 S
Type: s

Pons-Porrata, A.; Berlanga-Llavori, R.; Ruiz-Shulcloper, J.: Topic discovery based on text mining techniques (2007) 0.01

0.007751891 = product of:
  0.0284236 = sum of:
    0.0070291325 = weight(_text_:a in 916) [ClassicSimilarity], result of:
      0.0070291325 = score(doc=916,freq=18.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.22931081 = fieldWeight in 916, product of:
          4.2426405 = tf(freq=18.0), with freq of:
            18.0 = termFreq=18.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.046875 = fieldNorm(doc=916)
    0.019311246 = weight(_text_:r in 916) [ClassicSimilarity], result of:
      0.019311246 = score(doc=916,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.2194412 = fieldWeight in 916, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.046875 = fieldNorm(doc=916)
    0.0020832212 = weight(_text_:s in 916) [ClassicSimilarity], result of:
      0.0020832212 = score(doc=916,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.072074346 = fieldWeight in 916, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.046875 = fieldNorm(doc=916)
  0.27272728 = coord(3/11)

Abstract: In this paper, we present a topic discovery system aimed to reveal the implicit knowledge present in news streams. This knowledge is expressed as a hierarchy of topic/subtopics, where each topic contains the set of documents that are related to it and a summary extracted from these documents. Summaries so built are useful to browse and select topics of interest from the generated hierarchies. Our proposal consists of a new incremental hierarchical clustering algorithm, which combines both partitional and agglomerative approaches, taking the main benefits from them. Finally, a new summarization method based on Testor Theory has been proposed to build the topic summaries. Experimental results in the TDT2 collection demonstrate its usefulness and effectiveness not only as a topic detection system, but also as a classification and summarization tool.
Source: Information processing and management. 43(2007) no.3, S.752-768
Type: a

Lischka, K.: Spurensuche im Datenwust : Data-Mining-Software fahndet nach kriminellen Mitarbeitern, guten Kunden - und bald vielleicht auch nach Terroristen (2002) 0.01
```
0.00702913 = product of:
  0.019330107 = sum of:
    0.0016567823 = weight(_text_:a in 1178) [ClassicSimilarity], result of:
      0.0016567823 = score(doc=1178,freq=4.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.054049075 = fieldWeight in 1178, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0234375 = fieldNorm(doc=1178)
    0.0010416106 = weight(_text_:s in 1178) [ClassicSimilarity], result of:
      0.0010416106 = score(doc=1178,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.036037173 = fieldWeight in 1178, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0234375 = fieldNorm(doc=1178)
    0.011228944 = weight(_text_:k in 1178) [ClassicSimilarity], result of:
      0.011228944 = score(doc=1178,freq=2.0), product of:
        0.09490114 = queryWeight, product of:
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.026584605 = queryNorm
        0.118322544 = fieldWeight in 1178, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.0234375 = fieldNorm(doc=1178)
    0.0054027704 = product of:
      0.010805541 = sum of:
        0.010805541 = weight(_text_:22 in 1178) [ClassicSimilarity], result of:
          0.010805541 = score(doc=1178,freq=2.0), product of:
            0.09309476 = queryWeight, product of:
              3.5018296 = idf(docFreq=3622, maxDocs=44218)
              0.026584605 = queryNorm
            0.116070345 = fieldWeight in 1178, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              3.5018296 = idf(docFreq=3622, maxDocs=44218)
              0.0234375 = fieldNorm(doc=1178)
      0.5 = coord(1/2)
  0.36363637 = coord(4/11)
```
Content

"Ob man als Terrorist einen Anschlag gegen die Vereinigten Staaten plant, als Kassierer Scheine aus der Kasse unterschlägt oder für bestimmte Produkte besonders gerne Geld ausgibt - einen Unterschied macht Data-Mining-Software da nicht. Solche Programme analysieren riesige Daten- mengen und fällen statistische Urteile. Mit diesen Methoden wollen nun die For- scher des "Information Awaren in den Vereinigten Staaten Spuren von Terroristen in den Datenbanken von Behörden und privaten Unternehmen wie Kreditkartenfirmen finden. 200 Millionen Dollar umfasst der Jahresetat für die verschiedenen Forschungsprojekte. Dass solche Software in der Praxis funktioniert, zeigen die steigenden Umsätze der Anbieter so genannter Customer-Relationship-Management-Software. Im vergangenen Jahr ist das Potenzial für analytische CRM-Anwendungen laut dem Marktforschungsinstitut IDC weltweit um 22 Prozent gewachsen, bis zum Jahr 2006 soll es in Deutschland mit einem jährlichen Plus von 14,1 Prozent so weitergehen. Und das trotz schwacher Konjunktur - oder gerade deswegen. Denn ähnlich wie Data-Mining der USRegierung helfen soll, Terroristen zu finden, entscheiden CRM-Programme heute, welche Kunden für eine Firma profitabel sind. Und welche es künftig sein werden, wie Manuela Schnaubelt, Sprecherin des CRM-Anbieters SAP, beschreibt: "Die Kundenbewertung ist ein zentraler Bestandteil des analytischen CRM. Sie ermöglicht es Unternehmen, sich auf die für sie wichtigen und richtigen Kunden zu fokussieren. Darüber hinaus können Firmen mit speziellen Scoring- Verfahren ermitteln, welche Kunden langfristig in welchem Maße zum Unternehmenserfolg beitragen." Die Folgen der Bewertungen sind für die Betroffenen nicht immer positiv: Attraktive Kunden profitieren von individuellen Sonderangeboten und besonderer Zuwendung. Andere hängen vielleicht so lauge in der Warteschleife des Telefonservice, bis die profitableren Kunden abgearbeitet sind. So könnte eine praktische Umsetzung dessen aussehen, was SAP-Spreche-rin Schnaubelt abstrakt beschreibt: "In vielen Unternehmen wird Kundenbewertung mit der klassischen ABC-Analyse durchgeführt, bei der Kunden anhand von Daten wie dem Umsatz kategorisiert werden. A-Kunden als besonders wichtige Kunden werden anders betreut als C-Kunden." Noch näher am geplanten Einsatz von Data-Mining zur Terroristenjagd ist eine Anwendung, die heute viele Firmen erfolgreich nutzen: Sie spüren betrügende Mitarbeiter auf. Werner Sülzer vom großen CRM-Anbieter NCR Teradata beschreibt die Möglichkeiten so: "Heute hinterlässt praktisch jeder Täter - ob Mitarbeiter, Kunde oder Lieferant - Datenspuren bei seinen wirtschaftskriminellen Handlungen. Es muss vorrangig darum gehen, einzelne Spuren zu Handlungsmustern und Täterprofilen zu verdichten. Das gelingt mittels zentraler Datenlager und hoch entwickelter Such- und Analyseinstrumente." Von konkreten Erfolgen sprich: Entlas-sungen krimineller Mitarbeiter-nach Einsatz solcher Programme erzählen Unternehmen nicht gerne. Matthias Wilke von der "Beratungsstelle für Technologiefolgen und Qualifizierung" (BTQ) der Gewerkschaft Verdi weiß von einem Fall 'aus der Schweiz. Dort setzt die Handelskette "Pick Pay" das Programm "Lord Lose Prevention" ein. Zwei Monate nach Einfüh-rung seien Unterschlagungen im Wert von etwa 200 000 Franken ermittelt worden. Das kostete mehr als 50 verdächtige Kassiererinnen und Kassierer den Job.

Source

Frankfurter Rundschau. Nr.275 vom 26.11.2002, S.11

Type

a
Kantardzic, M.: Data mining : concepts, models, methods, and algorithms (2003) 0.01
```
0.0070053744 = product of:
  0.025686372 = sum of:
    0.0031240587 = weight(_text_:a in 2291) [ClassicSimilarity], result of:
      0.0031240587 = score(doc=2291,freq=8.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.10191591 = fieldWeight in 2291, product of:
          2.828427 = tf(freq=8.0), with freq of:
            8.0 = termFreq=8.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.03125 = fieldNorm(doc=2291)
    0.0013888142 = weight(_text_:s in 2291) [ClassicSimilarity], result of:
      0.0013888142 = score(doc=2291,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.048049565 = fieldWeight in 2291, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.03125 = fieldNorm(doc=2291)
    0.0211735 = weight(_text_:k in 2291) [ClassicSimilarity], result of:
      0.0211735 = score(doc=2291,freq=4.0), product of:
        0.09490114 = queryWeight, product of:
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.026584605 = queryNorm
        0.22311112 = fieldWeight in 2291, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.03125 = fieldNorm(doc=2291)
  0.27272728 = coord(3/11)
```
Abstract

This book offers a comprehensive introduction to the exploding field of data mining. We are surrounded by data, numerical and otherwise, which must be analyzed and processed to convert it into information that informs, instructs, answers, or otherwise aids understanding and decision-making. Due to the ever-increasing complexity and size of today's data sets, a new term, data mining, was created to describe the indirect, automatic data analysis techniques that utilize more complex and sophisticated tools than those which analysts used in the past to do mere data analysis. "Data Mining: Concepts, Models, Methods, and Algorithms" discusses data mining principles and then describes representative state-of-the-art methods and algorithms originating from different disciplines such as statistics, machine learning, neural networks, fuzzy logic, and evolutionary computation. Detailed algorithms are provided with necessary explanations and illustrative examples. This text offers guidance: how and when to use a particular software tool (with their companion data sets) from among the hundreds offered when faced with a data set to mine. This allows analysts to create and perform their own data mining experiments using their knowledge of the methodologies and techniques provided. This book emphasizes the selection of appropriate methodologies and data analysis software, as well as parameter tuning. These critically important, qualitative decisions can only be made with the deeper understanding of parameter meaning and its role in the technique that is offered here. Data mining is an exploding field and this book offers much-needed guidance to selecting among the numerous analysis programs that are available.

Classification

PZY (FH K)

GHBS

PZY (FH K)

Pages

XII, 345 S

Klein, H.: Web Content Mining (2004) 0.01

0.006972335 = product of:
  0.01917392 = sum of:
    0.0036259806 = product of:
      0.007251961 = sum of:
        0.007251961 = weight(_text_:h in 3154) [ClassicSimilarity], result of:
          0.007251961 = score(doc=3154,freq=2.0), product of:
            0.0660481 = queryWeight, product of:
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.026584605 = queryNorm
            0.10979818 = fieldWeight in 3154, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              2.4844491 = idf(docFreq=10020, maxDocs=44218)
              0.03125 = fieldNorm(doc=3154)
      0.5 = coord(1/2)
    0.0015620294 = weight(_text_:a in 3154) [ClassicSimilarity], result of:
      0.0015620294 = score(doc=3154,freq=2.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.050957955 = fieldWeight in 3154, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.03125 = fieldNorm(doc=3154)
    0.0013888142 = weight(_text_:s in 3154) [ClassicSimilarity], result of:
      0.0013888142 = score(doc=3154,freq=2.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.048049565 = fieldWeight in 3154, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.03125 = fieldNorm(doc=3154)
    0.012597097 = weight(_text_:u in 3154) [ClassicSimilarity], result of:
      0.012597097 = score(doc=3154,freq=2.0), product of:
        0.08704981 = queryWeight, product of:
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.026584605 = queryNorm
        0.14471136 = fieldWeight in 3154, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.2744443 = idf(docFreq=4547, maxDocs=44218)
          0.03125 = fieldNorm(doc=3154)
  0.36363637 = coord(4/11)

Pages: S.217-221
Source: Wissensorganisation und Edutainment: Wissen im Spannungsfeld von Gesellschaft, Gestaltung und Industrie. Proceedings der 7. Tagung der Deutschen Sektion der Internationalen Gesellschaft für Wissensorganisation, Berlin, 21.-23.3.2001. Hrsg.: C. Lehner, H.P. Ohly u. G. Rahmstorf
Type: a

Liu, Y.; Zhang, M.; Cen, R.; Ru, L.; Ma, S.: Data cleansing for Web information retrieval using query independent features (2007) 0.01
```
0.0066560227 = product of:
  0.024405416 = sum of:
    0.0058576106 = weight(_text_:a in 607) [ClassicSimilarity], result of:
      0.0058576106 = score(doc=607,freq=18.0), product of:
        0.030653298 = queryWeight, product of:
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.026584605 = queryNorm
        0.19109234 = fieldWeight in 607, product of:
          4.2426405 = tf(freq=18.0), with freq of:
            18.0 = termFreq=18.0
          1.153047 = idf(docFreq=37942, maxDocs=44218)
          0.0390625 = fieldNorm(doc=607)
    0.016092705 = weight(_text_:r in 607) [ClassicSimilarity], result of:
      0.016092705 = score(doc=607,freq=2.0), product of:
        0.088001914 = queryWeight, product of:
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.026584605 = queryNorm
        0.18286766 = fieldWeight in 607, product of:
          1.4142135 = tf(freq=2.0), with freq of:
            2.0 = termFreq=2.0
          3.3102584 = idf(docFreq=4387, maxDocs=44218)
          0.0390625 = fieldNorm(doc=607)
    0.0024550997 = weight(_text_:s in 607) [ClassicSimilarity], result of:
      0.0024550997 = score(doc=607,freq=4.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.08494043 = fieldWeight in 607, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0390625 = fieldNorm(doc=607)
  0.27272728 = coord(3/11)
```
Abstract

Understanding what kinds of Web pages are the most useful for Web search engine users is a critical task in Web information retrieval (IR). Most previous works used hyperlink analysis algorithms to solve this problem. However, little research has been focused on query-independent Web data cleansing for Web IR. In this paper, we first provide analysis of the differences between retrieval target pages and ordinary ones based on more than 30 million Web pages obtained from both the Text Retrieval Conference (TREC) and a widely used Chinese search engine, SOGOU (www.sogou.com). We further propose a learning-based data cleansing algorithm for reducing Web pages that are unlikely to be useful for user requests. We found that there exists a large proportion of low-quality Web pages in both the English and the Chinese Web page corpus, and retrieval target pages can be identified using query-independent features and cleansing algorithms. The experimental results showed that our algorithm is effective in reducing a large portion of Web pages with a small loss in retrieval target pages. It makes it possible for Web IR tools to meet a large fraction of users' needs with only a small part of pages on the Web. These results may help Web search engines make better use of their limited storage and computation resources to improve search performance.

Source

Journal of the American Society for Information Science and Technology. 58(2007) no.12, S.1884-1898

Type

a

Medien-Informationsmanagement : Archivarische, dokumentarische, betriebswirtschaftliche, rechtliche und Berufsbild-Aspekte ; [Frühjahrstagung der Fachgruppe 7 im Jahr 2000 in Weimar und Folgetagung 2001 in Köln] (2003) 0.01

0.0062061697 = product of:
  0.022755954 = sum of:
    0.00147306 = weight(_text_:s in 1833) [ClassicSimilarity], result of:
      0.00147306 = score(doc=1833,freq=4.0), product of:
        0.028903782 = queryWeight, product of:
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.026584605 = queryNorm
        0.050964262 = fieldWeight in 1833, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          1.0872376 = idf(docFreq=40523, maxDocs=44218)
          0.0234375 = fieldNorm(doc=1833)
    0.015880125 = weight(_text_:k in 1833) [ClassicSimilarity], result of:
      0.015880125 = score(doc=1833,freq=4.0), product of:
        0.09490114 = queryWeight, product of:
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.026584605 = queryNorm
        0.16733333 = fieldWeight in 1833, product of:
          2.0 = tf(freq=4.0), with freq of:
            4.0 = termFreq=4.0
          3.569778 = idf(docFreq=3384, maxDocs=44218)
          0.0234375 = fieldNorm(doc=1833)
    0.0054027704 = product of:
      0.010805541 = sum of:
        0.010805541 = weight(_text_:22 in 1833) [ClassicSimilarity], result of:
          0.010805541 = score(doc=1833,freq=2.0), product of:
            0.09309476 = queryWeight, product of:
              3.5018296 = idf(docFreq=3622, maxDocs=44218)
              0.026584605 = queryNorm
            0.116070345 = fieldWeight in 1833, product of:
              1.4142135 = tf(freq=2.0), with freq of:
                2.0 = termFreq=2.0
              3.5018296 = idf(docFreq=3622, maxDocs=44218)
              0.0234375 = fieldNorm(doc=1833)
      0.5 = coord(1/2)
  0.27272728 = coord(3/11)

Classification: BAQC (FH K)
Date: 11. 5.2008 19:49:22
GHBS: BAQC (FH K)
Pages: 276 S
Type: s

Search (76 results, page 1 of 4)

Authors

Languages

Types

Themes

Subjects

Classifications