Document (#37403)

Author
Glaesener, L.
Title
Automatisches Indexieren einer informationswissenschaftlichen Datenbank mit Mehrwortgruppen
Imprint
Köln : Fachhochschule / Fakultät für Informations- und Kommunikationswissenschaften
Year
2012
Pages
III, 34, VII S
Abstract
Ein Bericht über die Ergebnisse und die Prozessanalyse einer automatischen Indexierung mit Mehrwortgruppen. Diese Bachelorarbeit beschreibt, inwieweit der Inhalt informationswissenschaftlicher Fachtexte durch informationswissenschaftliches Fachvokabular erschlossen werden kann und sollte und dass in diesen wissenschaftlichen Texten ein Großteil der fachlichen Inhalte in Mehrwortgruppen vorkommt. Die Ergebnisse wurden durch eine automatische Indexierung mit Mehrwortgruppen mithilfe des Programme Lingo an einer informationswissenschaftlichen Datenbank ermittelt.
Content
Bachelorarbeit im Studiengang Bibliothekswesen der Fakultät für Informations- und Kommunikationswissenschaften an der Fachhochschule Köln.
Theme
Automatisches Indexieren

Similar documents (content)

  1. Bredack, J.: Terminologieextraktion von Mehrwortgruppen in kunsthistorischen Fachtexten (2013) 0.36
    0.36152261 = sum of:
      0.36152261 = product of:
        1.2911522 = sum of:
          0.023089679 = weight(abstract_txt:inhalt in 3055) [ClassicSimilarity], result of:
            0.023089679 = score(doc=3055,freq=1.0), product of:
              0.08756669 = queryWeight, product of:
                1.0790504 = boost
                6.7502356 = idf(docFreq=135, maxDocs=42740)
                0.012022043 = queryNorm
              0.26368108 = fieldWeight in 3055, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.7502356 = idf(docFreq=135, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
          0.028826037 = weight(abstract_txt:texten in 3055) [ClassicSimilarity], result of:
            0.028826037 = score(doc=3055,freq=1.0), product of:
              0.10152749 = queryWeight, product of:
                1.1618875 = boost
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.012022043 = queryNorm
              0.28392348 = fieldWeight in 3055, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
          0.016512034 = weight(abstract_txt:durch in 3055) [ClassicSimilarity], result of:
            0.016512034 = score(doc=3055,freq=2.0), product of:
              0.07002623 = queryWeight, product of:
                1.3646386 = boost
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.012022043 = queryNorm
              0.23579785 = fieldWeight in 3055, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
          0.11607349 = weight(abstract_txt:lingo in 3055) [ClassicSimilarity], result of:
            0.11607349 = score(doc=3055,freq=4.0), product of:
              0.16188093 = queryWeight, product of:
                1.4671351 = boost
                9.177984 = idf(docFreq=11, maxDocs=42740)
                0.012022043 = queryNorm
              0.71703005 = fieldWeight in 3055, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                9.177984 = idf(docFreq=11, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
          0.035439998 = weight(abstract_txt:ergebnisse in 3055) [ClassicSimilarity], result of:
            0.035439998 = score(doc=3055,freq=2.0), product of:
              0.116517045 = queryWeight, product of:
                1.760281 = boost
                5.5059114 = idf(docFreq=471, maxDocs=42740)
                0.012022043 = queryNorm
              0.3041615 = fieldWeight in 3055, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.5059114 = idf(docFreq=471, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
          0.029868783 = weight(abstract_txt:einer in 3055) [ClassicSimilarity], result of:
            0.029868783 = score(doc=3055,freq=5.0), product of:
              0.087684415 = queryWeight, product of:
                1.870226 = boost
                3.8998692 = idf(docFreq=2351, maxDocs=42740)
                0.012022043 = queryNorm
              0.3406396 = fieldWeight in 3055, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                3.8998692 = idf(docFreq=2351, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
          1.0413423 = weight(abstract_txt:mehrwortgruppen in 3055) [ClassicSimilarity], result of:
            1.0413423 = score(doc=3055,freq=13.0), product of:
              0.7490225 = queryWeight, product of:
                6.3117485 = boost
                9.871131 = idf(docFreq=5, maxDocs=42740)
                0.012022043 = queryNorm
              1.3902683 = fieldWeight in 3055, product of:
                3.6055512 = tf(freq=13.0), with freq of:
                  13.0 = termFreq=13.0
                9.871131 = idf(docFreq=5, maxDocs=42740)
                0.0390625 = fieldNorm(doc=3055)
        0.28 = coord(7/25)
    
  2. Bredack, J.; Lepsky, K.: Automatische Extraktion von Fachterminologie aus Volltexten (2014) 0.31
    0.30543193 = sum of:
      0.30543193 = product of:
        1.5271597 = sum of:
          0.07012178 = weight(abstract_txt:automatische in 1873) [ClassicSimilarity], result of:
            0.07012178 = score(doc=1873,freq=1.0), product of:
              0.09243935 = queryWeight, product of:
                1.108666 = boost
                6.9355025 = idf(docFreq=112, maxDocs=42740)
                0.012022043 = queryNorm
              0.7585706 = fieldWeight in 1873, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9355025 = idf(docFreq=112, maxDocs=42740)
                0.109375 = fieldNorm(doc=1873)
          0.08071291 = weight(abstract_txt:texten in 1873) [ClassicSimilarity], result of:
            0.08071291 = score(doc=1873,freq=1.0), product of:
              0.10152749 = queryWeight, product of:
                1.1618875 = boost
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.012022043 = queryNorm
              0.7949858 = fieldWeight in 1873, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.109375 = fieldNorm(doc=1873)
          0.16250287 = weight(abstract_txt:lingo in 1873) [ClassicSimilarity], result of:
            0.16250287 = score(doc=1873,freq=1.0), product of:
              0.16188093 = queryWeight, product of:
                1.4671351 = boost
                9.177984 = idf(docFreq=11, maxDocs=42740)
                0.012022043 = queryNorm
              1.003842 = fieldWeight in 1873, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.177984 = idf(docFreq=11, maxDocs=42740)
                0.109375 = fieldNorm(doc=1873)
          0.070167616 = weight(abstract_txt:ergebnisse in 1873) [ClassicSimilarity], result of:
            0.070167616 = score(doc=1873,freq=1.0), product of:
              0.116517045 = queryWeight, product of:
                1.760281 = boost
                5.5059114 = idf(docFreq=471, maxDocs=42740)
                0.012022043 = queryNorm
              0.60220903 = fieldWeight in 1873, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5059114 = idf(docFreq=471, maxDocs=42740)
                0.109375 = fieldNorm(doc=1873)
          1.1436545 = weight(abstract_txt:mehrwortgruppen in 1873) [ClassicSimilarity], result of:
            1.1436545 = score(doc=1873,freq=2.0), product of:
              0.7490225 = queryWeight, product of:
                6.3117485 = boost
                9.871131 = idf(docFreq=5, maxDocs=42740)
                0.012022043 = queryNorm
              1.5268626 = fieldWeight in 1873, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                9.871131 = idf(docFreq=5, maxDocs=42740)
                0.109375 = fieldNorm(doc=1873)
        0.2 = coord(5/25)
    
  3. Oberhauser, O.: Automatisches Klassifizieren : Entwicklungsstand - Methodik - Anwendungsbereiche (2005) 0.24
    0.23861139 = sum of:
      0.23861139 = product of:
        0.8521835 = sum of:
          0.06831448 = weight(abstract_txt:automatischen in 1164) [ClassicSimilarity], result of:
            0.06831448 = score(doc=1164,freq=4.0), product of:
              0.09084412 = queryWeight, product of:
                1.0990582 = boost
                6.8753986 = idf(docFreq=119, maxDocs=42740)
                0.012022043 = queryNorm
              0.75199676 = fieldWeight in 1164, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.8753986 = idf(docFreq=119, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1164)
          0.03506089 = weight(abstract_txt:automatische in 1164) [ClassicSimilarity], result of:
            0.03506089 = score(doc=1164,freq=1.0), product of:
              0.09243935 = queryWeight, product of:
                1.108666 = boost
                6.9355025 = idf(docFreq=112, maxDocs=42740)
                0.012022043 = queryNorm
              0.3792853 = fieldWeight in 1164, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9355025 = idf(docFreq=112, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1164)
          0.040356454 = weight(abstract_txt:texten in 1164) [ClassicSimilarity], result of:
            0.040356454 = score(doc=1164,freq=1.0), product of:
              0.10152749 = queryWeight, product of:
                1.1618875 = boost
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.012022043 = queryNorm
              0.3974929 = fieldWeight in 1164, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1164)
          0.05096022 = weight(abstract_txt:mithilfe in 1164) [ClassicSimilarity], result of:
            0.05096022 = score(doc=1164,freq=1.0), product of:
              0.11861215 = queryWeight, product of:
                1.2558473 = boost
                7.856228 = idf(docFreq=44, maxDocs=42740)
                0.012022043 = queryNorm
              0.42963746 = fieldWeight in 1164, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.856228 = idf(docFreq=44, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1164)
          0.01634608 = weight(abstract_txt:durch in 1164) [ClassicSimilarity], result of:
            0.01634608 = score(doc=1164,freq=1.0), product of:
              0.07002623 = queryWeight, product of:
                1.3646386 = boost
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.012022043 = queryNorm
              0.23342797 = fieldWeight in 1164, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1164)
          0.6037438 = weight(title_txt:automatisches in 1164) [ClassicSimilarity], result of:
            0.6037438 = score(doc=1164,freq=1.0), product of:
              0.15410501 = queryWeight, product of:
                1.4314647 = boost
                8.954841 = idf(docFreq=14, maxDocs=42740)
                0.012022043 = queryNorm
              3.9177427 = fieldWeight in 1164, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.954841 = idf(docFreq=14, maxDocs=42740)
                0.4375 = fieldNorm(doc=1164)
          0.037401628 = weight(abstract_txt:einer in 1164) [ClassicSimilarity], result of:
            0.037401628 = score(doc=1164,freq=4.0), product of:
              0.087684415 = queryWeight, product of:
                1.870226 = boost
                3.8998692 = idf(docFreq=2351, maxDocs=42740)
                0.012022043 = queryNorm
              0.42654818 = fieldWeight in 1164, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.8998692 = idf(docFreq=2351, maxDocs=42740)
                0.0546875 = fieldNorm(doc=1164)
        0.28 = coord(7/25)
    
  4. Grün, S.: Bildung von Komposita-Indextermen auf der Basis einer algorithmischen Mehrwortgruppenanalyse mit Lingo (2015) 0.22
    0.22218181 = sum of:
      0.22218181 = product of:
        1.3886364 = sum of:
          0.0768514 = weight(abstract_txt:großteil in 2336) [ClassicSimilarity], result of:
            0.0768514 = score(doc=2336,freq=1.0), product of:
              0.12297255 = queryWeight, product of:
                1.2787226 = boost
                7.999329 = idf(docFreq=38, maxDocs=42740)
                0.012022043 = queryNorm
              0.6249476 = fieldWeight in 2336, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.999329 = idf(docFreq=38, maxDocs=42740)
                0.078125 = fieldNorm(doc=2336)
          0.040446058 = weight(abstract_txt:durch in 2336) [ClassicSimilarity], result of:
            0.040446058 = score(doc=2336,freq=3.0), product of:
              0.07002623 = queryWeight, product of:
                1.3646386 = boost
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.012022043 = queryNorm
              0.57758445 = fieldWeight in 2336, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.078125 = fieldNorm(doc=2336)
          0.11607349 = weight(abstract_txt:lingo in 2336) [ClassicSimilarity], result of:
            0.11607349 = score(doc=2336,freq=1.0), product of:
              0.16188093 = queryWeight, product of:
                1.4671351 = boost
                9.177984 = idf(docFreq=11, maxDocs=42740)
                0.012022043 = queryNorm
              0.71703005 = fieldWeight in 2336, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.177984 = idf(docFreq=11, maxDocs=42740)
                0.078125 = fieldNorm(doc=2336)
          1.1552655 = weight(abstract_txt:mehrwortgruppen in 2336) [ClassicSimilarity], result of:
            1.1552655 = score(doc=2336,freq=4.0), product of:
              0.7490225 = queryWeight, product of:
                6.3117485 = boost
                9.871131 = idf(docFreq=5, maxDocs=42740)
                0.012022043 = queryNorm
              1.5423642 = fieldWeight in 2336, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                9.871131 = idf(docFreq=5, maxDocs=42740)
                0.078125 = fieldNorm(doc=2336)
        0.16 = coord(4/25)
    
  5. Oberhauser, O.: Automatisches Klassifizieren : Verfahren zur Erschließung elektronischer Dokumente (2004) 0.21
    0.21446164 = sum of:
      0.21446164 = product of:
        0.7659344 = sum of:
          0.06831448 = weight(abstract_txt:automatischen in 3488) [ClassicSimilarity], result of:
            0.06831448 = score(doc=3488,freq=4.0), product of:
              0.09084412 = queryWeight, product of:
                1.0990582 = boost
                6.8753986 = idf(docFreq=119, maxDocs=42740)
                0.012022043 = queryNorm
              0.75199676 = fieldWeight in 3488, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                6.8753986 = idf(docFreq=119, maxDocs=42740)
                0.0546875 = fieldNorm(doc=3488)
          0.03506089 = weight(abstract_txt:automatische in 3488) [ClassicSimilarity], result of:
            0.03506089 = score(doc=3488,freq=1.0), product of:
              0.09243935 = queryWeight, product of:
                1.108666 = boost
                6.9355025 = idf(docFreq=112, maxDocs=42740)
                0.012022043 = queryNorm
              0.3792853 = fieldWeight in 3488, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.9355025 = idf(docFreq=112, maxDocs=42740)
                0.0546875 = fieldNorm(doc=3488)
          0.040356454 = weight(abstract_txt:texten in 3488) [ClassicSimilarity], result of:
            0.040356454 = score(doc=3488,freq=1.0), product of:
              0.10152749 = queryWeight, product of:
                1.1618875 = boost
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.012022043 = queryNorm
              0.3974929 = fieldWeight in 3488, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.268441 = idf(docFreq=80, maxDocs=42740)
                0.0546875 = fieldNorm(doc=3488)
          0.05096022 = weight(abstract_txt:mithilfe in 3488) [ClassicSimilarity], result of:
            0.05096022 = score(doc=3488,freq=1.0), product of:
              0.11861215 = queryWeight, product of:
                1.2558473 = boost
                7.856228 = idf(docFreq=44, maxDocs=42740)
                0.012022043 = queryNorm
              0.42963746 = fieldWeight in 3488, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.856228 = idf(docFreq=44, maxDocs=42740)
                0.0546875 = fieldNorm(doc=3488)
          0.01634608 = weight(abstract_txt:durch in 3488) [ClassicSimilarity], result of:
            0.01634608 = score(doc=3488,freq=1.0), product of:
              0.07002623 = queryWeight, product of:
                1.3646386 = boost
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.012022043 = queryNorm
              0.23342797 = fieldWeight in 3488, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.2683973 = idf(docFreq=1626, maxDocs=42740)
                0.0546875 = fieldNorm(doc=3488)
          0.5174947 = weight(title_txt:automatisches in 3488) [ClassicSimilarity], result of:
            0.5174947 = score(doc=3488,freq=1.0), product of:
              0.15410501 = queryWeight, product of:
                1.4314647 = boost
                8.954841 = idf(docFreq=14, maxDocs=42740)
                0.012022043 = queryNorm
              3.3580651 = fieldWeight in 3488, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.954841 = idf(docFreq=14, maxDocs=42740)
                0.375 = fieldNorm(doc=3488)
          0.037401628 = weight(abstract_txt:einer in 3488) [ClassicSimilarity], result of:
            0.037401628 = score(doc=3488,freq=4.0), product of:
              0.087684415 = queryWeight, product of:
                1.870226 = boost
                3.8998692 = idf(docFreq=2351, maxDocs=42740)
                0.012022043 = queryNorm
              0.42654818 = fieldWeight in 3488, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.8998692 = idf(docFreq=2351, maxDocs=42740)
                0.0546875 = fieldNorm(doc=3488)
        0.28 = coord(7/25)