Document (#36841)

Author
Mehler, A.
Waltinger, U.
Title
Automatic enrichment of metadata
Source
http://conference.ub.uni-bielefeld.de/2009/programme/
Year
2009
Abstract
In this talk we present a retrieval model based on social ontologies. More specifically, we utilize the Wikipedia category system in order to perform semantic searches. That is, textual input is used to build queries by means of which documents are retrieved which do not necessarily contain any query term but are semantically related to the input text by virtue of their content. We present a desktop which utilizes this search facility in a web-based environment - the so called eHumanities Desktop.
Content
Vortrag, anlässlich der 9. Internationalen Bielefeld-Konferenz 2009, 3. - 5. Februar 2009.
Theme
Semantic Web
Metadaten
Object
Wikipedia

Similar documents (content)

  1. Agarwal, B.; Ramampiaro, H.; Langseth, H.; Ruocco, M.: ¬A deep network model for paraphrase detection in short text messages (2018) 0.16
    0.16185442 = sum of:
      0.16185442 = product of:
        0.50579506 = sum of:
          0.03797933 = weight(abstract_txt:called in 5043) [ClassicSimilarity], result of:
            0.03797933 = score(doc=5043,freq=1.0), product of:
              0.11461943 = queryWeight, product of:
                1.0204073 = boost
                5.3016257 = idf(docFreq=598, maxDocs=44218)
                0.0211873 = queryNorm
              0.3313516 = fieldWeight in 5043, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.3016257 = idf(docFreq=598, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.04274743 = weight(abstract_txt:specifically in 5043) [ClassicSimilarity], result of:
            0.04274743 = score(doc=5043,freq=1.0), product of:
              0.12402237 = queryWeight, product of:
                1.0614376 = boost
                5.5148025 = idf(docFreq=483, maxDocs=44218)
                0.0211873 = queryNorm
              0.34467515 = fieldWeight in 5043, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5148025 = idf(docFreq=483, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.08327887 = weight(abstract_txt:perform in 5043) [ClassicSimilarity], result of:
            0.08327887 = score(doc=5043,freq=2.0), product of:
              0.1535465 = queryWeight, product of:
                1.1810395 = boost
                6.1362057 = idf(docFreq=259, maxDocs=44218)
                0.0211873 = queryNorm
              0.54236907 = fieldWeight in 5043, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.1362057 = idf(docFreq=259, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.086234234 = weight(abstract_txt:contain in 5043) [ClassicSimilarity], result of:
            0.086234234 = score(doc=5043,freq=2.0), product of:
              0.157158 = queryWeight, product of:
                1.1948481 = boost
                6.2079496 = idf(docFreq=241, maxDocs=44218)
                0.0211873 = queryNorm
              0.5487104 = fieldWeight in 5043, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.2079496 = idf(docFreq=241, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.02335557 = weight(abstract_txt:based in 5043) [ClassicSimilarity], result of:
            0.02335557 = score(doc=5043,freq=2.0), product of:
              0.08288711 = queryWeight, product of:
                1.227165 = boost
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0211873 = queryNorm
              0.28177565 = fieldWeight in 5043, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.082878605 = weight(abstract_txt:semantically in 5043) [ClassicSimilarity], result of:
            0.082878605 = score(doc=5043,freq=1.0), product of:
              0.19283608 = queryWeight, product of:
                1.3235446 = boost
                6.8766055 = idf(docFreq=123, maxDocs=44218)
                0.0211873 = queryNorm
              0.42978784 = fieldWeight in 5043, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.8766055 = idf(docFreq=123, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.12248997 = weight(abstract_txt:necessarily in 5043) [ClassicSimilarity], result of:
            0.12248997 = score(doc=5043,freq=2.0), product of:
              0.1985868 = queryWeight, product of:
                1.3431349 = boost
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.0211873 = queryNorm
              0.6168082 = fieldWeight in 5043, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.9783883 = idf(docFreq=111, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
          0.026831083 = weight(abstract_txt:which in 5043) [ClassicSimilarity], result of:
            0.026831083 = score(doc=5043,freq=2.0), product of:
              0.10407568 = queryWeight, product of:
                1.6841458 = boost
                2.9167147 = idf(docFreq=6503, maxDocs=44218)
                0.0211873 = queryNorm
              0.2578036 = fieldWeight in 5043, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                2.9167147 = idf(docFreq=6503, maxDocs=44218)
                0.0625 = fieldNorm(doc=5043)
        0.32 = coord(8/25)
    
  2. Isaac, A.: Aligning thesauri for an integrated access to Cultural Heritage Resources (2007) 0.14
    0.14325447 = sum of:
      0.14325447 = product of:
        0.39792907 = sum of:
          0.022341209 = weight(abstract_txt:automatic in 553) [ClassicSimilarity], result of:
            0.022341209 = score(doc=553,freq=1.0), product of:
              0.11008068 = queryWeight, product of:
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.0211873 = queryNorm
              0.20295304 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.03148012 = weight(abstract_txt:ontologies in 553) [ClassicSimilarity], result of:
            0.03148012 = score(doc=553,freq=1.0), product of:
              0.13835587 = queryWeight, product of:
                1.1210971 = boost
                5.8247695 = idf(docFreq=354, maxDocs=44218)
                0.0211873 = queryNorm
              0.22753006 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.8247695 = idf(docFreq=354, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.032136988 = weight(abstract_txt:build in 553) [ClassicSimilarity], result of:
            0.032136988 = score(doc=553,freq=1.0), product of:
              0.14027387 = queryWeight, product of:
                1.1288412 = boost
                5.8650045 = idf(docFreq=340, maxDocs=44218)
                0.0211873 = queryNorm
              0.22910175 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.8650045 = idf(docFreq=340, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.053896394 = weight(abstract_txt:contain in 553) [ClassicSimilarity], result of:
            0.053896394 = score(doc=553,freq=2.0), product of:
              0.157158 = queryWeight, product of:
                1.1948481 = boost
                6.2079496 = idf(docFreq=241, maxDocs=44218)
                0.0211873 = queryNorm
              0.342944 = fieldWeight in 553, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.2079496 = idf(docFreq=241, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.051799122 = weight(abstract_txt:semantically in 553) [ClassicSimilarity], result of:
            0.051799122 = score(doc=553,freq=1.0), product of:
              0.19283608 = queryWeight, product of:
                1.3235446 = boost
                6.8766055 = idf(docFreq=123, maxDocs=44218)
                0.0211873 = queryNorm
              0.2686174 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.8766055 = idf(docFreq=123, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.06508047 = weight(abstract_txt:talk in 553) [ClassicSimilarity], result of:
            0.06508047 = score(doc=553,freq=1.0), product of:
              0.22452971 = queryWeight, product of:
                1.4281747 = boost
                7.4202213 = idf(docFreq=71, maxDocs=44218)
                0.0211873 = queryNorm
              0.28985238 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.4202213 = idf(docFreq=71, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.026204832 = weight(abstract_txt:present in 553) [ClassicSimilarity], result of:
            0.026204832 = score(doc=553,freq=1.0), product of:
              0.1542544 = queryWeight, product of:
                1.6740878 = boost
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0211873 = queryNorm
              0.1698806 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.011857776 = weight(abstract_txt:which in 553) [ClassicSimilarity], result of:
            0.011857776 = score(doc=553,freq=1.0), product of:
              0.10407568 = queryWeight, product of:
                1.6841458 = boost
                2.9167147 = idf(docFreq=6503, maxDocs=44218)
                0.0211873 = queryNorm
              0.11393417 = fieldWeight in 553, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                2.9167147 = idf(docFreq=6503, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
          0.10313215 = weight(abstract_txt:input in 553) [ClassicSimilarity], result of:
            0.10313215 = score(doc=553,freq=2.0), product of:
              0.30518937 = queryWeight, product of:
                2.3547463 = boost
                6.1171575 = idf(docFreq=264, maxDocs=44218)
                0.0211873 = queryNorm
              0.33792838 = fieldWeight in 553, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.1171575 = idf(docFreq=264, maxDocs=44218)
                0.0390625 = fieldNorm(doc=553)
        0.36 = coord(9/25)
    
  3. Soricut, R.; Marcu, D.: Abstractive headline generation using WIDL-expressions (2007) 0.14
    0.13749635 = sum of:
      0.13749635 = product of:
        0.4910584 = sum of:
          0.044682417 = weight(abstract_txt:automatic in 943) [ClassicSimilarity], result of:
            0.044682417 = score(doc=943,freq=1.0), product of:
              0.11008068 = queryWeight, product of:
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.0211873 = queryNorm
              0.40590608 = fieldWeight in 943, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.1955976 = idf(docFreq=665, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
          0.047474165 = weight(abstract_txt:called in 943) [ClassicSimilarity], result of:
            0.047474165 = score(doc=943,freq=1.0), product of:
              0.11461943 = queryWeight, product of:
                1.0204073 = boost
                5.3016257 = idf(docFreq=598, maxDocs=44218)
                0.0211873 = queryNorm
              0.41418952 = fieldWeight in 943, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.3016257 = idf(docFreq=598, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
          0.09586867 = weight(abstract_txt:textual in 943) [ClassicSimilarity], result of:
            0.09586867 = score(doc=943,freq=2.0), product of:
              0.14534312 = queryWeight, product of:
                1.1490573 = boost
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.0211873 = queryNorm
              0.65960234 = fieldWeight in 943, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.9700394 = idf(docFreq=306, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
          0.020643603 = weight(abstract_txt:based in 943) [ClassicSimilarity], result of:
            0.020643603 = score(doc=943,freq=1.0), product of:
              0.08288711 = queryWeight, product of:
                1.227165 = boost
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0211873 = queryNorm
              0.24905685 = fieldWeight in 943, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
          0.052409664 = weight(abstract_txt:present in 943) [ClassicSimilarity], result of:
            0.052409664 = score(doc=943,freq=1.0), product of:
              0.1542544 = queryWeight, product of:
                1.6740878 = boost
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0211873 = queryNorm
              0.3397612 = fieldWeight in 943, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
          0.023715552 = weight(abstract_txt:which in 943) [ClassicSimilarity], result of:
            0.023715552 = score(doc=943,freq=1.0), product of:
              0.10407568 = queryWeight, product of:
                1.6841458 = boost
                2.9167147 = idf(docFreq=6503, maxDocs=44218)
                0.0211873 = queryNorm
              0.22786833 = fieldWeight in 943, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                2.9167147 = idf(docFreq=6503, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
          0.2062643 = weight(abstract_txt:input in 943) [ClassicSimilarity], result of:
            0.2062643 = score(doc=943,freq=2.0), product of:
              0.30518937 = queryWeight, product of:
                2.3547463 = boost
                6.1171575 = idf(docFreq=264, maxDocs=44218)
                0.0211873 = queryNorm
              0.67585677 = fieldWeight in 943, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.1171575 = idf(docFreq=264, maxDocs=44218)
                0.078125 = fieldNorm(doc=943)
        0.28 = coord(7/25)
    
  4. Carpineto, C.; Mizzaro, S.; Romano, G.; Snidero, M.: Mobile information retrieval with search results clustering : prototypes and evaluations (2009) 0.11
    0.10842176 = sum of:
      0.10842176 = product of:
        0.5421088 = sum of:
          0.06306624 = weight(abstract_txt:searches in 2793) [ClassicSimilarity], result of:
            0.06306624 = score(doc=2793,freq=3.0), product of:
              0.111442514 = queryWeight, product of:
                1.0061666 = boost
                5.227637 = idf(docFreq=644, maxDocs=44218)
                0.0211873 = queryNorm
              0.56590825 = fieldWeight in 2793, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.227637 = idf(docFreq=644, maxDocs=44218)
                0.0625 = fieldNorm(doc=2793)
          0.06274971 = weight(abstract_txt:wikipedia in 2793) [ClassicSimilarity], result of:
            0.06274971 = score(doc=2793,freq=1.0), product of:
              0.16018967 = queryWeight, product of:
                1.2063177 = boost
                6.2675414 = idf(docFreq=227, maxDocs=44218)
                0.0211873 = queryNorm
              0.39172134 = fieldWeight in 2793, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2675414 = idf(docFreq=227, maxDocs=44218)
                0.0625 = fieldNorm(doc=2793)
          0.02335557 = weight(abstract_txt:based in 2793) [ClassicSimilarity], result of:
            0.02335557 = score(doc=2793,freq=2.0), product of:
              0.08288711 = queryWeight, product of:
                1.227165 = boost
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0211873 = queryNorm
              0.28177565 = fieldWeight in 2793, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0625 = fieldNorm(doc=2793)
          0.04192773 = weight(abstract_txt:present in 2793) [ClassicSimilarity], result of:
            0.04192773 = score(doc=2793,freq=1.0), product of:
              0.1542544 = queryWeight, product of:
                1.6740878 = boost
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0211873 = queryNorm
              0.27180895 = fieldWeight in 2793, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0625 = fieldNorm(doc=2793)
          0.35100952 = weight(abstract_txt:desktop in 2793) [ClassicSimilarity], result of:
            0.35100952 = score(doc=2793,freq=3.0), product of:
              0.44096982 = queryWeight, product of:
                2.8305047 = boost
                7.3530817 = idf(docFreq=76, maxDocs=44218)
                0.0211873 = queryNorm
              0.7959944 = fieldWeight in 2793, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                7.3530817 = idf(docFreq=76, maxDocs=44218)
                0.0625 = fieldNorm(doc=2793)
        0.2 = coord(5/25)
    
  5. Hepp, M.; Bruijn, J. de: GenTax : a generic methodology for deriving OWL and RDF-S ontologies from hierarchical classifications, thesauri, and inconsistent taxonomies (2007) 0.11
    0.107406035 = sum of:
      0.107406035 = product of:
        0.44752514 = sum of:
          0.10073638 = weight(abstract_txt:ontologies in 4692) [ClassicSimilarity], result of:
            0.10073638 = score(doc=4692,freq=4.0), product of:
              0.13835587 = queryWeight, product of:
                1.1210971 = boost
                5.8247695 = idf(docFreq=354, maxDocs=44218)
                0.0211873 = queryNorm
              0.7280962 = fieldWeight in 4692, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                5.8247695 = idf(docFreq=354, maxDocs=44218)
                0.0625 = fieldNorm(doc=4692)
          0.06097681 = weight(abstract_txt:contain in 4692) [ClassicSimilarity], result of:
            0.06097681 = score(doc=4692,freq=1.0), product of:
              0.157158 = queryWeight, product of:
                1.1948481 = boost
                6.2079496 = idf(docFreq=241, maxDocs=44218)
                0.0211873 = queryNorm
              0.38799685 = fieldWeight in 4692, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2079496 = idf(docFreq=241, maxDocs=44218)
                0.0625 = fieldNorm(doc=4692)
          0.06235791 = weight(abstract_txt:category in 4692) [ClassicSimilarity], result of:
            0.06235791 = score(doc=4692,freq=1.0), product of:
              0.15952218 = queryWeight, product of:
                1.2038018 = boost
                6.2544694 = idf(docFreq=230, maxDocs=44218)
                0.0211873 = queryNorm
              0.39090434 = fieldWeight in 4692, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.2544694 = idf(docFreq=230, maxDocs=44218)
                0.0625 = fieldNorm(doc=4692)
          0.016514882 = weight(abstract_txt:based in 4692) [ClassicSimilarity], result of:
            0.016514882 = score(doc=4692,freq=1.0), product of:
              0.08288711 = queryWeight, product of:
                1.227165 = boost
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0211873 = queryNorm
              0.19924548 = fieldWeight in 4692, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.1879277 = idf(docFreq=4958, maxDocs=44218)
                0.0625 = fieldNorm(doc=4692)
          0.04192773 = weight(abstract_txt:present in 4692) [ClassicSimilarity], result of:
            0.04192773 = score(doc=4692,freq=1.0), product of:
              0.1542544 = queryWeight, product of:
                1.6740878 = boost
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0211873 = queryNorm
              0.27180895 = fieldWeight in 4692, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.348943 = idf(docFreq=1552, maxDocs=44218)
                0.0625 = fieldNorm(doc=4692)
          0.16501144 = weight(abstract_txt:input in 4692) [ClassicSimilarity], result of:
            0.16501144 = score(doc=4692,freq=2.0), product of:
              0.30518937 = queryWeight, product of:
                2.3547463 = boost
                6.1171575 = idf(docFreq=264, maxDocs=44218)
                0.0211873 = queryNorm
              0.5406854 = fieldWeight in 4692, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.1171575 = idf(docFreq=264, maxDocs=44218)
                0.0625 = fieldNorm(doc=4692)
        0.24 = coord(6/25)