Document (#30199)

Author
Benoit, G.
Title
Data discretization for novel relationship discovery in information retrieval
Source
Journal of the American Society for Information Science and Technology. 53(2002) no.9, S.736-746
Year
2002
Abstract
A sample of 600 Dialog and Swiss-Prot full text records in genetics and molecular biology were parsed and term frequencies calculated to provide data for a test of Benoit's visualization model for retrieval. A retrieved set is displayed graphically allowing for manipulation of document and concept relationships in real time, which hopefully will reveal unanticipated relationships.
Theme
Computerlinguistik
Field
Molekularbiologie

Similar documents (content)

  1. Müller, B.; Poley, C.; Pössel, J.; Hagelstein, A.; Gübitz, T.: LIVIVO - the vertical search engine for life sciences (2017) 0.12
    0.11776206 = sum of:
      0.11776206 = product of:
        0.49067527 = sum of:
          0.040276237 = weight(abstract_txt:novel in 4833) [ClassicSimilarity], result of:
            0.040276237 = score(doc=4833,freq=1.0), product of:
              0.115878604 = queryWeight, product of:
                1.0996 = boost
                5.561163 = idf(docFreq=451, maxDocs=43254)
                0.018949725 = queryNorm
              0.34757268 = fieldWeight in 4833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.561163 = idf(docFreq=451, maxDocs=43254)
                0.0625 = fieldNorm(doc=4833)
          0.03550219 = weight(abstract_txt:data in 4833) [ClassicSimilarity], result of:
            0.03550219 = score(doc=4833,freq=4.0), product of:
              0.08455334 = queryWeight, product of:
                1.3283528 = boost
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.018949725 = queryNorm
              0.41987923 = fieldWeight in 4833, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.0625 = fieldNorm(doc=4833)
          0.033891704 = weight(abstract_txt:retrieval in 4833) [ClassicSimilarity], result of:
            0.033891704 = score(doc=4833,freq=3.0), product of:
              0.09022686 = queryWeight, product of:
                1.3721956 = boost
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.018949725 = queryNorm
              0.37562767 = fieldWeight in 4833, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.0625 = fieldNorm(doc=4833)
          0.08418832 = weight(abstract_txt:biology in 4833) [ClassicSimilarity], result of:
            0.08418832 = score(doc=4833,freq=1.0), product of:
              0.18944009 = queryWeight, product of:
                1.4059472 = boost
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.018949725 = queryNorm
              0.44440606 = fieldWeight in 4833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.0625 = fieldNorm(doc=4833)
          0.124054074 = weight(abstract_txt:molecular in 4833) [ClassicSimilarity], result of:
            0.124054074 = score(doc=4833,freq=1.0), product of:
              0.24530779 = queryWeight, product of:
                1.599885 = boost
                8.091326 = idf(docFreq=35, maxDocs=43254)
                0.018949725 = queryNorm
              0.50570786 = fieldWeight in 4833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.091326 = idf(docFreq=35, maxDocs=43254)
                0.0625 = fieldNorm(doc=4833)
          0.17276274 = weight(abstract_txt:genetics in 4833) [ClassicSimilarity], result of:
            0.17276274 = score(doc=4833,freq=1.0), product of:
              0.3059173 = queryWeight, product of:
                1.786632 = boost
                9.035788 = idf(docFreq=13, maxDocs=43254)
                0.018949725 = queryNorm
              0.5647367 = fieldWeight in 4833, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.035788 = idf(docFreq=13, maxDocs=43254)
                0.0625 = fieldNorm(doc=4833)
        0.24 = coord(6/25)
    
  2. Fenstermacher, D.A.: Introduction to bioinformatics. (2005) 0.11
    0.113487065 = sum of:
      0.113487065 = product of:
        0.5674353 = sum of:
          0.056692243 = weight(abstract_txt:visualization in 258) [ClassicSimilarity], result of:
            0.056692243 = score(doc=258,freq=1.0), product of:
              0.14554136 = queryWeight, product of:
                1.2323279 = boost
                6.232427 = idf(docFreq=230, maxDocs=43254)
                0.018949725 = queryNorm
              0.3895267 = fieldWeight in 258, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.232427 = idf(docFreq=230, maxDocs=43254)
                0.0625 = fieldNorm(doc=258)
          0.04348113 = weight(abstract_txt:data in 258) [ClassicSimilarity], result of:
            0.04348113 = score(doc=258,freq=6.0), product of:
              0.08455334 = queryWeight, product of:
                1.3283528 = boost
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.018949725 = queryNorm
              0.514245 = fieldWeight in 258, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.0625 = fieldNorm(doc=258)
          0.11906027 = weight(abstract_txt:biology in 258) [ClassicSimilarity], result of:
            0.11906027 = score(doc=258,freq=2.0), product of:
              0.18944009 = queryWeight, product of:
                1.4059472 = boost
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.018949725 = queryNorm
              0.6284851 = fieldWeight in 258, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.0625 = fieldNorm(doc=258)
          0.17543896 = weight(abstract_txt:molecular in 258) [ClassicSimilarity], result of:
            0.17543896 = score(doc=258,freq=2.0), product of:
              0.24530779 = queryWeight, product of:
                1.599885 = boost
                8.091326 = idf(docFreq=35, maxDocs=43254)
                0.018949725 = queryNorm
              0.7151789 = fieldWeight in 258, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                8.091326 = idf(docFreq=35, maxDocs=43254)
                0.0625 = fieldNorm(doc=258)
          0.17276274 = weight(abstract_txt:genetics in 258) [ClassicSimilarity], result of:
            0.17276274 = score(doc=258,freq=1.0), product of:
              0.3059173 = queryWeight, product of:
                1.786632 = boost
                9.035788 = idf(docFreq=13, maxDocs=43254)
                0.018949725 = queryNorm
              0.5647367 = fieldWeight in 258, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.035788 = idf(docFreq=13, maxDocs=43254)
                0.0625 = fieldNorm(doc=258)
        0.2 = coord(5/25)
    
  3. Fowler, R.H.; Wilson, B.A.; Fowler, W.A.L.: Information navigator : an information system using associative networks for display and retrieval (1992) 0.09
    0.09098579 = sum of:
      0.09098579 = product of:
        0.45492893 = sum of:
          0.0708653 = weight(abstract_txt:visualization in 2920) [ClassicSimilarity], result of:
            0.0708653 = score(doc=2920,freq=1.0), product of:
              0.14554136 = queryWeight, product of:
                1.2323279 = boost
                6.232427 = idf(docFreq=230, maxDocs=43254)
                0.018949725 = queryNorm
              0.48690838 = fieldWeight in 2920, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.232427 = idf(docFreq=230, maxDocs=43254)
                0.078125 = fieldNorm(doc=2920)
          0.02218887 = weight(abstract_txt:data in 2920) [ClassicSimilarity], result of:
            0.02218887 = score(doc=2920,freq=1.0), product of:
              0.08455334 = queryWeight, product of:
                1.3283528 = boost
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.018949725 = queryNorm
              0.26242453 = fieldWeight in 2920, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.078125 = fieldNorm(doc=2920)
          0.04236463 = weight(abstract_txt:retrieval in 2920) [ClassicSimilarity], result of:
            0.04236463 = score(doc=2920,freq=3.0), product of:
              0.09022686 = queryWeight, product of:
                1.3721956 = boost
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.018949725 = queryNorm
              0.46953458 = fieldWeight in 2920, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.078125 = fieldNorm(doc=2920)
          0.17133452 = weight(abstract_txt:manipulation in 2920) [ClassicSimilarity], result of:
            0.17133452 = score(doc=2920,freq=3.0), product of:
              0.1817831 = queryWeight, product of:
                1.3772407 = boost
                6.965315 = idf(docFreq=110, maxDocs=43254)
                0.018949725 = queryNorm
              0.94252175 = fieldWeight in 2920, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                6.965315 = idf(docFreq=110, maxDocs=43254)
                0.078125 = fieldNorm(doc=2920)
          0.14817558 = weight(abstract_txt:displayed in 2920) [ClassicSimilarity], result of:
            0.14817558 = score(doc=2920,freq=2.0), product of:
              0.18888831 = queryWeight, product of:
                1.4038982 = boost
                7.100134 = idf(docFreq=96, maxDocs=43254)
                0.018949725 = queryNorm
              0.7844614 = fieldWeight in 2920, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.100134 = idf(docFreq=96, maxDocs=43254)
                0.078125 = fieldNorm(doc=2920)
        0.2 = coord(5/25)
    
  4. Vaughan, L.; Shaw, D.: Web citation data for impact assessment : a comparison of four science disciplines (2005) 0.09
    0.08599792 = sum of:
      0.08599792 = product of:
        0.42998958 = sum of:
          0.040276237 = weight(abstract_txt:sample in 5881) [ClassicSimilarity], result of:
            0.040276237 = score(doc=5881,freq=1.0), product of:
              0.115878604 = queryWeight, product of:
                1.0996 = boost
                5.561163 = idf(docFreq=451, maxDocs=43254)
                0.018949725 = queryNorm
              0.34757268 = fieldWeight in 5881, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.561163 = idf(docFreq=451, maxDocs=43254)
                0.0625 = fieldNorm(doc=5881)
          0.043450553 = weight(abstract_txt:retrieved in 5881) [ClassicSimilarity], result of:
            0.043450553 = score(doc=5881,freq=1.0), product of:
              0.121889845 = queryWeight, product of:
                1.1277604 = boost
                5.7035832 = idf(docFreq=391, maxDocs=43254)
                0.018949725 = queryNorm
              0.35647395 = fieldWeight in 5881, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.7035832 = idf(docFreq=391, maxDocs=43254)
                0.0625 = fieldNorm(doc=5881)
          0.017751096 = weight(abstract_txt:data in 5881) [ClassicSimilarity], result of:
            0.017751096 = score(doc=5881,freq=1.0), product of:
              0.08455334 = queryWeight, product of:
                1.3283528 = boost
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.018949725 = queryNorm
              0.20993961 = fieldWeight in 5881, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.0625 = fieldNorm(doc=5881)
          0.08418832 = weight(abstract_txt:biology in 5881) [ClassicSimilarity], result of:
            0.08418832 = score(doc=5881,freq=1.0), product of:
              0.18944009 = queryWeight, product of:
                1.4059472 = boost
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.018949725 = queryNorm
              0.44440606 = fieldWeight in 5881, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.0625 = fieldNorm(doc=5881)
          0.24432339 = weight(abstract_txt:genetics in 5881) [ClassicSimilarity], result of:
            0.24432339 = score(doc=5881,freq=2.0), product of:
              0.3059173 = queryWeight, product of:
                1.786632 = boost
                9.035788 = idf(docFreq=13, maxDocs=43254)
                0.018949725 = queryNorm
              0.7986583 = fieldWeight in 5881, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                9.035788 = idf(docFreq=13, maxDocs=43254)
                0.0625 = fieldNorm(doc=5881)
        0.2 = coord(5/25)
    
  5. Rapp, B.A.; Wheeler, D.L.: Bioinformatics resources from the National Center for Biotechnology Information : an integrated foundation for discovery (2005) 0.08
    0.08072592 = sum of:
      0.08072592 = product of:
        0.4036296 = sum of:
          0.042597983 = weight(abstract_txt:discovery in 266) [ClassicSimilarity], result of:
            0.042597983 = score(doc=266,freq=1.0), product of:
              0.12029013 = queryWeight, product of:
                1.1203355 = boost
                5.666032 = idf(docFreq=406, maxDocs=43254)
                0.018949725 = queryNorm
              0.354127 = fieldWeight in 266, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.666032 = idf(docFreq=406, maxDocs=43254)
                0.0625 = fieldNorm(doc=266)
          0.04696498 = weight(abstract_txt:data in 266) [ClassicSimilarity], result of:
            0.04696498 = score(doc=266,freq=7.0), product of:
              0.08455334 = queryWeight, product of:
                1.3283528 = boost
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.018949725 = queryNorm
              0.555448 = fieldWeight in 266, product of:
                2.6457512 = tf(freq=7.0), with freq of:
                  7.0 = termFreq=7.0
                3.3590338 = idf(docFreq=4087, maxDocs=43254)
                0.0625 = fieldNorm(doc=266)
          0.019567385 = weight(abstract_txt:retrieval in 266) [ClassicSimilarity], result of:
            0.019567385 = score(doc=266,freq=1.0), product of:
              0.09022686 = queryWeight, product of:
                1.3721956 = boost
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.018949725 = queryNorm
              0.21686874 = fieldWeight in 266, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4699 = idf(docFreq=3658, maxDocs=43254)
                0.0625 = fieldNorm(doc=266)
          0.11906027 = weight(abstract_txt:biology in 266) [ClassicSimilarity], result of:
            0.11906027 = score(doc=266,freq=2.0), product of:
              0.18944009 = queryWeight, product of:
                1.4059472 = boost
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.018949725 = queryNorm
              0.6284851 = fieldWeight in 266, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.110497 = idf(docFreq=95, maxDocs=43254)
                0.0625 = fieldNorm(doc=266)
          0.17543896 = weight(abstract_txt:molecular in 266) [ClassicSimilarity], result of:
            0.17543896 = score(doc=266,freq=2.0), product of:
              0.24530779 = queryWeight, product of:
                1.599885 = boost
                8.091326 = idf(docFreq=35, maxDocs=43254)
                0.018949725 = queryNorm
              0.7151789 = fieldWeight in 266, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                8.091326 = idf(docFreq=35, maxDocs=43254)
                0.0625 = fieldNorm(doc=266)
        0.2 = coord(5/25)