Document (#17102)

Author
Ihm, P.
Title
Numerische Taxonomie und Datenbanken
Source
Numerische und nicht-numerische Klassifikation zwischen Theorie und Praxis. Proc. der 5. Fachtagung der Gesellschaft für Klassifikation, Hofgeismar, 7.-10.4.1981. Hrsg.: Peter Ihm u.a
Imprint
Frankfurt : Indeks
Year
1982
Pages
S.16-21
Series
Studien zur Klassifikation; Bd.10
Abstract
Eine Datebank besteht aus Datenbasis und Datenbank-Managementsystem. Sie ist Hilfsmittel zur Speicherung und Bereitstellung von Daten, die häufig Gegenstand einer statistischen (explorativen) Datenanalyse sind. Ein häufig angewandtes Verfahren ist die Clusteranalyse. In den für Datenbanken typischen Fällen haben Daten eine komplexe Struktur, es fragt sich, ob die Clusteranalysealgorithmen statt auf dem Umweg über rechteckige Dateien direkt auf die anders strukturierten Daten angewendet werden können. Entsprechende Methodologien für die verschiedenen Anwendungsfälle werden diskutiert

Similar documents (content)

  1. Renker, L.: Exploration von Textkorpora : Topic Models als Grundlage der Interaktion (2015) 0.11
    0.111576594 = sum of:
      0.111576594 = product of:
        0.55788296 = sum of:
          0.03132944 = weight(abstract_txt:werden in 3380) [ClassicSimilarity], result of:
            0.03132944 = score(doc=3380,freq=4.0), product of:
              0.0714511 = queryWeight, product of:
                1.0054148 = boost
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.020259555 = queryNorm
              0.43847388 = fieldWeight in 3380, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.0625 = fieldNorm(doc=3380)
          0.067466535 = weight(abstract_txt:entsprechende in 3380) [ClassicSimilarity], result of:
            0.067466535 = score(doc=3380,freq=1.0), product of:
              0.15012145 = queryWeight, product of:
                1.0304981 = boost
                7.190608 = idf(docFreq=90, maxDocs=44421)
                0.020259555 = queryNorm
              0.449413 = fieldWeight in 3380, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.190608 = idf(docFreq=90, maxDocs=44421)
                0.0625 = fieldNorm(doc=3380)
          0.07079655 = weight(abstract_txt:fällen in 3380) [ClassicSimilarity], result of:
            0.07079655 = score(doc=3380,freq=1.0), product of:
              0.15502147 = queryWeight, product of:
                1.047181 = boost
                7.3070183 = idf(docFreq=80, maxDocs=44421)
                0.020259555 = queryNorm
              0.45668864 = fieldWeight in 3380, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.3070183 = idf(docFreq=80, maxDocs=44421)
                0.0625 = fieldNorm(doc=3380)
          0.30947012 = weight(abstract_txt:explorativen in 3380) [ClassicSimilarity], result of:
            0.30947012 = score(doc=3380,freq=5.0), product of:
              0.24236672 = queryWeight, product of:
                1.3093698 = boost
                9.1365185 = idf(docFreq=12, maxDocs=44421)
                0.020259555 = queryNorm
              1.2768673 = fieldWeight in 3380, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                9.1365185 = idf(docFreq=12, maxDocs=44421)
                0.0625 = fieldNorm(doc=3380)
          0.078820296 = weight(abstract_txt:daten in 3380) [ClassicSimilarity], result of:
            0.078820296 = score(doc=3380,freq=1.0), product of:
              0.24016862 = queryWeight, product of:
                2.2575874 = boost
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.020259555 = queryNorm
              0.32818732 = fieldWeight in 3380, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.0625 = fieldNorm(doc=3380)
        0.2 = coord(5/25)
    
  2. Bock, H.-H.: Datenanalyse zur Strukturierung und Ordnung von Information (1989) 0.11
    0.106798 = sum of:
      0.106798 = product of:
        0.6674875 = sum of:
          0.023497079 = weight(abstract_txt:werden in 141) [ClassicSimilarity], result of:
            0.023497079 = score(doc=141,freq=1.0), product of:
              0.0714511 = queryWeight, product of:
                1.0054148 = boost
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.020259555 = queryNorm
              0.3288554 = fieldWeight in 141, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.09375 = fieldNorm(doc=141)
          0.14562021 = weight(abstract_txt:angewendet in 141) [ClassicSimilarity], result of:
            0.14562021 = score(doc=141,freq=1.0), product of:
              0.19133927 = queryWeight, product of:
                1.1633968 = boost
                8.117949 = idf(docFreq=35, maxDocs=44421)
                0.020259555 = queryNorm
              0.7610577 = fieldWeight in 141, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.117949 = idf(docFreq=35, maxDocs=44421)
                0.09375 = fieldNorm(doc=141)
          0.29358912 = weight(abstract_txt:datenanalyse in 141) [ClassicSimilarity], result of:
            0.29358912 = score(doc=141,freq=2.0), product of:
              0.24236672 = queryWeight, product of:
                1.3093698 = boost
                9.1365185 = idf(docFreq=12, maxDocs=44421)
                0.020259555 = queryNorm
              1.2113426 = fieldWeight in 141, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                9.1365185 = idf(docFreq=12, maxDocs=44421)
                0.09375 = fieldNorm(doc=141)
          0.20478113 = weight(abstract_txt:daten in 141) [ClassicSimilarity], result of:
            0.20478113 = score(doc=141,freq=3.0), product of:
              0.24016862 = queryWeight, product of:
                2.2575874 = boost
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.020259555 = queryNorm
              0.85265565 = fieldWeight in 141, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.09375 = fieldNorm(doc=141)
        0.16 = coord(4/25)
    
  3. Kind, J.: Praxis des Information Retrieval (2004) 0.10
    0.09706819 = sum of:
      0.09706819 = product of:
        0.48534095 = sum of:
          0.033370093 = weight(abstract_txt:eine in 3934) [ClassicSimilarity], result of:
            0.033370093 = score(doc=3934,freq=3.0), product of:
              0.07068355 = queryWeight, product of:
                3.4888992 = idf(docFreq=3686, maxDocs=44421)
                0.020259555 = queryNorm
              0.4721055 = fieldWeight in 3934, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4888992 = idf(docFreq=3686, maxDocs=44421)
                0.078125 = fieldNorm(doc=3934)
          0.027691573 = weight(abstract_txt:werden in 3934) [ClassicSimilarity], result of:
            0.027691573 = score(doc=3934,freq=2.0), product of:
              0.0714511 = queryWeight, product of:
                1.0054148 = boost
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.020259555 = queryNorm
              0.3875598 = fieldWeight in 3934, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.078125 = fieldNorm(doc=3934)
          0.1192651 = weight(abstract_txt:entsprechende in 3934) [ClassicSimilarity], result of:
            0.1192651 = score(doc=3934,freq=2.0), product of:
              0.15012145 = queryWeight, product of:
                1.0304981 = boost
                7.190608 = idf(docFreq=90, maxDocs=44421)
                0.020259555 = queryNorm
              0.79445744 = fieldWeight in 3934, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.190608 = idf(docFreq=90, maxDocs=44421)
                0.078125 = fieldNorm(doc=3934)
          0.108042784 = weight(abstract_txt:strukturierten in 3934) [ClassicSimilarity], result of:
            0.108042784 = score(doc=3934,freq=1.0), product of:
              0.17708196 = queryWeight, product of:
                1.1192136 = boost
                7.809647 = idf(docFreq=48, maxDocs=44421)
                0.020259555 = queryNorm
              0.6101287 = fieldWeight in 3934, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.809647 = idf(docFreq=48, maxDocs=44421)
                0.078125 = fieldNorm(doc=3934)
          0.1969714 = weight(abstract_txt:datenbanken in 3934) [ClassicSimilarity], result of:
            0.1969714 = score(doc=3934,freq=5.0), product of:
              0.19471493 = queryWeight, product of:
                1.6597415 = boost
                5.790671 = idf(docFreq=368, maxDocs=44421)
                0.020259555 = queryNorm
              1.0115886 = fieldWeight in 3934, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                5.790671 = idf(docFreq=368, maxDocs=44421)
                0.078125 = fieldNorm(doc=3934)
        0.2 = coord(5/25)
    
  4. Jackermeier, R.: Code I've Seen : Verhalten von Programmierern beim Wiederfinden von Code-Stellen (2015) 0.10
    0.09517455 = sum of:
      0.09517455 = product of:
        0.47587276 = sum of:
          0.02311948 = weight(abstract_txt:eine in 2740) [ClassicSimilarity], result of:
            0.02311948 = score(doc=2740,freq=1.0), product of:
              0.07068355 = queryWeight, product of:
                3.4888992 = idf(docFreq=3686, maxDocs=44421)
                0.020259555 = queryNorm
              0.3270843 = fieldWeight in 2740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4888992 = idf(docFreq=3686, maxDocs=44421)
                0.09375 = fieldNorm(doc=2740)
          0.040698137 = weight(abstract_txt:werden in 2740) [ClassicSimilarity], result of:
            0.040698137 = score(doc=2740,freq=3.0), product of:
              0.0714511 = queryWeight, product of:
                1.0054148 = boost
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.020259555 = queryNorm
              0.56959426 = fieldWeight in 2740, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.09375 = fieldNorm(doc=2740)
          0.14562021 = weight(abstract_txt:angewendet in 2740) [ClassicSimilarity], result of:
            0.14562021 = score(doc=2740,freq=1.0), product of:
              0.19133927 = queryWeight, product of:
                1.1633968 = boost
                8.117949 = idf(docFreq=35, maxDocs=44421)
                0.020259555 = queryNorm
              0.7610577 = fieldWeight in 2740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.117949 = idf(docFreq=35, maxDocs=44421)
                0.09375 = fieldNorm(doc=2740)
          0.14820449 = weight(abstract_txt:häufig in 2740) [ClassicSimilarity], result of:
            0.14820449 = score(doc=2740,freq=1.0), product of:
              0.24391614 = queryWeight, product of:
                1.8576381 = boost
                6.481112 = idf(docFreq=184, maxDocs=44421)
                0.020259555 = queryNorm
              0.60760427 = fieldWeight in 2740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.481112 = idf(docFreq=184, maxDocs=44421)
                0.09375 = fieldNorm(doc=2740)
          0.11823044 = weight(abstract_txt:daten in 2740) [ClassicSimilarity], result of:
            0.11823044 = score(doc=2740,freq=1.0), product of:
              0.24016862 = queryWeight, product of:
                2.2575874 = boost
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.020259555 = queryNorm
              0.49228096 = fieldWeight in 2740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.09375 = fieldNorm(doc=2740)
        0.2 = coord(5/25)
    
  5. Witschel, H.F.: Terminologie-Extraktion : Möglichkeiten der Kombination statistischer uns musterbasierter Verfahren (2004) 0.09
    0.09371233 = sum of:
      0.09371233 = product of:
        0.39046806 = sum of:
          0.026696073 = weight(abstract_txt:eine in 1123) [ClassicSimilarity], result of:
            0.026696073 = score(doc=1123,freq=3.0), product of:
              0.07068355 = queryWeight, product of:
                3.4888992 = idf(docFreq=3686, maxDocs=44421)
                0.020259555 = queryNorm
              0.3776844 = fieldWeight in 1123, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4888992 = idf(docFreq=3686, maxDocs=44421)
                0.0625 = fieldNorm(doc=1123)
          0.03502738 = weight(abstract_txt:werden in 1123) [ClassicSimilarity], result of:
            0.03502738 = score(doc=1123,freq=5.0), product of:
              0.0714511 = queryWeight, product of:
                1.0054148 = boost
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.020259555 = queryNorm
              0.4902287 = fieldWeight in 1123, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.0625 = fieldNorm(doc=1123)
          0.08910871 = weight(abstract_txt:gegenstand in 1123) [ClassicSimilarity], result of:
            0.08910871 = score(doc=1123,freq=2.0), product of:
              0.14343461 = queryWeight, product of:
                1.0072861 = boost
                7.028639 = idf(docFreq=106, maxDocs=44421)
                0.020259555 = queryNorm
              0.62124974 = fieldWeight in 1123, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.028639 = idf(docFreq=106, maxDocs=44421)
                0.0625 = fieldNorm(doc=1123)
          0.067466535 = weight(abstract_txt:entsprechende in 1123) [ClassicSimilarity], result of:
            0.067466535 = score(doc=1123,freq=1.0), product of:
              0.15012145 = queryWeight, product of:
                1.0304981 = boost
                7.190608 = idf(docFreq=90, maxDocs=44421)
                0.020259555 = queryNorm
              0.449413 = fieldWeight in 1123, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.190608 = idf(docFreq=90, maxDocs=44421)
                0.0625 = fieldNorm(doc=1123)
          0.093349084 = weight(abstract_txt:statistischen in 1123) [ClassicSimilarity], result of:
            0.093349084 = score(doc=1123,freq=1.0), product of:
              0.18640485 = queryWeight, product of:
                1.1482975 = boost
                8.0125885 = idf(docFreq=39, maxDocs=44421)
                0.020259555 = queryNorm
              0.5007868 = fieldWeight in 1123, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.0125885 = idf(docFreq=39, maxDocs=44421)
                0.0625 = fieldNorm(doc=1123)
          0.078820296 = weight(abstract_txt:daten in 1123) [ClassicSimilarity], result of:
            0.078820296 = score(doc=1123,freq=1.0), product of:
              0.24016862 = queryWeight, product of:
                2.2575874 = boost
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.020259555 = queryNorm
              0.32818732 = fieldWeight in 1123, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.250997 = idf(docFreq=632, maxDocs=44421)
                0.0625 = fieldNorm(doc=1123)
        0.24 = coord(6/25)