Document (#17102)

Author
Ihm, P.
Title
Numerische Taxonomie und Datenbanken
Source
Numerische und nicht-numerische Klassifikation zwischen Theorie und Praxis. Proc. der 5. Fachtagung der Gesellschaft für Klassifikation, Hofgeismar, 7.-10.4.1981. Hrsg.: Peter Ihm u.a
Imprint
Frankfurt : Indeks
Year
1982
Pages
S.16-21
Series
Studien zur Klassifikation; Bd.10
Abstract
Eine Datebank besteht aus Datenbasis und Datenbank-Managementsystem. Sie ist Hilfsmittel zur Speicherung und Bereitstellung von Daten, die häufig Gegenstand einer statistischen (explorativen) Datenanalyse sind. Ein häufig angewandtes Verfahren ist die Clusteranalyse. In den für Datenbanken typischen Fällen haben Daten eine komplexe Struktur, es fragt sich, ob die Clusteranalysealgorithmen statt auf dem Umweg über rechteckige Dateien direkt auf die anders strukturierten Daten angewendet werden können. Entsprechende Methodologien für die verschiedenen Anwendungsfälle werden diskutiert

Similar documents (content)

  1. Renker, L.: Exploration von Textkorpora : Topic Models als Grundlage der Interaktion (2015) 0.11
    0.111588575 = sum of:
      0.111588575 = product of:
        0.55794287 = sum of:
          0.031304825 = weight(abstract_txt:werden in 2380) [ClassicSimilarity], result of:
            0.031304825 = score(doc=2380,freq=4.0), product of:
              0.07142623 = queryWeight, product of:
                1.0048845 = boost
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.020272065 = queryNorm
              0.43828195 = fieldWeight in 2380, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.0625 = fieldNorm(doc=2380)
          0.06768449 = weight(abstract_txt:entsprechende in 2380) [ClassicSimilarity], result of:
            0.06768449 = score(doc=2380,freq=1.0), product of:
              0.15047105 = queryWeight, product of:
                1.0313326 = boost
                7.1970778 = idf(docFreq=89, maxDocs=44218)
                0.020272065 = queryNorm
              0.44981736 = fieldWeight in 2380, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.1970778 = idf(docFreq=89, maxDocs=44218)
                0.0625 = fieldNorm(doc=2380)
          0.07070079 = weight(abstract_txt:fällen in 2380) [ClassicSimilarity], result of:
            0.07070079 = score(doc=2380,freq=1.0), product of:
              0.15490888 = queryWeight, product of:
                1.0464306 = boost
                7.3024383 = idf(docFreq=80, maxDocs=44218)
                0.020272065 = queryNorm
              0.4564024 = fieldWeight in 2380, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.3024383 = idf(docFreq=80, maxDocs=44218)
                0.0625 = fieldNorm(doc=2380)
          0.30916792 = weight(abstract_txt:explorativen in 2380) [ClassicSimilarity], result of:
            0.30916792 = score(doc=2380,freq=5.0), product of:
              0.24225149 = queryWeight, product of:
                1.3085958 = boost
                9.131938 = idf(docFreq=12, maxDocs=44218)
                0.020272065 = queryNorm
              1.2762271 = fieldWeight in 2380, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                9.131938 = idf(docFreq=12, maxDocs=44218)
                0.0625 = fieldNorm(doc=2380)
          0.07908484 = weight(abstract_txt:daten in 2380) [ClassicSimilarity], result of:
            0.07908484 = score(doc=2380,freq=1.0), product of:
              0.24074803 = queryWeight, product of:
                2.25951 = boost
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.020272065 = queryNorm
              0.3284963 = fieldWeight in 2380, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.0625 = fieldNorm(doc=2380)
        0.2 = coord(5/25)
    
  2. Bock, H.-H.: Datenanalyse zur Strukturierung und Ordnung von Information (1989) 0.11
    0.106832 = sum of:
      0.106832 = product of:
        0.6677 = sum of:
          0.02347862 = weight(abstract_txt:werden in 141) [ClassicSimilarity], result of:
            0.02347862 = score(doc=141,freq=1.0), product of:
              0.07142623 = queryWeight, product of:
                1.0048845 = boost
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.020272065 = queryNorm
              0.32871145 = fieldWeight in 141, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.09375 = fieldNorm(doc=141)
          0.14545053 = weight(abstract_txt:angewendet in 141) [ClassicSimilarity], result of:
            0.14545053 = score(doc=141,freq=1.0), product of:
              0.19122422 = queryWeight, product of:
                1.1626359 = boost
                8.113368 = idf(docFreq=35, maxDocs=44218)
                0.020272065 = queryNorm
              0.7606282 = fieldWeight in 141, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.113368 = idf(docFreq=35, maxDocs=44218)
                0.09375 = fieldNorm(doc=141)
          0.29330242 = weight(abstract_txt:datenanalyse in 141) [ClassicSimilarity], result of:
            0.29330242 = score(doc=141,freq=2.0), product of:
              0.24225149 = queryWeight, product of:
                1.3085958 = boost
                9.131938 = idf(docFreq=12, maxDocs=44218)
                0.020272065 = queryNorm
              1.2107353 = fieldWeight in 141, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                9.131938 = idf(docFreq=12, maxDocs=44218)
                0.09375 = fieldNorm(doc=141)
          0.20546843 = weight(abstract_txt:daten in 141) [ClassicSimilarity], result of:
            0.20546843 = score(doc=141,freq=3.0), product of:
              0.24074803 = queryWeight, product of:
                2.25951 = boost
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.020272065 = queryNorm
              0.8534584 = fieldWeight in 141, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.09375 = fieldNorm(doc=141)
        0.16 = coord(4/25)
    
  3. Kind, J.: Praxis des Information Retrieval (2004) 0.10
    0.097046934 = sum of:
      0.097046934 = product of:
        0.48523465 = sum of:
          0.0333967 = weight(abstract_txt:eine in 2934) [ClassicSimilarity], result of:
            0.0333967 = score(doc=2934,freq=3.0), product of:
              0.07073355 = queryWeight, product of:
                3.4892128 = idf(docFreq=3668, maxDocs=44218)
                0.020272065 = queryNorm
              0.47214794 = fieldWeight in 2934, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4892128 = idf(docFreq=3668, maxDocs=44218)
                0.078125 = fieldNorm(doc=2934)
          0.027669821 = weight(abstract_txt:werden in 2934) [ClassicSimilarity], result of:
            0.027669821 = score(doc=2934,freq=2.0), product of:
              0.07142623 = queryWeight, product of:
                1.0048845 = boost
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.020272065 = queryNorm
              0.3873902 = fieldWeight in 2934, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.078125 = fieldNorm(doc=2934)
          0.11965039 = weight(abstract_txt:entsprechende in 2934) [ClassicSimilarity], result of:
            0.11965039 = score(doc=2934,freq=2.0), product of:
              0.15047105 = queryWeight, product of:
                1.0313326 = boost
                7.1970778 = idf(docFreq=89, maxDocs=44218)
                0.020272065 = queryNorm
              0.7951722 = fieldWeight in 2934, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.1970778 = idf(docFreq=89, maxDocs=44218)
                0.078125 = fieldNorm(doc=2934)
          0.1079097 = weight(abstract_txt:strukturierten in 2934) [ClassicSimilarity], result of:
            0.1079097 = score(doc=2934,freq=1.0), product of:
              0.17696762 = queryWeight, product of:
                1.1184567 = boost
                7.805067 = idf(docFreq=48, maxDocs=44218)
                0.020272065 = queryNorm
              0.6097709 = fieldWeight in 2934, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.805067 = idf(docFreq=48, maxDocs=44218)
                0.078125 = fieldNorm(doc=2934)
          0.19660804 = weight(abstract_txt:datenbanken in 2934) [ClassicSimilarity], result of:
            0.19660804 = score(doc=2934,freq=5.0), product of:
              0.19450958 = queryWeight, product of:
                1.6582797 = boost
                5.7860904 = idf(docFreq=368, maxDocs=44218)
                0.020272065 = queryNorm
              1.0107884 = fieldWeight in 2934, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                5.7860904 = idf(docFreq=368, maxDocs=44218)
                0.078125 = fieldNorm(doc=2934)
        0.2 = coord(5/25)
    
  4. Jackermeier, R.: Code I've Seen : Verhalten von Programmierern beim Wiederfinden von Code-Stellen (2015) 0.10
    0.09524443 = sum of:
      0.09524443 = product of:
        0.47622216 = sum of:
          0.023137912 = weight(abstract_txt:eine in 1740) [ClassicSimilarity], result of:
            0.023137912 = score(doc=1740,freq=1.0), product of:
              0.07073355 = queryWeight, product of:
                3.4892128 = idf(docFreq=3668, maxDocs=44218)
                0.020272065 = queryNorm
              0.3271137 = fieldWeight in 1740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4892128 = idf(docFreq=3668, maxDocs=44218)
                0.09375 = fieldNorm(doc=1740)
          0.040666163 = weight(abstract_txt:werden in 1740) [ClassicSimilarity], result of:
            0.040666163 = score(doc=1740,freq=3.0), product of:
              0.07142623 = queryWeight, product of:
                1.0048845 = boost
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.020272065 = queryNorm
              0.56934494 = fieldWeight in 1740, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.09375 = fieldNorm(doc=1740)
          0.14545053 = weight(abstract_txt:angewendet in 1740) [ClassicSimilarity], result of:
            0.14545053 = score(doc=1740,freq=1.0), product of:
              0.19122422 = queryWeight, product of:
                1.1626359 = boost
                8.113368 = idf(docFreq=35, maxDocs=44218)
                0.020272065 = queryNorm
              0.7606282 = fieldWeight in 1740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.113368 = idf(docFreq=35, maxDocs=44218)
                0.09375 = fieldNorm(doc=1740)
          0.14834028 = weight(abstract_txt:häufig in 1740) [ClassicSimilarity], result of:
            0.14834028 = score(doc=1740,freq=1.0), product of:
              0.24410802 = queryWeight, product of:
                1.8577117 = boost
                6.481951 = idf(docFreq=183, maxDocs=44218)
                0.020272065 = queryNorm
              0.60768294 = fieldWeight in 1740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.481951 = idf(docFreq=183, maxDocs=44218)
                0.09375 = fieldNorm(doc=1740)
          0.11862726 = weight(abstract_txt:daten in 1740) [ClassicSimilarity], result of:
            0.11862726 = score(doc=1740,freq=1.0), product of:
              0.24074803 = queryWeight, product of:
                2.25951 = boost
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.020272065 = queryNorm
              0.49274445 = fieldWeight in 1740, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.09375 = fieldNorm(doc=1740)
        0.2 = coord(5/25)
    
  5. Witschel, H.F.: Terminologie-Extraktion : Möglichkeiten der Kombination statistischer uns musterbasierter Verfahren (2004) 0.09
    0.09376952 = sum of:
      0.09376952 = product of:
        0.39070633 = sum of:
          0.02671736 = weight(abstract_txt:eine in 123) [ClassicSimilarity], result of:
            0.02671736 = score(doc=123,freq=3.0), product of:
              0.07073355 = queryWeight, product of:
                3.4892128 = idf(docFreq=3668, maxDocs=44218)
                0.020272065 = queryNorm
              0.37771836 = fieldWeight in 123, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4892128 = idf(docFreq=3668, maxDocs=44218)
                0.0625 = fieldNorm(doc=123)
          0.034999862 = weight(abstract_txt:werden in 123) [ClassicSimilarity], result of:
            0.034999862 = score(doc=123,freq=5.0), product of:
              0.07142623 = queryWeight, product of:
                1.0048845 = boost
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.020272065 = queryNorm
              0.49001414 = fieldWeight in 123, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                3.5062556 = idf(docFreq=3606, maxDocs=44218)
                0.0625 = fieldNorm(doc=123)
          0.08898153 = weight(abstract_txt:gegenstand in 123) [ClassicSimilarity], result of:
            0.08898153 = score(doc=123,freq=2.0), product of:
              0.14332329 = queryWeight, product of:
                1.0065391 = boost
                7.0240583 = idf(docFreq=106, maxDocs=44218)
                0.020272065 = queryNorm
              0.6208449 = fieldWeight in 123, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                7.0240583 = idf(docFreq=106, maxDocs=44218)
                0.0625 = fieldNorm(doc=123)
          0.06768449 = weight(abstract_txt:entsprechende in 123) [ClassicSimilarity], result of:
            0.06768449 = score(doc=123,freq=1.0), product of:
              0.15047105 = queryWeight, product of:
                1.0313326 = boost
                7.1970778 = idf(docFreq=89, maxDocs=44218)
                0.020272065 = queryNorm
              0.44981736 = fieldWeight in 123, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.1970778 = idf(docFreq=89, maxDocs=44218)
                0.0625 = fieldNorm(doc=123)
          0.093238235 = weight(abstract_txt:statistischen in 123) [ClassicSimilarity], result of:
            0.093238235 = score(doc=123,freq=1.0), product of:
              0.18629 = queryWeight, product of:
                1.147538 = boost
                8.008008 = idf(docFreq=39, maxDocs=44218)
                0.020272065 = queryNorm
              0.5005005 = fieldWeight in 123, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.008008 = idf(docFreq=39, maxDocs=44218)
                0.0625 = fieldNorm(doc=123)
          0.07908484 = weight(abstract_txt:daten in 123) [ClassicSimilarity], result of:
            0.07908484 = score(doc=123,freq=1.0), product of:
              0.24074803 = queryWeight, product of:
                2.25951 = boost
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.020272065 = queryNorm
              0.3284963 = fieldWeight in 123, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.255941 = idf(docFreq=626, maxDocs=44218)
                0.0625 = fieldNorm(doc=123)
        0.24 = coord(6/25)