Document (#37810)

Author
Biselli, A.
Title
Unter Generalverdacht durch Algorithmen
Source
http://www.golem.de/news/textanalyse-unter-generalverdacht-durch-algorithmen-1402-104637.html
Year
2014
Abstract
Geheimdienste wie die NSA scannen täglich unzählige Texte. Die Gefahr, dass Personen fälschlicherweise verdächtigt werden, sei groß, schreibt Informatikerin Anna Biselli. Denn Algorithmen arbeiteten nicht fehlerfrei.
Theme
Computerlinguistik

Similar documents (content)

  1. Ulfkotte, U.: "Nackte Ehefrau" schaltet ab : Neues Computervirus löscht die Festplatte (2001) 0.16
    0.1584931 = sum of:
      0.1584931 = product of:
        0.35660946 = sum of:
          0.011230344 = weight(abstract_txt:werden in 6644) [ClassicSimilarity], result of:
            0.011230344 = score(doc=6644,freq=5.0), product of:
              0.045816753 = queryWeight, product of:
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.013061426 = queryNorm
              0.24511436 = fieldWeight in 6644, product of:
                2.236068 = tf(freq=5.0), with freq of:
                  5.0 = termFreq=5.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.01748028 = weight(abstract_txt:nicht in 6644) [ClassicSimilarity], result of:
            0.01748028 = score(doc=6644,freq=6.0), product of:
              0.057907406 = queryWeight, product of:
                1.1242293 = boost
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.013061426 = queryNorm
              0.30186605 = fieldWeight in 6644, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.008908381 = weight(abstract_txt:durch in 6644) [ClassicSimilarity], result of:
            0.008908381 = score(doc=6644,freq=1.0), product of:
              0.06713538 = queryWeight, product of:
                1.2104965 = boost
                4.246169 = idf(docFreq=1728, maxDocs=44421)
                0.013061426 = queryNorm
              0.13269278 = fieldWeight in 6644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.246169 = idf(docFreq=1728, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.0127542615 = weight(abstract_txt:unter in 6644) [ClassicSimilarity], result of:
            0.0127542615 = score(doc=6644,freq=1.0), product of:
              0.08528169 = queryWeight, product of:
                1.3643185 = boost
                4.785744 = idf(docFreq=1007, maxDocs=44421)
                0.013061426 = queryNorm
              0.1495545 = fieldWeight in 6644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.785744 = idf(docFreq=1007, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.051223375 = weight(abstract_txt:täglich in 6644) [ClassicSimilarity], result of:
            0.051223375 = score(doc=6644,freq=1.0), product of:
              0.21547543 = queryWeight, product of:
                2.1686363 = boost
                7.607123 = idf(docFreq=59, maxDocs=44421)
                0.013061426 = queryNorm
              0.23772259 = fieldWeight in 6644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.607123 = idf(docFreq=59, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.05338136 = weight(abstract_txt:gefahr in 6644) [ClassicSimilarity], result of:
            0.05338136 = score(doc=6644,freq=1.0), product of:
              0.22148554 = queryWeight, product of:
                2.1986725 = boost
                7.7124834 = idf(docFreq=53, maxDocs=44421)
                0.013061426 = queryNorm
              0.2410151 = fieldWeight in 6644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.7124834 = idf(docFreq=53, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.06500003 = weight(abstract_txt:schreibt in 6644) [ClassicSimilarity], result of:
            0.06500003 = score(doc=6644,freq=1.0), product of:
              0.2525581 = queryWeight, product of:
                2.34784 = boost
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.013061426 = queryNorm
              0.25736663 = fieldWeight in 6644, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
          0.13663141 = weight(abstract_txt:anna in 6644) [ClassicSimilarity], result of:
            0.13663141 = score(doc=6644,freq=2.0), product of:
              0.32893443 = queryWeight, product of:
                2.6794307 = boost
                9.398883 = idf(docFreq=9, maxDocs=44421)
                0.013061426 = queryNorm
              0.41537586 = fieldWeight in 6644, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                9.398883 = idf(docFreq=9, maxDocs=44421)
                0.03125 = fieldNorm(doc=6644)
        0.44444445 = coord(8/18)
    
  2. Weber-Wulf, D.: Im Anfang war das Wort ... und das Chaos : Wikipedia das unbekannte Wesen (2009) 0.16
    0.15592411 = sum of:
      0.15592411 = product of:
        0.7016585 = sum of:
          0.02008945 = weight(abstract_txt:werden in 62) [ClassicSimilarity], result of:
            0.02008945 = score(doc=62,freq=1.0), product of:
              0.045816753 = queryWeight, product of:
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.013061426 = queryNorm
              0.43847388 = fieldWeight in 62, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.125 = fieldNorm(doc=62)
          0.2048935 = weight(abstract_txt:täglich in 62) [ClassicSimilarity], result of:
            0.2048935 = score(doc=62,freq=1.0), product of:
              0.21547543 = queryWeight, product of:
                2.1686363 = boost
                7.607123 = idf(docFreq=59, maxDocs=44421)
                0.013061426 = queryNorm
              0.95089036 = fieldWeight in 62, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.607123 = idf(docFreq=59, maxDocs=44421)
                0.125 = fieldNorm(doc=62)
          0.21667542 = weight(abstract_txt:groß in 62) [ClassicSimilarity], result of:
            0.21667542 = score(doc=62,freq=1.0), product of:
              0.22365847 = queryWeight, product of:
                2.2094314 = boost
                7.750224 = idf(docFreq=51, maxDocs=44421)
                0.013061426 = queryNorm
              0.968778 = fieldWeight in 62, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.750224 = idf(docFreq=51, maxDocs=44421)
                0.125 = fieldNorm(doc=62)
          0.2600001 = weight(abstract_txt:schreibt in 62) [ClassicSimilarity], result of:
            0.2600001 = score(doc=62,freq=1.0), product of:
              0.2525581 = queryWeight, product of:
                2.34784 = boost
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.013061426 = queryNorm
              1.0294665 = fieldWeight in 62, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.125 = fieldNorm(doc=62)
        0.22222222 = coord(4/18)
    
  3. Arns, C.: Fallstricke Online : Über die eigenen Worte gestolpert (2005) 0.15
    0.15185276 = sum of:
      0.15185276 = product of:
        0.3904785 = sum of:
          0.017397974 = weight(abstract_txt:werden in 4502) [ClassicSimilarity], result of:
            0.017397974 = score(doc=4502,freq=3.0), product of:
              0.045816753 = queryWeight, product of:
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.013061426 = queryNorm
              0.3797295 = fieldWeight in 4502, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
          0.020184487 = weight(abstract_txt:nicht in 4502) [ClassicSimilarity], result of:
            0.020184487 = score(doc=4502,freq=2.0), product of:
              0.057907406 = queryWeight, product of:
                1.1242293 = boost
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.013061426 = queryNorm
              0.34856486 = fieldWeight in 4502, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
          0.021478167 = weight(abstract_txt:dass in 4502) [ClassicSimilarity], result of:
            0.021478167 = score(doc=4502,freq=1.0), product of:
              0.07604379 = queryWeight, product of:
                1.288308 = boost
                4.5191154 = idf(docFreq=1315, maxDocs=44421)
                0.013061426 = queryNorm
              0.28244472 = fieldWeight in 4502, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.5191154 = idf(docFreq=1315, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
          0.025508523 = weight(abstract_txt:unter in 4502) [ClassicSimilarity], result of:
            0.025508523 = score(doc=4502,freq=1.0), product of:
              0.08528169 = queryWeight, product of:
                1.3643185 = boost
                4.785744 = idf(docFreq=1007, maxDocs=44421)
                0.013061426 = queryNorm
              0.299109 = fieldWeight in 4502, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.785744 = idf(docFreq=1007, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
          0.067571595 = weight(abstract_txt:denn in 4502) [ClassicSimilarity], result of:
            0.067571595 = score(doc=4502,freq=2.0), product of:
              0.12958808 = queryWeight, product of:
                1.6817846 = boost
                5.899349 = idf(docFreq=330, maxDocs=44421)
                0.013061426 = queryNorm
              0.5214337 = fieldWeight in 4502, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.899349 = idf(docFreq=330, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
          0.10833771 = weight(abstract_txt:groß in 4502) [ClassicSimilarity], result of:
            0.10833771 = score(doc=4502,freq=1.0), product of:
              0.22365847 = queryWeight, product of:
                2.2094314 = boost
                7.750224 = idf(docFreq=51, maxDocs=44421)
                0.013061426 = queryNorm
              0.484389 = fieldWeight in 4502, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.750224 = idf(docFreq=51, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
          0.13000005 = weight(abstract_txt:schreibt in 4502) [ClassicSimilarity], result of:
            0.13000005 = score(doc=4502,freq=1.0), product of:
              0.2525581 = queryWeight, product of:
                2.34784 = boost
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.013061426 = queryNorm
              0.51473325 = fieldWeight in 4502, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                8.235732 = idf(docFreq=31, maxDocs=44421)
                0.0625 = fieldNorm(doc=4502)
        0.3888889 = coord(7/18)
    
  4. Dahmen, E.: Klassifikation als Ordnundssystem im elektronischen Pressearchiv (2003) 0.14
    0.1374215 = sum of:
      0.1374215 = product of:
        0.3533696 = sum of:
          0.015067087 = weight(abstract_txt:werden in 2513) [ClassicSimilarity], result of:
            0.015067087 = score(doc=2513,freq=4.0), product of:
              0.045816753 = queryWeight, product of:
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.013061426 = queryNorm
              0.3288554 = fieldWeight in 2513, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
          0.015138365 = weight(abstract_txt:nicht in 2513) [ClassicSimilarity], result of:
            0.015138365 = score(doc=2513,freq=2.0), product of:
              0.057907406 = queryWeight, product of:
                1.1242293 = boost
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.013061426 = queryNorm
              0.26142365 = fieldWeight in 2513, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
          0.013362571 = weight(abstract_txt:durch in 2513) [ClassicSimilarity], result of:
            0.013362571 = score(doc=2513,freq=1.0), product of:
              0.06713538 = queryWeight, product of:
                1.2104965 = boost
                4.246169 = idf(docFreq=1728, maxDocs=44421)
                0.013061426 = queryNorm
              0.19903918 = fieldWeight in 2513, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.246169 = idf(docFreq=1728, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
          0.03583525 = weight(abstract_txt:denn in 2513) [ClassicSimilarity], result of:
            0.03583525 = score(doc=2513,freq=1.0), product of:
              0.12958808 = queryWeight, product of:
                1.6817846 = boost
                5.899349 = idf(docFreq=330, maxDocs=44421)
                0.013061426 = queryNorm
              0.276532 = fieldWeight in 2513, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.899349 = idf(docFreq=330, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
          0.05443433 = weight(abstract_txt:texte in 2513) [ClassicSimilarity], result of:
            0.05443433 = score(doc=2513,freq=1.0), product of:
              0.17124058 = queryWeight, product of:
                1.9332641 = boost
                6.7814865 = idf(docFreq=136, maxDocs=44421)
                0.013061426 = queryNorm
              0.31788218 = fieldWeight in 2513, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.7814865 = idf(docFreq=136, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
          0.05748002 = weight(abstract_txt:personen in 2513) [ClassicSimilarity], result of:
            0.05748002 = score(doc=2513,freq=1.0), product of:
              0.17756991 = queryWeight, product of:
                1.9686682 = boost
                6.905677 = idf(docFreq=120, maxDocs=44421)
                0.013061426 = queryNorm
              0.3237036 = fieldWeight in 2513, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.905677 = idf(docFreq=120, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
          0.16205198 = weight(abstract_txt:arbeiteten in 2513) [ClassicSimilarity], result of:
            0.16205198 = score(doc=2513,freq=1.0), product of:
              0.3543733 = queryWeight, product of:
                2.7811112 = boost
                9.755557 = idf(docFreq=6, maxDocs=44421)
                0.013061426 = queryNorm
              0.45729172 = fieldWeight in 2513, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                9.755557 = idf(docFreq=6, maxDocs=44421)
                0.046875 = fieldNorm(doc=2513)
        0.3888889 = coord(7/18)
    
  5. Halip, I.: Automatische Extrahierung von Schlagworten aus unstrukturierten Texten (2005) 0.13
    0.13105352 = sum of:
      0.13105352 = product of:
        0.33699477 = sum of:
          0.021528894 = weight(abstract_txt:werden in 986) [ClassicSimilarity], result of:
            0.021528894 = score(doc=986,freq=6.0), product of:
              0.045816753 = queryWeight, product of:
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.013061426 = queryNorm
              0.4698913 = fieldWeight in 986, product of:
                2.4494898 = tf(freq=6.0), with freq of:
                  6.0 = termFreq=6.0
                3.507791 = idf(docFreq=3617, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
          0.021630742 = weight(abstract_txt:nicht in 986) [ClassicSimilarity], result of:
            0.021630742 = score(doc=986,freq=3.0), product of:
              0.057907406 = queryWeight, product of:
                1.1242293 = boost
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.013061426 = queryNorm
              0.37354016 = fieldWeight in 986, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.9435613 = idf(docFreq=2339, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
          0.015589665 = weight(abstract_txt:durch in 986) [ClassicSimilarity], result of:
            0.015589665 = score(doc=986,freq=1.0), product of:
              0.06713538 = queryWeight, product of:
                1.2104965 = boost
                4.246169 = idf(docFreq=1728, maxDocs=44421)
                0.013061426 = queryNorm
              0.23221236 = fieldWeight in 986, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.246169 = idf(docFreq=1728, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
          0.026577875 = weight(abstract_txt:dass in 986) [ClassicSimilarity], result of:
            0.026577875 = score(doc=986,freq=2.0), product of:
              0.07604379 = queryWeight, product of:
                1.288308 = boost
                4.5191154 = idf(docFreq=1315, maxDocs=44421)
                0.013061426 = queryNorm
              0.34950748 = fieldWeight in 986, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.5191154 = idf(docFreq=1315, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
          0.08981206 = weight(abstract_txt:texte in 986) [ClassicSimilarity], result of:
            0.08981206 = score(doc=986,freq=2.0), product of:
              0.17124058 = queryWeight, product of:
                1.9332641 = boost
                6.7814865 = idf(docFreq=136, maxDocs=44421)
                0.013061426 = queryNorm
              0.52447885 = fieldWeight in 986, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                6.7814865 = idf(docFreq=136, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
          0.06706002 = weight(abstract_txt:personen in 986) [ClassicSimilarity], result of:
            0.06706002 = score(doc=986,freq=1.0), product of:
              0.17756991 = queryWeight, product of:
                1.9686682 = boost
                6.905677 = idf(docFreq=120, maxDocs=44421)
                0.013061426 = queryNorm
              0.3776542 = fieldWeight in 986, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                6.905677 = idf(docFreq=120, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
          0.09479549 = weight(abstract_txt:groß in 986) [ClassicSimilarity], result of:
            0.09479549 = score(doc=986,freq=1.0), product of:
              0.22365847 = queryWeight, product of:
                2.2094314 = boost
                7.750224 = idf(docFreq=51, maxDocs=44421)
                0.013061426 = queryNorm
              0.42384037 = fieldWeight in 986, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.750224 = idf(docFreq=51, maxDocs=44421)
                0.0546875 = fieldNorm(doc=986)
        0.3888889 = coord(7/18)