Document (#6509)

Author
Ashford, J.H.
Title
Free text retrieval in the Welsh language : problems, and proposed working practice
Source
Journal of documentation. 51(1995) no.2, S.118-125
Year
1995
Abstract
A bilingual Welsh-English full text database is planned for Inspection Reports of Her Majesty's Inspectors of Schools for Wales. Special requirements for free text retrieval in the Welsh language are identified, and practical solutions are proposed for problems arising from the use of standard text database products, some of which may also apply to other lesser-used languages
Theme
Volltextretrieval

Similar documents (content)

  1. Cunliffe, D.; Harries, R.: Promoting minority-language use in a bilingual online community (2005) 0.22
    0.2171264 = sum of:
      0.2171264 = product of:
        0.90469337 = sum of:
          0.047453377 = weight(abstract_txt:practice in 915) [ClassicSimilarity], result of:
            0.047453377 = score(doc=915,freq=1.0), product of:
              0.104878716 = queryWeight, product of:
                4.8262353 = idf(docFreq=967, maxDocs=44421)
                0.021730958 = queryNorm
              0.45245957 = fieldWeight in 915, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.8262353 = idf(docFreq=967, maxDocs=44421)
                0.09375 = fieldNorm(doc=915)
          0.059002977 = weight(abstract_txt:languages in 915) [ClassicSimilarity], result of:
            0.059002977 = score(doc=915,freq=1.0), product of:
              0.12127145 = queryWeight, product of:
                1.0753148 = boost
                5.189722 = idf(docFreq=672, maxDocs=44421)
                0.021730958 = queryNorm
              0.48653644 = fieldWeight in 915, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.189722 = idf(docFreq=672, maxDocs=44421)
                0.09375 = fieldNorm(doc=915)
          0.1034183 = weight(abstract_txt:english in 915) [ClassicSimilarity], result of:
            0.1034183 = score(doc=915,freq=2.0), product of:
              0.13992572 = queryWeight, product of:
                1.1550615 = boost
                5.5745983 = idf(docFreq=457, maxDocs=44421)
                0.021730958 = queryNorm
              0.73909426 = fieldWeight in 915, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.5745983 = idf(docFreq=457, maxDocs=44421)
                0.09375 = fieldNorm(doc=915)
          0.37921765 = weight(abstract_txt:bilingual in 915) [ClassicSimilarity], result of:
            0.37921765 = score(doc=915,freq=4.0), product of:
              0.2640878 = queryWeight, product of:
                1.5868303 = boost
                7.6584163 = idf(docFreq=56, maxDocs=44421)
                0.021730958 = queryNorm
              1.435953 = fieldWeight in 915, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                7.6584163 = idf(docFreq=56, maxDocs=44421)
                0.09375 = fieldNorm(doc=915)
          0.20949289 = weight(abstract_txt:wales in 915) [ClassicSimilarity], result of:
            0.20949289 = score(doc=915,freq=1.0), product of:
              0.28224233 = queryWeight, product of:
                1.6404666 = boost
                7.917278 = idf(docFreq=43, maxDocs=44421)
                0.021730958 = queryNorm
              0.7422448 = fieldWeight in 915, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.917278 = idf(docFreq=43, maxDocs=44421)
                0.09375 = fieldNorm(doc=915)
          0.10610821 = weight(abstract_txt:language in 915) [ClassicSimilarity], result of:
            0.10610821 = score(doc=915,freq=3.0), product of:
              0.15666723 = queryWeight, product of:
                1.7284642 = boost
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.021730958 = queryNorm
              0.677284 = fieldWeight in 915, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.09375 = fieldNorm(doc=915)
        0.24 = coord(6/25)
    
  2. Tseng, Y.-H.: Automatic cataloguing and searching for retrospective data by use of OCR text (2001) 0.18
    0.18273325 = sum of:
      0.18273325 = product of:
        0.5710414 = sum of:
          0.043415457 = weight(abstract_txt:special in 5420) [ClassicSimilarity], result of:
            0.043415457 = score(doc=5420,freq=1.0), product of:
              0.11161597 = queryWeight, product of:
                1.0316194 = boost
                4.978838 = idf(docFreq=830, maxDocs=44421)
                0.021730958 = queryNorm
              0.38897172 = fieldWeight in 5420, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.978838 = idf(docFreq=830, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.08516346 = weight(abstract_txt:languages in 5420) [ClassicSimilarity], result of:
            0.08516346 = score(doc=5420,freq=3.0), product of:
              0.12127145 = queryWeight, product of:
                1.0753148 = boost
                5.189722 = idf(docFreq=672, maxDocs=44421)
                0.021730958 = queryNorm
              0.70225483 = fieldWeight in 5420, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                5.189722 = idf(docFreq=672, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.06093982 = weight(abstract_txt:english in 5420) [ClassicSimilarity], result of:
            0.06093982 = score(doc=5420,freq=1.0), product of:
              0.13992572 = queryWeight, product of:
                1.1550615 = boost
                5.5745983 = idf(docFreq=457, maxDocs=44421)
                0.021730958 = queryNorm
              0.4355155 = fieldWeight in 5420, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5745983 = idf(docFreq=457, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.062492084 = weight(abstract_txt:solutions in 5420) [ClassicSimilarity], result of:
            0.062492084 = score(doc=5420,freq=1.0), product of:
              0.14229187 = queryWeight, product of:
                1.1647866 = boost
                5.6215343 = idf(docFreq=436, maxDocs=44421)
                0.021730958 = queryNorm
              0.43918237 = fieldWeight in 5420, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.6215343 = idf(docFreq=436, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.05120091 = weight(abstract_txt:retrieval in 5420) [ClassicSimilarity], result of:
            0.05120091 = score(doc=5420,freq=3.0), product of:
              0.108839065 = queryWeight, product of:
                1.4406674 = boost
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.021730958 = queryNorm
              0.4704277 = fieldWeight in 5420, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.051051337 = weight(abstract_txt:language in 5420) [ClassicSimilarity], result of:
            0.051051337 = score(doc=5420,freq=1.0), product of:
              0.15666723 = queryWeight, product of:
                1.7284642 = boost
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.021730958 = queryNorm
              0.3258584 = fieldWeight in 5420, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.055969626 = weight(abstract_txt:problems in 5420) [ClassicSimilarity], result of:
            0.055969626 = score(doc=5420,freq=1.0), product of:
              0.16657445 = queryWeight, product of:
                1.7822782 = boost
                4.300847 = idf(docFreq=1636, maxDocs=44421)
                0.021730958 = queryNorm
              0.33600366 = fieldWeight in 5420, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.300847 = idf(docFreq=1636, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
          0.1608087 = weight(abstract_txt:text in 5420) [ClassicSimilarity], result of:
            0.1608087 = score(doc=5420,freq=3.0), product of:
              0.29409167 = queryWeight, product of:
                3.3490965 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.021730958 = queryNorm
              0.5467979 = fieldWeight in 5420, product of:
                1.7320508 = tf(freq=3.0), with freq of:
                  3.0 = termFreq=3.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.078125 = fieldNorm(doc=5420)
        0.32 = coord(8/25)
    
  3. Riggs, K.R.: XML and free text (2002) 0.18
    0.1791295 = sum of:
      0.1791295 = product of:
        0.89564747 = sum of:
          0.08168214 = weight(abstract_txt:language in 1461) [ClassicSimilarity], result of:
            0.08168214 = score(doc=1461,freq=1.0), product of:
              0.15666723 = queryWeight, product of:
                1.7284642 = boost
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.021730958 = queryNorm
              0.52137345 = fieldWeight in 1461, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.125 = fieldNorm(doc=1461)
          0.1266448 = weight(abstract_txt:problems in 1461) [ClassicSimilarity], result of:
            0.1266448 = score(doc=1461,freq=2.0), product of:
              0.16657445 = queryWeight, product of:
                1.7822782 = boost
                4.300847 = idf(docFreq=1636, maxDocs=44421)
                0.021730958 = queryNorm
              0.7602895 = fieldWeight in 1461, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.300847 = idf(docFreq=1636, maxDocs=44421)
                0.125 = fieldNorm(doc=1461)
          0.11014523 = weight(abstract_txt:proposed in 1461) [ClassicSimilarity], result of:
            0.11014523 = score(doc=1461,freq=1.0), product of:
              0.19122174 = queryWeight, product of:
                1.9095892 = boost
                4.608063 = idf(docFreq=1203, maxDocs=44421)
                0.021730958 = queryNorm
              0.5760079 = fieldWeight in 1461, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.608063 = idf(docFreq=1203, maxDocs=44421)
                0.125 = fieldNorm(doc=1461)
          0.28007784 = weight(abstract_txt:free in 1461) [ClassicSimilarity], result of:
            0.28007784 = score(doc=1461,freq=2.0), product of:
              0.28275 = queryWeight, product of:
                2.3220556 = boost
                5.6033936 = idf(docFreq=444, maxDocs=44421)
                0.021730958 = queryNorm
              0.9905494 = fieldWeight in 1461, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                5.6033936 = idf(docFreq=444, maxDocs=44421)
                0.125 = fieldNorm(doc=1461)
          0.29709744 = weight(abstract_txt:text in 1461) [ClassicSimilarity], result of:
            0.29709744 = score(doc=1461,freq=4.0), product of:
              0.29409167 = queryWeight, product of:
                3.3490965 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.021730958 = queryNorm
              1.0102205 = fieldWeight in 1461, product of:
                2.0 = tf(freq=4.0), with freq of:
                  4.0 = termFreq=4.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.125 = fieldNorm(doc=1461)
        0.2 = coord(5/25)
    
  4. Ata, B.M.A.: SISDOM: a multilingual document retrieval system (1995) 0.16
    0.15718558 = sum of:
      0.15718558 = product of:
        0.65493995 = sum of:
          0.05882971 = weight(abstract_txt:full in 963) [ClassicSimilarity], result of:
            0.05882971 = score(doc=963,freq=1.0), product of:
              0.10921339 = queryWeight, product of:
                1.020456 = boost
                4.9249606 = idf(docFreq=876, maxDocs=44421)
                0.021730958 = queryNorm
              0.53866756 = fieldWeight in 963, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9249606 = idf(docFreq=876, maxDocs=44421)
                0.109375 = fieldNorm(doc=963)
          0.08531574 = weight(abstract_txt:english in 963) [ClassicSimilarity], result of:
            0.08531574 = score(doc=963,freq=1.0), product of:
              0.13992572 = queryWeight, product of:
                1.1550615 = boost
                5.5745983 = idf(docFreq=457, maxDocs=44421)
                0.021730958 = queryNorm
              0.60972166 = fieldWeight in 963, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.5745983 = idf(docFreq=457, maxDocs=44421)
                0.109375 = fieldNorm(doc=963)
          0.05852752 = weight(abstract_txt:retrieval in 963) [ClassicSimilarity], result of:
            0.05852752 = score(doc=963,freq=2.0), product of:
              0.108839065 = queryWeight, product of:
                1.4406674 = boost
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.021730958 = queryNorm
              0.5377437 = fieldWeight in 963, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.109375 = fieldNorm(doc=963)
          0.22121032 = weight(abstract_txt:bilingual in 963) [ClassicSimilarity], result of:
            0.22121032 = score(doc=963,freq=1.0), product of:
              0.2640878 = queryWeight, product of:
                1.5868303 = boost
                7.6584163 = idf(docFreq=56, maxDocs=44421)
                0.021730958 = queryNorm
              0.8376393 = fieldWeight in 963, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                7.6584163 = idf(docFreq=56, maxDocs=44421)
                0.109375 = fieldNorm(doc=963)
          0.10107649 = weight(abstract_txt:language in 963) [ClassicSimilarity], result of:
            0.10107649 = score(doc=963,freq=2.0), product of:
              0.15666723 = queryWeight, product of:
                1.7284642 = boost
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.021730958 = queryNorm
              0.64516675 = fieldWeight in 963, product of:
                1.4142135 = tf(freq=2.0), with freq of:
                  2.0 = termFreq=2.0
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.109375 = fieldNorm(doc=963)
          0.12998013 = weight(abstract_txt:text in 963) [ClassicSimilarity], result of:
            0.12998013 = score(doc=963,freq=1.0), product of:
              0.29409167 = queryWeight, product of:
                3.3490965 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.021730958 = queryNorm
              0.44197148 = fieldWeight in 963, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.109375 = fieldNorm(doc=963)
        0.24 = coord(6/25)
    
  5. Asija, S.P.: Natural language interface without artifical intelligence (1989) 0.15
    0.14786926 = sum of:
      0.14786926 = product of:
        0.61612195 = sum of:
          0.084042445 = weight(abstract_txt:full in 5779) [ClassicSimilarity], result of:
            0.084042445 = score(doc=5779,freq=1.0), product of:
              0.10921339 = queryWeight, product of:
                1.020456 = boost
                4.9249606 = idf(docFreq=876, maxDocs=44421)
                0.021730958 = queryNorm
              0.7695251 = fieldWeight in 5779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.9249606 = idf(docFreq=876, maxDocs=44421)
                0.15625 = fieldNorm(doc=5779)
          0.086830914 = weight(abstract_txt:special in 5779) [ClassicSimilarity], result of:
            0.086830914 = score(doc=5779,freq=1.0), product of:
              0.11161597 = queryWeight, product of:
                1.0316194 = boost
                4.978838 = idf(docFreq=830, maxDocs=44421)
                0.021730958 = queryNorm
              0.77794343 = fieldWeight in 5779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.978838 = idf(docFreq=830, maxDocs=44421)
                0.15625 = fieldNorm(doc=5779)
          0.0983383 = weight(abstract_txt:languages in 5779) [ClassicSimilarity], result of:
            0.0983383 = score(doc=5779,freq=1.0), product of:
              0.12127145 = queryWeight, product of:
                1.0753148 = boost
                5.189722 = idf(docFreq=672, maxDocs=44421)
                0.021730958 = queryNorm
              0.8108941 = fieldWeight in 5779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                5.189722 = idf(docFreq=672, maxDocs=44421)
                0.15625 = fieldNorm(doc=5779)
          0.05912172 = weight(abstract_txt:retrieval in 5779) [ClassicSimilarity], result of:
            0.05912172 = score(doc=5779,freq=1.0), product of:
              0.108839065 = queryWeight, product of:
                1.4406674 = boost
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.021730958 = queryNorm
              0.5432031 = fieldWeight in 5779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                3.4765 = idf(docFreq=3732, maxDocs=44421)
                0.15625 = fieldNorm(doc=5779)
          0.102102675 = weight(abstract_txt:language in 5779) [ClassicSimilarity], result of:
            0.102102675 = score(doc=5779,freq=1.0), product of:
              0.15666723 = queryWeight, product of:
                1.7284642 = boost
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.021730958 = queryNorm
              0.6517168 = fieldWeight in 5779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.1709876 = idf(docFreq=1863, maxDocs=44421)
                0.15625 = fieldNorm(doc=5779)
          0.1856859 = weight(abstract_txt:text in 5779) [ClassicSimilarity], result of:
            0.1856859 = score(doc=5779,freq=1.0), product of:
              0.29409167 = queryWeight, product of:
                3.3490965 = boost
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.021730958 = queryNorm
              0.6313878 = fieldWeight in 5779, product of:
                1.0 = tf(freq=1.0), with freq of:
                  1.0 = termFreq=1.0
                4.040882 = idf(docFreq=2122, maxDocs=44421)
                0.15625 = fieldNorm(doc=5779)
        0.24 = coord(6/25)