Changeset 909 for metadata


Ignore:
Timestamp:
11/17/10 13:25:55 (14 years ago)
Author:
dietuyt
Message:

Fix for UTF-8 issues.

File:
1 edited

Legend:

Unmodified
Added
Removed
  • metadata/trunk/toolkit/scripts/lrt2cmdi.py

    r907 r909  
    55
    66import urllib, csv, datetime, xml.etree.ElementTree as ElementTree
     7from curses.ascii import ascii
    78
    89class CmdiFile:
     
    9697                newLanguageNode = ElementTree.Element("ISO639")
    9798                newCodeNode = ElementTree.Element("iso-639-%s-code" % iso639Type)
    98                 newCodeNode.text = isoList[language]
     99                keyLang = language.encode("utf-8")
     100                newCodeNode.text = isoList[keyLang]
    99101                newLanguageNode.append(newCodeNode)
    100102                languagesNode.append(newLanguageNode)
     
    214216def loadInfo():
    215217    csvFile = csv.reader(urllib.urlopen("http://www.clarin.eu/export_resources").readlines())
     218    #csvFile =[l.decode('utf-8') for l in rawCsvFile]
     219   
    216220    #csvFile = csv.reader(urllib.urlopen("resources.csv").readlines()) 
    217221    linenr = 0
     
    224228            colnr = 0
    225229            for field in fieldList:
    226                 newDict[linenr][fieldList[colnr].replace(" ", "_")] = l[colnr]
     230                newDict[linenr][fieldList[colnr].replace(" ", "_").decode('utf-8')] = l[colnr].decode('utf-8')
    227231                colnr += 1
    228232        linenr += 1
     
    233237    dictionary = dict()
    234238    for l in csvFile:
    235         dictionary[l[1]] = l[0]
     239        dictionary[l[1]] = unicode(l[0])
     240
    236241    return dictionary
    237242
Note: See TracChangeset for help on using the changeset viewer.