Changeset 909
- Timestamp:
- 11/17/10 13:25:55 (14 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
metadata/trunk/toolkit/scripts/lrt2cmdi.py
r907 r909 5 5 6 6 import urllib, csv, datetime, xml.etree.ElementTree as ElementTree 7 from curses.ascii import ascii 7 8 8 9 class CmdiFile: … … 96 97 newLanguageNode = ElementTree.Element("ISO639") 97 98 newCodeNode = ElementTree.Element("iso-639-%s-code" % iso639Type) 98 newCodeNode.text = isoList[language] 99 keyLang = language.encode("utf-8") 100 newCodeNode.text = isoList[keyLang] 99 101 newLanguageNode.append(newCodeNode) 100 102 languagesNode.append(newLanguageNode) … … 214 216 def loadInfo(): 215 217 csvFile = csv.reader(urllib.urlopen("http://www.clarin.eu/export_resources").readlines()) 218 #csvFile =[l.decode('utf-8') for l in rawCsvFile] 219 216 220 #csvFile = csv.reader(urllib.urlopen("resources.csv").readlines()) 217 221 linenr = 0 … … 224 228 colnr = 0 225 229 for field in fieldList: 226 newDict[linenr][fieldList[colnr].replace(" ", "_") ] = l[colnr]230 newDict[linenr][fieldList[colnr].replace(" ", "_").decode('utf-8')] = l[colnr].decode('utf-8') 227 231 colnr += 1 228 232 linenr += 1 … … 233 237 dictionary = dict() 234 238 for l in csvFile: 235 dictionary[l[1]] = l[0] 239 dictionary[l[1]] = unicode(l[0]) 240 236 241 return dictionary 237 242
Note: See TracChangeset
for help on using the changeset viewer.