1 | package eu.clarin.sru.fcs.aggregator.lang; |
---|
2 | |
---|
3 | import com.fasterxml.jackson.core.JsonProcessingException; |
---|
4 | import com.fasterxml.jackson.databind.ObjectMapper; |
---|
5 | import com.fasterxml.jackson.databind.ObjectWriter; |
---|
6 | import java.io.BufferedReader; |
---|
7 | import java.io.IOException; |
---|
8 | import java.io.InputStream; |
---|
9 | import java.io.InputStreamReader; |
---|
10 | import java.util.HashMap; |
---|
11 | import java.util.Map; |
---|
12 | import java.util.Set; |
---|
13 | import org.slf4j.LoggerFactory; |
---|
14 | |
---|
15 | /** |
---|
16 | * Represents collection of languages. |
---|
17 | * |
---|
18 | * @author Yana Panchenko |
---|
19 | */ |
---|
20 | public class LanguagesISO693_3 { |
---|
21 | |
---|
22 | private static final org.slf4j.Logger log = LoggerFactory.getLogger(LanguagesISO693_3.class); |
---|
23 | public static final String LANGUAGES_FILE_PATH = "/lang/iso-639-3_20140320.tab"; |
---|
24 | public static final String LANGUAGES_FILE_ENCODING = "UTF-8"; |
---|
25 | |
---|
26 | private static LanguagesISO693_3 instance = null; |
---|
27 | |
---|
28 | public static class Language { |
---|
29 | |
---|
30 | String code, name; |
---|
31 | |
---|
32 | public Language(String code, String name) { |
---|
33 | this.code = code; |
---|
34 | this.name = name; |
---|
35 | } |
---|
36 | } |
---|
37 | |
---|
38 | private Map<String, Language> code2Lang = new HashMap<String, Language>(); |
---|
39 | private Map<String, Language> name2Lang = new HashMap<String, Language>(); |
---|
40 | |
---|
41 | private LanguagesISO693_3() { |
---|
42 | InputStream is = LanguagesISO693_3.class.getResourceAsStream(LANGUAGES_FILE_PATH); |
---|
43 | try (BufferedReader br = new BufferedReader(new InputStreamReader(is, LANGUAGES_FILE_ENCODING))) { |
---|
44 | String line; |
---|
45 | while ((line = br.readLine()) != null) { |
---|
46 | if (line.length() > 0) { |
---|
47 | String[] toks = line.split("\\t"); |
---|
48 | if (toks.length != 7 && toks.length != 8) { |
---|
49 | log.error("Line error in language codes file: ", line); |
---|
50 | continue; |
---|
51 | } |
---|
52 | String code = toks[0]; |
---|
53 | String name = toks[6]; |
---|
54 | Language l = new Language(code, name); |
---|
55 | code2Lang.put(code, l); |
---|
56 | name2Lang.put(name, l); |
---|
57 | } |
---|
58 | } |
---|
59 | } catch (IOException ex) { |
---|
60 | log.error("Initialization of languages code to name mapping failed.", ex); |
---|
61 | } |
---|
62 | |
---|
63 | ObjectWriter ow = new ObjectMapper().writerWithDefaultPrettyPrinter(); |
---|
64 | try { |
---|
65 | System.out.println(ow.writeValueAsString(code2Lang)); |
---|
66 | } catch (JsonProcessingException ex) { |
---|
67 | } |
---|
68 | } |
---|
69 | |
---|
70 | public static LanguagesISO693_3 getInstance() { |
---|
71 | if (instance == null) { |
---|
72 | instance = new LanguagesISO693_3(); |
---|
73 | } |
---|
74 | return instance; |
---|
75 | } |
---|
76 | |
---|
77 | public Set<String> getCodes() { |
---|
78 | return code2Lang.keySet(); |
---|
79 | } |
---|
80 | |
---|
81 | public String codeForName(String name) { |
---|
82 | Language l = name2Lang.get(name); |
---|
83 | if (l == null) { |
---|
84 | log.error("Unknown language name: " + name); |
---|
85 | return null; |
---|
86 | } |
---|
87 | return l.code; |
---|
88 | } |
---|
89 | |
---|
90 | public String nameForCode(String code) { |
---|
91 | Language l = code2Lang.get(code); |
---|
92 | if (l == null) { |
---|
93 | log.error("Unknown language code: " + code); |
---|
94 | return null; |
---|
95 | } |
---|
96 | return l.name; |
---|
97 | } |
---|
98 | |
---|
99 | } |
---|