2 Copyright (C) 2020 Carl Hetherington <cth@carlh.net>
4 This file is part of libdcp.
6 libdcp is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
11 libdcp is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with libdcp. If not, see <http://www.gnu.org/licenses/>.
19 In addition, as a special exception, the copyright holders give
20 permission to link the code of portions of this program with the
21 OpenSSL library under certain conditions as described in each
22 individual source file, and distribute linked combinations
25 You must obey the GNU General Public License in all respects
26 for all of the code used other than OpenSSL. If you modify
27 file(s) with this exception, you may extend this exception to your
28 version of the file(s), but you are not obligated to do so. If you
29 do not wish to do so, delete this exception statement from your
30 version. If you delete this exception statement from all source
31 files in the program, then also delete it here.
35 #include "compose.hpp"
36 #include "dcp_assert.h"
37 #include "exceptions.h"
38 #include "language_tag.h"
39 #include <boost/algorithm/string.hpp>
40 #include <boost/foreach.hpp>
49 using boost::optional;
50 using boost::algorithm::trim;
56 static vector<LanguageTag::SubtagData> language_list;
57 static vector<LanguageTag::SubtagData> variant_list;
58 static vector<LanguageTag::SubtagData> region_list;
59 static vector<LanguageTag::SubtagData> script_list;
60 static vector<LanguageTag::SubtagData> extlang_list;
65 optional<LanguageTag::SubtagData>
66 find_in_list (vector<LanguageTag::SubtagData> const& list, string subtag)
68 BOOST_FOREACH (LanguageTag::SubtagData const& i, list) {
69 if (boost::iequals(i.subtag, subtag)) {
74 return optional<LanguageTag::SubtagData>();
78 LanguageTag::Subtag::Subtag (string subtag, SubtagType type)
81 if (!get_subtag_data(type, subtag)) {
82 throw LanguageTagError(String::compose("Unknown %1 string %2", subtag_type_name(type), subtag));
87 LanguageTag::LanguageTag (string tag)
90 boost::split (parts, tag, boost::is_any_of("-"));
92 throw LanguageTagError (String::compose("Could not parse language tag %1", tag));
95 vector<string>::size_type p = 0;
96 _language = LanguageSubtag (parts[p]);
99 if (p == parts.size()) {
104 _script = ScriptSubtag (parts[p]);
108 if (p == parts.size()) {
113 _region = RegionSubtag (parts[p]);
117 if (p == parts.size()) {
123 _variants.push_back (VariantSubtag(parts[p]));
125 if (p == parts.size()) {
133 _extlangs.push_back (ExtlangSubtag(parts[p]));
135 if (p == parts.size()) {
141 if (p < parts.size()) {
142 throw LanguageTagError (String::compose("Unrecognised subtag %1", parts[p]));
148 LanguageTag::to_string () const
151 throw LanguageTagError("No language set up");
154 string s = _language->subtag();
157 s += "-" + _script->subtag();
161 s += "-" + _region->subtag();
164 BOOST_FOREACH (VariantSubtag i, _variants) {
165 s += "-" + i.subtag();
168 BOOST_FOREACH (ExtlangSubtag i, _extlangs) {
169 s += "-" + i.subtag();
177 LanguageTag::set_language (LanguageSubtag language)
179 _language = language;
184 LanguageTag::set_script (ScriptSubtag script)
191 LanguageTag::set_region (RegionSubtag region)
198 LanguageTag::add_variant (VariantSubtag variant)
200 if (find(_variants.begin(), _variants.end(), variant) != _variants.end()) {
201 throw LanguageTagError (String::compose("Duplicate Variant subtag %1", variant.subtag()));
204 _variants.push_back (variant);
210 check_for_duplicates (vector<T> const& subtags, dcp::LanguageTag::SubtagType type)
212 vector<T> sorted = subtags;
213 sort (sorted.begin(), sorted.end());
215 BOOST_FOREACH (T const& i, sorted) {
216 if (last && i == *last) {
217 throw LanguageTagError (String::compose("Duplicate %1 subtag %2", dcp::LanguageTag::subtag_type_name(type), i.subtag()));
225 LanguageTag::set_variants (vector<VariantSubtag> variants)
227 check_for_duplicates (variants, VARIANT);
228 _variants = variants;
233 LanguageTag::add_extlang (ExtlangSubtag extlang)
235 if (find(_extlangs.begin(), _extlangs.end(), extlang) != _extlangs.end()) {
236 throw LanguageTagError (String::compose("Duplicate Extlang subtag %1", extlang.subtag()));
239 _extlangs.push_back (extlang);
244 LanguageTag::set_extlangs (vector<ExtlangSubtag> extlangs)
246 check_for_duplicates (extlangs, EXTLANG);
247 _extlangs = extlangs;
252 LanguageTag::description () const
255 throw LanguageTagError("No language set up");
260 BOOST_FOREACH (VariantSubtag const& i, _variants) {
261 optional<SubtagData> variant = get_subtag_data (VARIANT, i.subtag());
262 DCP_ASSERT (variant);
263 d += variant->description + " dialect of ";
266 optional<SubtagData> language = get_subtag_data (LANGUAGE, _language->subtag());
267 DCP_ASSERT (language);
268 d += language->description;
271 optional<SubtagData> script = get_subtag_data (SCRIPT, _script->subtag());
273 d += " written using the " + script->description + " script";
277 optional<SubtagData> region = get_subtag_data (REGION, _region->subtag());
279 d += " for " + region->description;
282 BOOST_FOREACH (ExtlangSubtag const& i, _extlangs) {
283 optional<SubtagData> extlang = get_subtag_data (EXTLANG, i.subtag());
284 DCP_ASSERT (extlang);
285 d += ", " + extlang->description;
292 vector<LanguageTag::SubtagData> const &
293 LanguageTag::get_all (SubtagType type)
297 return language_list;
308 return language_list;
313 LanguageTag::subtag_type_name (SubtagType type)
332 dcp::LanguageTag::VariantSubtag::operator== (VariantSubtag const & other) const
334 return subtag() == other.subtag();
339 dcp::LanguageTag::VariantSubtag::operator< (VariantSubtag const & other) const
341 return subtag() < other.subtag();
346 dcp::LanguageTag::ExtlangSubtag::operator== (ExtlangSubtag const & other) const
348 return subtag() == other.subtag();
353 dcp::LanguageTag::ExtlangSubtag::operator< (ExtlangSubtag const & other) const
355 return subtag() < other.subtag();
360 dcp::operator== (dcp::LanguageTag const& a, dcp::LanguageTag const& b)
362 return a.to_string() == b.to_string();
367 dcp::operator<< (ostream& os, dcp::LanguageTag const& tag)
369 os << tag.to_string();
374 vector<pair<LanguageTag::SubtagType, LanguageTag::SubtagData> >
375 LanguageTag::subtags () const
377 vector<pair<SubtagType, SubtagData> > s;
380 s.push_back (make_pair(LANGUAGE, *get_subtag_data(LANGUAGE, _language->subtag())));
384 s.push_back (make_pair(SCRIPT, *get_subtag_data(SCRIPT, _script->subtag())));
388 s.push_back (make_pair(REGION, *get_subtag_data(REGION, _region->subtag())));
391 BOOST_FOREACH (VariantSubtag const& i, _variants) {
392 s.push_back (make_pair(VARIANT, *get_subtag_data(VARIANT, i.subtag())));
395 BOOST_FOREACH (ExtlangSubtag const& i, _extlangs) {
396 s.push_back (make_pair(EXTLANG, *get_subtag_data(EXTLANG, i.subtag())));
403 optional<LanguageTag::SubtagData>
404 LanguageTag::get_subtag_data (LanguageTag::SubtagType type, string subtag)
407 case dcp::LanguageTag::LANGUAGE:
408 return find_in_list(language_list, subtag);
409 case dcp::LanguageTag::SCRIPT:
410 return find_in_list(script_list, subtag);
411 case dcp::LanguageTag::REGION:
412 return find_in_list(region_list, subtag);
413 case dcp::LanguageTag::VARIANT:
414 return find_in_list(variant_list, subtag);
415 case dcp::LanguageTag::EXTLANG:
416 return find_in_list(extlang_list, subtag);
419 return optional<LanguageTag::SubtagData>();
424 LanguageTag::get_subtag_description (LanguageTag::SubtagType type, string subtag)
426 optional<SubtagData> data = get_subtag_data (type, subtag);
428 return optional<string>();
431 return data->description;
436 load_language_tag_list (boost::filesystem::path tags_directory, string name, vector<LanguageTag::SubtagData>& list)
438 FILE* f = fopen_boost (tags_directory / name, "r");
440 throw FileError ("Could not open tags file", tags_directory / name, errno);
446 char* r = fgets (buffer, sizeof(buffer), f);
452 r = fgets (buffer, sizeof(buffer), f);
455 throw FileError ("Bad tags file", tags_directory / name, -1);
459 list.push_back (LanguageTag::SubtagData(a, b));
468 dcp::load_language_tag_lists (boost::filesystem::path tags_directory)
470 load_language_tag_list (tags_directory, "language", language_list);
471 load_language_tag_list (tags_directory, "variant", variant_list);
472 load_language_tag_list (tags_directory, "region", region_list);
473 load_language_tag_list (tags_directory, "script", script_list);
474 load_language_tag_list (tags_directory, "extlang", extlang_list);