KI18n

isocodescache.cpp
1/*
2 SPDX-FileCopyrightText: 2021 Volker Krause <vkrause@kde.org>
3
4 SPDX-License-Identifier: LGPL-2.0-or-later
5*/
6
7#include "config-localedata.h"
8
9#include "isocodes_p.h"
10#include "isocodescache_p.h"
11#include "logging.h"
12
13#include <QDir>
14#include <QFile>
15#include <QFileInfo>
16#include <QJsonArray>
17#include <QJsonDocument>
18#include <QJsonObject>
19#include <QStandardPaths>
20
21using namespace Qt::Literals;
22
23// increment those when changing the format
24enum : uint32_t {
25 Iso3166_1CacheHeader = 0x4B493102,
26 Iso3166_2CacheHeader = 0x4B493201,
27};
28
29static QString isoCodesPath(QStringView file)
30{
31#ifndef Q_OS_ANDROID
33 if (!path.isEmpty()) {
34 return path;
35 }
36
37 // search manually in the compile-time determined prefix
38 // needed for example for non-installed Windows binaries to work, such as unit tests
39 for (const char *installLocation : {"/share", "/bin/data"}) {
40 path = QLatin1String(ISO_CODES_PREFIX) + QLatin1String(installLocation) + QLatin1String("/iso-codes/json/") + file;
41 if (QFileInfo::exists(path)) {
42 return path;
43 }
44 }
45
46 return {};
47#else
48 return QLatin1String("assets:/share/iso-codes/json/") + file;
49#endif
50}
51
52static QString cachePath()
53{
55}
56
57static QString cacheFilePath(QStringView file)
58{
59 return cachePath() + file;
60}
61
62IsoCodesCache::~IsoCodesCache() = default;
63
64IsoCodesCache *IsoCodesCache::instance()
65{
66 static IsoCodesCache s_cache;
67 return &s_cache;
68}
69
70void IsoCodesCache::loadIso3166_1()
71{
72 if (!m_iso3166_1CacheData && !loadIso3166_1Cache()) {
73 QDir().mkpath(cachePath());
74 createIso3166_1Cache(isoCodesPath(u"iso_3166-1.json"), cacheFilePath(u"iso_3166-1"));
75 loadIso3166_1Cache();
76 }
77}
78
79static std::unique_ptr<QFile> openCacheFile(QStringView cacheFileName, QStringView isoCodesFileName)
80{
81 QFileInfo jsonFi(isoCodesPath(isoCodesFileName));
82 if (!jsonFi.exists()) { // no source file means we can only use an embedded cache
83 auto f = std::make_unique<QFile>(QLatin1String(":/org.kde.ki18n/iso-codes/cache/") + cacheFileName);
84 if (!f->open(QFile::ReadOnly) || f->size() < 8) {
85 return {};
86 }
87 return f;
88 }
89 auto f = std::make_unique<QFile>(cacheFilePath(cacheFileName));
90 if (!f->open(QFile::ReadOnly) || f->fileTime(QFile::FileModificationTime) < jsonFi.lastModified() || f->size() < 8) {
91 return {};
92 }
93 return f;
94}
95
96bool IsoCodesCache::loadIso3166_1Cache()
97{
98 auto f = openCacheFile(u"iso_3166-1", u"iso_3166-1.json");
99 if (!f) {
100 return false;
101 }
102 m_iso3166_1CacheSize = f->size();
103
104 // validate cache file is usable
105 // header matches
106 const auto data = f->map(0, m_iso3166_1CacheSize);
107 if (*reinterpret_cast<const uint32_t *>(data) != Iso3166_1CacheHeader) {
108 return false;
109 }
110 // lookup tables fit into the available size
111 const auto size = *(reinterpret_cast<const uint32_t *>(data) + 1);
112 if (sizeof(Iso3166_1CacheHeader) + sizeof(size) + size * sizeof(MapEntry<uint16_t>) * 2 >= m_iso3166_1CacheSize) {
113 return false;
114 }
115 // string table is 0 terminated
116 if (data[m_iso3166_1CacheSize - 1] != '\0') {
117 return false;
118 }
119
120 m_iso3166_1CacheFile = std::move(f);
121 m_iso3166_1CacheData = data;
122 return true;
123}
124
125uint32_t IsoCodesCache::countryCount() const
126{
127 return m_iso3166_1CacheData ? *(reinterpret_cast<const uint32_t *>(m_iso3166_1CacheData) + 1) : 0;
128}
129
130const MapEntry<uint16_t> *IsoCodesCache::countryNameMapBegin() const
131{
132 return m_iso3166_1CacheData ? reinterpret_cast<const MapEntry<uint16_t> *>(m_iso3166_1CacheData + sizeof(uint32_t) * 2) : nullptr;
133}
134
135const MapEntry<uint16_t> *IsoCodesCache::countryAlpha3MapBegin() const
136{
137 return m_iso3166_1CacheData ? countryNameMapBegin() + countryCount() : nullptr;
138}
139
140const char *IsoCodesCache::countryStringTableLookup(uint16_t offset) const
141{
142 if (m_iso3166_1CacheData) {
143 const auto pos = offset + 2 * sizeof(uint32_t) + 2 * countryCount() * sizeof(MapEntry<uint16_t>);
144 return m_iso3166_1CacheSize > pos ? reinterpret_cast<const char *>(m_iso3166_1CacheData + pos) : nullptr;
145 }
146 return nullptr;
147}
148
149[[nodiscard]] static QByteArray nameForIso3166_1(const QJsonObject &entry)
150{
151 if (const auto commonName = entry.value("common_name"_L1).toString(); !commonName.isEmpty()) {
152 return commonName.toUtf8();
153 }
154 return entry.value("name"_L1).toString().toUtf8();
155}
156
157void IsoCodesCache::createIso3166_1Cache(const QString &isoCodesPath, const QString &cacheFilePath)
158{
159 qCDebug(KI18NLD) << "Rebuilding ISO 3166-1 cache";
160
161 QFile file(isoCodesPath);
162 if (!file.open(QFile::ReadOnly)) {
163 qCWarning(KI18NLD) << "Unable to open iso_3166-1.json" << isoCodesPath << file.errorString();
164 return;
165 }
166
167 std::vector<MapEntry<uint16_t>> alpha2NameMap;
168 std::vector<MapEntry<uint16_t>> alpha3alpha2Map;
169 QByteArray iso3166_1stringTable;
170
171 const auto doc = QJsonDocument::fromJson(file.readAll());
172 const auto array = doc.object().value(QLatin1String("3166-1")).toArray();
173 for (const auto &entryVal : array) {
174 const auto entry = entryVal.toObject();
175 const auto alpha2 = entry.value(QLatin1String("alpha_2")).toString();
176 if (alpha2.size() != 2) {
177 continue;
178 }
179 const auto alpha2Key = IsoCodes::alpha2CodeToKey(alpha2);
180
181 assert(std::numeric_limits<uint16_t>::max() > iso3166_1stringTable.size());
182 alpha2NameMap.push_back({alpha2Key, (uint16_t)iso3166_1stringTable.size()});
183 iso3166_1stringTable.append(nameForIso3166_1(entry));
184 iso3166_1stringTable.append('\0');
185
186 const auto alpha3Key = IsoCodes::alpha3CodeToKey(entry.value(QLatin1String("alpha_3")).toString());
187 alpha3alpha2Map.push_back({alpha3Key, alpha2Key});
188 }
189
190 std::sort(alpha2NameMap.begin(), alpha2NameMap.end());
191 std::sort(alpha3alpha2Map.begin(), alpha3alpha2Map.end());
192
193 // write out binary cache file
194 QFile cache(cacheFilePath);
195 if (!cache.open(QFile::WriteOnly)) {
196 qCWarning(KI18NLD) << "Failed to write ISO 3166-1 cache:" << cache.errorString() << cache.fileName();
197 return;
198 }
199
200 uint32_t n = Iso3166_1CacheHeader;
201 cache.write(reinterpret_cast<const char *>(&n), 4); // header
202 n = alpha2NameMap.size();
203 cache.write(reinterpret_cast<const char *>(&n), 4); // size
204 for (auto entry : alpha2NameMap) {
205 cache.write(reinterpret_cast<const char *>(&entry), sizeof(entry));
206 }
207 for (auto entry : alpha3alpha2Map) {
208 cache.write(reinterpret_cast<const char *>(&entry), sizeof(entry));
209 }
210 cache.write(iso3166_1stringTable);
211}
212
213void IsoCodesCache::loadIso3166_2()
214{
215 if (!m_iso3166_2CacheData && !loadIso3166_2Cache()) {
216 QDir().mkpath(cachePath());
217 createIso3166_2Cache(isoCodesPath(u"iso_3166-2.json"), cacheFilePath(u"iso_3166-2"));
218 loadIso3166_2Cache();
219 }
220}
221
222bool IsoCodesCache::loadIso3166_2Cache()
223{
224 auto f = openCacheFile(u"iso_3166-2", u"iso_3166-2.json");
225 if (!f) {
226 return false;
227 }
228 m_iso3166_2CacheSize = f->size();
229
230 // validate cache file is usable
231 // header matches
232 const auto data = f->map(0, m_iso3166_2CacheSize);
233 if (*reinterpret_cast<const uint32_t *>(data) != Iso3166_2CacheHeader) {
234 return false;
235 }
236 // name lookup table fits into the available size
237 auto size = *(reinterpret_cast<const uint32_t *>(data) + 1);
238 auto offset = 3 * sizeof(uint32_t) + size * sizeof(MapEntry<uint32_t>);
239 if (offset >= m_iso3166_2CacheSize) {
240 return false;
241 }
242 // hierarchy map boundary check
243 size = *(reinterpret_cast<const uint32_t *>(data + offset) - 1);
244 offset += size * sizeof(MapEntry<uint32_t>);
245 if (offset >= m_iso3166_2CacheSize) {
246 return false;
247 }
248 // string table is 0 terminated
249 if (data[m_iso3166_2CacheSize - 1] != '\0') {
250 return false;
251 }
252
253 m_iso3166_2CacheFile = std::move(f);
254 m_iso3166_2CacheData = data;
255 return true;
256}
257
258uint32_t IsoCodesCache::subdivisionCount() const
259{
260 return m_iso3166_2CacheData ? *(reinterpret_cast<const uint32_t *>(m_iso3166_2CacheData) + 1) : 0;
261}
262
263const MapEntry<uint32_t> *IsoCodesCache::subdivisionNameMapBegin() const
264{
265 return m_iso3166_2CacheData ? reinterpret_cast<const MapEntry<uint32_t> *>(m_iso3166_2CacheData + 2 * sizeof(uint32_t)) : nullptr;
266}
267
268uint32_t IsoCodesCache::subdivisionHierachyMapSize() const
269{
270 return m_iso3166_2CacheData
271 ? *(reinterpret_cast<const uint32_t *>(m_iso3166_2CacheData + 2 * sizeof(uint32_t) + subdivisionCount() * sizeof(MapEntry<uint32_t>)))
272 : 0;
273}
274
275const MapEntry<uint32_t> *IsoCodesCache::subdivisionParentMapBegin() const
276{
277 return m_iso3166_2CacheData
278 ? reinterpret_cast<const MapEntry<uint32_t> *>(m_iso3166_2CacheData + 3 * sizeof(uint32_t) + subdivisionCount() * sizeof(MapEntry<uint32_t>))
279 : nullptr;
280}
281
282const char *IsoCodesCache::subdivisionStringTableLookup(uint16_t offset) const
283{
284 if (m_iso3166_2CacheData) {
285 const auto pos = offset + 3 * sizeof(uint32_t) + (subdivisionCount() + subdivisionHierachyMapSize()) * sizeof(MapEntry<uint32_t>);
286 return m_iso3166_2CacheSize > pos ? reinterpret_cast<const char *>(m_iso3166_2CacheData + pos) : nullptr;
287 }
288 return nullptr;
289}
290
291void IsoCodesCache::createIso3166_2Cache(const QString &isoCodesPath, const QString &cacheFilePath)
292{
293 qCDebug(KI18NLD) << "Rebuilding ISO 3166-2 cache";
294 QFile file(isoCodesPath);
295 if (!file.open(QFile::ReadOnly)) {
296 qCWarning(KI18NLD) << "Unable to open iso_3166-2.json" << isoCodesPath << file.errorString();
297 return;
298 }
299
300 std::vector<MapEntry<uint32_t>> subdivNameMap;
301 std::vector<MapEntry<uint32_t>> subdivParentMap;
302 QByteArray iso3166_2stringTable;
303
304 const auto doc = QJsonDocument::fromJson(file.readAll());
305 const auto array = doc.object().value(QLatin1String("3166-2")).toArray();
306 for (const auto &entryVal : array) {
307 const auto entry = entryVal.toObject();
308 const auto key = IsoCodes::subdivisionCodeToKey(entry.value(QLatin1String("code")).toString());
309
310 assert(std::numeric_limits<uint16_t>::max() > iso3166_2stringTable.size());
311 subdivNameMap.push_back({key, (uint16_t)iso3166_2stringTable.size()});
312 iso3166_2stringTable.append(entry.value(QLatin1String("name")).toString().toUtf8());
313 iso3166_2stringTable.append('\0');
314
315 const auto parentKey = IsoCodes::parentCodeToKey(entry.value(QLatin1String("parent")).toString());
316 if (parentKey) {
317 subdivParentMap.push_back({key, parentKey});
318 }
319 }
320
321 std::sort(subdivNameMap.begin(), subdivNameMap.end());
322 std::sort(subdivParentMap.begin(), subdivParentMap.end());
323
324 // write out binary cache file
325 QFile cache(cacheFilePath);
326 if (!cache.open(QFile::WriteOnly)) {
327 qCWarning(KI18NLD) << "Failed to write ISO 3166-2 cache:" << cache.errorString() << cache.fileName();
328 return;
329 }
330
331 uint32_t n = Iso3166_2CacheHeader;
332 cache.write(reinterpret_cast<const char *>(&n), 4); // header
333 n = subdivNameMap.size();
334 cache.write(reinterpret_cast<const char *>(&n), 4); // size of the name map
335 for (auto entry : subdivNameMap) {
336 cache.write(reinterpret_cast<const char *>(&entry), sizeof(entry));
337 }
338 n = subdivParentMap.size();
339 cache.write(reinterpret_cast<const char *>(&n), 4); // size of the hierarchy map
340 for (auto entry : subdivParentMap) {
341 cache.write(reinterpret_cast<const char *>(&entry), sizeof(entry));
342 }
343 cache.write(iso3166_2stringTable);
344}
char * toString(const EngineQuery &query)
QString path(const QString &relativePath)
QByteArray & append(QByteArrayView data)
qsizetype size() const const
bool mkpath(const QString &dirPath) const const
bool exists(const QString &path)
QJsonDocument fromJson(const QByteArray &json, QJsonParseError *error)
QJsonValue value(QLatin1StringView key) const const
QString toString() const const
QString locate(StandardLocation type, const QString &fileName, LocateOptions options)
QString writableLocation(StandardLocation type)
bool isEmpty() const const
QByteArray toUtf8() const const
This file is part of the KDE documentation.
Documentation copyright © 1996-2025 The KDE developers.
Generated on Fri Apr 4 2025 12:07:41 by doxygen 1.13.2 written by Dimitri van Heesch, © 1997-2006

KDE's Doxygen guidelines are available online.