localizations_utils.dart 15.9 KB
Newer Older
Ian Hickson's avatar
Ian Hickson committed
1
// Copyright 2014 The Flutter Authors. All rights reserved.
2 3 4
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

5
import 'dart:convert';
6 7 8 9 10
import 'dart:io';

import 'package:args/args.dart' as argslib;
import 'package:meta/meta.dart';

11 12
import 'language_subtag_registry.dart';

13 14 15
typedef HeaderGenerator = String Function(String regenerateInstructions);
typedef ConstructorGenerator = String Function(LocaleInfo locale);

16 17 18 19
int sortFilesByPath (FileSystemEntity a, FileSystemEntity b) {
  return a.path.compareTo(b.path);
}

20
/// Simple data class to hold parsed locale. Does not promise validity of any data.
21
@immutable
22
class LocaleInfo implements Comparable<LocaleInfo> {
23
  const LocaleInfo({
24
    required this.languageCode,
25 26
    this.scriptCode,
    this.countryCode,
27 28
    required this.length,
    required this.originalString,
29 30 31
  });

  /// Simple parser. Expects the locale string to be in the form of 'language_script_COUNTRY'
Chris Bracken's avatar
Chris Bracken committed
32
  /// where the language is 2 characters, script is 4 characters with the first uppercase,
33 34 35
  /// and country is 2-3 characters and all uppercase.
  ///
  /// 'language_COUNTRY' or 'language_script' are also valid. Missing fields will be null.
36 37 38 39
  ///
  /// When `deriveScriptCode` is true, if [scriptCode] was unspecified, it will
  /// be derived from the [languageCode] and [countryCode] if possible.
  factory LocaleInfo.fromString(String locale, { bool deriveScriptCode = false }) {
40 41 42
    final List<String> codes = locale.split('_'); // [language, script, country]
    assert(codes.isNotEmpty && codes.length < 4);
    final String languageCode = codes[0];
43 44
    String? scriptCode;
    String? countryCode;
45 46 47 48 49 50 51 52 53
    int length = codes.length;
    String originalString = locale;
    if (codes.length == 2) {
      scriptCode = codes[1].length >= 4 ? codes[1] : null;
      countryCode = codes[1].length < 4 ? codes[1] : null;
    } else if (codes.length == 3) {
      scriptCode = codes[1].length > codes[2].length ? codes[1] : codes[2];
      countryCode = codes[1].length < codes[2].length ? codes[1] : codes[2];
    }
54
    assert(codes[0].isNotEmpty);
55 56 57 58 59 60 61 62 63
    assert(countryCode == null || countryCode.isNotEmpty);
    assert(scriptCode == null || scriptCode.isNotEmpty);

    /// Adds scriptCodes to locales where we are able to assume it to provide
    /// finer granularity when resolving locales.
    ///
    /// The basis of the assumptions here are based off of known usage of scripts
    /// across various countries. For example, we know Taiwan uses traditional (Hant)
    /// script, so it is safe to apply (Hant) to Taiwanese languages.
64
    if (deriveScriptCode && scriptCode == null) {
65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95
      switch (languageCode) {
        case 'zh': {
          if (countryCode == null) {
            scriptCode = 'Hans';
          }
          switch (countryCode) {
            case 'CN':
            case 'SG':
              scriptCode = 'Hans';
              break;
            case 'TW':
            case 'HK':
            case 'MO':
              scriptCode = 'Hant';
              break;
          }
          break;
        }
        case 'sr': {
          if (countryCode == null) {
            scriptCode = 'Cyrl';
          }
          break;
        }
      }
      // Increment length if we were able to assume a scriptCode.
      if (scriptCode != null) {
        length += 1;
      }
      // Update the base string to reflect assumed scriptCodes.
      originalString = languageCode;
96
      if (scriptCode != null) {
97
        originalString += '_$scriptCode';
98 99
      }
      if (countryCode != null) {
100
        originalString += '_$countryCode';
101
      }
102 103 104 105 106 107 108 109 110 111 112 113
    }

    return LocaleInfo(
      languageCode: languageCode,
      scriptCode: scriptCode,
      countryCode: countryCode,
      length: length,
      originalString: originalString,
    );
  }

  final String languageCode;
114 115
  final String? scriptCode;
  final String? countryCode;
116 117 118
  final int length;             // The number of fields. Ranges from 1-3.
  final String originalString;  // Original un-parsed locale string.

119 120 121 122
  String camelCase() {
    return originalString
      .split('_')
      .map<String>((String part) => part.substring(0, 1).toUpperCase() + part.substring(1).toLowerCase())
123
      .join();
124 125
  }

126 127
  @override
  bool operator ==(Object other) {
128 129
    return other is LocaleInfo
        && other.originalString == originalString;
130 131 132
  }

  @override
133
  int get hashCode => originalString.hashCode;
134 135 136 137 138 139 140 141 142 143 144 145

  @override
  String toString() {
    return originalString;
  }

  @override
  int compareTo(LocaleInfo other) {
    return originalString.compareTo(other.originalString);
  }
}

146 147 148
/// Parse the data for a locale from a file, and store it in the [attributes]
/// and [resources] keys.
void loadMatchingArbsIntoBundleMaps({
149 150 151 152
  required Directory directory,
  required RegExp filenamePattern,
  required Map<LocaleInfo, Map<String, String>> localeToResources,
  required Map<LocaleInfo, Map<String, dynamic>> localeToResourceAttributes,
153 154 155 156 157 158 159 160 161 162
}) {

  /// Set that holds the locales that were assumed from the existing locales.
  ///
  /// For example, when the data lacks data for zh_Hant, we will use the data of
  /// the first Hant Chinese locale as a default by repeating the data. If an
  /// explicit match is later found, we can reference this set to see if we should
  /// overwrite the existing assumed data.
  final Set<LocaleInfo> assumedLocales = <LocaleInfo>{};

163
  for (final FileSystemEntity entity in directory.listSync().toList()..sort(sortFilesByPath)) {
164 165
    final String entityPath = entity.path;
    if (FileSystemEntity.isFileSync(entityPath) && filenamePattern.hasMatch(entityPath)) {
166
      final String localeString = filenamePattern.firstMatch(entityPath)![1]!;
167 168 169 170
      final File arbFile = File(entityPath);

      // Helper method to fill the maps with the correct data from file.
      void populateResources(LocaleInfo locale, File file) {
171 172
        final Map<String, String> resources = localeToResources[locale]!;
        final Map<String, dynamic> attributes = localeToResourceAttributes[locale]!;
173
        final Map<String, dynamic> bundle = json.decode(file.readAsStringSync()) as Map<String, dynamic>;
174
        for (final String key in bundle.keys) {
175
          // The ARB file resource "attributes" for foo are called @foo.
176
          if (key.startsWith('@')) {
177
            attributes[key.substring(1)] = bundle[key];
178
          } else {
179
            resources[key] = bundle[key] as String;
180
          }
181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199
        }
      }
      // Only pre-assume scriptCode if there is a country or script code to assume off of.
      // When we assume scriptCode based on languageCode-only, we want this initial pass
      // to use the un-assumed version as a base class.
      LocaleInfo locale = LocaleInfo.fromString(localeString, deriveScriptCode: localeString.split('_').length > 1);
      // Allow overwrite if the existing data is assumed.
      if (assumedLocales.contains(locale)) {
        localeToResources[locale] = <String, String>{};
        localeToResourceAttributes[locale] = <String, dynamic>{};
        assumedLocales.remove(locale);
      } else {
        localeToResources[locale] ??= <String, String>{};
        localeToResourceAttributes[locale] ??= <String, dynamic>{};
      }
      populateResources(locale, arbFile);
      // Add an assumed locale to default to when there is no info on scriptOnly locales.
      locale = LocaleInfo.fromString(localeString, deriveScriptCode: true);
      if (locale.scriptCode != null) {
200
        final LocaleInfo scriptLocale = LocaleInfo.fromString('${locale.languageCode}_${locale.scriptCode}');
201 202 203 204 205 206 207 208 209 210 211
        if (!localeToResources.containsKey(scriptLocale)) {
          assumedLocales.add(scriptLocale);
          localeToResources[scriptLocale] ??= <String, String>{};
          localeToResourceAttributes[scriptLocale] ??= <String, dynamic>{};
          populateResources(scriptLocale, arbFile);
        }
      }
    }
  }
}

212
void exitWithError(String errorMessage) {
213
  stderr.writeln('fatal: $errorMessage');
214 215 216 217
  exit(1);
}

void checkCwdIsRepoRoot(String commandName) {
218
  final bool isRepoRoot = Directory('.git').existsSync();
219 220

  if (!isRepoRoot) {
221
    exitWithError(
222 223 224 225 226 227 228
      '$commandName must be run from the root of the Flutter repository. The '
      'current working directory is: ${Directory.current.path}'
    );
  }
}

GeneratorOptions parseArgs(List<String> rawArgs) {
229
  final argslib.ArgParser argParser = argslib.ArgParser()
230 231 232 233 234
    ..addFlag(
      'help',
      abbr: 'h',
      help: 'Print the usage message for this command',
    )
235 236 237
    ..addFlag(
      'overwrite',
      abbr: 'w',
238 239 240 241 242
      help: 'Overwrite existing localizations',
    )
    ..addFlag(
      'remove-undefined',
      help: 'Remove any localizations that are not defined in the canonical locale.',
243 244 245 246 247 248 249 250
    )
    ..addFlag(
      'material',
      help: 'Whether to print the generated classes for the Material package only. Ignored when --overwrite is passed.',
    )
    ..addFlag(
      'cupertino',
      help: 'Whether to print the generated classes for the Cupertino package only. Ignored when --overwrite is passed.',
251 252
    );
  final argslib.ArgResults args = argParser.parse(rawArgs);
253 254 255 256
  if (args.wasParsed('help') && args['help'] == true) {
    stderr.writeln(argParser.usage);
    exit(0);
  }
257
  final bool writeToFile = args['overwrite'] as bool;
258
  final bool removeUndefined = args['remove-undefined'] as bool;
259 260
  final bool materialOnly = args['material'] as bool;
  final bool cupertinoOnly = args['cupertino'] as bool;
261

262 263 264 265 266 267
  return GeneratorOptions(
    writeToFile: writeToFile,
    materialOnly: materialOnly,
    cupertinoOnly: cupertinoOnly,
    removeUndefined: removeUndefined,
  );
268 269 270 271
}

class GeneratorOptions {
  GeneratorOptions({
272
    required this.writeToFile,
273
    required this.removeUndefined,
274 275
    required this.materialOnly,
    required this.cupertinoOnly,
276 277 278
  });

  final bool writeToFile;
279
  final bool removeUndefined;
280 281
  final bool materialOnly;
  final bool cupertinoOnly;
282
}
283 284 285 286

// See also //master/tools/gen_locale.dart in the engine repo.
Map<String, List<String>> _parseSection(String section) {
  final Map<String, List<String>> result = <String, List<String>>{};
287
  late List<String> lastHeading;
288
  for (final String line in section.split('\n')) {
289
    if (line == '') {
290
      continue;
291
    }
292 293 294 295 296
    if (line.startsWith('  ')) {
      lastHeading[lastHeading.length - 1] = '${lastHeading.last}${line.substring(1)}';
      continue;
    }
    final int colon = line.indexOf(':');
297
    if (colon <= 0) {
298
      throw 'not sure how to deal with "$line"';
299
    }
300 301 302
    final String name = line.substring(0, colon);
    final String value = line.substring(colon + 2);
    lastHeading = result.putIfAbsent(name, () => <String>[]);
303
    result[name]!.add(value);
304 305 306 307 308 309 310 311 312 313 314 315 316
  }
  return result;
}

final Map<String, String> _languages = <String, String>{};
final Map<String, String> _regions = <String, String>{};
final Map<String, String> _scripts = <String, String>{};
const String kProvincePrefix = ', Province of ';
const String kParentheticalPrefix = ' (';

/// Prepares the data for the [describeLocale] method below.
///
/// The data is obtained from the official IANA registry.
317 318 319
void precacheLanguageAndRegionTags() {
  final List<Map<String, List<String>>> sections =
      languageSubtagRegistry.split('%%').skip(1).map<Map<String, List<String>>>(_parseSection).toList();
320
  for (final Map<String, List<String>> section in sections) {
321
    assert(section.containsKey('Type'), section.toString());
322
    final String type = section['Type']!.single;
323 324
    if (type == 'language' || type == 'region' || type == 'script') {
      assert(section.containsKey('Subtag') && section.containsKey('Description'), section.toString());
325 326
      final String subtag = section['Subtag']!.single;
      String description = section['Description']!.join(' ');
327
      if (description.startsWith('United ')) {
328
        description = 'the $description';
329 330
      }
      if (description.contains(kParentheticalPrefix)) {
331
        description = description.substring(0, description.indexOf(kParentheticalPrefix));
332 333
      }
      if (description.contains(kProvincePrefix)) {
334
        description = description.substring(0, description.indexOf(kProvincePrefix));
335 336
      }
      if (description.endsWith(' Republic')) {
337
        description = 'the $description';
338
      }
339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357
      switch (type) {
        case 'language':
          _languages[subtag] = description;
          break;
        case 'region':
          _regions[subtag] = description;
          break;
        case 'script':
          _scripts[subtag] = description;
          break;
      }
    }
  }
}

String describeLocale(String tag) {
  final List<String> subtags = tag.split('_');
  assert(subtags.isNotEmpty);
  assert(_languages.containsKey(subtags[0]));
358
  final String language = _languages[subtags[0]]!;
359
  String output = language;
360 361
  String? region;
  String? script;
362 363 364
  if (subtags.length == 2) {
    region = _regions[subtags[1]];
    script = _scripts[subtags[1]];
365
    assert(region != null || script != null);
366 367 368 369
  } else if (subtags.length >= 3) {
    region = _regions[subtags[2]];
    script = _scripts[subtags[1]];
    assert(region != null && script != null);
370
  }
371
  if (region != null) {
372
    output += ', as used in $region';
373 374
  }
  if (script != null) {
375
    output += ', using the $script script';
376
  }
377
  return output;
378 379 380 381 382 383 384 385
}

/// Writes the header of each class which corresponds to a locale.
String generateClassDeclaration(
  LocaleInfo locale,
  String classNamePrefix,
  String superClass,
) {
386
  final String camelCaseName = locale.camelCase();
387 388 389 390 391 392
  return '''

/// The translations for ${describeLocale(locale.originalString)} (`${locale.originalString}`).
class $classNamePrefix$camelCaseName extends $superClass {''';
}

393
/// Return the input string as a Dart-parseable string.
394 395
///
/// ```
396 397 398 399
/// foo => 'foo'
/// foo "bar" => 'foo "bar"'
/// foo 'bar' => "foo 'bar'"
/// foo 'bar' "baz" => '''foo 'bar' "baz"'''
400 401
/// ```
///
402 403
/// This function is used by tools that take in a JSON-formatted file to
/// generate Dart code. For this reason, characters with special meaning
404 405 406
/// in JSON files are escaped. For example, the backspace character (\b)
/// has to be properly escaped by this function so that the generated
/// Dart code correctly represents this character:
407 408 409 410 411 412
/// ```
/// foo\bar => 'foo\\bar'
/// foo\nbar => 'foo\\nbar'
/// foo\\nbar => 'foo\\\\nbar'
/// foo\\bar => 'foo\\\\bar'
/// foo\ bar => 'foo\\ bar'
413
/// foo$bar = 'foo\$bar'
414
/// ```
415
String generateString(String value) {
416 417 418 419 420 421 422 423 424 425 426 427 428
  if (<String>['\n', '\f', '\t', '\r', '\b'].every((String pattern) => !value.contains(pattern))) {
    final bool hasDollar = value.contains(r'$');
    final bool hasBackslash = value.contains(r'\');
    final bool hasQuote = value.contains("'");
    final bool hasDoubleQuote = value.contains('"');
    if (!hasQuote) {
      return hasBackslash || hasDollar ? "r'$value'" : "'$value'";
    }
    if (!hasDoubleQuote) {
      return hasBackslash || hasDollar ? 'r"$value"' : '"$value"';
    }
  }

429 430 431 432 433 434 435 436 437
  const String backslash = '__BACKSLASH__';
  assert(
    !value.contains(backslash),
    'Input string cannot contain the sequence: '
    '"__BACKSLASH__", as it is used as part of '
    'backslash character processing.'
  );

  value = value
438 439
    // Replace backslashes with a placeholder for now to properly parse
    // other special characters.
440 441 442 443 444 445 446 447 448
    .replaceAll(r'\', backslash)
    .replaceAll(r'$', r'\$')
    .replaceAll("'", r"\'")
    .replaceAll('"', r'\"')
    .replaceAll('\n', r'\n')
    .replaceAll('\f', r'\f')
    .replaceAll('\t', r'\t')
    .replaceAll('\r', r'\r')
    .replaceAll('\b', r'\b')
449
    // Reintroduce escaped backslashes into generated Dart string.
450
    .replaceAll(backslash, r'\\');
451 452

  return "'$value'";
453
}
454 455 456 457

/// Only used to generate localization strings for the Kannada locale ('kn') because
/// some of the localized strings contain characters that can crash Emacs on Linux.
/// See packages/flutter_localizations/lib/src/l10n/README for more information.
458
String generateEncodedString(String? locale, String value) {
459
  if (locale != 'kn' || value.runes.every((int code) => code <= 0xFF)) {
460
    return generateString(value);
461
  }
462

463
  final String unicodeEscapes = value.runes.map((int code) => '\\u{${code.toRadixString(16)}}').join();
464 465
  return "'$unicodeEscapes'";
}