lib/web_ui/tool/unicode_sync_script.dart - mirrors/engine - Git at Google

 // Copyright 2013 The Flutter Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 // @dart = 2.6
 import 'dart:io';

 import 'package:args/args.dart';
 import 'package:path/path.dart' as path;

 const int _kChar_A = 65;
 const int _kChar_a = 97;

 final ArgParser argParser = ArgParser()
   ..addOption(
     'words',
     abbr: 'w',
     help: 'Sync the word break properties.',
   )
   ..addOption(
     'lines',
     abbr: 'l',
     help: 'Sync the line break properties.',
   )
   ..addFlag(
     'dry',
     abbr: 'd',
     help: 'Dry mode does not write anything to disk. '
         'The output is printed to the console.',
   );

 /// A map of properties that could safely be normalized into other properties.
 ///
 /// For example, a NL behaves exactly the same as BK so it gets normalized to BK
 /// in the generated code.
 const Map<String, String> normalizationTable = <String, String>{
   // NL behaves exactly the same as BK.
   // See: https://www.unicode.org/reports/tr14/tr14-45.html#NL
   'NL': 'BK',
   // In the absence of extra data (ICU data and language dictionaries), the
   // following properties will be treated as AL (alphabetic): AI, SA, SG and XX.
   // See LB1: https://www.unicode.org/reports/tr14/tr14-45.html#LB1
   'AI': 'AL',
   'SA': 'AL',
   'SG': 'AL',
   'XX': 'AL',
   // https://unicode.org/reports/tr14/tr14-45.html#CJ
   'CJ': 'NS',
 };

 /// A tuple that holds a [start] and [end] of a unicode range and a [property].
 class UnicodeRange {
   const UnicodeRange(this.start, this.end, this.property);

   final int start;
   final int end;
   final EnumValue property;

   /// Checks if there's an overlap between this range and the [other] range.
   bool isOverlapping(UnicodeRange other) {
     return start <= other.end && end >= other.start;
   }

   /// Checks if the [other] range is adjacent to this range.
   ///
   /// Two ranges are considered adjacent if:
   /// - The new range immediately follows this range, and
   /// - The new range has the same property as this range.
   bool isAdjacent(UnicodeRange other) {
     return other.start == end + 1 && property == other.property;
   }

   /// Merges the ranges of the 2 [UnicodeRange]s if they are adjacent.
   UnicodeRange extendRange(UnicodeRange extension) {
     assert(isAdjacent(extension));
     return UnicodeRange(start, extension.end, property);
   }
 }

 final String codegenPath = path.join(
   path.dirname(Platform.script.toFilePath()),
   '../lib/src/engine/text',
 );
 final String wordBreakCodegen =
     path.join(codegenPath, 'word_break_properties.dart');
 final String lineBreakCodegen =
     path.join(codegenPath, 'line_break_properties.dart');

 /// Usage (from the root of the web_ui project).
 ///
 /// To generate code for word break properties:
 /// ```
 /// dart tool/unicode_sync_script.dart -w <path/to/word/break/properties>
 /// ```
 ///
 /// To generate code for line break properties:
 /// ```
 /// dart tool/unicode_sync_script.dart -l <path/to/line/break/properties>
 /// ```
 ///
 /// To do a dry run, add the `-d` flag:
 ///
 /// ```
 /// dart tool/unicode_sync_script.dart -d ...
 /// ```
 ///
 /// This script parses the unicode word/line break properties(1) and generates Dart
 /// code(2) that can perform lookups in the unicode ranges to find what property
 /// a letter has.
 ///
 /// (1) The word break properties file can be downloaded from:
 ///     https://www.unicode.org/Public/13.0.0/ucd/auxiliary/WordBreakProperty.txt
 ///
 ///     The line break properties file can be downloaded from:
 ///     https://www.unicode.org/Public/13.0.0/ucd/LineBreak.txt
 ///
 /// (2) The codegen'd Dart files is located at:
 ///     lib/src/engine/text/word_break_properties.dart
 ///     lib/src/engine/text/line_break_properties.dart
 void main(List<String> arguments) async {
   final ArgResults result = argParser.parse(arguments);
   final PropertiesSyncer syncer = getSyncer(
     result['words'],
     result['lines'],
     result['dry'],
   );

   syncer.perform();
 }

 PropertiesSyncer getSyncer(
   String wordBreakProperties,
   String lineBreakProperties,
   bool dry,
 ) {
   if (wordBreakProperties == null && lineBreakProperties == null) {
     print(
         'Expecting either a word break properties file or a line break properties file. None was given.\n');
     print(argParser.usage);
     exit(64);
   }
   if (wordBreakProperties != null && lineBreakProperties != null) {
     print(
         'Expecting either a word break properties file or a line break properties file. Both were given.\n');
     print(argParser.usage);
     exit(64);
   }
   if (wordBreakProperties != null) {
     return dry
         ? WordBreakPropertiesSyncer.dry(wordBreakProperties)
         : WordBreakPropertiesSyncer(wordBreakProperties, '$wordBreakCodegen');
   } else {
     return dry
         ? LineBreakPropertiesSyncer.dry(lineBreakProperties)
         : LineBreakPropertiesSyncer(lineBreakProperties, '$lineBreakCodegen');
   }
 }

 /// Base class that provides common logic for syncing all kinds of unicode
 /// properties (e.g. word break properties, line break properties, etc).
 ///
 /// Subclasses implement the [template] method which receives as argument the
 /// list of data parsed by [processLines].
 abstract class PropertiesSyncer {
   PropertiesSyncer(this._src, this._dest) : _dryRun = false;
   PropertiesSyncer.dry(this._src)
       : _dest = null,
         _dryRun = true;

   final String _src;
   final String _dest;
   final bool _dryRun;

   String get prefix;
   String get enumDocLink;

   /// The default property to be used when a certain code point doesn't belong
   /// to any known range.
   String get defaultProperty;

   void perform() async {
     final List<String> lines = await File(_src).readAsLines();
     final List<String> header = extractHeader(lines);
     final PropertyCollection data =
         PropertyCollection.fromLines(lines, defaultProperty);

     final String output = template(header, data);

     if (_dryRun) {
       print(output);
     } else {
       final IOSink sink = File(_dest).openWrite();
       sink.write(output);
     }
   }

   String template(List<String> header, PropertyCollection data) {
     return '''
 // Copyright 2013 The Flutter Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 // AUTO-GENERATED FILE.
 // Generated by: tool/unicode_sync_script.dart
 //
 // Source:
 // ${header.join('\n// ')}

 part of engine;

 /// For an explanation of these enum values, see:
 ///
 /// * ${enumDocLink}
 enum ${prefix}CharProperty {
   ${_getEnumValues(data.enumCollection).join('\n  ')}
 }

 const String _packed${prefix}BreakProperties =
   '${_packProperties(data)}';


 UnicodePropertyLookup<${prefix}CharProperty> ${prefix.toLowerCase()}Lookup =
     UnicodePropertyLookup<${prefix}CharProperty>.fromPackedData(
   _packed${prefix}BreakProperties,
   ${_getSingleRangesCount(data)},
   ${prefix}CharProperty.values,
   ${prefix}CharProperty.${defaultProperty},
 );
 ''';
   }

   Iterable<String> _getEnumValues(EnumCollection enumCollection) {
     return enumCollection.values.expand(
       (EnumValue value) => <String>[
         if (value.normalizedFrom.isNotEmpty)
           '// Normalized from: ${value.normalizedFrom.join(', ')}',
         '${value.enumName}, // serialized as "${value.serialized}"',
       ],
     );
   }

   int _getSingleRangesCount(PropertyCollection data) {
     int count = 0;
     for (final UnicodeRange range in data.ranges) {
       if (range.start == range.end) {
         count++;
       }
     }
     return count;
   }

   String _packProperties(PropertyCollection data) {
     final StringBuffer buffer = StringBuffer();
     for (final UnicodeRange range in data.ranges) {
       buffer.write(range.start.toRadixString(36).padLeft(4, '0'));
       if (range.start == range.end) {
         buffer.write('!');
       } else {
         buffer.write(range.end.toRadixString(36).padLeft(4, '0'));
       }
       buffer.write(range.property.serialized);
     }
     return buffer.toString();
   }
 }

 /// Syncs Unicode's word break properties.
 class WordBreakPropertiesSyncer extends PropertiesSyncer {
   WordBreakPropertiesSyncer(String src, String dest) : super(src, dest);
   WordBreakPropertiesSyncer.dry(String src) : super.dry(src);

   @override
   final String prefix = 'Word';

   @override
   final String enumDocLink =
       'http://unicode.org/reports/tr29/#Table_Word_Break_Property_Values';

   @override
   final String defaultProperty = 'Unknown';
 }

 /// Syncs Unicode's line break properties.
 class LineBreakPropertiesSyncer extends PropertiesSyncer {
   LineBreakPropertiesSyncer(String src, String dest) : super(src, dest);
   LineBreakPropertiesSyncer.dry(String src) : super.dry(src);

   @override
   final String prefix = 'Line';

   @override
   final String enumDocLink =
       'https://www.unicode.org/reports/tr14/tr14-45.html#DescriptionOfProperties';

   @override
   final String defaultProperty = 'AL';
 }

 /// Holds the collection of properties parsed from the unicode spec file.
 class PropertyCollection {
   PropertyCollection.fromLines(List<String> lines, String defaultProperty) {
     final List<UnicodeRange> unprocessedRanges = lines
         .map(removeCommentFromLine)
         .where((String line) => line.isNotEmpty)
         .map(parseLineIntoUnicodeRange)
         .toList();
     // Insert the default property if it doesn't exist.
     final EnumValue found = enumCollection.values.firstWhere(
       (property) => property.name == defaultProperty,
       orElse: () => null,
     );
     if (found == null) {
       enumCollection.add(defaultProperty);
     }
     ranges = processRanges(unprocessedRanges, defaultProperty);
   }

   List<UnicodeRange> ranges;

   final EnumCollection enumCollection = EnumCollection();

   /// Examples:
   ///
   /// 00C0..00D6    ; ALetter
   /// 037F          ; ALetter
   ///
   /// Would be parsed into:
   ///
   /// ```dart
   /// UnicodeRange(192, 214, EnumValue('ALetter'));
   /// UnicodeRange(895, 895, EnumValue('ALetter'));
   /// ```
   UnicodeRange parseLineIntoUnicodeRange(String line) {
     final List<String> split = line.split(';');
     final String rangeStr = split[0].trim();
     final String propertyStr = split[1].trim();

     final EnumValue property = normalizationTable.containsKey(propertyStr)
         ? enumCollection.add(normalizationTable[propertyStr], propertyStr)
         : enumCollection.add(propertyStr);

     return UnicodeRange(
       getRangeStart(rangeStr),
       getRangeEnd(rangeStr),
       property,
     );
   }
 }

 /// Represents the collection of values of an enum.
 class EnumCollection {
   final List<EnumValue> values = <EnumValue>[];

   EnumValue add(String name, [String normalizedFrom]) {
     final int index =
         values.indexWhere((EnumValue value) => value.name == name);
     EnumValue value;
     if (index == -1) {
       value = EnumValue(values.length, name);
       values.add(value);
     } else {
       value = values[index];
     }

     if (normalizedFrom != null) {
       value.normalizedFrom.add(normalizedFrom);
     }
     return value;
   }
 }

 /// Represents a single value in an [EnumCollection].
 class EnumValue {
   EnumValue(this.index, this.name);

   final int index;
   final String name;

   /// The properties that were normalized to this value.
   final Set<String> normalizedFrom = <String>{};

   /// Returns a serialized, compact format of the enum value.
   ///
   /// Enum values are serialized based on their index. We start serializing them
   /// to "A", "B", "C", etc until we reach "Z". Then we continue with "a", "b",
   /// "c", etc.
   String get serialized {
     // We assign uppercase letters to the first 26 enum values.
     if (index < 26) {
       return String.fromCharCode(_kChar_A + index);
     }
     // Enum values above 26 will be assigned a lowercase letter.
     return String.fromCharCode(_kChar_a + index - 26);
   }

   /// Returns the enum name that'll be used in the Dart code.
   ///
   /// ```dart
   /// enum CharProperty {
   ///   ALetter, // <-- this is the name returned by this method ("ALetter").
   ///   Numeric,
   ///   // etc...
   /// }
   /// ```
   String get enumName {
     return name.replaceAll('_', '');
   }
 }

 /// Sorts ranges and combines adjacent ranges that have the same property and
 /// can be merged.
 Iterable<UnicodeRange> processRanges(
   List<UnicodeRange> data,
   String defaultProperty,
 ) {
   data.sort(
     // Ranges don't overlap so it's safe to sort based on the start of each
     // range.
     (UnicodeRange range1, UnicodeRange range2) =>
         range1.start.compareTo(range2.start),
   );
   verifyNoOverlappingRanges(data);
   return combineAdjacentRanges(data, defaultProperty);
 }

 /// Example:
 ///
 /// ```
 /// 0x01C4..0x0293; ALetter
 /// 0x0294..0x0294; ALetter
 /// 0x0295..0x02AF; ALetter
 /// ```
 ///
 /// will get combined into:
 ///
 /// ```
 /// 0x01C4..0x02AF; ALetter
 /// ```
 List<UnicodeRange> combineAdjacentRanges(
   List<UnicodeRange> data,
   String defaultProperty,
 ) {
   final List<UnicodeRange> result = <UnicodeRange>[data.first];
   for (int i = 1; i < data.length; i++) {
     final UnicodeRange prev = result.last;
     final UnicodeRange next = data[i];
     if (prev.isAdjacent(next)) {
       result.last = prev.extendRange(next);
     } else if (prev.property == next.property &&
         prev.property.name == defaultProperty) {
       // When there's a gap between two ranges, but they both have the default
       // property, it's safe to combine them.
       result.last = prev.extendRange(next);
     } else {
       // Check if there's a gap between the previous range and this range.
       result.add(next);
     }
   }
   return result;
 }

 int getRangeStart(String range) {
   return int.parse(range.split('..')[0], radix: 16);
 }

 int getRangeEnd(String range) {
   if (range.contains('..')) {
     return int.parse(range.split('..')[1], radix: 16);
   }
   return int.parse(range, radix: 16);
 }

 void verifyNoOverlappingRanges(List<UnicodeRange> data) {
   for (int i = 1; i < data.length; i++) {
     if (data[i].isOverlapping(data[i - 1])) {
       throw Exception('Data contains overlapping ranges.');
     }
   }
 }

 List<String> extractHeader(List<String> lines) {
   final List<String> headerLines = <String>[];
   for (String line in lines) {
     if (line.trim() == '#' || line.trim().isEmpty) {
       break;
     }
     if (line.isNotEmpty) {
       headerLines.add(line);
     }
   }
   return headerLines;
 }

 String removeCommentFromLine(String line) {
   final int poundIdx = line.indexOf('#');
   return (poundIdx == -1) ? line : line.substring(0, poundIdx);
 }
	// Copyright 2013 The Flutter Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	// @dart = 2.6
	import 'dart:io';

	import 'package:args/args.dart';
	import 'package:path/path.dart' as path;

	const int _kChar_A = 65;
	const int _kChar_a = 97;

	final ArgParser argParser = ArgParser()
	..addOption(
	'words',
	abbr: 'w',
	help: 'Sync the word break properties.',
	)
	..addOption(
	'lines',
	abbr: 'l',
	help: 'Sync the line break properties.',
	)
	..addFlag(
	'dry',
	abbr: 'd',
	help: 'Dry mode does not write anything to disk. '
	'The output is printed to the console.',
	);

	/// A map of properties that could safely be normalized into other properties.
	///
	/// For example, a NL behaves exactly the same as BK so it gets normalized to BK
	/// in the generated code.
	const Map<String, String> normalizationTable = <String, String>{
	// NL behaves exactly the same as BK.
	// See: https://www.unicode.org/reports/tr14/tr14-45.html#NL
	'NL': 'BK',
	// In the absence of extra data (ICU data and language dictionaries), the
	// following properties will be treated as AL (alphabetic): AI, SA, SG and XX.
	// See LB1: https://www.unicode.org/reports/tr14/tr14-45.html#LB1
	'AI': 'AL',
	'SA': 'AL',
	'SG': 'AL',
	'XX': 'AL',
	// https://unicode.org/reports/tr14/tr14-45.html#CJ
	'CJ': 'NS',
	};

	/// A tuple that holds a [start] and [end] of a unicode range and a [property].
	class UnicodeRange {
	const UnicodeRange(this.start, this.end, this.property);

	final int start;
	final int end;
	final EnumValue property;

	/// Checks if there's an overlap between this range and the [other] range.
	bool isOverlapping(UnicodeRange other) {
	return start <= other.end && end >= other.start;
	}

	/// Checks if the [other] range is adjacent to this range.
	///
	/// Two ranges are considered adjacent if:
	/// - The new range immediately follows this range, and
	/// - The new range has the same property as this range.
	bool isAdjacent(UnicodeRange other) {
	return other.start == end + 1 && property == other.property;
	}

	/// Merges the ranges of the 2 [UnicodeRange]s if they are adjacent.
	UnicodeRange extendRange(UnicodeRange extension) {
	assert(isAdjacent(extension));
	return UnicodeRange(start, extension.end, property);
	}
	}

	final String codegenPath = path.join(
	path.dirname(Platform.script.toFilePath()),
	'../lib/src/engine/text',
	);
	final String wordBreakCodegen =
	path.join(codegenPath, 'word_break_properties.dart');
	final String lineBreakCodegen =
	path.join(codegenPath, 'line_break_properties.dart');

	/// Usage (from the root of the web_ui project).
	///
	/// To generate code for word break properties:
	/// ```
	/// dart tool/unicode_sync_script.dart -w <path/to/word/break/properties>
	/// ```
	///
	/// To generate code for line break properties:
	/// ```
	/// dart tool/unicode_sync_script.dart -l <path/to/line/break/properties>
	/// ```
	///
	/// To do a dry run, add the `-d` flag:
	///
	/// ```
	/// dart tool/unicode_sync_script.dart -d ...
	/// ```
	///
	/// This script parses the unicode word/line break properties(1) and generates Dart
	/// code(2) that can perform lookups in the unicode ranges to find what property
	/// a letter has.
	///
	/// (1) The word break properties file can be downloaded from:
	/// https://www.unicode.org/Public/13.0.0/ucd/auxiliary/WordBreakProperty.txt
	///
	/// The line break properties file can be downloaded from:
	/// https://www.unicode.org/Public/13.0.0/ucd/LineBreak.txt
	///
	/// (2) The codegen'd Dart files is located at:
	/// lib/src/engine/text/word_break_properties.dart
	/// lib/src/engine/text/line_break_properties.dart
	void main(List<String> arguments) async {
	final ArgResults result = argParser.parse(arguments);
	final PropertiesSyncer syncer = getSyncer(
	result['words'],
	result['lines'],
	result['dry'],
	);

	syncer.perform();
	}

	PropertiesSyncer getSyncer(
	String wordBreakProperties,
	String lineBreakProperties,
	bool dry,
	) {
	if (wordBreakProperties == null && lineBreakProperties == null) {
	print(
	'Expecting either a word break properties file or a line break properties file. None was given.\n');
	print(argParser.usage);
	exit(64);
	}
	if (wordBreakProperties != null && lineBreakProperties != null) {
	print(
	'Expecting either a word break properties file or a line break properties file. Both were given.\n');
	print(argParser.usage);
	exit(64);
	}
	if (wordBreakProperties != null) {
	return dry
	? WordBreakPropertiesSyncer.dry(wordBreakProperties)
	: WordBreakPropertiesSyncer(wordBreakProperties, '$wordBreakCodegen');
	} else {
	return dry
	? LineBreakPropertiesSyncer.dry(lineBreakProperties)
	: LineBreakPropertiesSyncer(lineBreakProperties, '$lineBreakCodegen');
	}
	}

	/// Base class that provides common logic for syncing all kinds of unicode
	/// properties (e.g. word break properties, line break properties, etc).
	///
	/// Subclasses implement the [template] method which receives as argument the
	/// list of data parsed by [processLines].
	abstract class PropertiesSyncer {
	PropertiesSyncer(this._src, this._dest) : _dryRun = false;
	PropertiesSyncer.dry(this._src)
	: _dest = null,
	_dryRun = true;

	final String _src;
	final String _dest;
	final bool _dryRun;

	String get prefix;
	String get enumDocLink;

	/// The default property to be used when a certain code point doesn't belong
	/// to any known range.
	String get defaultProperty;

	void perform() async {
	final List<String> lines = await File(_src).readAsLines();
	final List<String> header = extractHeader(lines);
	final PropertyCollection data =
	PropertyCollection.fromLines(lines, defaultProperty);

	final String output = template(header, data);

	if (_dryRun) {
	print(output);
	} else {
	final IOSink sink = File(_dest).openWrite();
	sink.write(output);
	}
	}

	String template(List<String> header, PropertyCollection data) {
	return '''
	// Copyright 2013 The Flutter Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	// AUTO-GENERATED FILE.
	// Generated by: tool/unicode_sync_script.dart
	//
	// Source:
	// ${header.join('\n// ')}

	part of engine;

	/// For an explanation of these enum values, see:
	///
	/// * ${enumDocLink}
	enum ${prefix}CharProperty {
	${_getEnumValues(data.enumCollection).join('\n ')}
	}

	const String _packed${prefix}BreakProperties =
	'${_packProperties(data)}';


	UnicodePropertyLookup<${prefix}CharProperty> ${prefix.toLowerCase()}Lookup =
	UnicodePropertyLookup<${prefix}CharProperty>.fromPackedData(
	_packed${prefix}BreakProperties,
	${_getSingleRangesCount(data)},
	${prefix}CharProperty.values,
	${prefix}CharProperty.${defaultProperty},
	);
	''';
	}

	Iterable<String> _getEnumValues(EnumCollection enumCollection) {
	return enumCollection.values.expand(
	(EnumValue value) => <String>[
	if (value.normalizedFrom.isNotEmpty)
	'// Normalized from: ${value.normalizedFrom.join(', ')}',
	'${value.enumName}, // serialized as "${value.serialized}"',
	],
	);
	}

	int _getSingleRangesCount(PropertyCollection data) {
	int count = 0;
	for (final UnicodeRange range in data.ranges) {
	if (range.start == range.end) {
	count++;
	}
	}
	return count;
	}

	String _packProperties(PropertyCollection data) {
	final StringBuffer buffer = StringBuffer();
	for (final UnicodeRange range in data.ranges) {
	buffer.write(range.start.toRadixString(36).padLeft(4, '0'));
	if (range.start == range.end) {
	buffer.write('!');
	} else {
	buffer.write(range.end.toRadixString(36).padLeft(4, '0'));
	}
	buffer.write(range.property.serialized);
	}
	return buffer.toString();
	}
	}

	/// Syncs Unicode's word break properties.
	class WordBreakPropertiesSyncer extends PropertiesSyncer {
	WordBreakPropertiesSyncer(String src, String dest) : super(src, dest);
	WordBreakPropertiesSyncer.dry(String src) : super.dry(src);

	@override
	final String prefix = 'Word';

	@override
	final String enumDocLink =
	'http://unicode.org/reports/tr29/#Table_Word_Break_Property_Values';

	@override
	final String defaultProperty = 'Unknown';
	}

	/// Syncs Unicode's line break properties.
	class LineBreakPropertiesSyncer extends PropertiesSyncer {
	LineBreakPropertiesSyncer(String src, String dest) : super(src, dest);
	LineBreakPropertiesSyncer.dry(String src) : super.dry(src);

	@override
	final String prefix = 'Line';

	@override
	final String enumDocLink =
	'https://www.unicode.org/reports/tr14/tr14-45.html#DescriptionOfProperties';

	@override
	final String defaultProperty = 'AL';
	}

	/// Holds the collection of properties parsed from the unicode spec file.
	class PropertyCollection {
	PropertyCollection.fromLines(List<String> lines, String defaultProperty) {
	final List<UnicodeRange> unprocessedRanges = lines
	.map(removeCommentFromLine)
	.where((String line) => line.isNotEmpty)
	.map(parseLineIntoUnicodeRange)
	.toList();
	// Insert the default property if it doesn't exist.
	final EnumValue found = enumCollection.values.firstWhere(
	(property) => property.name == defaultProperty,
	orElse: () => null,
	);
	if (found == null) {
	enumCollection.add(defaultProperty);
	}
	ranges = processRanges(unprocessedRanges, defaultProperty);
	}

	List<UnicodeRange> ranges;

	final EnumCollection enumCollection = EnumCollection();

	/// Examples:
	///
	/// 00C0..00D6 ; ALetter
	/// 037F ; ALetter
	///
	/// Would be parsed into:
	///
	/// ```dart
	/// UnicodeRange(192, 214, EnumValue('ALetter'));
	/// UnicodeRange(895, 895, EnumValue('ALetter'));
	/// ```
	UnicodeRange parseLineIntoUnicodeRange(String line) {
	final List<String> split = line.split(';');
	final String rangeStr = split[0].trim();
	final String propertyStr = split[1].trim();

	final EnumValue property = normalizationTable.containsKey(propertyStr)
	? enumCollection.add(normalizationTable[propertyStr], propertyStr)
	: enumCollection.add(propertyStr);

	return UnicodeRange(
	getRangeStart(rangeStr),
	getRangeEnd(rangeStr),
	property,
	);
	}
	}

	/// Represents the collection of values of an enum.
	class EnumCollection {
	final List<EnumValue> values = <EnumValue>[];

	EnumValue add(String name, [String normalizedFrom]) {
	final int index =
	values.indexWhere((EnumValue value) => value.name == name);
	EnumValue value;
	if (index == -1) {
	value = EnumValue(values.length, name);
	values.add(value);
	} else {
	value = values[index];
	}

	if (normalizedFrom != null) {
	value.normalizedFrom.add(normalizedFrom);
	}
	return value;
	}
	}

	/// Represents a single value in an [EnumCollection].
	class EnumValue {
	EnumValue(this.index, this.name);

	final int index;
	final String name;

	/// The properties that were normalized to this value.
	final Set<String> normalizedFrom = <String>{};

	/// Returns a serialized, compact format of the enum value.
	///
	/// Enum values are serialized based on their index. We start serializing them
	/// to "A", "B", "C", etc until we reach "Z". Then we continue with "a", "b",
	/// "c", etc.
	String get serialized {
	// We assign uppercase letters to the first 26 enum values.
	if (index < 26) {
	return String.fromCharCode(_kChar_A + index);
	}
	// Enum values above 26 will be assigned a lowercase letter.
	return String.fromCharCode(_kChar_a + index - 26);
	}

	/// Returns the enum name that'll be used in the Dart code.
	///
	/// ```dart
	/// enum CharProperty {
	/// ALetter, // <-- this is the name returned by this method ("ALetter").
	/// Numeric,
	/// // etc...
	/// }
	/// ```
	String get enumName {
	return name.replaceAll('_', '');
	}
	}

	/// Sorts ranges and combines adjacent ranges that have the same property and
	/// can be merged.
	Iterable<UnicodeRange> processRanges(
	List<UnicodeRange> data,
	String defaultProperty,
	) {
	data.sort(
	// Ranges don't overlap so it's safe to sort based on the start of each
	// range.
	(UnicodeRange range1, UnicodeRange range2) =>
	range1.start.compareTo(range2.start),
	);
	verifyNoOverlappingRanges(data);
	return combineAdjacentRanges(data, defaultProperty);
	}

	/// Example:
	///
	/// ```
	/// 0x01C4..0x0293; ALetter
	/// 0x0294..0x0294; ALetter
	/// 0x0295..0x02AF; ALetter
	/// ```
	///
	/// will get combined into:
	///
	/// ```
	/// 0x01C4..0x02AF; ALetter
	/// ```
	List<UnicodeRange> combineAdjacentRanges(
	List<UnicodeRange> data,
	String defaultProperty,
	) {
	final List<UnicodeRange> result = <UnicodeRange>[data.first];
	for (int i = 1; i < data.length; i++) {
	final UnicodeRange prev = result.last;
	final UnicodeRange next = data[i];
	if (prev.isAdjacent(next)) {
	result.last = prev.extendRange(next);
	} else if (prev.property == next.property &&
	prev.property.name == defaultProperty) {
	// When there's a gap between two ranges, but they both have the default
	// property, it's safe to combine them.
	result.last = prev.extendRange(next);
	} else {
	// Check if there's a gap between the previous range and this range.
	result.add(next);
	}
	}
	return result;
	}

	int getRangeStart(String range) {
	return int.parse(range.split('..')[0], radix: 16);
	}

	int getRangeEnd(String range) {
	if (range.contains('..')) {
	return int.parse(range.split('..')[1], radix: 16);
	}
	return int.parse(range, radix: 16);
	}

	void verifyNoOverlappingRanges(List<UnicodeRange> data) {
	for (int i = 1; i < data.length; i++) {
	if (data[i].isOverlapping(data[i - 1])) {
	throw Exception('Data contains overlapping ranges.');
	}
	}
	}

	List<String> extractHeader(List<String> lines) {
	final List<String> headerLines = <String>[];
	for (String line in lines) {
	if (line.trim() == '#' \|\| line.trim().isEmpty) {
	break;
	}
	if (line.isNotEmpty) {
	headerLines.add(line);
	}
	}
	return headerLines;
	}

	String removeCommentFromLine(String line) {
	final int poundIdx = line.indexOf('#');
	return (poundIdx == -1) ? line : line.substring(0, poundIdx);
	}