51 lines
1.2 KiB
Ruby
51 lines
1.2 KiB
Ruby
# -*- coding: utf-8; frozen_string_literal: true -*-
|
|
#
|
|
#--
|
|
# Copyright (C) 2009-2019 Thomas Leitner <t_leitner@gmx.at>
|
|
#
|
|
# This file is part of kramdown which is licensed under the MIT.
|
|
#++
|
|
#
|
|
# This file is based on code originally from the Stringex library and needs the data files from
|
|
# Stringex to work correctly.
|
|
|
|
module Kramdown
|
|
module Utils
|
|
|
|
# Provides the ability to tranliterate Unicode strings into plain ASCII ones.
|
|
module Unidecoder
|
|
|
|
gem 'stringex'
|
|
path = $:.find do |dir|
|
|
File.directory?(File.join(File.expand_path(dir), "stringex", "unidecoder_data"))
|
|
end
|
|
|
|
if !path
|
|
def self.decode(string)
|
|
string
|
|
end
|
|
else
|
|
|
|
CODEPOINTS = Hash.new do |h, k|
|
|
h[k] = YAML.load_file(File.join(path, "stringex", "unidecoder_data", "#{k}.yml"))
|
|
end
|
|
|
|
# Transliterate string from Unicode into ASCII.
|
|
def self.decode(string)
|
|
string.gsub(/[^\x00-\x7f]/u) do |codepoint|
|
|
begin
|
|
unpacked = codepoint.unpack("U")[0]
|
|
CODEPOINTS[sprintf("x%02x", unpacked >> 8)][unpacked & 255]
|
|
rescue StandardError
|
|
"?"
|
|
end
|
|
end
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
end
|