cartodb/config/initializers/string.rb

201 lines
5.5 KiB
Ruby
Raw Normal View History

2021-01-24 16:18:54 +08:00
# coding: UTF-8
2020-06-15 10:58:47 +08:00
class String
def self.random(length=10)
('a'..'z').sort_by {rand}[0,length].join
end
def normalize
str = self.downcase
return '' if str.blank?
n = str.force_encoding("UTF-8")
n.gsub!(/[àáâãäåāă]/, 'a')
n.gsub!(/æ/, 'ae')
n.gsub!(/[ďđ]/, 'd')
n.gsub!(/[çćčĉċ]/, 'c')
n.gsub!(/[èéêëēęěĕė]/, 'e')
n.gsub!(/ƒ/, 'f')
n.gsub!(/[ĝğġģ]/, 'g')
n.gsub!(/[ĥħ]/, 'h')
n.gsub!(/[ììíîïīĩĭ]/, 'i')
n.gsub!(/[įıijĵ]/, 'j')
n.gsub!(/[ķĸ]/, 'k')
n.gsub!(/[łľĺļŀ]/, 'l')
n.gsub!(/[ñńňņʼnŋ]/, 'n')
n.gsub!(/[òóôõöøōőŏŏ]/, 'o')
n.gsub!(/œ/, 'oe')
n.gsub!(/ą/, 'q')
n.gsub!(/[ŕřŗ]/, 'r')
n.gsub!(/[śšşŝș]/, 's')
n.gsub!(/[ťţŧț]/, 't')
n.gsub!(/[ùúûüūůűŭũų]/, 'u')
n.gsub!(/ŵ/, 'w')
n.gsub!(/[ýÿŷ]/, 'y')
n.gsub!(/[žżź]/, 'z')
n.gsub!(/[ÀÁÂÃÄÅĀĂ]/i, 'A')
n.gsub!(/Æ/i, 'AE')
n.gsub!(/[ĎĐ]/i, 'D')
n.gsub!(/[ÇĆČĈĊ]/i, 'C')
n.gsub!(/[ÈÉÊËĒĘĚĔĖ]/i, 'E')
n.gsub!(/Ƒ/i, 'F')
n.gsub!(/[ĜĞĠĢ]/i, 'G')
n.gsub!(/[ĤĦ]/i, 'H')
n.gsub!(/[ÌÌÍÎÏĪĨĬ]/i, 'I')
n.gsub!(/[IJĴ]/i, 'J')
n.gsub!(/[Ķĸ]/i, 'J')
n.gsub!(/[ŁĽĹĻĿ]/i, 'L')
n.gsub!(/[ÑŃŇŅʼnŊ]/i, 'N')
n.gsub!(/[ÒÓÔÕÖØŌŐŎŎ]/i, 'O')
n.gsub!(/Œ/i, 'OE')
n.gsub!(/Ą/i, 'Q')
n.gsub!(/[ŔŘŖ]/i, 'R')
n.gsub!(/[ŚŠŞŜȘ]/i, 'S')
n.gsub!(/[ŤŢŦȚ]/i, 'T')
n.gsub!(/[ÙÚÛÜŪŮŰŬŨŲ]/i, 'U')
n.gsub!(/Ŵ/i, 'W')
n.gsub!(/[ÝŸŶ]/i, 'Y')
n.gsub!(/[ŽŻŹ]/i, 'Z')
n.gsub!(/A/i, 'A')
n.gsub!(/а/i, 'a')
n.gsub!(/Б/i, 'B')
n.gsub!(/б/i, 'b')
n.gsub!(/В/i, 'V')
n.gsub!(/в/i, 'v')
n.gsub!(/Г/i, 'G')
n.gsub!(/г/i, 'g')
n.gsub!(/Д/i, 'D')
n.gsub!(/д/i, 'd')
n.gsub!(/Е/i, 'E')
n.gsub!(/е/i, 'e')
n.gsub!(/Ё/i, 'Yo')
n.gsub!(/ё/i, 'yo')
n.gsub!(/Ж/i, 'Zh')
n.gsub!(/ж/i, 'zh')
n.gsub!(/З/i, 'Z')
n.gsub!(/з/i, 'z')
n.gsub!(/И/i, 'I')
n.gsub!(/и/i, 'i')
n.gsub!(/Й/i, 'J')
n.gsub!(/й/i, 'j')
n.gsub!(/К/i, 'K')
n.gsub!(/к/i, 'k')
n.gsub!(/Л/i, 'L')
n.gsub!(/л/i, 'l')
n.gsub!(/М/i, 'M')
n.gsub!(/м/i, 'm')
n.gsub!(/Н/i, 'N')
n.gsub!(/н/i, 'n')
n.gsub!(/О/i, 'O')
n.gsub!(/о/i, 'o')
n.gsub!(/П/i, 'P')
n.gsub!(/п/i, 'p')
n.gsub!(/Р/i, 'R')
n.gsub!(/р/i, 'r')
n.gsub!(/С/i, 'S')
n.gsub!(/с/i, 's')
n.gsub!(/Т/i, 'T')
n.gsub!(/т/i, 't')
n.gsub!(/У/i, 'U')
n.gsub!(/у/i, 'u')
n.gsub!(/Ф/i, 'F')
n.gsub!(/ф/i, 'f')
n.gsub!(/Х/i, 'X')
n.gsub!(/х/i, 'x')
n.gsub!(/Ц/i, 'Cz')
n.gsub!(/ц/i, 'cz')
n.gsub!(/Ч/i, 'Ch')
n.gsub!(/ч/i, 'ch')
n.gsub!(/Ш/i, 'Sh')
n.gsub!(/ш/i, 'sh')
n.gsub!(/Щ/i, 'Shh')
n.gsub!(/щ/i, 'shh')
n.gsub!(/Ъ/i, '')
n.gsub!(/ъ/i, '')
n.gsub!(/Ы/i, 'Y')
n.gsub!(/ы/i, 'y')
n.gsub!(/Ь/i, '')
n.gsub!(/ь/i, '')
n.gsub!(/Э/i, 'E')
n.gsub!(/э/i, 'e')
n.gsub!(/Ю/i, 'Yu')
n.gsub!(/ю/i, 'yu')
n.gsub!(/Я/i, 'Ya')
n.gsub!(/я/i, 'ya')
n
end
def sanitize
return if self.blank?
self.gsub(/<[^>]+>/m,'').normalize.downcase.gsub(/&.+?;/,'-').
gsub(/[^a-z0-9 _-]/,'-').strip.gsub(/\s+/,'-').gsub(/-+/,'-').
gsub(/-/,' ').strip.gsub(/ /,'-').gsub(/-/,'_')
end
def strip_tags
self.gsub(/<[^>]+>/m,'').strip
end
def get_cartodb_types
{
"number" => ["smallint", /numeric\(\d+,\d+\)/, "integer", "bigint", "decimal", "numeric", "double precision", "serial", "big serial", "real"],
"string" => ["varchar", "character varying", "text", /character\svarying\(\d+\)/, /char\s*\(\d+\)/, /character\s*\(\d+\)/],
"boolean" => ["boolean"],
"date" => [
"timestamptz",
"timestamp with time zone",
"timestamp without time zone"
]
}
end
def convert_to_db_type
cartodb_types = get_cartodb_types
if cartodb_types.keys.include?(downcase)
case downcase
when "number"
"double precision"
when "string"
"text"
else
cartodb_types[downcase].first
end
else
downcase
end
end
# {"integer"=>:number, "real"=>:number, "varchar"=>:string, "text"=>:string, "timestamp"=>:date, "boolean"=>:boolean}
def convert_to_cartodb_type
inverse_types = get_cartodb_types.invert.inject({}){ |h, e| e.first.each{ |k| h[k] = e.last }; h}
if inverse_types.keys.include?(self.downcase)
inverse_types[self.downcase]
else
inverse_types.keys.select{ |t| !t.is_a?(String) }.each do |re|
if self.downcase.match(re)
return inverse_types[re]
end
end
self.downcase
end
end
def sanitize_sql
self.gsub(/\\/, '\&\&').gsub(/'/, "''")
end
def sanitize_column_name
temporal_name = sanitize || ''
if temporal_name !~ /^[a-zA-Z_]/ ||
Carto::DB::Sanitize::RESERVED_WORDS.include?(downcase) ||
CartoDB::RESERVED_COLUMN_NAMES.include?(upcase)
return '_' + temporal_name
else
temporal_name
end
end
end