require "http/client" require "http/headers" require "http/request" require "ishi/html" require "json" require "uuid" require "db" require "pg" USER = File.read("/var/openfaas/secrets/nombres-user").strip PASS = File.read("/var/openfaas/secrets/nombres-pass").strip DB_URL = "postgres://#{USER}:#{PASS}@10.61.0.1:5432/nombres" class Handler def format_buffer(buffer, canvas_name, title = "") # Process the gnuplot output so it works in the page # # buffer is the Ishi output # name is a string to replace for gnuplot_canvas so # we can have multiple charts in a page # title is added on top of the chart html = buffer.to_s.split("\n") html = html[html.index("")] html = "#{title}" + html.join("\n") + %(
Sorry, your browser seems not to support the HTML 5 canvas element
) # This ID needs to be unique in case # we have 2 charts in the same page html.gsub("gnuplot_canvas", canvas_name) end def query(sql) # Runs a SQL query against the database. # # Returns an array of values [[Year,Count]...] # Or nil if there are no results DB.open("postgres://#{USER}:#{PASS}@10.61.0.1:5432/nombres") do |cursor| cursor.query sql do |result_set| result = [] of Tuple(Int32, Int32) result_set.each do year = result_set.read(Int32) contador = result_set.read(Int32) result.push({year, contador}) end return result end end # No result, return nil nil end def normalize_name(s) # Remove diacritics, turn lowercase normalized = s.unicode_normalize(:nfkd).chars normalized.reject! { |character| !character.ascii_letter? }.join("").downcase end def feminidad(nombre) # Yes this database is upper case nombre = nombre.to_s.upcase sql1 = %( SELECT COALESCE(frecuencia,0) FROM mujeres WHERE nombre='#{nombre}' ) sql2 = %( SELECT COALESCE(frecuencia,0) FROM hombres WHERE nombre='#{nombre}' ) hombres = mujeres = 0 DB.open("postgres://#{USER}:#{PASS}@10.61.0.1:5432/nombres") do |cursor| cursor.query sql1 do |result| mujeres = result.read(Int32) end cursor.query sql2 do |result| hombres = result.read(Int32) end end if hombres == mujeres == 0 return 0.5 end mujeres / (hombres + mujeres) end def split_por_genero(nombres) femeninos = Array(Tuple(Int32, String)).new masculinos = Array(Tuple(Int32, String)).new nombres.map { |nombre| fem = feminidad(nombre[1]) # El overlap en 0.5 es intencional! if fem >= 0.5 femeninos << nombre end if fem <= 0.5 masculinos << nombre end } { "f": femeninos, "m": masculinos, } end def run(request : HTTP::Request) # Try to find most popular names based on a prefix, year and gender. # # Request body is JSON in this form: # # { # p: prefijo del nombre, # g: genero del nombre, # y: year de nacimiento # } if (body = request.body).nil? query = {"p": "", "g": "", a: ""} else query = Hash(String, String).from_json(body) end # Sanitize input. # Each one either a valid string or nil prefijo = query.fetch("p", "") genero = query.fetch("g", "") year = query.fetch("y", "") if !prefijo.empty? prefijo = normalize_name(prefijo) else prefijo = nil end if !["f", "m"].includes?(genero) genero = nil end year = year.to_i? if prefijo.nil? && year.nil? # Global totals sql = %( SELECT total, nombre FROM totales ORDER BY total DESC LIMIT 50 ) elsif prefijo.nil? && !year.nil? # Per-year totals sql = %( SELECT contador, nombre FROM nombres WHERE anio = '#{year}' ORDER BY contador DESC LIMIT 50 ) elsif !prefijo.nil? && year.nil? # Filter only by prefix sql = %( SELECT total, nombre FROM totales WHERE nombre LIKE '#{prefijo}%' ORDER BY total DESC LIMIT 50 ) else # We have both sql = %( SELECT contador, nombre FROM nombres WHERE anio = '#{year}' AND nombre LIKE '#{prefijo}%' ORDER BY contador DESC LIMIT 50 ) end datos = [] of Tuple(Int32, String) DB.open("postgres://#{USER}:#{PASS}@10.61.0.1:5432/nombres") do |cursor| cursor.query sql do |result_set| result_set.each do valor = result_set.read(Int32) nombre = result_set.read(String) datos.push({valor, nombre}) end end end if datos.empty? # This is bad 😀 return { body: "Que raro, no tengo *idea*!", status_code: 200, headers: HTTP::Headers{"Content-Type" => "text/html"}, } end # In this context, remove all composite names datos.reject! { |row| row[1].to_s.includes? " " } if genero datos = split_por_genero(datos)[genero] end datos = datos[..10] if datos.size > 1 title = "¿Puede ser ... #{datos[0][1].to_s.titleize}? ¿O capaz que #{datos[1][1].to_s.titleize}? ¡Contame más!" elsif datos.size == 1 title = "Me parece que ... #{datos[0][1].to_s.titleize}!" else title = "No tengo idea!" end buffer = IO::Memory.new Ishi.new(buffer) do x = (0..datos.size - 1).to_a y = datos.map { |row| row[0].to_f / 1000 } yrange(0..(y.max*1.1).to_i + 1) xtics = Hash(Float64, String).new datos.each_with_index { |row, i| xtics[i.to_f] = row[1].to_s.titleize } canvas_size(800, 300) plot(x, y, style: :boxes, fs: 0.25) .boxwidth(0.5) .show_key(false) .ylabel("Popularidad (miles)") .xtics(xtics) end { body: format_buffer(buffer, "busqueda", title), status_code: 200, headers: HTTP::Headers{"Content-Type" => "text/html"}, } end end