druid_adapter.rb 2.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768
  1. module Blazer
  2. module Adapters
  3. class DruidAdapter < BaseAdapter
  4. TIMESTAMP_REGEX = /\A\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}\.\d{3}Z\z/
  5. def run_statement(statement, comment)
  6. columns = []
  7. rows = []
  8. error = nil
  9. header = {"Content-Type" => "application/json", "Accept" => "application/json"}
  10. context = {}
  11. timeout = data_source.timeout ? data_source.timeout.to_i : 300
  12. data = {
  13. query: statement,
  14. context: {
  15. timeout: timeout * 1000
  16. }
  17. }
  18. uri = URI.parse("#{settings["url"]}/druid/v2/sql/")
  19. http = Net::HTTP.new(uri.host, uri.port)
  20. http.read_timeout = timeout
  21. begin
  22. response = JSON.parse(http.post(uri.request_uri, data.to_json, header).body)
  23. if response.is_a?(Hash)
  24. error = response["errorMessage"] || "Unknown error: #{response.inspect}"
  25. if error.include?("timed out")
  26. error = Blazer::TIMEOUT_MESSAGE
  27. end
  28. else
  29. columns = response.first.keys || []
  30. rows = response.map { |r| r.values }
  31. # Druid doesn't return column types
  32. # and no timestamp type in JSON
  33. rows.each do |row|
  34. row.each_with_index do |v, i|
  35. if v.is_a?(String) && TIMESTAMP_REGEX.match(v)
  36. row[i] = Time.parse(v)
  37. end
  38. end
  39. end
  40. end
  41. rescue => e
  42. error = e.message
  43. end
  44. [columns, rows, error]
  45. end
  46. def tables
  47. result = data_source.run_statement("SELECT TABLE_NAME FROM INFORMATION_SCHEMA.TABLES WHERE TABLE_SCHEMA NOT IN ('INFORMATION_SCHEMA') ORDER BY TABLE_NAME")
  48. result.rows.map(&:first)
  49. end
  50. def schema
  51. result = data_source.run_statement("SELECT TABLE_SCHEMA, TABLE_NAME, COLUMN_NAME, DATA_TYPE, ORDINAL_POSITION FROM INFORMATION_SCHEMA.COLUMNS WHERE TABLE_SCHEMA NOT IN ('INFORMATION_SCHEMA') ORDER BY 1, 2")
  52. result.rows.group_by { |r| [r[0], r[1]] }.map { |k, vs| {schema: k[0], table: k[1], columns: vs.sort_by { |v| v[2] }.map { |v| {name: v[2], data_type: v[3]} }} }
  53. end
  54. def preview_statement
  55. "SELECT * FROM {table} LIMIT 10"
  56. end
  57. end
  58. end
  59. end