Class: MoSQL::Schema
Instance Method Summary collapse
- #all_columns(schema, copy = false) ⇒ Object
- #all_columns_for_copy(schema) ⇒ Object
- #all_mongo_dbs ⇒ Object
- #check_columns!(ns, spec) ⇒ Object
- #collections_for_mongo_db(db) ⇒ Object
- #copy_column?(col) ⇒ Boolean
- #copy_data(db, ns, objs) ⇒ Object
- #create_schema(db, clobber = false) ⇒ Object
- #fetch_and_delete_dotted(obj, dotted) ⇒ Object
- #fetch_special_source(obj, source) ⇒ Object
- #find_db(db) ⇒ Object
- #find_ns(ns) ⇒ Object
- #find_ns!(ns) ⇒ Object
-
#initialize(map) ⇒ Schema
constructor
A new instance of Schema.
- #parse_meta(meta) ⇒ Object
- #parse_spec(ns, spec) ⇒ Object
- #primary_sql_key_for_ns(ns) ⇒ Object
- #quote_copy(val) ⇒ Object
- #sanitize(value) ⇒ Object
- #table_for_ns(ns) ⇒ Object
- #to_array(lst) ⇒ Object
- #transform(ns, obj, schema = nil) ⇒ Object
- #transform_to_copy(ns, row, schema = nil) ⇒ Object
Methods included from Logging
Constructor Details
#initialize(map) ⇒ Schema
Returns a new instance of Schema.
60 61 62 63 64 65 66 67 68 69 70 71 72 73 |
# File 'lib/mosql/schema.rb', line 60 def initialize(map) @map = {} map.each do |dbname, db| @map[dbname] = { :meta => (db[:meta]) } db.each do |cname, spec| next unless cname.is_a?(String) begin @map[dbname][cname] = parse_spec("#{dbname}.#{cname}", spec) rescue KeyError => e raise SchemaError.new("In spec for #{dbname}.#{cname}: #{e}") end end end end |
Instance Method Details
#all_columns(schema, copy = false) ⇒ Object
228 229 230 231 232 233 234 235 236 237 |
# File 'lib/mosql/schema.rb', line 228 def all_columns(schema, copy=false) cols = [] schema[:columns].each do |col| cols << col[:name] unless copy && !copy_column?(col) end if schema[:meta][:extra_props] cols << "_extra_props" end cols end |
#all_columns_for_copy(schema) ⇒ Object
239 240 241 |
# File 'lib/mosql/schema.rb', line 239 def all_columns_for_copy(schema) all_columns(schema, true) end |
#all_mongo_dbs ⇒ Object
284 285 286 |
# File 'lib/mosql/schema.rb', line 284 def all_mongo_dbs @map.keys end |
#check_columns!(ns, spec) ⇒ Object
35 36 37 38 39 40 41 42 43 |
# File 'lib/mosql/schema.rb', line 35 def check_columns!(ns, spec) seen = Set.new spec[:columns].each do |col| if seen.include?(col[:source]) raise SchemaError.new("Duplicate source #{col[:source]} in column definition #{col[:name]} for #{ns}.") end seen.add(col[:source]) end end |
#collections_for_mongo_db(db) ⇒ Object
288 289 290 |
# File 'lib/mosql/schema.rb', line 288 def collections_for_mongo_db(db) (@map[db]||{}).keys end |
#copy_column?(col) ⇒ Boolean
224 225 226 |
# File 'lib/mosql/schema.rb', line 224 def copy_column?(col) col[:source] != '$timestamp' end |
#copy_data(db, ns, objs) ⇒ Object
243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 |
# File 'lib/mosql/schema.rb', line 243 def copy_data(db, ns, objs) schema = find_ns!(ns) db.synchronize do |pg| sql = "COPY \"#{schema[:meta][:table]}\" " + "(#{all_columns_for_copy(schema).map {|c| "\"#{c}\""}.join(",")}) FROM STDIN" pg.execute(sql) objs.each do |o| pg.put_copy_data(transform_to_copy(ns, o, schema) + "\n") end pg.put_copy_end begin pg.get_result.check rescue PGError => e db.send(:raise_error, e) end end end |
#create_schema(db, clobber = false) ⇒ Object
75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 |
# File 'lib/mosql/schema.rb', line 75 def create_schema(db, clobber=false) @map.values.each do |dbspec| dbspec.each do |n, collection| next unless n.is_a?(String) = collection[:meta] log.info("Creating table '#{[:table]}'...") db.send(clobber ? :create_table! : :create_table?, [:table]) do collection[:columns].each do |col| opts = {} if col[:source] == '$timestamp' opts[:default] = Sequel.function(:now) end column col[:name], col[:type], opts if col[:source].to_sym == :_id primary_key [col[:name].to_sym] end end if [:extra_props] type = if [:extra_props] == "JSON" "JSON" else "TEXT" end column '_extra_props', type end end end end end |
#fetch_and_delete_dotted(obj, dotted) ⇒ Object
134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 |
# File 'lib/mosql/schema.rb', line 134 def fetch_and_delete_dotted(obj, dotted) pieces = dotted.split(".") = [] while pieces.length > 1 key = pieces.shift << [obj, key] obj = obj[key] return nil unless obj.is_a?(Hash) end val = obj.delete(pieces.first) .reverse.each do |obj, key| obj.delete(key) if obj[key].empty? end val end |
#fetch_special_source(obj, source) ⇒ Object
153 154 155 156 157 158 159 160 |
# File 'lib/mosql/schema.rb', line 153 def fetch_special_source(obj, source) case source when "$timestamp" Sequel.function(:now) else raise SchemaError.new("Unknown source: #{source}") end end |
#find_db(db) ⇒ Object
107 108 109 110 111 112 113 114 |
# File 'lib/mosql/schema.rb', line 107 def find_db(db) unless @map.key?(db) @map[db] = @map.values.find do |spec| spec && spec[:meta][:alias].any? { |a| a.match(db) } end end @map[db] end |
#find_ns(ns) ⇒ Object
116 117 118 119 120 121 122 123 124 125 126 |
# File 'lib/mosql/schema.rb', line 116 def find_ns(ns) db, collection = ns.split(".", 2) unless spec = find_db(db) return nil end unless schema = spec[collection] log.debug("No mapping for ns: #{ns}") return nil end schema end |
#find_ns!(ns) ⇒ Object
128 129 130 131 132 |
# File 'lib/mosql/schema.rb', line 128 def find_ns!(ns) schema = find_ns(ns) raise SchemaError.new("No mapping for namespace: #{ns}") if schema.nil? schema end |
#parse_meta(meta) ⇒ Object
52 53 54 55 56 57 58 |
# File 'lib/mosql/schema.rb', line 52 def () = {} if .nil? [:alias] = [] unless .key?(:alias) [:alias] = [[:alias]] unless [:alias].is_a?(Array) [:alias] = [:alias].map { |r| Regexp.new(r) } end |
#parse_spec(ns, spec) ⇒ Object
45 46 47 48 49 50 |
# File 'lib/mosql/schema.rb', line 45 def parse_spec(ns, spec) out = spec.dup out[:columns] = to_array(spec.fetch(:columns)) check_columns!(ns, out) out end |
#primary_sql_key_for_ns(ns) ⇒ Object
292 293 294 |
# File 'lib/mosql/schema.rb', line 292 def primary_sql_key_for_ns(ns) find_ns!(ns)[:columns].find {|c| c[:source] == '_id'}[:name] end |
#quote_copy(val) ⇒ Object
261 262 263 264 265 266 267 268 269 270 271 272 273 274 |
# File 'lib/mosql/schema.rb', line 261 def quote_copy(val) case val when nil "\\N" when true 't' when false 'f' when Sequel::SQL::Function nil else val.to_s.gsub(/([\\\t\n\r])/, '\\\\\\1') end end |
#sanitize(value) ⇒ Object
204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 |
# File 'lib/mosql/schema.rb', line 204 def sanitize(value) # Base64-encode binary blobs from _extra_props -- they may # contain invalid UTF-8, which to_json will not properly encode. case value when Hash ret = {} value.each {|k, v| ret[k] = sanitize(v)} ret when Array value.map {|v| sanitize(v)} when BSON::Binary Base64.encode64(value.to_s) when Float # NaN is illegal in JSON. Translate into null. value.nan? ? nil : value else value end end |
#table_for_ns(ns) ⇒ Object
280 281 282 |
# File 'lib/mosql/schema.rb', line 280 def table_for_ns(ns) find_ns!(ns)[:meta][:table] end |
#to_array(lst) ⇒ Object
7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 |
# File 'lib/mosql/schema.rb', line 7 def to_array(lst) lst.map do |ent| col = nil if ent.is_a?(Hash) && ent[:source].is_a?(String) && ent[:type].is_a?(String) # new configuration format col = { :source => ent.fetch(:source), :type => ent.fetch(:type), :name => (ent.keys - [:source, :type]).first, } elsif ent.is_a?(Hash) && ent.keys.length == 1 && ent.values.first.is_a?(String) col = { :source => ent.first.first, :name => ent.first.first, :type => ent.first.last } else raise SchemaError.new("Invalid ordered hash entry #{ent.inspect}") end if !col.key?(:array_type) && /\A(.+)\s+array\z/i.match(col[:type]) col[:array_type] = $1 end col end end |
#transform(ns, obj, schema = nil) ⇒ Object
162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 |
# File 'lib/mosql/schema.rb', line 162 def transform(ns, obj, schema=nil) schema ||= find_ns!(ns) obj = obj.dup row = [] schema[:columns].each do |col| source = col[:source] type = col[:type] if source.start_with?("$") v = fetch_special_source(obj, source) else v = fetch_and_delete_dotted(obj, source) case v when BSON::Binary, BSON::ObjectId, Symbol v = v.to_s when BSON::DBRef v = v.object_id.to_s when Hash v = JSON.dump(v) when Array if col[:array_type] v = Sequel.pg_array(v, col[:array_type]) else v = JSON.dump(v) end end end row << v end if schema[:meta][:extra_props] extra = sanitize(obj) row << JSON.dump(extra) end log.debug { "Transformed: #{row.inspect}" } row end |
#transform_to_copy(ns, row, schema = nil) ⇒ Object
276 277 278 |
# File 'lib/mosql/schema.rb', line 276 def transform_to_copy(ns, row, schema=nil) row.map { |c| quote_copy(c) }.compact.join("\t") end |