247 lines
6.2 KiB
Ruby
Executable File
247 lines
6.2 KiB
Ruby
Executable File
#!/usr/bin/env ruby
|
|
|
|
require "rest_client"
|
|
require "redis"
|
|
require "yaml"
|
|
require "logger"
|
|
require "active_support/core_ext/hash"
|
|
|
|
class Migrator
|
|
|
|
attr_accessor :username, :base_url, :swift_host, :swift_token,
|
|
:environment, :dry_run, :settings, :logger
|
|
|
|
def initialize(username)
|
|
@username = username
|
|
|
|
@environment = ENV["ENVIRONMENT"] || "staging"
|
|
@settings = YAML.load(File.read('config.yml'))[@environment]
|
|
|
|
@swift_host = @settings["swift"]["host"]
|
|
@swift_token = File.read("tmp/swift_token.txt").strip
|
|
|
|
@dry_run = ENV["DRYRUN"] || false # disables writing anything to Redis when true
|
|
|
|
@logger = Logger.new("log/migrate_metadata_to_redis.log")
|
|
log_level = ENV["LOGLEVEL"] || "INFO"
|
|
logger.level = Kernel.const_get "Logger::#{log_level}"
|
|
logger.progname = username
|
|
end
|
|
|
|
def root_url
|
|
"#{@base_url}/#{@username}"
|
|
end
|
|
|
|
def is_dir?(name)
|
|
name[-1] == "/"
|
|
end
|
|
|
|
def url_for(directory, parent_directory="")
|
|
"#{root_url}#{parent_directory}#{directory}"
|
|
end
|
|
|
|
def migrate
|
|
logger.info "Starting migration for '#{username}'"
|
|
set_directory_backend("legacy_locked")
|
|
begin
|
|
work_on_dir("", "")
|
|
rescue Exception => ex
|
|
logger.error "Error migrating metadata for '#{username}': #{ex}"
|
|
set_directory_backend("legacy")
|
|
# write username to file for later reference
|
|
File.open('log/failed_migration.log', 'a') { |f| f.puts username }
|
|
exit 1
|
|
end
|
|
set_directory_backend("new")
|
|
logger.info "Finished migration for '#{username}'"
|
|
end
|
|
|
|
def set_directory_backend(backend)
|
|
redis.set("rsc:db:#{username}", backend) unless dry_run
|
|
end
|
|
|
|
def work_on_dir(directory, parent_directory)
|
|
logger.debug "Retrieving listing for '#{parent_directory}#{directory}'"
|
|
|
|
listing = get_directory_listing_from_swift("#{parent_directory}#{directory}")
|
|
|
|
timestamp = (Time.now.to_f * 1000).to_i
|
|
|
|
if listing["items"].any?
|
|
items = listing["items"]
|
|
items.each do |item, data|
|
|
if is_dir? item
|
|
save_directory_data("#{parent_directory}#{directory}", item, data, timestamp)
|
|
|
|
# get dir listing and repeat
|
|
work_on_dir(item, "#{parent_directory}#{directory}")
|
|
else
|
|
save_document_data("#{parent_directory}#{directory}", item, data)
|
|
end
|
|
|
|
add_item_to_parent_dir("#{parent_directory}#{directory}", item)
|
|
end
|
|
end
|
|
end
|
|
|
|
def add_item_to_parent_dir(dir, item)
|
|
key = "rs:m:#{username}:#{parent_directory_for(dir)}:items"
|
|
logger.debug "Adding item #{item} to #{key}"
|
|
redis.sadd(key, item) unless dry_run
|
|
end
|
|
|
|
def save_directory_data(dir, item, data, timestamp)
|
|
key = "rs:m:#{username}:#{dir.gsub(/^\//, "")}#{item}"
|
|
metadata = {
|
|
e: data["ETag"],
|
|
m: timestamp_for(data["Last-Modified"])
|
|
}
|
|
|
|
logger.debug "Metadata for dir #{key}: #{metadata}"
|
|
redis.hmset(key, *metadata) unless dry_run
|
|
end
|
|
|
|
def save_document_data(dir, item, data)
|
|
key = "rs:m:#{username}:#{dir.gsub(/^\//, "")}#{item}"
|
|
metadata = {
|
|
e: data["ETag"],
|
|
s: data["Content-Length"],
|
|
t: data["Content-Type"],
|
|
m: timestamp_for(data["Last-Modified"])
|
|
}
|
|
logger.debug "Metadata for document #{key}: #{metadata}"
|
|
redis.hmset(key, *metadata) unless dry_run
|
|
end
|
|
|
|
def parent_directory_for(directory)
|
|
if directory.match(/\//)
|
|
return directory[0..directory.rindex("/")]
|
|
else
|
|
return "/"
|
|
end
|
|
end
|
|
|
|
def timestamp_for(date)
|
|
return DateTime.parse(date).strftime("%Q").to_i
|
|
end
|
|
|
|
def redis
|
|
@redis ||= Redis.new(@settings["redis"].symbolize_keys)
|
|
end
|
|
|
|
def get_directory_listing_from_swift(directory)
|
|
is_root_listing = directory.empty?
|
|
|
|
get_response = nil
|
|
|
|
do_head_request("#{url_for_directory(@username, directory)}") do |response|
|
|
return directory_listing([]) if response.code == 404
|
|
|
|
if is_root_listing
|
|
get_response = do_get_request("#{container_url_for(@username)}/?format=json&path=")
|
|
else
|
|
get_response = do_get_request("#{container_url_for(@username)}/?format=json&path=#{escape(directory)}")
|
|
end
|
|
end
|
|
|
|
if body = JSON.parse(get_response.body)
|
|
listing = directory_listing(body)
|
|
else
|
|
puts "listing not JSON"
|
|
end
|
|
|
|
listing
|
|
end
|
|
|
|
def directory_listing(res_body)
|
|
listing = {
|
|
"@context" => "http://remotestorage.io/spec/folder-description",
|
|
"items" => {}
|
|
}
|
|
|
|
res_body.each do |entry|
|
|
name = entry["name"]
|
|
name.sub!("#{File.dirname(entry["name"])}/", '')
|
|
if name[-1] == "/" # It's a directory
|
|
listing["items"].merge!({
|
|
name => {
|
|
"ETag" => entry["hash"],
|
|
"Last-Modified" => entry["last_modified"]
|
|
}
|
|
})
|
|
else # It's a file
|
|
listing["items"].merge!({
|
|
name => {
|
|
"ETag" => entry["hash"],
|
|
"Content-Type" => entry["content_type"],
|
|
"Content-Length" => entry["bytes"],
|
|
"Last-Modified" => entry["last_modified"]
|
|
}
|
|
})
|
|
end
|
|
end
|
|
|
|
listing
|
|
end
|
|
|
|
def etag_for(body)
|
|
objects = JSON.parse(body)
|
|
|
|
if objects.empty?
|
|
Digest::MD5.hexdigest ""
|
|
else
|
|
Digest::MD5.hexdigest objects.map { |o| o["hash"] }.join
|
|
end
|
|
end
|
|
|
|
def do_head_request(url, &block)
|
|
RestClient.head(url, default_headers, &block)
|
|
end
|
|
|
|
def do_get_request(url, &block)
|
|
RestClient.get(url, default_headers, &block)
|
|
end
|
|
|
|
def default_headers
|
|
{"x-auth-token" => @swift_token}
|
|
end
|
|
|
|
def url_for_directory(user, directory)
|
|
if directory.empty?
|
|
container_url_for(user)
|
|
else
|
|
"#{container_url_for(user)}/#{escape(directory)}"
|
|
end
|
|
end
|
|
|
|
def container_url_for(user)
|
|
"#{base_url}/#{container_for(user)}"
|
|
end
|
|
|
|
def base_url
|
|
@base_url ||= @swift_host
|
|
end
|
|
|
|
def container_for(user)
|
|
"rs:#{environment.to_s.chars.first}:#{user}"
|
|
end
|
|
|
|
def escape(url)
|
|
# We want spaces to turn into %20 and slashes to stay slashes
|
|
CGI::escape(url).gsub('+', '%20').gsub('%2F', '/')
|
|
end
|
|
end
|
|
|
|
username = ARGV[0]
|
|
|
|
unless username
|
|
puts "No username given."
|
|
puts "Usage:"
|
|
puts "ENVIRONMENT=staging ./migrate_metadata_to_redis.rb <username>"
|
|
exit 1
|
|
end
|
|
|
|
migrator = Migrator.new username
|
|
migrator.migrate
|
|
|