dodb.cr/src/fsdb.cr

364 lines
7.7 KiB
Crystal
Raw Normal View History

2018-11-19 21:06:36 +01:00
2019-07-24 02:19:57 +02:00
require "file_utils"
2018-11-19 21:06:36 +01:00
require "json"
abstract class FSDB::Indexer(V)
abstract def index (key : String, value : V)
abstract def deindex (key : String, value : V)
abstract def check! (key : String, value : V, old_value : V?)
abstract def name : String
end
2018-11-19 23:35:49 +01:00
class FSDB::Partition(V) < FSDB::Indexer(V)
property name : String
property key_proc : Proc(V, String)
getter storage_root : String
def initialize(@storage_root, @name, @key_proc)
::Dir.mkdir_p get_partition_directory
2018-11-19 23:35:49 +01:00
end
def check!(key, value, old_value)
return true # Partitions dont have collisions or overloads.
2019-07-26 12:34:37 +02:00
end
def index(key, value)
partition = key_proc.call value
symlink = get_partition_symlink(partition, key)
Dir.mkdir_p ::File.dirname symlink
# FIXME: Should not happen anymore. Should we remove this?
::File.delete symlink if ::File.exists? symlink
::File.symlink get_data_symlink(key), symlink
end
def deindex(key, value)
partition = key_proc.call value
symlink = get_partition_symlink(partition, key)
::File.delete symlink
end
def get(partition)
r_value = Array(V).new
partition_directory = get_partition_directory partition
Dir.each_child partition_directory do |child|
r_value << V.from_json ::File.read "#{partition_directory}/#{child}"
end
r_value
end
private def get_partition_directory
"#{@storage_root}/partitions/by_#{@name}"
2018-11-19 23:35:49 +01:00
end
private def get_partition_directory(partition)
"#{get_partition_directory}/#{partition}"
end
2018-11-19 23:35:49 +01:00
private def get_partition_symlink(partition : String, key : String)
"#{get_partition_directory partition}/#{key}.json"
2019-07-26 12:34:37 +02:00
end
private def get_data_symlink(key : String)
"../../../data/#{key}.json"
end
end
class FSDB::Index(V) < FSDB::Indexer(V)
property name : String
property key_proc : Proc(V, String)
getter storage_root : String
2019-07-26 12:34:37 +02:00
def initialize(@storage_root, @name, @key_proc)
Dir.mkdir_p dir_path_indices
2018-11-19 23:35:49 +01:00
end
def check!(key, value, old_value)
index_key = key_proc.call value
symlink = file_path_index index_key.to_s
# FIXME: Check its not pointing to “old_value”, if any, before raising.
if ::File.exists? symlink
if old_value
old_key = key_proc.call old_value
return if symlink == file_path_index old_key.to_s
end
raise IndexOverload.new "Index '#{@name}' is overloaded for key '#{key}'"
end
end
def index(key, value)
index_key = key_proc.call value
symlink = file_path_index index_key
Dir.mkdir_p ::File.dirname symlink
# FIXME: Now that this is done in check!, can we remove it?
if ::File.exists? symlink
raise Exception.new "symlink already exists: #{symlink}"
end
::File.symlink get_data_symlink_index(key), symlink
end
def deindex(key, value)
index_key = key_proc.call value
2018-11-19 23:35:49 +01:00
symlink = file_path_index index_key
::File.delete symlink
end
def get(index : String) : V?
V.from_json ::File.read "#{file_path_index index}"
end
private def dir_path_indices
"#{@storage_root}/indices/by_#{@name}"
end
private def file_path_index(index_key : String)
"#{dir_path_indices}/#{index_key}.json"
end
private def get_data_symlink_index(key : String)
"../../data/#{key}.json"
end
end
class FSDB::Tags(V) < FSDB::Indexer(V)
property name : String
property key_proc : Proc(V, Array(String))
getter storage_root : String
def initialize(@storage_root, @name, @key_proc)
::Dir.mkdir_p get_tag_directory
end
def index(key, value)
indices = key_proc.call value
indices.each do |index|
symlink = get_tagged_entry_path(key.to_s, index)
Dir.mkdir_p ::File.dirname symlink
::File.delete symlink if ::File.exists? symlink
::File.symlink get_data_symlink(key), symlink
2018-11-19 23:35:49 +01:00
end
end
2018-11-19 23:35:49 +01:00
def deindex(key, value)
indices = key_proc.call value
indices.each do |index_key|
symlink = get_tagged_entry_path(key, index_key)
::File.delete symlink
end
2018-11-19 21:06:36 +01:00
end
def check!(key, value, old_value)
return true # Tags dont have collisions or overloads.
end
def get(name, key) : Array(V)
2019-07-26 12:34:37 +02:00
r_value = Array(V).new
partition_directory = "#{get_tag_directory}/#{key}"
return r_value unless Dir.exists? partition_directory
Dir.each_child partition_directory do |child|
r_value << V.from_json ::File.read "#{partition_directory}/#{child}"
2019-07-26 12:34:37 +02:00
end
r_value
end
private def get_tag_directory
"#{@storage_root}/by_tags/by_#{@name}"
end
private def get_tagged_entry_path(key : String, index_key : String)
"#{get_tag_directory}/#{index_key}/#{key}.json"
end
private def get_data_symlink(key)
"../../../data/#{key}.json"
end
end
class FSDB::IndexOverload < Exception
end
class FSDB::DataBase(K, V)
@indexers = [] of Indexer(V)
def initialize(@directory_name : String)
Dir.mkdir_p data_path
end
##
# name is the name that will be used on the file system.
def new_partition(name : String, &block : Proc(V, String))
Partition(V).new(@directory_name, name, block).tap do |table|
@indexers << table
end
end
##
# name is the name that will be used on the file system.
def new_index(name : String, &block : Proc(V, String))
Index(V).new(@directory_name, name, block).tap do |indexer|
@indexers << indexer
end
end
def new_tags(name : String, &block : Proc(V, Array(String)))
Tags(V).new(@directory_name, name, block).tap do |tags|
@indexers << tags
end
end
def get_index(name : String, key)
index = @indexers.find &.name.==(name)
index.not_nil!.as(FSDB::Index).get key
end
# FIXME: Is this “key” really a K, not just a String?
def get_partition(table_name : String, partition_name : String)
partition = @indexers.find &.name.==(table_name)
partition.not_nil!.as(FSDB::Partition).get partition_name
end
def get_tags(name, key : K)
partition = @indexers.find &.name.==(name)
partition.not_nil!.as(FSDB::Tags).get name, key
end
2018-11-22 14:28:41 +01:00
def []?(key : K) : V?
2018-11-19 21:06:36 +01:00
begin
read file_path key
rescue
# FIXME: Only rescue JSON and “no such file” errors.
return nil
end
end
2018-11-22 14:28:41 +01:00
def [](key : K) : V
2018-11-19 21:06:36 +01:00
read file_path key
end
2018-11-22 14:28:41 +01:00
def []=(key : K, value : V)
old_value = self.[key]?
check_collisions! key, value, old_value
# Removes any old indices or partitions pointing to a value about
# to be replaced.
if old_value
remove_partitions key, old_value
end
2018-11-19 23:35:49 +01:00
# Avoids corruption in case the application crashes while writing.
2019-07-24 02:19:57 +02:00
file_path(key).tap do |path|
::File.write "#{path}.new", value.to_json
::FileUtils.mv "#{path}.new", path
end
2018-11-19 23:35:49 +01:00
write_partitions key, value
end
def check_collisions!(key : K, value : V, old_value : V?)
@indexers.each &.check!(key, value, old_value)
end
def write_partitions(key : K, value : V)
@indexers.each &.index(key, value)
2018-11-19 21:06:36 +01:00
end
2018-11-22 14:28:41 +01:00
def delete(key : K)
2018-11-19 21:06:36 +01:00
value = self[key]?
return if value.nil?
2018-11-19 21:06:36 +01:00
begin
2019-07-12 16:00:56 +02:00
::File.delete file_path key
2018-11-19 21:06:36 +01:00
rescue
# FIXME: Only intercept “no such file" errors
end
remove_partitions key, value
2018-11-19 23:35:49 +01:00
value
end
2018-11-19 23:35:49 +01:00
def remove_partitions(key : K, value : V)
@indexers.each &.deindex(key, value)
2018-11-19 21:06:36 +01:00
end
2018-11-19 23:35:49 +01:00
##
# CAUTION: Very slow. Try not to use.
# Can be useful for making dumps or to restore a database, however.
2018-11-19 21:06:36 +01:00
def each
2019-07-26 12:34:37 +02:00
dirname = data_path
Dir.each_child dirname do |child|
2018-11-19 23:35:49 +01:00
next if child.match /^\./
2019-07-26 12:34:37 +02:00
full_path = "#{dirname}/#{child}"
2018-11-19 21:06:36 +01:00
begin
# FIXME: Only intercept JSON parsing errors.
field = read full_path
rescue
next
end
# FIXME: Will only work for String. :(
key = child.gsub /\.json$/, ""
yield key, field
end
end
2019-01-01 17:36:17 +01:00
##
# CAUTION: Very slow. Try not to use.
def to_h
hash = ::Hash(K, V).new
each do |key, value|
hash[key] = value
end
hash
end
2019-07-26 12:34:37 +02:00
private def data_path
"#{@directory_name}/data"
end
2018-11-19 21:06:36 +01:00
private def file_path(key : K)
2019-07-26 12:34:37 +02:00
"#{data_path}/#{key.to_s}.json"
end
2018-11-19 21:06:36 +01:00
private def read(file_path : String)
2019-07-12 16:00:56 +02:00
V.from_json ::File.read file_path
2018-11-19 21:06:36 +01:00
end
end