JuliaIO · meggart · Apr 12, 2023 · Feb 16, 2023 · Mar 24, 2023 · Apr 4, 2023
diff --git a/Project.toml b/Project.toml
@@ -1,7 +1,7 @@
 name = "Zarr"
 uuid = "0a941bbe-ad1d-11e8-39d9-ab76183a1d99"
 authors = ["Fabian Gans <[email protected]>"]
-version = "0.8.0"
+version = "0.9.0"
 
 [deps]
 AWSS3 = "1c724243-ef5b-51ab-93f4-b0a88ac62a95"
@@ -14,6 +14,7 @@ HTTP = "cd3eb016-35fb-5094-929b-558a96fad6f3"
 JSON = "682c06a0-de6a-54ab-a142-c8b1cf79cde6"
 LRUCache = "8ac3fa9e-de4c-5943-b1dc-09c6b5f20637"
 OffsetArrays = "6fe1bfb0-de20-5000-8ca7-80f57d26f881"
+OpenSSL = "4d8831e6-92b7-49fb-bdf8-b643e874388c"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
 URIs = "5c2747f8-b7ea-4ff2-ba2e-563bfd36b1d4"
 

diff --git a/docs/src/tutorial.md b/docs/src/tutorial.md
@@ -171,7 +171,7 @@ A number of different compressors can be used with Zarr. In this Julia package w
 julia> using Zarr
 
 julia> compressor = Zarr.BloscCompressor(cname="zstd", clevel=3, shuffle=true)
-Zarr.BloscCompressor(0, 3, "zstd", 1)
+Zarr.BloscCompressor(0, 3, "zstd", true)
 
 julia> data = Int32(1):Int32(100000000)
 1:100000000
@@ -195,7 +195,7 @@ Shape               : (10000, 10000)
 Chunk Shape         : (1000, 1000)
 Order               : C
 Read-Only           : false
-Compressor          : Zarr.BloscCompressor(0, 3, "zstd", 1)
+Compressor          : Zarr.BloscCompressor(0, 3, "zstd", true)
 Filters             : nothing
 Store type          : Dictionary Storage
 No. bytes           : 400000000

diff --git a/src/Compressors.jl b/src/Compressors.jl
@@ -62,6 +62,20 @@ end
 
 zuncompress(a, ::BloscCompressor, T) = Blosc.decompress(Base.nonmissingtype(T), a)
 
+function zuncompress!(data::DenseArray, compressed, ::BloscCompressor) 
+    Blosc.decompress!(vec(data),compressed)
+    # if Int(pointer(data,length(data))-pointer(data)) != (length(data)-1)*sizeof(eltype(data))
+    #     @show size(data)
+    #     @show size(parent(data))
+    #     @show typeof(data)
+    #     @show Int(pointer(data,length(data))-pointer(data))
+    #     @show (length(data)-1)*sizeof(eltype(data))
+    #     error("Something is wrong")
+    # end
+    # Zarr.Blosc.blosc_decompress(data, compressed, sizeof(data))
+end
+
+
 function zcompress(a, c::BloscCompressor)
     itemsize = sizeof(eltype(a))
     shuffle = c.shuffle

diff --git a/src/Storage/Storage.jl b/src/Storage/Storage.jl
@@ -94,6 +94,67 @@ function writemetadata(s::AbstractStore, p, m::Metadata)
 end
 
 
+## Handling sequential vs parallel IO
+struct SequentialRead end
+struct ConcurrentRead
+    ntasks::Int
+end
+store_read_strategy(::AbstractStore) = SequentialRead()
+
+channelsize(s) = channelsize(store_read_strategy(s))
+channelsize(::SequentialRead) = 0
+channelsize(c::ConcurrentRead) = c.ntasks
+
+read_items!(s::AbstractStore,c::AbstractChannel, p, i) = read_items!(s,c,store_read_strategy(s),p,i)
+function read_items!(s::AbstractStore,c::AbstractChannel, ::SequentialRead ,p,i)
+    for ii in i
+        res = s[p,ii]
+        put!(c,(ii=>res))
+    end
+end
+function read_items!(s::AbstractStore,c::AbstractChannel, r::ConcurrentRead ,p,i)
+    ntasks = r.ntasks
+    #@show ntasks
+    asyncmap(i,ntasks = ntasks) do ii
+        #@show ii,objectid(current_task),p
+        res = s[p,ii]
+        #@show ii,length(res)
+        put!(c,(ii=>res))
+        nothing
+    end
+end
+
+write_items!(s::AbstractStore,c::AbstractChannel, p, i) = write_items!(s,c,store_read_strategy(s),p,i)
+function write_items!(s::AbstractStore,c::AbstractChannel, ::SequentialRead ,p,i)
+  for _ in 1:length(i)
+      ii,data = take!(c)
+      if data === nothing
+        if isinitialized(s,p,ii)
+          delete!(s,p,ii)
+        end
+      else
+        s[p,ii] = data
+      end
+  end
+  close(c)
+end
+
+function write_items!(s::AbstractStore,c::AbstractChannel, r::ConcurrentRead ,p,i)
+  ntasks = r.ntasks
+  asyncmap(i,ntasks = ntasks) do _
+      ii,data = take!(c)
+      if data === nothing
+        if isinitialized(s,ii)
+          delete!(s,ii)
+        end
+      else
+        s[p,ii] = data
+      end
+      nothing
+  end
+  close(c)
+end
+
 isemptysub(s::AbstractStore, p) = isempty(subkeys(s,p)) && isempty(subdirs(s,p))
 
 #Here different storage backends can register regexes that are checked against

diff --git a/src/Storage/consolidated.jl b/src/Storage/consolidated.jl
@@ -61,6 +61,7 @@ function Base.delete!(d::ConsolidatedStore,i::String)
   delete!(d.parent,i)
 end
 
+store_read_strategy(s::ConsolidatedStore) = store_read_strategy(s.parent)
 
 function consolidate_metadata(s::AbstractStore,d,prefix)
   for k in (".zattrs",".zarray",".zgroup")

diff --git a/src/Storage/gcstore.jl b/src/Storage/gcstore.jl
@@ -146,3 +146,5 @@ function storefromstring(::Type{<:GCStore}, url,_)
   @debug "path: $p"
   return GCStore(url),p
 end
+
+store_read_strategy(::GCStore) = ConcurrentRead(concurrent_io_tasks[])
diff --git a/src/Storage/http.jl b/src/Storage/http.jl
@@ -1,4 +1,5 @@
 using HTTP
+using OpenSSL: OpenSSL
 
 """
     HTTPStore
@@ -13,7 +14,7 @@ struct HTTPStore <: AbstractStore
 end
 
 function Base.getindex(s::HTTPStore, k::String)
-r = HTTP.request("GET",string(s.url,"/",k),status_exception = false)
+r = HTTP.request("GET",string(s.url,"/",k),status_exception = false,socket_type_tls=OpenSSL.SSLStream,connection_limit=25)
 if r.status >= 300
     if r.status == 404
         nothing
@@ -25,10 +26,12 @@ else
 end
 end
 
+
 push!(storageregexlist,r"^https://"=>HTTPStore)
 push!(storageregexlist,r"^http://"=>HTTPStore)
 storefromstring(::Type{<:HTTPStore}, s,_) = ConsolidatedStore(HTTPStore(s),""),""
 
+store_read_strategy(::HTTPStore) = ConcurrentRead(concurrent_io_tasks[])
 
 
 ## This is a server implementation for Zarr datasets

diff --git a/src/Storage/lru.jl b/src/Storage/lru.jl
diff --git a/src/Storage/s3store.jl b/src/Storage/s3store.jl
@@ -79,3 +79,5 @@ function storefromstring(::Type{<:S3Store}, s, _)
   path = join(decomp[3:end],"/")
   S3Store(String(bucket),aws=AWSS3.AWS.global_aws_config()),path
 end
+
+store_read_strategy(::S3Store) = ConcurrentRead(concurrent_io_tasks[])