initial local commit

jishnub · jishnub · commit cf2be7bd550d · 2019-07-22T11:49:26.000+04:00
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1 @@
+Manifest.toml
diff --git a/Project.toml b/Project.toml
@@ -0,0 +1,8 @@
+name = "ParallelUtilities"
+uuid = "fad6cfc8-4f83-11e9-06cc-151124046ad0"
+authors = ["Jishnu Bhattacharya <jishnuonline@gmail.com>"]
+version = "0.1.0"
+
+[deps]
+Distributed = "8ba89e20-285c-5b6f-9357-94700520ee1b"
+Reexport = "189a3867-3050-52da-a836-e630ba90ab69"
diff --git a/src/ParallelUtilities.jl b/src/ParallelUtilities.jl
@@ -0,0 +1,228 @@
+module ParallelUtilities
+
+using Reexport
+@reexport using Distributed
+
+worker_rank() = myid()-minimum(workers())+1
+
+function split_across_processors(num_tasks::Integer,num_procs=nworkers(),proc_id=worker_rank())
+	if num_procs == 1
+		return num_tasks
+	end
+
+	num_tasks_per_process,num_tasks_leftover = div(num_tasks,num_procs),mod(num_tasks,num_procs)
+
+	num_tasks_on_proc = num_tasks_per_process + (proc_id <= mod(num_tasks,num_procs) ? 1 : 0 );
+	task_start = num_tasks_per_process*(proc_id-1) + min(num_tasks_leftover+1,proc_id);
+
+	return task_start:(task_start+num_tasks_on_proc-1)
+end
+
+function split_across_processors(arr₁,num_procs=nworkers(),proc_id=worker_rank())
+
+	@assert(proc_id<=num_procs,"processor rank has to be less than number of workers engaged")
+	if num_procs == 1
+		return arr₁
+	end
+
+	num_tasks = length(arr₁);
+
+	num_tasks_per_process,num_tasks_leftover = div(num_tasks,num_procs),mod(num_tasks,num_procs)
+
+	num_tasks_on_proc = num_tasks_per_process + (proc_id <= mod(num_tasks,num_procs) ? 1 : 0 );
+	task_start = num_tasks_per_process*(proc_id-1) + min(num_tasks_leftover+1,proc_id);
+
+	return Iterators.take(Iterators.drop(arr₁,task_start-1),num_tasks_on_proc)
+end
+
+function split_product_across_processors(arr₁,arr₂,num_procs::Integer=nworkers(),proc_id::Integer=worker_rank())
+
+	# arr₁ will change faster
+	return split_across_processors(Iterators.product(arr₁,arr₂),num_procs,proc_id)
+end
+
+function split_product_across_processors(arrs_tuple,num_procs::Integer=nworkers(),proc_id::Integer=worker_rank())
+	return split_across_processors(Iterators.product(arrs_tuple...),num_procs,proc_id)
+end
+
+function get_processor_id_from_split_array(arr₁,arr₂,(arr₁_value,arr₂_value)::Tuple,num_procs)
+	# Find the closest match in arrays
+
+	if (arr₁_value ∉ arr₁) || (arr₂_value ∉ arr₂)
+		return nothing # invalid
+	end
+	
+	num_tasks = length(arr₁)*length(arr₂);
+
+	a1_match_index = searchsortedfirst(arr₁,arr₁_value)
+	a2_match_index = searchsortedfirst(arr₂,arr₂_value)
+
+	num_tasks_per_process,num_tasks_leftover = div(num_tasks,num_procs),mod(num_tasks,num_procs)
+
+	proc_id = 1
+	num_tasks_on_proc = num_tasks_per_process + (proc_id <= mod(num_tasks,num_procs) ? 1 : 0 );
+	total_tasks_till_proc_id = num_tasks_on_proc
+
+	task_no = 0
+
+	for (ind2,a2) in enumerate(arr₂), (ind1,a1) in enumerate(arr₁)
+		
+		task_no +=1
+		if task_no > total_tasks_till_proc_id
+			proc_id += 1
+			num_tasks_on_proc = num_tasks_per_process + (proc_id <= mod(num_tasks,num_procs) ? 1 : 0 );
+			total_tasks_till_proc_id += num_tasks_on_proc
+		end
+
+		if ind2< a2_match_index
+			continue
+		end
+
+		if (ind2 == a2_match_index) && (ind1 == a1_match_index)
+			break
+		end
+	end
+
+	return proc_id
+end
+
+function get_processor_range_from_split_array(arr₁,arr₂,modes_on_proc,num_procs)
+	
+	if isempty(modes_on_proc)
+		return 0:-1 # empty range
+	end
+
+	tasks_arr = collect(modes_on_proc)
+	proc_id_start = get_processor_id_from_split_array(arr₁,arr₂,first(tasks_arr),num_procs)
+	proc_id_end = get_processor_id_from_split_array(arr₁,arr₂,last(tasks_arr),num_procs)
+	return proc_id_start:proc_id_end
+end
+
+function get_index_in_split_array(modes_on_proc,(arr₁_value,arr₂_value))
+	if isnothing(modes_on_proc)
+		return nothing
+	end
+	for (ind,(t1,t2)) in enumerate(modes_on_proc)
+		if (t1==arr₁_value) && (t2 == arr₂_value)
+			return ind
+		end
+	end
+	nothing
+end
+
+function procid_and_mode_index(arr₁,arr₂,(arr₁_value,arr₂_value),num_procs)
+	proc_id_mode = get_processor_id_from_split_array(arr₁,arr₂,(arr₁_value,arr₂_value),num_procs)
+	modes_in_procid_file = split_product_across_processors(arr₁,arr₂,num_procs,proc_id_mode)
+	mode_index = get_index_in_split_array(modes_in_procid_file,(arr₁_value,arr₂_value))
+	return proc_id_mode,mode_index
+end
+
+function mode_index_in_file(arr₁,arr₂,(arr₁_value,arr₂_value),num_procs,proc_id_mode)
+	modes_in_procid_file = split_product_across_processors(arr₁,arr₂,num_procs,proc_id_mode)
+	mode_index = get_index_in_split_array(modes_in_procid_file,(arr₁_value,arr₂_value))
+end
+
+function procid_allmodes(arr₁,arr₂,iter,num_procs=nworkers_active(arr₁,arr₂))
+	procid = zeros(Int64,length(iter))
+	for (ind,mode) in enumerate(iter)
+		procid[ind] = get_processor_id_from_split_array(arr₁,arr₂,mode,num_procs)
+	end
+	return procid
+end
+
+workers_active(arr) = workers()[1:min(length(arr),nworkers())]
+
+workers_active(arr₁,arr₂) = workers_active(Iterators.product(arr₁,arr₂))
+
+nworkers_active(args...) = length(workers_active(args...))
+
+function minmax_from_split_array(iterable)
+	arr₁_min,arr₂_min = first(iterable)
+	arr₁_max,arr₂_max = arr₁_min,arr₂_min
+	for (arr₁_value,arr₂_value) in iterable
+		arr₁_min = min(arr₁_min,arr₁_value)
+		arr₁_max = max(arr₁_max,arr₁_value)
+		arr₂_min = min(arr₂_min,arr₂_value)
+		arr₂_max = max(arr₂_max,arr₂_value)
+	end
+	return (arr₁_min=arr₁_min,arr₁_max=arr₁_max,arr₂_min=arr₂_min,arr₂_max=arr₂_max)
+end
+
+function get_hostnames(procs_used=workers())
+	hostnames = Vector{String}(undef,length(procs_used))
+	@sync for (ind,p) in enumerate(procs_used)
+		@async hostnames[ind] = @fetchfrom p Libc.gethostname()
+	end
+	return hostnames
+end
+
+get_nodes(hostnames::Vector{String}) = unique(hostnames)
+get_nodes(procs_used::Vector{<:Integer}=workers()) = get_nodes(get_hostnames(procs_used))
+
+function get_nprocs_node(hostnames::Vector{String})
+	nodes = get_nodes(hostnames)
+	num_procs_node = Dict(node=>count(x->x==node,hostnames) for node in nodes)
+end
+
+get_nprocs_node(procs_used::Vector{<:Integer}=workers()) = get_nprocs_node(get_hostnames(procs_used))
+
+function pmapsum(f::Function,iterable,args...;kwargs...) where {T}
+
+	procs_used = workers_active(iterable)
+	num_workers = length(procs_used)
+	hostnames = get_hostnames(procs_used)
+	nodes = get_nodes(hostnames)
+	pid_rank0_on_node = [procs_used[findfirst(x->x==node,hostnames)] for node in nodes]
+
+	futures = pmap_onebatch_per_worker(f,iterable,args...;kwargs...)
+
+	# Intermediate sum over processors on the same node
+	node_sum_futures = Vector{Future}(undef,length(pid_rank0_on_node))
+	@sync for (ind,p) in enumerate(pid_rank0_on_node)
+		@async node_sum_futures[ind] = @spawnat p sum_at_node(futures,hostnames)
+	end
+
+	# Worker at which final reduction takes place
+	p = first(pid_rank0_on_node)
+
+	# Final sum across all nodes
+	S = @fetchfrom p sum(fetch(f) for f in node_sum_futures)
+
+	return S
+end
+
+function pmap_onebatch_per_worker(f::Function,iterable,args...;num_workers=nothing,kwargs...)
+
+	procs_used = workers_active(iterable)
+	if !isnothing(num_workers) && num_workers<=length(procs_used)
+		procs_used = procs_used[1:num_workers]
+	end
+	num_workers = length(procs_used)
+
+	futures = Vector{Future}(undef,num_workers)
+	@sync for (rank,p) in enumerate(procs_used)
+		@async begin
+			iterable_on_proc = split_across_processors(iterable,num_workers,rank)
+			futures[rank] = @spawnat p f(iterable_on_proc,args...;kwargs...)
+		end
+	end
+	return futures
+end
+
+function sum_at_node(futures::Vector{Future},hostnames)
+	myhost = hostnames[worker_rank()]
+	futures_on_myhost = futures[hostnames .== myhost]
+	sum(fetch(f) for f in futures_on_myhost)
+end
+
+#############################################################################
+
+export split_across_processors,split_product_across_processors,
+get_processor_id_from_split_array,
+procid_allmodes,mode_index_in_file,
+get_processor_range_from_split_array,workers_active,worker_rank,
+get_index_in_split_array,procid_and_mode_index,minmax_from_split_array,
+node_remotechannels,pmapsum,sum_at_node,pmap_onebatch_per_worker,
+get_nodes,get_hostnames,get_nprocs_node
+
+end # module