diff --git a/examples/fluid/hydrostatic_water_column_2d.jl b/examples/fluid/hydrostatic_water_column_2d.jl
index 86d392c5b..080525b5f 100644
--- a/examples/fluid/hydrostatic_water_column_2d.jl
+++ b/examples/fluid/hydrostatic_water_column_2d.jl
@@ -1,12 +1,14 @@
 using TrixiParticles
 using OrdinaryDiffEq
+using P4estTypes, PointNeighbors
+using MPI; MPI.Init()
 
 # ==========================================================================================
 # ==== Resolution
-fluid_particle_spacing = 0.05
+fluid_particle_spacing = 0.3
 
 # Make sure that the kernel support of fluid particles at a boundary is always fully sampled
-boundary_layers = 3
+boundary_layers = 1
 
 # ==========================================================================================
 # ==== Experiment Setup
@@ -14,7 +16,7 @@ gravity = 9.81
 tspan = (0.0, 1.0)
 
 # Boundary geometry and initial fluid particle positions
-initial_fluid_size = (1.0, 0.9)
+initial_fluid_size = (1.0, 1.0)
 tank_size = (1.0, 1.0)
 
 fluid_density = 1000.0
@@ -41,9 +43,16 @@ system_acceleration = (0.0, -gravity)
 fluid_system = WeaklyCompressibleSPHSystem(tank.fluid, fluid_density_calculator,
                                            state_equation, smoothing_kernel,
                                            smoothing_length, viscosity=viscosity,
-                                           acceleration=system_acceleration,
+                                        #    acceleration=system_acceleration,
                                            source_terms=nothing)
 
+fluid_system2 = WeaklyCompressibleSPHSystem(tank.fluid, fluid_density_calculator,
+                                           state_equation, smoothing_kernel,
+                                           smoothing_length, viscosity=viscosity,
+                                        #    acceleration=system_acceleration,
+                                           source_terms=nothing)
+ghost_system = TrixiParticles.GhostSystem(fluid_system2)
+
 # ==========================================================================================
 # ==== Boundary
 
@@ -51,21 +60,30 @@ fluid_system = WeaklyCompressibleSPHSystem(tank.fluid, fluid_density_calculator,
 boundary_density_calculator = AdamiPressureExtrapolation()
 
 # This is to set wall viscosity with `trixi_include`
-viscosity_wall = nothing
-boundary_model = BoundaryModelDummyParticles(tank.boundary.density, tank.boundary.mass,
-                                             state_equation=state_equation,
-                                             boundary_density_calculator,
-                                             smoothing_kernel, smoothing_length,
-                                             viscosity=viscosity_wall)
+# viscosity_wall = nothing
+# boundary_model = BoundaryModelDummyParticles(tank.boundary.density, tank.boundary.mass,
+#                                              state_equation=state_equation,
+#                                              boundary_density_calculator,
+#                                              smoothing_kernel, smoothing_length,
+#                                              viscosity=viscosity_wall)
+k_solid = 0.2
+beta_solid = 1
+boundary_model = BoundaryModelMonaghanKajtar(k_solid, beta_solid,
+                                                   fluid_particle_spacing,
+                                                   tank.boundary.mass)
 boundary_system = BoundarySPHSystem(tank.boundary, boundary_model, movement=nothing)
 
 # ==========================================================================================
 # ==== Simulation
-semi = Semidiscretization(fluid_system, boundary_system)
+min_corner = minimum(tank.fluid.coordinates, dims = 2) .- 2 * smoothing_length .- 0.2
+max_corner = maximum(tank.fluid.coordinates, dims = 2) .+ 2 * smoothing_length .- 0.2
+
+semi = Semidiscretization(fluid_system, ghost_system,
+                          neighborhood_search=GridNeighborhoodSearch{2}(cell_list=PointNeighbors.P4estCellList(; min_corner, max_corner)))
 ode = semidiscretize(semi, tspan)
 
 info_callback = InfoCallback(interval=50)
-saving_callback = SolutionSavingCallback(dt=0.02, prefix="")
+saving_callback = SolutionSavingCallback(dt=0.02, prefix="$(MPI.Comm_rank(MPI.COMM_WORLD))")
 
 # This is to easily add a new callback with `trixi_include`
 extra_callback = nothing
diff --git a/src/TrixiParticles.jl b/src/TrixiParticles.jl
index d85096860..7cf4e01d9 100644
--- a/src/TrixiParticles.jl
+++ b/src/TrixiParticles.jl
@@ -16,6 +16,7 @@ using GPUArraysCore: AbstractGPUArray
 using JSON: JSON
 using KernelAbstractions: KernelAbstractions, @kernel, @index
 using LinearAlgebra: norm, dot, I, tr, inv, pinv, det
+using MPI: MPI
 using MuladdMacro: @muladd
 using Polyester: Polyester, @batch
 using Printf: @printf, @sprintf
diff --git a/src/general/general.jl b/src/general/general.jl
index dfd709861..a8f4f5d84 100644
--- a/src/general/general.jl
+++ b/src/general/general.jl
@@ -9,3 +9,4 @@ include("buffer.jl")
 include("interpolation.jl")
 include("custom_quantities.jl")
 include("neighborhood_search.jl")
+include("ghost_system.jl")
diff --git a/src/general/ghost_system.jl b/src/general/ghost_system.jl
new file mode 100644
index 000000000..3970b9b24
--- /dev/null
+++ b/src/general/ghost_system.jl
@@ -0,0 +1,173 @@
+struct GhostSystem{S, NDIMS, IC, U, V} <: System{NDIMS, IC}
+    system::S
+    v::V
+    u::U
+    buffer::Nothing
+
+    function GhostSystem(system)
+        v = zeros(eltype(system), v_nvariables(system), nparticles(system))
+        u = zeros(eltype(system), u_nvariables(system), nparticles(system))
+        return new{typeof(system), ndims(system),
+                   typeof(system.initial_condition),
+                   typeof(v), typeof(u)}(system, v, u, nothing)
+    end
+end
+
+vtkname(system::GhostSystem) = "ghost"
+timer_name(::GhostSystem) = "ghost"
+
+@inline nparticles(system::GhostSystem) = nparticles(system.system)
+@inline Base.eltype(system::GhostSystem) = eltype(system.system)
+
+@inline u_nvariables(system::GhostSystem) = 0
+@inline v_nvariables(system::GhostSystem) = 0
+
+@inline compact_support(system, neighbor::GhostSystem) = compact_support(system, neighbor.system)
+@inline compact_support(system::GhostSystem, neighbor) = compact_support(system.system, neighbor)
+@inline compact_support(system::GhostSystem, neighbor::GhostSystem) = compact_support(system.system, neighbor.system)
+
+@inline initial_coordinates(system::GhostSystem) = initial_coordinates(system.system)
+@inline current_coordinates(u, system::GhostSystem) = current_coordinates(system.u, system.system)
+
+function write_u0!(u0, system::GhostSystem)
+    return u0
+end
+
+function write_v0!(v0, system::GhostSystem)
+    return v0
+end
+
+function partition(system::GhostSystem, neighborhood_search)
+    # TODO variable size
+    keep = trues(nparticles(system))
+    for particle in eachparticle(system)
+        cell = PointNeighbors.cell_coords(initial_coords(system, particle), neighborhood_search)
+        mpi_neighbors = neighborhood_search.cell_list.neighbor_cells[2]
+        # length of mpi_neighbors is the number of mirror cells. Everything after that is ghost.
+        if neighborhood_search.cell_list.cell_indices[cell...] <= length(mpi_neighbors)
+            # Remove particle from this rank
+            keep[particle] = false
+        end
+    end
+
+    return GhostSystem(keep_particles(system.system, keep))
+end
+
+function copy_neighborhood_search_ghost(nhs, search_radius, n_points)
+    (; periodic_box) = nhs
+
+    cell_list = copy_cell_list_ghost(nhs.cell_list, search_radius, periodic_box)
+
+    return GridNeighborhoodSearch{ndims(nhs)}(; search_radius, n_points, periodic_box,
+                                              cell_list,
+                                              update_strategy = nhs.update_strategy)
+end
+
+function copy_cell_list_ghost(cell_list, search_radius, periodic_box)
+    (; min_corner, max_corner) = cell_list
+
+    return PointNeighbors.P4estCellList(; min_corner, max_corner, search_radius,
+                                        backend = typeof(cell_list.cells), ghost=true)
+end
+
+function create_neighborhood_search(neighborhood_search, system, neighbor::GhostSystem)
+    return copy_neighborhood_search_ghost(neighborhood_search, compact_support(system, neighbor),
+                                    nparticles(neighbor))
+end
+
+function update_nhs!(neighborhood_search,
+                     system, neighbor::GhostSystem,
+                     u_system, u_neighbor)
+end
+
+function update_nhs!(neighborhood_search,
+                     system::GhostSystem, neighbor,
+                     u_system, u_neighbor)
+end
+
+function update_nhs!(neighborhood_search,
+                     system::GhostSystem, neighbor::GhostSystem,
+                     u_system, u_neighbor)
+end
+
+# function mpi_communication1!(system::GhostSystem, v, u, v_ode, u_ode, semi, t)
+#     # Receive data from other ranks
+#     return system
+# end
+
+function mpi_communication3!(system::GhostSystem, v, u, v_ode, u_ode, semi, t)
+    # TODO Receive only density and pressure from other ranks
+    # and move the rest to `mpi_communication1!`.
+    n_particles_from_rank = zeros(Int, MPI.Comm_size(MPI.COMM_WORLD))
+    for source in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        buffer = view(n_particles_from_rank, source + 1)
+        MPI.Recv!(buffer, MPI.COMM_WORLD; source=source, tag=0)
+    end
+
+    @info "" n_particles_from_rank
+    total_particles = sum(n_particles_from_rank)
+
+    requests = Vector{MPI.Request}(undef, 3 * MPI.Comm_size(MPI.COMM_WORLD))
+
+    coordinates = zeros(ndims(system), total_particles)
+    for source in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        buffer = view(coordinates, :, (1 + sum(n_particles_from_rank[1:source])):total_particles)
+        # requests[source + 1] = MPI.Irecv!(buffer, MPI.COMM_WORLD; source=source, tag=1)
+        MPI.Recv!(buffer, MPI.COMM_WORLD; source=source, tag=1)
+    end
+
+    # Receive density and pressure from other ranks
+    density = zeros(total_particles)
+    for source in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        buffer = view(density, (1 + sum(n_particles_from_rank[1:source])):total_particles)
+        # requests[source + MPI.Comm_size(MPI.COMM_WORLD) + 1] = MPI.Irecv!(buffer, MPI.COMM_WORLD; source=source, tag=2)
+        MPI.Recv!(buffer, MPI.COMM_WORLD; source=source, tag=2)
+    end
+
+    pressure = zeros(total_particles)
+    for source in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        buffer = view(pressure, (1 + sum(n_particles_from_rank[1:source])):total_particles)
+        # requests[source + 2 * MPI.Comm_size(MPI.COMM_WORLD) + 1] = MPI.Irecv!(buffer, MPI.COMM_WORLD; source=source, tag=3)
+        MPI.Recv!(buffer, MPI.COMM_WORLD; source=source, tag=3)
+    end
+
+    # MPI.Waitall(requests)
+
+    return system
+end
+
+function update_quantities!(system::GhostSystem, v, u,
+                            v_ode, u_ode, semi, t)
+    return system
+end
+
+function update_pressure!(system::GhostSystem, v, u, v_ode, u_ode, semi, t)
+    return system
+end
+
+function interact!(dv, v_particle_system, u_particle_system,
+                   v_neighbor_system, u_neighbor_system, neighborhood_search,
+                   particle_system::GhostSystem,
+                   neighbor_system)
+    return dv
+end
+
+function interact!(dv, v_particle_system, u_particle_system,
+                   v_neighbor_system, u_neighbor_system, neighborhood_search,
+                   particle_system::GhostSystem,
+                   neighbor_system::GhostSystem)
+    return dv
+end
+
+function interact!(dv, v_particle_system, u_particle_system,
+                   v_neighbor_system, u_neighbor_system, neighborhood_search,
+                   particle_system,
+                   neighbor_system::GhostSystem)
+    interact!(dv, v_particle_system, u_particle_system,
+              v_neighbor_system, u_neighbor_system, neighborhood_search,
+              particle_system, neighbor_system.system)
+
+    return dv
+end
+
+@inline add_velocity!(du, v, particle, system::GhostSystem) = du
diff --git a/src/general/initial_condition.jl b/src/general/initial_condition.jl
index 3f9162767..8ca2d6efc 100644
--- a/src/general/initial_condition.jl
+++ b/src/general/initial_condition.jl
@@ -318,3 +318,15 @@ function find_too_close_particles(coords1, coords2, max_distance)
 
     return result
 end
+
+function keep_particles(initial_condition, keep)
+    NDIMS = ndims(initial_condition)
+    coordinates = initial_condition.coordinates[:, keep]
+    velocity = initial_condition.velocity[:, keep]
+    mass = initial_condition.mass[keep]
+    density = initial_condition.density[keep]
+    pressure = initial_condition.pressure[keep]
+
+    return InitialCondition{NDIMS}(coordinates, velocity, mass, density, pressure,
+                                       initial_condition.particle_spacing)
+end
diff --git a/src/general/semidiscretization.jl b/src/general/semidiscretization.jl
index 600d573d5..880067f46 100644
--- a/src/general/semidiscretization.jl
+++ b/src/general/semidiscretization.jl
@@ -73,6 +73,20 @@ function Semidiscretization(systems...;
     # Other checks might be added here later.
     check_configuration(systems)
 
+    # Create a tuple of n neighborhood searches for each of the n systems.
+    # We will need one neighborhood search for each pair of systems.
+    searches = Tuple(Tuple(create_neighborhood_search(neighborhood_search,
+                                                      system, neighbor)
+                           for neighbor in systems)
+                     for system in systems)
+
+    systems = partition(systems, searches)
+
+    searches = Tuple(Tuple(create_neighborhood_search(neighborhood_search,
+                                                      system, neighbor)
+                           for neighbor in systems)
+                     for system in systems)
+
     sizes_u = [u_nvariables(system) * n_moving_particles(system)
                for system in systems]
     ranges_u = Tuple((sum(sizes_u[1:(i - 1)]) + 1):sum(sizes_u[1:i])
@@ -82,13 +96,6 @@ function Semidiscretization(systems...;
     ranges_v = Tuple((sum(sizes_v[1:(i - 1)]) + 1):sum(sizes_v[1:i])
                      for i in eachindex(sizes_v))
 
-    # Create a tuple of n neighborhood searches for each of the n systems.
-    # We will need one neighborhood search for each pair of systems.
-    searches = Tuple(Tuple(create_neighborhood_search(neighborhood_search,
-                                                      system, neighbor)
-                           for neighbor in systems)
-                     for system in systems)
-
     return Semidiscretization(systems, ranges_u, ranges_v, searches)
 end
 
@@ -178,7 +185,7 @@ end
 @inline function compact_support(system, model::BoundaryModelMonaghanKajtar,
                                  neighbor::BoundarySPHSystem)
     # This NHS is never used
-    return 0.0
+    return 1.0
 end
 
 @inline function compact_support(system, model::BoundaryModelDummyParticles, neighbor)
@@ -206,10 +213,14 @@ end
     return neighborhood_searches[system_index][neighbor_index]
 end
 
-@inline function system_indices(system, semi)
+@inline function system_indices(system, semi::Semidiscretization)
+    system_indices(system, semi.systems)
+end
+
+@inline function system_indices(system, systems)
     # Note that this takes only about 5 ns, while mapping systems to indices with a `Dict`
     # is ~30x slower because `hash(::System)` is very slow.
-    index = findfirst(==(system), semi.systems)
+    index = findfirst(==(system), systems)
 
     if isnothing(index)
         throw(ArgumentError("system is not in the semidiscretization"))
@@ -472,6 +483,16 @@ function update_systems_and_nhs(v_ode, u_ode, semi, t; update_from_callback=fals
     # Update NHS
     @trixi_timeit timer() "update nhs" update_nhs!(semi, u_ode)
 
+    # foreach_system(semi) do system
+    #     v = wrap_v(v_ode, system, semi)
+    #     u = wrap_u(u_ode, system, semi)
+
+    #     mpi_communication1!(system, v, u, v_ode, u_ode, semi, t)
+    # end
+
+    # TODO update NHS for ghost systems
+    # @trixi_timeit timer() "update nhs" update_nhs!(semi, u_ode)
+
     # Second update step.
     # This is used to calculate density and pressure of the fluid systems
     # before updating the boundary systems,
@@ -483,6 +504,8 @@ function update_systems_and_nhs(v_ode, u_ode, semi, t; update_from_callback=fals
         update_quantities!(system, v, u, v_ode, u_ode, semi, t)
     end
 
+    # TODO MPI communication 2 if correction is used
+
     # Perform correction and pressure calculation
     foreach_system(semi) do system
         v = wrap_v(v_ode, system, semi)
@@ -491,6 +514,13 @@ function update_systems_and_nhs(v_ode, u_ode, semi, t; update_from_callback=fals
         update_pressure!(system, v, u, v_ode, u_ode, semi, t)
     end
 
+    foreach_system(semi) do system
+        v = wrap_v(v_ode, system, semi)
+        u = wrap_u(u_ode, system, semi)
+
+        mpi_communication3!(system, v, u, v_ode, u_ode, semi, t)
+    end
+
     # Final update step for all remaining systems
     foreach_system(semi) do system
         v = wrap_v(v_ode, system, semi)
@@ -817,6 +847,12 @@ function update!(neighborhood_search, system::GPUSystem, x, y; points_moving=(tr
                            parallelization_backend=KernelAbstractions.get_backend(system))
 end
 
+function partition(systems, searches)
+    return map(systems) do system
+        return partition(system, searches[system_indices(system, systems)][system_indices(system, systems)])
+    end
+end
+
 function check_configuration(systems)
     foreach_system(systems) do system
         check_configuration(system, systems)
diff --git a/src/general/system.jl b/src/general/system.jl
index 48d556eba..8c5178cfe 100644
--- a/src/general/system.jl
+++ b/src/general/system.jl
@@ -151,3 +151,16 @@ end
 
 # Only for systems requiring a mandatory callback
 reset_callback_flag!(system) = system
+
+function partition(system::System, neighborhood_search)
+    keep = trues(nparticles(system))
+    for particle in eachparticle(system)
+        cell = PointNeighbors.cell_coords(initial_coords(system, particle), neighborhood_search)
+        if neighborhood_search.cell_list.cell_indices[cell...] <= 0
+            # Remove particle from this rank
+            keep[particle] = false
+        end
+    end
+
+    return keep_particles(system, keep)
+end
diff --git a/src/schemes/fluid/weakly_compressible_sph/rhs.jl b/src/schemes/fluid/weakly_compressible_sph/rhs.jl
index 0fe58ab21..14079c1a5 100644
--- a/src/schemes/fluid/weakly_compressible_sph/rhs.jl
+++ b/src/schemes/fluid/weakly_compressible_sph/rhs.jl
@@ -97,6 +97,17 @@ function interact!(dv, v_particle_system, u_particle_system,
     return dv
 end
 
+function interact!(dv, v_particle_system, u_particle_system,
+                   v_neighbor_system, u_neighbor_system, neighborhood_search,
+                   particle_system::WeaklyCompressibleSPHSystem,
+                   neighbor_system::GhostSystem)
+    interact!(dv, v_particle_system, u_particle_system,
+              neighbor_system.v, neighbor_system.u, neighborhood_search,
+              particle_system, neighbor_system.system)
+
+    return dv
+end
+
 # With 'SummationDensity', density is calculated in wcsph/system.jl:compute_density!
 @inline function continuity_equation!(dv, density_calculator::SummationDensity,
                                       v_particle_system, v_neighbor_system,
diff --git a/src/schemes/fluid/weakly_compressible_sph/system.jl b/src/schemes/fluid/weakly_compressible_sph/system.jl
index 6d66ba06a..b803114e6 100644
--- a/src/schemes/fluid/weakly_compressible_sph/system.jl
+++ b/src/schemes/fluid/weakly_compressible_sph/system.jl
@@ -218,6 +218,12 @@ end
 
 @inline system_sound_speed(system::WeaklyCompressibleSPHSystem) = system.state_equation.sound_speed
 
+# function mpi_communication1!(system::WeaklyCompressibleSPHSystem, v, u,
+#                              v_ode, u_ode, semi, t)
+#     # Send data (?) to other ranks
+#     return system
+# end
+
 function update_quantities!(system::WeaklyCompressibleSPHSystem, v, u,
                             v_ode, u_ode, semi, t)
     (; density_calculator, density_diffusion, correction) = system
@@ -247,6 +253,52 @@ function update_pressure!(system::WeaklyCompressibleSPHSystem, v, u, v_ode, u_od
     return system
 end
 
+function mpi_communication3!(system::WeaklyCompressibleSPHSystem, v, u,
+                             v_ode, u_ode, semi, t)
+    # TODO Send only density and pressure from other ranks
+    # and move the rest to `mpi_communication1!`.
+    nhs = get_neighborhood_search(system, semi)
+    _, mpi_neighbors = nhs.cell_list.neighbor_cells
+
+    particles_for_rank = [Int[] for _ in 1:MPI.Comm_size(MPI.COMM_WORLD)]
+    for particle in eachparticle(system)
+        cell = PointNeighbors.cell_coords(current_coords(u, system, particle), nhs)
+        for (rank, _) in mpi_neighbors[nhs.cell_list.cell_indices[cell...]]
+            if !(particle in particles_for_rank[rank + 1])
+                push!(particles_for_rank[rank + 1], particle)
+            end
+        end
+    end
+
+    @info "" particles_for_rank
+
+    for dest in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        MPI.Isend(length(particles_for_rank[dest + 1]), MPI.COMM_WORLD; dest=dest, tag=0)
+    end
+
+    requests = Vector{MPI.Request}(undef, 3 * MPI.Comm_size(MPI.COMM_WORLD))
+
+    for dest in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        coordinates = [current_coords(u, system, particle) for particle in particles_for_rank[dest + 1]]
+        requests[dest + 1] = MPI.Isend(coordinates, MPI.COMM_WORLD; dest=dest, tag=1)
+    end
+
+    # Send density and pressure to other ranks
+    for dest in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        density = [particle_density(v, system, particle) for particle in particles_for_rank[dest + 1]]
+        requests[dest + MPI.Comm_size(MPI.COMM_WORLD) + 1] = MPI.Isend(density, MPI.COMM_WORLD; dest=dest, tag=2)
+    end
+
+    for dest in 0:MPI.Comm_size(MPI.COMM_WORLD) - 1
+        pressure = [particle_pressure(v, system, particle) for particle in particles_for_rank[dest + 1]]
+        requests[dest + 2 * MPI.Comm_size(MPI.COMM_WORLD) + 1] = MPI.Isend(pressure, MPI.COMM_WORLD; dest=dest, tag=3)
+    end
+
+    # MPI.Waitall(requests)
+
+    return system
+end
+
 function kernel_correct_density!(system::WeaklyCompressibleSPHSystem, v, u, v_ode, u_ode,
                                  semi, correction, density_calculator)
     return system
@@ -393,3 +445,20 @@ end
 @inline function surface_tension_model(system)
     return nothing
 end
+
+function keep_particles(system::WeaklyCompressibleSPHSystem, keep)
+    (; initial_condition, density_calculator, state_equation,
+    smoothing_kernel, smoothing_length, pressure_acceleration_formulation,
+    viscosity, density_diffusion, acceleration, correction,
+    source_terms, surface_tension) = system
+
+    WeaklyCompressibleSPHSystem(keep_particles(initial_condition, keep),
+                                density_calculator, state_equation,
+                                smoothing_kernel, smoothing_length;
+                                pressure_acceleration=pressure_acceleration_formulation,
+                                # buffer_size=nothing,
+                                viscosity, density_diffusion,
+                                acceleration,
+                                correction, source_terms,
+                                surface_tension)
+end