Generate multivec files from CistromeDB bigWig files.
conda activate cistrome-to-multivec-pipeline
# to generate multivec outputs
snakemake --cores 2 --config filetype=mv5
# or, to generate zarr outputs
snakemake --cores 2 --config filetype=zarr
# or, if on O2 (replace with your O2 username)
./ mv5 my_username
conda env create -f environment.yml
conda activate cistrome-to-multivec-pipeline
mkdir -p ~/.config/snakemake/cistrome-explorer
cp ./cluster-profile.yml ~/.config/snakemake/cistrome-explorer/config.yaml
# replace with your credentials
export AWS_ACCESS_KEY_ID="{my_access_key_id}"
export AWS_SECRET_ACCESS_KEY="{my_secret_access_key}"
export AWS_DEFAULT_REGION="us-east-1"
# replace with your O2 username details
# .../users/{first_letter_of_username}/{username}/cistrome-explorer/...
aws s3 sync /n/scratch3/users/m/mk596/cistrome-explorer/data/processed/ s3://higlass-server/CistromeDB/
The following info is outdated, since h5py does not yet work with the parallel version of hdf5 installed on the o2 cluster. In the meantime we can do parallelization by submitting many simultaneous snakemake jobs for each output bigwig file.
module load gcc/6.2.0
module load openmpi/3.1.0
module load hdf5/1.12.0
which mpicc
which h5cc # doesn't work for some reason - but the hdf5 dir is /n/app/hdf5/1.12.0.parallel
# CC="mpicc" HDF5_MPI="ON" HDF5_DIR=/n/app/hdf5/1.12.0.parallel pip install --no-binary=h5py h5py # doesn't work since pip h5py not compatible with 1.12.0
cd path/to/h5py-parent
# Clone h5py so that the latest code with support for hdf5 v1.12.0 (since not yet on pip).
git clone
cd h5py
python configure --hdf5=/n/app/hdf5/1.12.0.parallel
python configure --mpi
python install
Download hdf5 1.10.6 source code from and un-tar-gz
brew install openmpi
# Make a directory in which hdf5 can be installed.
mkdir -p ~/software/hdf5
brew info openmpi # Use this to find the CC value for the next line.
# In the downloaded hdf5-1.10.6 source directory:
CC=/usr/local/Cellar/open-mpi/4.0.3/bin/mpicc ./configure --enable-parallel --enable-shared --prefix=$HOME/software/hdf5
export NPROCS=3 #
make check
make install
cd path/to/h5py-parent
# Clone h5py so that the latest code with support for hdf5 v1.12.0 (since not yet on pip).
git clone
cd h5py
export CC=/usr/local/Cellar/open-mpi/4.0.3/bin/mpicc
python configure --hdf5=$HOME/software/hdf5
python configure --mpi
python install
cd ..
>>> import h5py
>>> h5py.get_config().mpi # Should return True if MPI has been enabled