Skip to content
Snippets Groups Projects
old_downstream_setup.sh 2.86 KiB
Newer Older
#!/bin/bash
#PBS -l walltime=01:00:00
#PBS -l ncpus=1,mem=2gb
#PBS -q uv2000
#PBS -N downstream_setup
#PBS -j oe


echo "PROJECT_ID = $PROJECT_ID"
echo "DATE = $DATE"
echo "BATCH = $BATCH"
DATE_BATCH=${DATE}_${BATCH}
echo "DATE_BATCH = ${DATE_BATCH}"


BASE=/scratch/u035/u035/shared/analysis/wes_pilot
SOURCE_DIR=/scratch/u035/u035/shared/analysis/wes_pilot/bcbio/final
PED_DIR=/scratch/u035/u035/shared/analysis/wes_pilot/params 


WORK_DIR=$BASE/${PROJECT_ID}
G2P_DIR=${WORK_DIR}/G2P
VASE_DIR=${WORK_DIR}/VASE 
COV_DIR=${WORK_DIR}/COV
DEC_DIR=${WORK_DIR}/DECIPHER
CNV_DIR=${WORK_DIR}/CNV
SCRIPTS_DIR=/home/u035/u035/shared/scripts
PYTHON2=/home/u035/u035/shared/software/bcbio/anaconda/envs/python2/bin/python2.7


# create the working dir and the required subfolders
mkdir ${WORK_DIR}
cd ${WORK_DIR}
mkdir PED
mkdir VCF
mkdir LOG
echo "Created WORK_DIR = ${WORK_DIR} for this batch and the required subfolders"


# create the folders needed for G2P
mkdir ${G2P_DIR}
cd ${G2P_DIR}
echo "Created ${G2P_DIR} for this batch"


# create the folders needed for VASE
cd ${WORK_DIR}
mkdir ${VASE_DIR}
cd ${VASE_DIR}
echo "Created ${VASE_DIR} for this batch"


# create the folders needed for the coverage analysis
cd ${WORK_DIR}
mkdir ${COV_DIR}
echo "Created ${COV_DIR} for this batch"


# create the DECIPHER folders
cd ${WORK_DIR}
mkdir ${DEC_DIR}
cd ${DEC_DIR}
mkdir IGV
echo "Created ${DEC_DIR} for this batch and the required subfolders"


# create the CNV folders
cd ${WORK_DIR}
mkdir ${CNV_DIR}
echo "Created ${CNV_DIR} for this batch"







### Copy the PED file per each family  ###
### format: <BATCH_ID>_<FAMILY_ID>.ped ###
###     and create the FAM_IDs file    ###

for FILE in ${PED_DIR}/${BATCH}_*.ped
do
    # copy the PED file
    cp $FILE ${WORK_DIR}/PED

#    # create the file with the family ids
#    filename="${FILE##*/}"
#    IFS='_|.' read -ra array_1 <<< "$filename"
#    echo "family id = ${array_1[1]}"
#    echo ${array_1[1]} >> ${WORK_DIR}/FAM_IDs.txt
done


######################################################################################
### generate the FAM_IDs.txt, PRO_IDs.txt and FAM_PRO.txt *only for trio* families ###
######################################################################################

time ${PYTHON2} ${SCRIPTS_DIR}/extract_trio_FAM_PRO_ID.py ${WORK_DIR}




echo "OK: Setup for PROJECT_ID = $PROJECT_ID (DATE_BATCH = ${DATE_BATCH}) successful"












######################################################

# LOG_DIR=$BASE/${PROJECT_ID}/logs
#mkdir ${LOG_DIR}
#echo "Created LOG_DIR = ${LOG_DIR} for this batch"

#cd $LOG_DIR
#echo "Created LOG_DIR = ${LOG_DIR} for this batch"


#cd $BASE
#mkdir $BASE/$PROJECT_ID




#source $CONFIG

## Change to the working directory
#cd $WORK_DIR/gvcfs

## Copy the GVCF files
#for file in `cat ../params/$BATCH.gvcfs.txt`
#do
#  cp $file* ./
#done

## Check the md5s
#for file in *.md5
#do
#  md5sum --check $file
#done