pre_dadimodo.sh0000775005165000003260000000562713120171171013441 0ustar thureauswing#!/bin/bash #Number of models generated by modeller NBmodels=5 #load modeller module only during batch scripts if [ $HOSTNAME == 'isei' ] then . /opt/modules/Modules/default/init/sh elif [ $HOSTNAME == 'idai' ] then . /usr/share/Modules/init/sh else echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo $HOSTNAME is unknown echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo exit 0 fi module load modeller if [ $# == 0 ] then echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo NO ARGUMENTS FOUND echo "usage: ./pre_dadimodo.sh " echo OR echo "usage: ./pre_dadimodo.sh " echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo exit 0 fi EXEPATH="python /home/experiences/swing/bin/PreDadimodo" EXEPATH="python /home/experiences/swing/thureau/Scripts/PreDadimodo" SEQALIFILE=$1 if [ ! -f $SEQALIFILE ] then echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo $SEQALIFILE not exist echo "usage: ./pre_dadimodo.sh " echo OR echo "usage: ./pre_dadimodo.sh " echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo exit 0 fi shift #shift the argument (remove the first one) nbpdbfiles=$# pdbfileS=$* #echo $nbpdbfiles #echo $pdbfileS for pdbfile in $pdbfileS do if [ ! -f $pdbfile ] then echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo $pdbfile not exist echo "usage: ./pre_dadimodo.sh " echo OR echo "usage: ./pre_dadimodo.sh " echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo exit 0 fi done #echo $EXEPATH"/pre-dadi.py" $SEQALIFILE $pdbfileS $EXEPATH"/pre-dadi.py" $SEQALIFILE $pdbfileS $NBmodels module unload modeller echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! echo echo "Modeller renumerate chain and residus " echo "The first chain will be A and the first residu will be 1" echo "If only one chain was present, there is no chain in the Output" echo "to add A as chain use the command:" echo "sed -e '/ATOM/ {s/^\(.\{21\}\).\{1\}\(.*\)/\1A\2/}' -e '/TER/ {s/^\(.\{21\}\).\{1\}\(.*\)/\1A\2/}' input.pdb > output.pdb" echo echo !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! pre-dadi.py0000775005165000003260000001202013216430644012510 0ustar thureauswing#!/usr/bin/env python2.7 # -*- coding: utf-8 -*- import sys import os from modeller import * from modeller.automodel import * # Load the automodel class filename, file_extension = os.path.splitext(sys.argv[1]) nbmodels = 1 #default value if file_extension == ".fasta": #First case: will generate a pdb file if pdb sequence identical to fasta sequence fastafile = sys.argv[1] #fichier contenant la sequence complete du systeme rootfasta = filename #save the root name without extension #nbmodels = int(sys.argv[2]) #number of models to generate nbpdbfiles = len(sys.argv)-3 #we suppose that all the other arguments are pdb files ... !!! Not safe !!! code = ['None']*nbpdbfiles #generation of list for i in range(0,nbpdbfiles) : print sys.argv[i+2] code[i]=sys.argv[i+2][:sys.argv[i+2].rindex('.')] #save the root name without extension #sert comme id pour le fichier structure alifile = rootfasta+'.ali' #fichier out de l'alignement # Get the sequence of the PDB file, and write to an alignment file env = environ() env.io.atom_files_directory = ['.', '../atom_files'] env.io.hetatm = True #take into account hetero atoms aln = alignment(env, file=fastafile, alignment_format='FASTA', align_codes = 'all') #cree l'objet aln et y insert la sequence complete for i in range(0,nbpdbfiles) : #add pdb sequence (one by one) to the aln object mod1 = model(env, file=code[i]) # model est la partie de la structure connue du systeme aln.append_model(mod1, align_codes=code[i]) #model est ajoute comme structure a aln aln.salign() #genration d'un alignement automatique (pas 100% fiable) aln.write(file=alifile, alignment_format='PIR') #ecriture du ficher d'alignement s1 = aln[0] #recuperation du code de la sequence fasta s2 = aln[1] #recuperation du code de la sequence du premier fichier pdb en input if (s1.get_num_equiv(s2) == s1.get_num_equiv(s1)) & (s1.get_sequence_identity(s2) == 100 ) & (nbpdbfiles == 1): # same number of residus (no gap) 100% of identity only 1 pdb file as input a = automodel(env, alnfile = alifile, knowns = s2.code, sequence = aln[0].code) #mise en place de l'alignement structural a.starting_model = 1 a.ending_model = nbmodels #(ending_model - starting_model +1) indique le nombre de modeles a creer a.make() #lance l'alignement structural => creation des fichiers pdb complet count=0 for file in os.listdir("."): #To rename the output pdf file if file.endswith("pdb") & file.startswith(aln[0].code): count=count+1 os.rename(file, aln[0].code+"-pred_"+str(count)+".pdb") else: print print print "********************" print "you need to check / modify "+alifile+" file to validate the automatic alignment and then " print "run pre_dadimodo.sh "+alifile print "********************" print print ########################################################################################################### elif file_extension == ".ali": #second and third case: will generate a pdb file based on an alignment if len(sys.argv) != 3: print "usage : pre_dadimodo.sh " sys.exit(1) alifile = sys.argv[1] nbmodels = int(sys.argv[2]) env = environ() env.io.atom_files_directory = ['.', '../atom_files'] env.io.hetatm = True #take into account hetero atoms aln = alignment(env, file=alifile, align_codes='all') list_struct=list() for struct in aln[1:]: list_struct.append(struct.code) a = automodel(env, alnfile = alifile, knowns = list_struct, sequence = aln[0].code) a.starting_model= 1 a.ending_model = 5 # Very thorough VTFM optimization: #a.library_schedule = autosched.slow #a.max_var_iterations = 300 # Thorough MD optimization: a.md_level = refine.slow # a.md_level = refine.very_fast # Repeat the whole cycle 2 times and do not stop unless obj.func. > 1E6 #a.repeat_optimization = 2 #a.max_molpdf = 1e6 a.make() count=0 for file in os.listdir("."): #To rename the output pdb file if file.endswith("pdb") & file.startswith(aln[0].code): count=count+1 os.rename(file, aln[0].code+"_p-"+str(count)+".pdb") else: print print print "**************** WRONG extension !! **************************" print "* Need a .fasta OR .ali as 1st Argument *" print "* pre_dadimodo.sh *" print "* OR *" print "* pre_dadimodo.sh *" print "**************** WRONG extension !! **************************" print print sys.exit(1)