Réimplémentation du programme DSSP en Python

pdb.py 3.7KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596
  1. # custom imports
  2. from atom import *
  3. import sys
  4. import pymol
  5. #import collections
  6. class PDBFile:
  7. def getContent(self, filename):
  8. with open(filename) as f:
  9. return(f.readlines())
  10. def getHeader(self):
  11. #Metadata = collections.namedtuple("Metadata", ["header", "compound", "source", "author"])
  12. Metadata = {}
  13. for line in self.rawLines:
  14. # no need to continue if meta are complete
  15. if(len(Metadata) <4):
  16. if(line[0:10] == "HEADER "):
  17. Metadata['header']=line
  18. elif(line[0:10] == "COMPND 2"):
  19. Metadata['compound']=line
  20. elif(line[0:10] == "SOURCE 2"):
  21. Metadata['source']=line
  22. elif(line[0:10] == "AUTHOR "):
  23. Metadata['author']=line
  24. else:
  25. # if meta are complete, stop parsing
  26. break
  27. return(Metadata)
  28. def getAtoms(self, filename):
  29. self.atoms = []
  30. self.residues = []
  31. temp_atoms = []
  32. count_h = 0
  33. for line in self.rawLines:
  34. if line.startswith("ATOM" or "HETATM"):
  35. if(line[76:78].strip()=="H"):
  36. count_h+=1
  37. atom = Atom(atom_id = int(line[6:11].strip()),
  38. atom_name = line[12:16].strip(),
  39. res_name = line[17:20].strip(),
  40. chain_id = line[21:22].strip(),
  41. res_seq_nb = int(line[22:26].strip()),
  42. coordinates = [float(line[30:38].strip()),
  43. float(line[38:46].strip()),
  44. float(line[46:54].strip()),
  45. ])
  46. self.atoms.append(atom)
  47. # get the current indice of atom
  48. i = self.atoms.index(atom)
  49. # if this is a brand new residue
  50. if(len(self.atoms)>1
  51. and atom.res_seq_nb != self.atoms[i-1].res_seq_nb):
  52. self.residues.append(Residue(temp_atoms))
  53. temp_atoms=[]
  54. temp_atoms.append(atom)
  55. # last residue
  56. self.residues.append(Residue(temp_atoms))
  57. # hydrogens should represent in average 50% of total atoms... We use 30% threshold...
  58. if(count_h/len(temp_atoms)<0.30):
  59. #if(output_pdb==None):
  60. print("Need to add hydrogens ! If you want the modified PDB file, please use the -o output.pdb argument")
  61. self.add_hydrogens(filename)
  62. def check_hydrogens(self, atoms):
  63. print("ENTER CHECK HYDROGEN")
  64. return True
  65. def add_hydrogens(self, filename, output_pdb=None):
  66. pymol.finish_launching(['pymol', '-qc'])
  67. pymol.cmd.load(filename)
  68. pymol.cmd.select("nitrogens",'name n')
  69. pymol.cmd.h_add("nitrogens")
  70. pymol.stored.pos = []
  71. pymol.cmd.iterate_state(1, "hydrogens", 'stored.pos.append([name,resi,x,y,z])')
  72. if(output_pdb!=None):
  73. pymol.cmd.save(output_file)
  74. return(pymol.stored.pos)
  75. def __init__(self, filename, output_pdb=None):
  76. self.rawLines = self.getContent(filename)
  77. self.Metadata = self.getHeader()
  78. self.getAtoms(filename)
  79. # for elem in self.Metadata :
  80. # print(self.Metadata[elem], end="")
  81. if __name__ == "__main__":
  82. if(len(sys.argv)<2):
  83. print("Not enough arguments! Run with --help to learn more about proper"
  84. "call structure and parameters.")
  85. else:
  86. pdbFile = PDBFile(sys.argv[1])
  87. print(pdbFile.residues[15].atoms["C"].coord_x)
  88. print(pdbFile.add_hydrogens(sys.argv[1])[3])