Réimplémentation du programme DSSP en Python

pdb.py 3.5KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990
  1. # custom imports
  2. from atom import *
  3. import sys
  4. import pymol
  5. #import collections
  6. class PDBFile:
  7. def getContent(self, filename):
  8. with open(filename) as f:
  9. return(f.readlines())
  10. def getHeader(self):
  11. #Metadata = collections.namedtuple("Metadata", ["header", "compound", "source", "author"])
  12. Metadata = {}
  13. for line in self.rawLines:
  14. # no need to continue if meta are complete
  15. if(len(Metadata) <4):
  16. if(line[0:10] == "HEADER "):
  17. Metadata['header']=line
  18. elif(line[0:10] == "COMPND 2"):
  19. Metadata['compound']=line
  20. elif(line[0:10] == "SOURCE 2"):
  21. Metadata['source']=line
  22. elif(line[0:10] == "AUTHOR "):
  23. Metadata['author']=line
  24. else:
  25. # if meta are complete, stop parsing
  26. break
  27. return(Metadata)
  28. def getAtoms(self):
  29. self.atoms = []
  30. self.residues = []
  31. temp_atoms = []
  32. for line in self.rawLines:
  33. if line.startswith("ATOM" or "HETATM"):
  34. atom = Atom(atom_id = int(line[6:11].strip()),
  35. atom_name = line[12:16].strip(),
  36. res_name = line[17:20].strip(),
  37. chain_id = line[21:22].strip(),
  38. res_seq_nb = int(line[22:26].strip()),
  39. coordinates = [float(line[30:38].strip()),
  40. float(line[38:46].strip()),
  41. float(line[46:54].strip()),
  42. ])
  43. self.atoms.append(atom)
  44. # get the current indice of atom
  45. i = self.atoms.index(atom)
  46. # if this is a brand new residue
  47. if(len(self.atoms)>1
  48. and atom.res_seq_nb != self.atoms[i-1].res_seq_nb):
  49. self.residues.append(Residue(temp_atoms))
  50. temp_atoms=[]
  51. temp_atoms.append(atom)
  52. # last residue
  53. self.residues.append(Residue(temp_atoms))
  54. def check_hydrogens(self, atoms):
  55. return true
  56. def add_hydrogens(self, filename, output_pdb=None):
  57. pymol.cmd.load(filename)
  58. pymol.cmd.select("nitrogens", selection='name n')
  59. pymol.cmd.h_add("nitrogens")
  60. pymol.cmd.select('hydrogens',selection='name h')
  61. pymol.stored.pos = []
  62. pymol.cmd.iterate_state(1, 'hydrogens', 'stored.pos.append([name,resi,x,y,z])')
  63. if(output_pdb!=None):
  64. pymol.cmd.save(output_file)
  65. return(pymol.stored.pos)
  66. def __init__(self, filename, output_pdb=None):
  67. self.rawLines = self.getContent(filename)
  68. self.Metadata = self.getHeader()
  69. self.getAtoms()
  70. for elem in self.Metadata :
  71. print(self.Metadata[elem], end="")
  72. if(self.check_hydrogens(self.atoms)==False):
  73. if(output_pdb==None):
  74. print("Need to add hydrogens ! If you want the modified PDB file, please use the -o output.pdb argument")
  75. self.add_hydrogens(filename)
  76. if __name__ == "__main__":
  77. if(len(sys.argv)<2):
  78. print("Not enough arguments! Run with --help to learn more about proper"
  79. "call structure and parameters.")
  80. else:
  81. pdbFile = PDBFile(sys.argv[1])
  82. print(pdbFile.residues[15].atoms["C"].coord_x)
  83. print(pdbFile.add_hydrogens(sys.argv[1])[3])