Printing protein amino acids histograms
A program that prints a histogram of the occurrences of various amino acids in a protein. An example command would be:
prompt> python reshist.py input.pdb
Code
Download code
#!/usr/bin/env python
# (C) 2022 Cadence Design Systems, Inc. (Cadence)
# All rights reserved.
# TERMS FOR USE OF SAMPLE CODE The software below ("Sample Code") is
# provided to current licensees or subscribers of Cadence products or
# SaaS offerings (each a "Customer").
# Customer is hereby permitted to use, copy, and modify the Sample Code,
# subject to these terms. Cadence claims no rights to Customer's
# modifications. Modification of Sample Code is at Customer's sole and
# exclusive risk. Sample Code may require Customer to have a then
# current license or subscription to the applicable Cadence offering.
# THE SAMPLE CODE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED. OPENEYE DISCLAIMS ALL WARRANTIES, INCLUDING, BUT
# NOT LIMITED TO, WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
# PARTICULAR PURPOSE AND NONINFRINGEMENT. In no event shall Cadence be
# liable for any damages or liability in connection with the Sample Code
# or its use.
#############################################################################
# Print a histogram of the occurrences of various amino acids in a protein
#############################################################################
import sys
from openeye import oechem
def ResHist(ifs):
nrmol = 0
mol = oechem.OEGraphMol()
while oechem.OEReadMolecule(ifs, mol):
nrmol += 1
print("==============================")
print("Molecule: %d Title: %s" % (nrmol, mol.GetTitle()))
nrres = 0
resmap = {}
if not oechem.OEHasResidues(mol):
oechem.OEPerceiveResidues(mol, oechem.OEPreserveResInfo_All)
hv = oechem.OEHierView(mol)
for res in hv.GetResidues():
nrres += 1
name = res.GetOEResidue().GetName()
if name in resmap:
resmap[name] += 1
else:
resmap[name] = 1
sortedres = sorted(resmap.keys())
for name in sortedres:
percent = 100.0*float(resmap[name])/float(nrres)
print("%3s %3d %4.1f %%" % (name, resmap[name], percent))
if __name__ == "__main__":
if len(sys.argv) != 2:
oechem.OEThrow.Usage("reshist.py <infile>")
ifs = oechem.oemolistream()
if not ifs.open(sys.argv[1]):
oechem.OEThrow.Fatal("Unable to open %s for reading" % sys.argv[1])
ResHist(ifs)
See also
OEPerceiveResiduesfunctionOEHierView class
OEHierResidue class
OEHierResidue.GetOEResiduemethod