annotate mayachemtool/mayachemtools/lib/PDBFileUtil.pm @ 0:68300206e90d draft default tip

Uploaded
author deepakjadmin
date Thu, 05 Nov 2015 02:41:30 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1 package PDBFileUtil;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
2 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
3 # $RCSfile: PDBFileUtil.pm,v $
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
4 # $Date: 2015/02/28 20:47:18 $
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
5 # $Revision: 1.36 $
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
6 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
7 # Author: Manish Sud <msud@san.rr.com>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
8 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
9 # Copyright (C) 2015 Manish Sud. All rights reserved.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
10 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
11 # This file is part of MayaChemTools.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
12 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
13 # MayaChemTools is free software; you can redistribute it and/or modify it under
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
14 # the terms of the GNU Lesser General Public License as published by the Free
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
15 # Software Foundation; either version 3 of the License, or (at your option) any
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
16 # later version.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
17 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
18 # MayaChemTools is distributed in the hope that it will be useful, but without
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
19 # any warranty; without even the implied warranty of merchantability of fitness
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
20 # for a particular purpose. See the GNU Lesser General Public License for more
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
21 # details.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
22 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
23 # You should have received a copy of the GNU Lesser General Public License
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
24 # along with MayaChemTools; if not, see <http://www.gnu.org/licenses/> or
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
25 # write to the Free Software Foundation Inc., 59 Temple Place, Suite 330,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
26 # Boston, MA, 02111-1307, USA.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
27 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
28
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
29 use strict;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
30 use Exporter;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
31 use Text::ParseWords;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
32 use TextUtil;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
33 use FileUtil;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
34 use TimeUtil ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
35
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
36 use vars qw(@ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
37
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
38 @ISA = qw(Exporter);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
39 @EXPORT = qw(GetPDBRecordType GetRecordTypesCount GetAllResidues GetConectRecordLines GetChainsAndResidues GetExperimentalTechnique GetExperimentalTechniqueResolution GetMinMaxCoords IsPDBFile IsAtomRecordType IsConectRecordType IsHeaderRecordType IsHetatmRecordType IsSeqresRecordType IsModelRecordType IsEndmdlRecordType IsTerRecordType IsMasterRecordType ReadPDBFile ParseHeaderRecordLine GenerateHeaderRecordLine GenerateHeaderRecordTimeStamp ParseAtomRecordLine GenerateAtomRecordLine ParseAtomOrHetatmRecordLine GenerateAtomOrHetatmRecordLine GenerateHetatmRecordLine ParseHetatmRecordLine ParseConectRecordLine GenerateConectRecordLine ParseExpdtaRecordLine ParseRemark2ResolutionRecordLine ParseSeqresRecordLine ParseTerRecordLine GenerateTerRecordLine ParseMasterRecordLine GenerateEndRecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
40 @EXPORT_OK = qw();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
41
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
42 %EXPORT_TAGS = (all => [@EXPORT, @EXPORT_OK]);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
43
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
44 # Get PDB record type...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
45 sub GetPDBRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
46 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
47
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
48 return _GetRecordType($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
49 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
50
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
51 # Is it a PDB file?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
52 sub IsPDBFile {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
53 my($PDBFile) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
54 my($Line, $Status);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
55
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
56 $Status = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
57 open PDBFILE, "$PDBFile" or die "Can't open $PDBFile: $!\n";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
58 $Line = GetTextLine(\*PDBFILE);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
59 $Status = ($Line =~ /^HEADER/i) ? 1 : 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
60 close PDBFILE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
61
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
62 return $Status;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
63 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
64
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
65 # Is it a atom record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
66 sub IsAtomRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
67 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
68
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
69 return _IsRecordType($Line, 'ATOM');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
70 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
71
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
72 # Is it a connect record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
73 sub IsConectRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
74 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
75
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
76 return _IsRecordType($Line, 'CONECT');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
77 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
78
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
79 # Is it a header atom record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
80 sub IsHeaderRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
81 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
82
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
83 return _IsRecordType($Line, 'HEADER');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
84 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
85
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
86 # Is it a hetro atom record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
87 sub IsHetatmRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
88 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
89
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
90 return _IsRecordType($Line, 'HETATM');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
91 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
92
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
93 # Is it a seqres record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
94 sub IsSeqresRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
95 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
96
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
97 return _IsRecordType($Line, 'SEQRES');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
98 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
99
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
100 # Is it a MODEL record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
101 sub IsModelRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
102 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
103
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
104 return _IsRecordType($Line, 'MODEL');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
105 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
106
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
107 # Is it a ENDMDL record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
108 sub IsEndmdlRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
109 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
110
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
111 return _IsRecordType($Line, 'ENDMDL');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
112 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
113
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
114 # Is it a TER record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
115 sub IsTerRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
116 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
117
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
118 return _IsRecordType($Line, 'TER');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
119 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
120
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
121 # Is it a MASTER record type?
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
122 sub IsMasterRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
123 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
124
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
125 return _IsRecordType($Line, 'MASTER');
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
126 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
127
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
128 # Count the number of each record type and a reference to data type with these key/value pairs:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
129 # {RecordTypes} - An array of unique record types in order of their presence in the file
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
130 # {Count}{$RecordType} - Count of each record type
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
131 # {Lines}{$RecordType} - Optional lines data for a specific record type.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
132 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
133 sub GetRecordTypesCount {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
134 my($PDBRecordLinesRef, $SpecifiedRecordType, $GetRecordLinesFlag, $RecordType, $RecordLine, %RecordTypeDataMap);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
135
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
136 %RecordTypeDataMap = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
137 @{$RecordTypeDataMap{RecordTypes}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
138 %{$RecordTypeDataMap{Count}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
139 %{$RecordTypeDataMap{Lines}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
140
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
141 $SpecifiedRecordType = '';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
142 $GetRecordLinesFlag = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
143 if (@_ == 3) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
144 ($PDBRecordLinesRef, $SpecifiedRecordType, $GetRecordLinesFlag) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
145 $SpecifiedRecordType = uc $SpecifiedRecordType;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
146 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
147 elsif (@_ == 2) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
148 ($PDBRecordLinesRef, $SpecifiedRecordType) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
149 $SpecifiedRecordType = uc $SpecifiedRecordType;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
150 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
151 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
152 ($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
153 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
154 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
155 $RecordType = _GetRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
156 if ($SpecifiedRecordType && ($SpecifiedRecordType ne $RecordType)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
157 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
158 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
159 if (exists $RecordTypeDataMap{Count}{$RecordType}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
160 # Update count...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
161 $RecordTypeDataMap{Count}{$RecordType} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
162
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
163 if ($GetRecordLinesFlag) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
164 push @{$RecordTypeDataMap{Lines}{$RecordType}}, $RecordLine;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
165 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
166 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
167 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
168 # New record type...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
169 push @{$RecordTypeDataMap{RecordTypes}}, $RecordType;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
170 $RecordTypeDataMap{Count}{$RecordType} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
171
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
172 if ($GetRecordLinesFlag) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
173 @{$RecordTypeDataMap{Lines}{$RecordType}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
174 push @{$RecordTypeDataMap{Lines}{$RecordType}}, $RecordLine;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
175 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
176 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
177 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
178 return (\%RecordTypeDataMap);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
179 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
180
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
181 # Collect CONECT record lines for specific atom number, modified specified data to exclude any atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
182 # number not present in the list of specified atom numbers and return a reference to list of
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
183 # CONECT record lines.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
184 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
185 sub GetConectRecordLines {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
186 my($PDBRecordLinesRef, $AtomNumbersMapRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
187 my($AtomNumber, $ConectAtomNumber, $RecordLine, @ConectRecordAtomNums, @ConectRecordLines);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
188
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
189 @ConectRecordLines = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
190 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
191 if (!IsConectRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
192 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
193 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
194 @ConectRecordAtomNums = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
195 push @ConectRecordAtomNums, ParseConectRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
196 ATOMNUMBER: for $ConectAtomNumber (@ConectRecordAtomNums) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
197 if (defined $ConectAtomNumber) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
198 $AtomNumber = $ConectAtomNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
199 if ($AtomNumber) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
200 if (! exists $AtomNumbersMapRef->{$AtomNumber}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
201 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
202 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
203 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
204 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
205 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
206 push @ConectRecordLines, $RecordLine;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
207 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
208 return \@ConectRecordLines;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
209 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
210
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
211 # Get chains and residue information using ATOM/HETATM or SEQRES records. And return a reference to a
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
212 # hash with these keys:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
213 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
214 # @{$ChainsDataMap{ChainIDs}} - List of chain IDs with 'None' for no chain identification
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
215 # @{$ChainsDataMap{Residues}{$ChainID}} - List of residues in order of their appearance in a chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
216 # @{$ChainsDataMap{ResidueNumbers}{$ChainID}} - List of residue numbers in order of their appearance in a chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
217 # %{$ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName}} - Count of specific residues in a chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
218 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
219 # Notes:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
220 # . Chains and residue data can be extacted using either ATOM/HETATM records or SEQRES records.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
221 # . In addition to a different chain ID in ATOM/HETATM a TER record also indicates end of an existing chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
222 # and start of a new one: ChainID in ATOM/HETATM records might still be emtpy.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
223 # . ATOM/HETATM records after the first ENDMDL records are simply ingnored.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
224 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
225 sub GetChainsAndResidues {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
226 my($PDBRecordLinesRef, $RecordsSource, $GetChainResiduesBeyondTERFlag, $GetRecordLinesFlag);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
227
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
228 $RecordsSource = 'AtomAndHetatm';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
229 $GetChainResiduesBeyondTERFlag = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
230 $GetRecordLinesFlag = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
231
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
232 if (@_ == 4) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
233 ($PDBRecordLinesRef, $RecordsSource, $GetChainResiduesBeyondTERFlag, $GetRecordLinesFlag) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
234 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
235 elsif (@_ == 3) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
236 ($PDBRecordLinesRef, $RecordsSource, $GetChainResiduesBeyondTERFlag) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
237 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
238 elsif (@_ == 2) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
239 ($PDBRecordLinesRef, $RecordsSource) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
240 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
241 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
242 ($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
243 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
244
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
245 if ($RecordsSource =~ /^AtomAndHetatm$/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
246 return _GetChainsAndResiduesFromAtomHetatmRecords($PDBRecordLinesRef, $GetChainResiduesBeyondTERFlag, $GetRecordLinesFlag);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
247 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
248 elsif ($RecordsSource =~ /^Seqres$/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
249 return _GetChainsAndResiduesFromSeqresRecords($PDBRecordLinesRef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
250 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
251 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
252 my(%ChainsDataMap);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
253 %ChainsDataMap = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
254 @{$ChainsDataMap{ChainIDs}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
255 %{$ChainsDataMap{Residues}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
256 %{$ChainsDataMap{ResidueNumbers}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
257 %{$ChainsDataMap{ResidueCount}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
258
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
259 return \%ChainsDataMap;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
260 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
261 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
262
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
263
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
264 # Get residue information using ATOM/HETATM records and return a reference to a hash with
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
265 # these keys:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
266 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
267 # @{$ResiduesDataMap{ResidueNames}} - List of all the residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
268 # %{$ResiduesDataMap{ResidueCount}{$ResidueName}} - Count of residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
269 # @{$ResiduesDataMap{AtomResidueNames}} - List of all the residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
270 # %{$ResiduesDataMap{AtomResidueCount}{$ResidueName}} - Count of residues in ATOM records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
271 # @{$ResiduesDataMap{HetatomResidueNames}} - List of all the residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
272 # %{$ResiduesDataMap{HetatmResidueCount}{$ResidueName}} - Count of residues HETATM records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
273 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
274 # Notes:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
275 # . ATOM/HETATM records after the first ENDMDL records are simply ingnored.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
276 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
277 sub GetAllResidues {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
278 my($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
279
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
280 my($PreviousChainID, $PreviousResidueNumber, $RecordLine, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge, %ResiduesDataMap);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
281
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
282 %ResiduesDataMap = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
283 @{$ResiduesDataMap{ResidueNames}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
284 %{$ResiduesDataMap{ResidueCount}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
285 @{$ResiduesDataMap{AtomResidueNames}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
286 %{$ResiduesDataMap{AtomResidueCount}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
287 @{$ResiduesDataMap{HetatmResidueNames}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
288 %{$ResiduesDataMap{HetatmResidueCount}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
289
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
290 $PreviousChainID = '';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
291 $PreviousResidueNumber = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
292
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
293 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
294 if (IsEndmdlRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
295 last LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
296 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
297 if (!(IsAtomRecordType($RecordLine) || IsHetatmRecordType($RecordLine))) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
298 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
299 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
300 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = ParseAtomRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
301
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
302 if ($PreviousChainID eq $ChainID) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
303 if ($ResidueNumber == $PreviousResidueNumber) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
304 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
305 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
306 $PreviousResidueNumber = $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
307 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
308 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
309 # New chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
310 $PreviousChainID = $ChainID;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
311 $PreviousResidueNumber = $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
312 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
313
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
314 # Store the residue and update its count...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
315 push @{$ResiduesDataMap{ResidueNames}}, $ResidueName;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
316 if (exists $ResiduesDataMap{ResidueCount}{$ResidueName}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
317 $ResiduesDataMap{ResidueCount}{$ResidueName} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
318 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
319 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
320 $ResiduesDataMap{ResidueCount}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
321 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
322 # Update ATOM residue data...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
323 if (IsAtomRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
324 push @{$ResiduesDataMap{AtomResidueNames}}, $ResidueName;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
325 if (exists $ResiduesDataMap{AtomResidueCount}{$ResidueName}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
326 $ResiduesDataMap{AtomResidueCount}{$ResidueName} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
327 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
328 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
329 $ResiduesDataMap{AtomResidueCount}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
330 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
331 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
332 # Update HETATM residue data...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
333 if (IsHetatmRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
334 push @{$ResiduesDataMap{HetatmResidueNames}}, $ResidueName;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
335 if (exists $ResiduesDataMap{HetatmResidueCount}{$ResidueName}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
336 $ResiduesDataMap{HetatmResidueCount}{$ResidueName} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
337 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
338 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
339 $ResiduesDataMap{HetatmResidueCount}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
340 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
341 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
342 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
343
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
344 return \%ResiduesDataMap;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
345 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
346
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
347 # Return min/max XYZ coordinates for ATOM/HETATM records...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
348 sub GetMinMaxCoords {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
349 my($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
350
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
351 my($XMin, $YMin, $ZMin, $XMax, $YMax, $ZMax, $RecordLine, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
352
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
353 ($XMin, $YMin, $ZMin) = (99999) x 3;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
354 ($XMax, $YMax, $ZMax) = (-99999) x 3;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
355
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
356 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
357 if (!(IsAtomRecordType($RecordLine) || IsHetatmRecordType($RecordLine))) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
358 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
359 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
360 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = ParseAtomRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
361
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
362 $XMin = ($X < $XMin) ? $X : $XMin;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
363 $YMin = ($Y < $YMin) ? $Y : $YMin;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
364 $ZMin = ($Z < $ZMin) ? $Z : $ZMin;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
365
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
366 $XMax = ($X > $XMax) ? $X : $XMax;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
367 $YMax = ($Y > $YMax) ? $Y : $YMax;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
368 $ZMax = ($Z > $ZMax) ? $Z : $ZMax;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
369 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
370
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
371 if ($XMin == 99999) { $XMin = undef; }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
372 if ($YMin == 99999) { $YMin = undef; }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
373 if ($ZMin == 99999) { $ZMin = undef; }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
374 if ($XMax == -99999) { $XMax = undef; }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
375 if ($YMax == -99999) { $YMax = undef; }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
376 if ($ZMax == -99999) { $ZMax = undef; }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
377
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
378 return ($XMin, $YMin, $ZMin, $XMax, $YMax, $ZMax);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
379 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
380
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
381 # Read PDB file and return reference to record lines..
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
382 sub ReadPDBFile {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
383 my($PDBFile) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
384
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
385 my($Line, @PDBRecordLines);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
386
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
387 @PDBRecordLines = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
388 open PDBFILE, "$PDBFile" or die "Can't open $PDBFile: $!\n";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
389 while ($Line = GetTextLine(\*PDBFILE)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
390 push @PDBRecordLines, $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
391 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
392
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
393 close PDBFILE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
394
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
395 return (\@PDBRecordLines);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
396 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
397
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
398 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
399 # Get experimental technique information...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
400 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
401 sub GetExperimentalTechnique {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
402 my($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
403 my($RecordLine, $ContinuationNum, $ExperimentalTechnique);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
404
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
405 $ExperimentalTechnique = undef;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
406
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
407 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
408 if (_IsRecordType($RecordLine, 'EXPDTA')) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
409 ($ContinuationNum, $ExperimentalTechnique) = ParseExpdtaRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
410 last LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
411 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
412 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
413
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
414 return $ExperimentalTechnique;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
415 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
416
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
417 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
418 # Get experimental technique resolution information...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
419 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
420 sub GetExperimentalTechniqueResolution {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
421 my($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
422 my($RecordLine, $Resolution, $ResolutionUnits);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
423
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
424 ($Resolution, $ResolutionUnits) = ((undef) x 2);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
425
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
426 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
427 if ($RecordLine =~ /^REMARK 2 RESOLUTION./i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
428 ($Resolution, $ResolutionUnits) = ParseRemark2ResolutionRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
429 last LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
430 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
431 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
432
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
433 return ($Resolution, $ResolutionUnits);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
434 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
435
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
436 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
437 # Parse HEADER record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
438 sub ParseHeaderRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
439 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
440 my($Classification, $DepositionDate, $IDCode) = (undef, undef, undef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
441
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
442 if ($Line !~ /^HEADER/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
443 return ($Classification, $DepositionDate, $IDCode);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
444 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
445 my($Length);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
446
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
447 ($Classification, $DepositionDate, $IDCode) = ('') x 3;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
448
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
449 $Length = length $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
450
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
451 if ($Length <= 62) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
452 ($Classification, $DepositionDate) = unpack("x10A40A9", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
453 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
454 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
455 ($Classification, $DepositionDate, $IDCode) = unpack("x10A40A9x3A4", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
456 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
457
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
458 $Classification = RemoveLeadingAndTrailingWhiteSpaces($Classification);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
459 $DepositionDate =~ s/ //g;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
460 $IDCode =~ s/ //g;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
461
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
462 return ($Classification, $DepositionDate, $IDCode);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
463 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
464
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
465 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
466 # Generate HEADER record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
467 sub GenerateHeaderRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
468 my($Classification, $Date, $IDCode, $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
469
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
470 $Classification = "Created using MayaChemTools";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
471 $Date = GenerateHeaderRecordTimeStamp();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
472 if (@_ == 3) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
473 ($IDCode, $Classification, $Date) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
474 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
475 elsif (@_ == 2) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
476 ($IDCode, $Classification) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
477 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
478 elsif (@_ == 1) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
479 ($IDCode) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
480 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
481
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
482 $Line = sprintf "HEADER %-40.40s%9.9s %4.4s", $Classification, $Date, $IDCode;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
483 return $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
484 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
485
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
486 # Generate PDB header time stamp...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
487 sub GenerateHeaderRecordTimeStamp {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
488 return TimeUtil::PDBFileTimeStamp();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
489 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
490
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
491 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
492 # Parse ATOM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
493 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
494 sub ParseAtomRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
495 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
496
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
497 return _ParseAtomOrHetatmRecordLine($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
498 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
499
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
500 # Generate ATOM record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
501 sub GenerateAtomRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
502 my($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
503
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
504 return _GenerateAtomOrHetatmRecordLine('ATOM', $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
505 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
506
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
507 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
508 # Parse ATOM/HETATm record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
509 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
510 sub ParseAtomOrHetatmRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
511 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
512
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
513 return _ParseAtomOrHetatmRecordLine($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
514 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
515
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
516 # Generate ATOM/HETATM record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
517 sub GenerateAtomOrHetatmRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
518 my($RecordType, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
519
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
520 return _GenerateAtomOrHetatmRecordLine($RecordType, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
521 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
522 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
523 # Parse HETATM record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
524 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
525 sub ParseHetatmRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
526 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
527
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
528 return _ParseAtomOrHetatmRecordLine($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
529 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
530
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
531 # Generate HETATM record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
532 sub GenerateHetatmRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
533 my($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
534
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
535 return _GenerateAtomOrHetatmRecordLine('HETATM', $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
536 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
537
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
538 # Parse EXPDTA record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
539 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
540 # EXPDTA format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
541 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
542 #1 - 6 Record name "EXPDTA"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
543 # 9 - 10 Continuation continuation Allows concatenation of multiple records.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
544 # 11 - 70 SList technique The experimental technique(s) with optional comment describing the sample or experiment.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
545 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
546 # The EXPDTA record identifies the experimental technique used. This may refer to the type of radiation and
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
547 # sample, or include the spectroscopic or modeling technique. Permitted values include:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
548 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
549 # ELECTRON DIFFRACTION
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
550 # FIBER DIFFRACTION
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
551 # FLUORESCENCE TRANSFER
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
552 # NEUTRON DIFFRACTION
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
553 # NMR
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
554 # THEORETICAL MODEL
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
555 # X-RAY DIFFRACTION
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
556 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
557 sub ParseExpdtaRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
558 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
559
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
560 if ($Line !~ /^EXPDTA/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
561 return ((undef) x 2);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
562 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
563
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
564 my($ContinuationNum, $ExperimentalTechnique) = unpack("x8A2A60" , $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
565
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
566 $ContinuationNum =~ s/ //g;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
567 $ExperimentalTechnique = RemoveLeadingAndTrailingWhiteSpaces($ExperimentalTechnique);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
568
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
569 return ($ContinuationNum, $ExperimentalTechnique);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
570 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
571
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
572 # Parse REMARK 2 record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
573 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
574 # REMARK 2 format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
575 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
576 # The second REMARK 2 record has one of two formats. The first is used for diffraction studies, the second
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
577 # for other types of experiments in which resolution is not relevant, e.g., NMR and theoretical modeling.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
578 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
579 #For diffraction experiments:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
580 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
581 # 1 - 6 Record name "REMARK"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
582 # 10 LString(1) "2"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
583 # 12 - 22 LString(11) "RESOLUTION."
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
584 # 23 - 27 Real(5.2) resolution Resolution.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
585 # 29 - 38 LString(10) "ANGSTROMS."
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
586 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
587 # REMARK 2 when not a diffraction experiment:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
588 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
589 # 1 - 6 Record name "REMARK"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
590 # 10 LString(1) "2"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
591 # 12 - 38 LString(28) "RESOLUTION. NOT APPLICABLE."
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
592 # 41 - 70 String comment Comment.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
593 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
594 sub ParseRemark2ResolutionRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
595 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
596
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
597 if ($Line !~ /^REMARK 2 RESOLUTION./i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
598 return ((undef) x 2);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
599 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
600
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
601 my($Resolution, $ResolutionUnits);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
602
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
603 if ($Line =~ /NOT APPLICABLE/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
604 ($Resolution, $ResolutionUnits) = ("NOT APPLICABLE", "");
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
605 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
606 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
607 ($Resolution, $ResolutionUnits) = unpack("x22A5x1A10" , $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
608 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
609
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
610 $Resolution = RemoveLeadingAndTrailingWhiteSpaces($Resolution);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
611
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
612 $ResolutionUnits = RemoveLeadingAndTrailingWhiteSpaces($ResolutionUnits);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
613 $ResolutionUnits =~ s/\.$//;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
614
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
615 return ($Resolution, $ResolutionUnits);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
616 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
617
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
618 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
619 # Parse SEQRES record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
620 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
621 # SEQRES format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
622 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
623 # 1 - 6 Record name "SEQRES"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
624 # 9 - 10 Serial number of the SEQRES record for the current chain. Starts at 1 and increments by one each line. Reset to 1 for each chain.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
625 # 12 - Chain identifier
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
626 # 14 - 17 Integer numRes Number of residues in the chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
627 # 20 - 22 24 -26 ... ... 68 - 70 Residue name resName Residue name.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
628 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
629 sub ParseSeqresRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
630 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
631
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
632 if ($Line !~ /^SEQRES/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
633 return ((undef) x 5);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
634 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
635 my($RecordSerialNumber, $ChainID, $NumOfResidues, $ResidueNames) = unpack("x8A2x1A1x1A4x2A51" , $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
636 $RecordSerialNumber =~ s/ //g;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
637 $ChainID =~ s/ //g;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
638 $NumOfResidues =~ s/ //g;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
639 $ResidueNames = RemoveLeadingAndTrailingWhiteSpaces($ResidueNames);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
640
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
641 return ($RecordSerialNumber, $ChainID, $NumOfResidues, $ResidueNames);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
642 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
643
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
644 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
645 # Parse CONECT record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
646 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
647 # CONECT format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
648 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
649 # 1 - 6 Record name "CONECT"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
650 # 7 - 11 Atom number
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
651 # 12 - 16, 17 - 21, 22 - 26, 27 - 31 Atom number of bonded atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
652 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
653 # 32 - 36, 37 - 41 Atom number of hydrogen bonded atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
654 # 42 - 46 Atom number of salt bridged atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
655 # 47 - 51, 52 -56 Atom number of hydrogen bonded atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
656 # 57 - 61 Atom number of salt bridged atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
657 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
658 sub ParseConectRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
659 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
660
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
661 if ($Line !~ /^CONECT/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
662 return ((undef) x 11);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
663 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
664 my($AtomNum, $BondedAtomNum1, $BondedAtomNum2, $BondedAtomNum3, $BondedAtomNum4, $HBondedAtomNum1, $HBondedAtomNum2, $SaltBridgedAtomNum1, $HBondedAtomNum3, $HBondedAtomNum4, $SaltBridgedAtomNum2) = map {s/ //g; $_} unpack("x6A5A5A5A5A5A5A5A5A5A5A5", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
665
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
666 return ($AtomNum, $BondedAtomNum1, $BondedAtomNum2, $BondedAtomNum3, $BondedAtomNum4, $HBondedAtomNum1, $HBondedAtomNum2, $SaltBridgedAtomNum1, $HBondedAtomNum3, $HBondedAtomNum4, $SaltBridgedAtomNum2);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
667 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
668
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
669 # Generate CONECT record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
670 sub GenerateConectRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
671 my($AtomNum, $BondedAtomNum1, $BondedAtomNum2, $BondedAtomNum3, $BondedAtomNum4, $HBondedAtomNum1, $HBondedAtomNum2, $SaltBridgedAtomNum1, $HBondedAtomNum3, $HBondedAtomNum4, $SaltBridgedAtomNum2) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
672 my($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
673
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
674 $Line = sprintf "CONECT%5.5s%5.5s%5.5s%5.5s%5.5s%5.5s%5.5s%5.5s%5.5s%5.5s%5.5s", $AtomNum, $BondedAtomNum1, $BondedAtomNum2, $BondedAtomNum3, $BondedAtomNum4, $HBondedAtomNum1, $HBondedAtomNum2, $SaltBridgedAtomNum1, $HBondedAtomNum3, $HBondedAtomNum4, $SaltBridgedAtomNum2;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
675
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
676 return $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
677 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
678
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
679 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
680 # Parse TER record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
681 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
682 # TER format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
683 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
684 #1 - 6 Record name "TER "
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
685 # 7 - 11 Serial number
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
686 # 18 - 20 Residue name
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
687 # 22 Chain identifier
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
688 # 23 - 26 Residue sequence number
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
689 # 27 Insertion code
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
690 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
691 sub ParseTerRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
692 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
693
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
694 if ($Line !~ /^TER/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
695 return ((undef) x 5);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
696 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
697 my($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $Length);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
698
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
699 ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode) = ('') x 5;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
700
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
701 $Length = length $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
702
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
703 if ($Length <= 17) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
704 ($SerialNumber, $ResidueName) = map {s/ //g; $_} unpack("x6A5", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
705 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
706 elsif ($Length <= 21) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
707 ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode) = map {s/ //g; $_} unpack("x6A5x6A3", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
708 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
709 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
710 ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode) = map {s/ //g; $_} unpack("x6A5x6A3xA1A4A1", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
711 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
712
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
713 return ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
714 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
715
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
716 # Generate TER record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
717 sub GenerateTerRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
718 my($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $Line) = ('') x 6;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
719
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
720 if (@_ == 5) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
721 ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
722 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
723 elsif (@_ == 4) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
724 ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
725 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
726 elsif (@_ == 3) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
727 ($SerialNumber, $ResidueName) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
728 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
729 elsif (@_ == 2) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
730 ($SerialNumber, $ResidueName) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
731 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
732 elsif (@_ == 1) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
733 ($SerialNumber) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
734 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
735 $Line = sprintf "TER %5.5s %-3.3s %1.1s%4.4s%1.1s", $SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
736
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
737 return $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
738 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
739
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
740 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
741 # Parse MASTER record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
742 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
743 # MASTER record format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
744 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
745 #1 - 6 Record name "MASTER"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
746 # 11 - 15 Number of REMARK records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
747 # 16 - 20 "0"
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
748 # 21 - 25 Number of HET records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
749 # 26 - 30 Number of HELIX records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
750 # 31 - 35 Number of SHEET records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
751 # 36 - 40 Number of TURN records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
752 # 41 - 45 Number of SITE records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
753 # 46 - 50 Number of coordinate transformation records (ORIGXn+SCALEn+MTRIXn)
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
754 # 51 - 55 Number of atomic coordinate records (ATOM+HETATM)
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
755 # 56 - 60 Number of TER records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
756 # 61 - 65 Number of CONECT records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
757 # 66 - 70 Number of SEQRES records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
758 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
759 sub ParseMasterRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
760 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
761
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
762 if ($Line !~ /^MASTER/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
763 return ((undef) x 11);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
764 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
765 my($NumOfRemarkRecords, $NumOfHetRecords, $NumOfHelixRecords, $NumOfSheetRecords, $NumOfTurnRecords, $NumOfSiteRecords, $NumOfTransformationsRecords, $NumOfAtomAndHetatmRecords, $NumOfTerRecords, $NumOfConectRecords, $NumOfSeqresRecords) = map {s/ //g; $_} unpack("x6x4A5x5A5A5A5A5A5A5A5A5A5A5", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
766
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
767 return ($NumOfRemarkRecords, $NumOfHetRecords, $NumOfHelixRecords, $NumOfSheetRecords, $NumOfTurnRecords, $NumOfSiteRecords, $NumOfTransformationsRecords, $NumOfAtomAndHetatmRecords, $NumOfTerRecords, $NumOfConectRecords, $NumOfSeqresRecords);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
768 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
769
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
770 # End record...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
771 sub GenerateEndRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
772 my($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
773 $Line = 'END ';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
774 return $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
775 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
776
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
777 # ATOM/HETATM record format:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
778 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
779 # 1 - 6 Record name
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
780 # 7 - 11 Atom serial number - right justified
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
781 # 13 - 16 Atom name
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
782 # 17 Alternate location indicator.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
783 # 18 - 20 Residue name - right justified
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
784 # 22 Chain identifier.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
785 # 23 - 26 Residue sequence number - right justified
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
786 # 27 Code for insertion of residues.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
787 # 31 - 38 Real(8.3), Orthogonal coordinates for X in Angstroms.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
788 # 39 - 46 Real(8.3), Orthogonal coordinates for Y in Angstroms.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
789 # 47 - 54 Real(8.3), Orthogonal coordinates for Z in Angstroms.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
790 # 55 - 60 Real(6.2), Occupancy
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
791 # 61 - 66 Real(6.2), Temperature factor
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
792 # 73 - 76 LString(4), Segment identifier, left-justified.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
793 # 77 - 78 LString(2), Element symbol, right-justified.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
794 #79 - 80 LString(2), Charge on the atom.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
795 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
796 # Notes:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
797 # . Atom names starting with C, N, O and S are left justified starting with column 14
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
798 # and others are left justified starting with column 13.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
799 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
800 # . Six characters (columns) are reserved for atom names, assigned as follows:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
801 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
802 # 13 - 14 Chemical symbol - right justified, except for hydrogen atoms
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
803 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
804 # And for amino acids:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
805 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
806 # 15 Remoteness indicator (alphabetic) (A, B, G, D, E, Z and so on)
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
807 # 16 Branch designator (numeric)
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
808 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
809 sub _ParseAtomOrHetatmRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
810 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
811
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
812 if ($Line !~ /^(ATOM|HETATM)/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
813 return ((undef) x 15);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
814 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
815 my($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge, $Length);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
816
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
817 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = ('') x 15;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
818
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
819 $Length = length $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
820
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
821 if ($Length <= 72) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
822 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor) = map {s/ //g; $_} unpack("x6A5xA4A1A3xA1A4A1x3A8A8A8A6A6", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
823 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
824 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
825 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = map {s/ //g; $_} unpack("x6A5xA4A1A3xA1A4A1x3A8A8A8A6A6x6A4A2A2", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
826 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
827 return($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
828 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
829
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
830 # Generate ATOM/HETATM record line...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
831 sub _GenerateAtomOrHetatmRecordLine {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
832 my($RecordType, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
833 my($Line, $AtomNameFormat);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
834
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
835 if (length($AtomName) >= 4) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
836 # Left justified starting at column 13 for all atom names of length 4...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
837 $AtomNameFormat = "%-4.4s";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
838 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
839 elsif (IsEmpty($ElementSymbol)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
840 # No element symbol specified; just guess from atom name to cover most likely cases...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
841 $AtomNameFormat = ($AtomName =~ /^(C|N|O|S)/i) ? " %-3.3s" : "%-4.4s";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
842 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
843 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
844 # Element symbol specified...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
845 if ($ElementSymbol =~ /^H$/i) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
846 # Hydrogen atom name with <=3 characters is left justified starting at column 14;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
847 # Otherwise, left justified starting at column 13.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
848 $AtomNameFormat = (length($AtomName) <= 3) ? " %-3.3s" : "%-4.4s";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
849 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
850 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
851 # Non-hydrogen atom name...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
852 $AtomNameFormat = (length($ElementSymbol) == 1) ? " %-3.3s" : "%-4.4s";
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
853 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
854 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
855
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
856 $Line = sprintf "%-6.6s%5.5s ${AtomNameFormat}%1.1s%3.3s %1.1s%4.4s%1.1s %8.8s%8.8s%8.8s%6.6s%6.6s %-4.4s%2.2s%2.2s", $RecordType, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
857
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
858 return $Line;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
859 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
860
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
861 # Check record type...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
862 sub _IsRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
863 my($Line, $SpecifiedType) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
864 my($Type, $Status);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
865
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
866 ($Type) = map {s/ //g; $_} unpack("A6", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
867
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
868 $Status = ($SpecifiedType eq $Type) ? 1 : 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
869
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
870 return $Status;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
871 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
872
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
873 # Get record type...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
874 sub _GetRecordType {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
875 my($Line) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
876 my($Type);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
877
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
878 ($Type) = map {s/ //g; $_} unpack("A6", $Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
879
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
880 return $Type;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
881 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
882
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
883 # Get chains and residues data using ATOM/HETATM records...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
884 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
885 sub _GetChainsAndResiduesFromAtomHetatmRecords {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
886 my($PDBRecordLinesRef, $GetChainResiduesBeyondTERFlag, $GetRecordLinesFlag) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
887
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
888 my($LineCount, $TotalChainCount, $PreviousResidueNumber, $ChainCount, $DefaultChainID, $DefaultChainLabel, $RecordLine, $AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge, %ChainsDataMap);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
889
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
890 # Do a quick chain count using TER record...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
891 $TotalChainCount = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
892 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
893 if (IsEndmdlRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
894 last LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
895 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
896 if (IsTerRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
897 $TotalChainCount++;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
898 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
899 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
900
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
901 %ChainsDataMap = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
902 @{$ChainsDataMap{ChainIDs}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
903 %{$ChainsDataMap{Residues}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
904 %{$ChainsDataMap{ResidueNumbers}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
905 %{$ChainsDataMap{Lines}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
906 %{$ChainsDataMap{ResidueCount}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
907
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
908 $LineCount = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
909 $ChainCount = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
910 $DefaultChainLabel = 'None';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
911 $DefaultChainID = $DefaultChainLabel . ($ChainCount + 1);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
912 $PreviousResidueNumber = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
913
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
914 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
915 $LineCount++;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
916 if (IsTerRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
917 $DefaultChainID = $DefaultChainLabel . ($ChainCount + 1);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
918 $ChainCount++;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
919 if ($ChainCount == $TotalChainCount) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
920 last LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
921 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
922 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
923 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
924 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
925 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
926 elsif (!(IsAtomRecordType($RecordLine) || IsHetatmRecordType($RecordLine))) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
927 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
928 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
929 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = ParseAtomRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
930
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
931 if (IsEmpty($ChainID)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
932 $ChainID = $DefaultChainID;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
933 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
934 if (exists $ChainsDataMap{Residues}{$ChainID}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
935 # Data for existing chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
936 if ($GetRecordLinesFlag) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
937 push @{$ChainsDataMap{Lines}{$ChainID}}, $RecordLine;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
938 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
939
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
940 if ($ResidueNumber != $PreviousResidueNumber) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
941 # Next residue with in the chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
942 push @{$ChainsDataMap{Residues}{$ChainID}}, $ResidueName;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
943 push @{$ChainsDataMap{ResidueNumbers}{$ChainID}}, $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
944
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
945 if (exists $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
946 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
947 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
948 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
949 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
950 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
951 $PreviousResidueNumber = $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
952 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
953 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
954 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
955 # Data for new chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
956 push @{$ChainsDataMap{ChainIDs}}, $ChainID;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
957
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
958 @{$ChainsDataMap{Residues}{$ChainID}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
959 push @{$ChainsDataMap{Residues}{$ChainID}}, $ResidueName;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
960
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
961 @{$ChainsDataMap{ResidueNumbers}{$ChainID}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
962 push @{$ChainsDataMap{ResidueNumbers}{$ChainID}}, $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
963
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
964 @{$ChainsDataMap{Lines}{$ChainID}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
965 if ($GetRecordLinesFlag) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
966 push @{$ChainsDataMap{Lines}{$ChainID}}, $RecordLine;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
967 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
968
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
969 %{$ChainsDataMap{ResidueCount}{$ChainID}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
970 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
971 $PreviousResidueNumber = $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
972 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
973 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
974 if (!$GetChainResiduesBeyondTERFlag) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
975 return \%ChainsDataMap;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
976 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
977 # Look for any HETATM residues specified outside TER records which could belong to an existing chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
978 my($LineIndex, $PreviousChainID);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
979 $PreviousChainID = '';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
980 $PreviousResidueNumber = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
981 LINE: for $LineIndex (($LineCount - 1) .. $#{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
982 $RecordLine = $PDBRecordLinesRef->[$LineIndex];
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
983 if (IsEndmdlRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
984 last LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
985 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
986 if (!(IsAtomRecordType($RecordLine) || IsHetatmRecordType($RecordLine))) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
987 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
988 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
989 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) = ParseAtomRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
990 if (IsEmpty($ChainID)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
991 # Ignore the chains with no ids...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
992 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
993 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
994 if (! exists($ChainsDataMap{Residues}{$ChainID})) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
995 # Don't collect any new chains after TER record...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
996 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
997 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
998 if ($GetRecordLinesFlag) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
999 push @{$ChainsDataMap{Lines}{$ChainID}}, $RecordLine;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1000 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1001 if ($ResidueNumber != $PreviousResidueNumber || $ChainID ne $PreviousChainID) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1002
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1003 push @{$ChainsDataMap{Residues}{$ChainID}}, $ResidueName;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1004 push @{$ChainsDataMap{ResidueNumbers}{$ChainID}}, $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1005
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1006 if (exists $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1007 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1008 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1009 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1010 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1011 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1012 $PreviousChainID = $ChainID;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1013 $PreviousResidueNumber = $ResidueNumber;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1014 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1015 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1016 return \%ChainsDataMap;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1017 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1018
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1019 # Get chains and residues data using SEQRES records...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1020 #
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1021 sub _GetChainsAndResiduesFromSeqresRecords {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1022 my($PDBRecordLinesRef) = @_;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1023
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1024 my($ChainCount, $DefaultChainLabel, $DefaultChainID, $RecordLine, $RecordSerialNumber, $ChainID, $NumOfResidues, $ResidueName, $ResidueNamesString, @ResidueNamesList, %ChainsDataMap);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1025
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1026 %ChainsDataMap = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1027 @{$ChainsDataMap{ChainIDs}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1028 %{$ChainsDataMap{Residues}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1029 %{$ChainsDataMap{ResidueNumbers}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1030 %{$ChainsDataMap{ResidueCount}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1031
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1032 $ChainCount = 0;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1033 $DefaultChainLabel = 'None';
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1034 $DefaultChainID = $DefaultChainLabel . ($ChainCount + 1);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1035
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1036 LINE: for $RecordLine (@{$PDBRecordLinesRef}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1037 if (!IsSeqresRecordType($RecordLine)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1038 next LINE;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1039 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1040 ($RecordSerialNumber, $ChainID, $NumOfResidues, $ResidueNamesString) = ParseSeqresRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1041 if ($RecordSerialNumber == 1) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1042 # Indicates start of a new chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1043 $DefaultChainID = $DefaultChainLabel . ($ChainCount + 1);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1044 $ChainCount++;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1045 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1046 if (IsEmpty($ChainID)) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1047 $ChainID = $DefaultChainID;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1048 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1049 # Process the residues...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1050 @ResidueNamesList = split /[ ]+/, $ResidueNamesString;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1051
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1052 if (exists $ChainsDataMap{Residues}{$ChainID}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1053 # Data for existing chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1054 push @{$ChainsDataMap{Residues}{$ChainID}}, @ResidueNamesList;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1055 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1056 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1057 # Data for new chain...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1058 push @{$ChainsDataMap{ChainIDs}}, $ChainID;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1059 @{$ChainsDataMap{Residues}{$ChainID}} = ();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1060 push @{$ChainsDataMap{Residues}{$ChainID}}, @ResidueNamesList;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1061 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1062
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1063 # Setup residue count...
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1064 for $ResidueName (@ResidueNamesList) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1065 if (exists $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName}) {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1066 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} += 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1067 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1068 else {
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1069 $ChainsDataMap{ResidueCount}{$ChainID}{$ResidueName} = 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1070 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1071 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1072 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1073 return \%ChainsDataMap;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1074 }
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1075
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1076 1;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1077
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1078 __END__
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1079
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1080 =head1 NAME
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1081
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1082 PDBFileUtil
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1083
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1084 =head1 SYNOPSIS
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1085
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1086 use PDBFileUtil ;
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1087
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1088 use PDBFileUtil qw(:all);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1089
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1090 =head1 DESCRIPTION
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1091
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1092 B<PDBFileUtil> module provides the following functions:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1093
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1094 GenerateAtomOrHetatmRecordLine, GenerateAtomRecordLine, GenerateConectRecordLine,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1095 GenerateEndRecordLine, GenerateHeaderRecordLine, GenerateHeaderRecordTimeStamp,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1096 GenerateHetatmRecordLine, GenerateTerRecordLine, GetAllResidues,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1097 GetChainsAndResidues, GetConectRecordLines, GetExperimentalTechnique,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1098 GetExperimentalTechniqueResolution, GetMinMaxCoords, GetPDBRecordType,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1099 GetRecordTypesCount, IsAtomRecordType, IsConectRecordType, IsEndmdlRecordType,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1100 IsHeaderRecordType, IsHetatmRecordType, IsMasterRecordType, IsModelRecordType,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1101 IsPDBFile, IsSeqresRecordType, IsTerRecordType, ParseAtomOrHetatmRecordLine,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1102 ParseAtomRecordLine, ParseConectRecordLine, ParseExpdtaRecordLine,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1103 ParseHeaderRecordLine, ParseHetatmRecordLine, ParseMasterRecordLine,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1104 ParseRemark2ResolutionRecordLine, ParseSeqresRecordLine, ParseTerRecordLine,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1105 ReadPDBFile
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1106
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1107 =head1 METHODS
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1108
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1109 =over 4
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1110
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1111 =item B<GenerateAtomOrHetatmRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1112
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1113 $RecordLine = GenerateAtomOrHetatmRecordLine($RecordType,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1114 $AtomNumber, $AtomName, $AlternateLocation, $ResidueName,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1115 $ChainID, $ResidueNumber, $InsertionCode, $X, $Y, $Z,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1116 $Occupancy, $TemperatureFactor, $SegmentID,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1117 $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1118
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1119 Returns ATOM or HETATM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1120
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1121 =item B<GenerateAtomRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1122
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1123 $RecordLine = GenerateAtomRecordLine($AtomNumber,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1124 $AtomName, $AlternateLocation, $ResidueName, $ChainID,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1125 $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1126 $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1127
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1128 Returns ATOM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1129
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1130 =item B<GenerateConectRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1131
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1132 $RecordLine = GenerateConectRecordLine($AtomNum, $BondedAtomNum1,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1133 $BondedAtomNum2, $BondedAtomNum3, $BondedAtomNum4,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1134 $HBondedAtomNum1, $HBondedAtomNum2, $SaltBridgedAtomNum1,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1135 $HBondedAtomNum3, $HBondedAtomNum4, $SaltBridgedAtomNum2);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1136
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1137 Returns CONECT record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1138
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1139 =item B<GenerateHeaderRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1140
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1141 $RecordLine = GenerateHeaderRecordLine($IDCode, [$Classification,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1142 $Date]);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1143
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1144 Returns HEADER record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1145
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1146 =item B<GenerateHeaderRecordTimeStamp>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1147
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1148 $Date = GenerateHeaderRecordTimeStamp();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1149
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1150 Returns PDB header time stamp.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1151
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1152 =item B<GenerateHetatmRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1153
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1154 $RecordLine = GenerateHetatmRecordLine($AtomNumber, $AtomName,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1155 $AlternateLocation, $ResidueName, $ChainID, $ResidueNumber,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1156 $InsertionCode, $X, $Y, $Z, $Occupancy, $TemperatureFactor,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1157 $SegmentID, $ElementSymbol, $AtomCharge);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1158
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1159 Returns HETATM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1160
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1161 =item B<GenerateEndRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1162
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1163 $RecordLine = GenerateEndRecordLine();
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1164
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1165 Returns END record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1166
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1167 =item B<GenerateTerRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1168
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1169 $RecordLine = GenerateTerRecordLine($SerialNumber, [$ResidueName,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1170 $ChainID, $ResidueNumber, $InsertionCode]);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1171
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1172 Returns TER record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1173
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1174 =item B<GetAllResidues>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1175
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1176 $ResiduesDataRef = GetAllResidues($PDBRecordLinesRef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1177
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1178 Gets residue information using ATOM/HETATM records and returns a reference to a hash with
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1179 following key/value pairs:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1180
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1181 $ResiduesDataRef->{ResidueNames} - Array of all the residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1182 $ResiduesDataRef->{ResidueCount}{$ResidueName} - Count of residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1183 $ResiduesDataRef->{AtomResidueNames}} - Array of all ATOM residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1184 $ResiduesDataRef->{AtomResidueCount}{$ResidueName} - Count of
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1185 residues in ATOM records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1186 $ResiduesDataRef->{HetatomResidueNames} - List of all HETATM
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1187 residues
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1188 $ResiduesDataRef->{HetatmResidueCount}{$ResidueName} - Count of
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1189 residues HETATM records
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1190
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1191 ATOM/HETATM records after the first ENDMDL records are simply ingnored.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1192
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1193 =item B<GetChainsAndResidues>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1194
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1195 $ChainsDataRef = GetChainsAndResidues($PDBRecordLinesRef,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1196 [$RecordsSource, $GetChainResiduesBeyondTERFlag,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1197 $GetRecordLinesFlag]);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1198
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1199 Gets chains and residue information using ATOM/HETATM or SEQRES records and returns a reference to a
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1200 hash with these keys:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1201
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1202 $ChainsDataRef->{ChainIDs} - List of chain IDs with 'None' for
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1203 no IDs
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1204 $ChainsDataRef->{Residues}{$ChainID} - List of residues in order
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1205 of their appearance in a chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1206 $ChainsDataRef->{ResidueCount}{$ChainID}{$ResidueName} - Count of
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1207 residues in a chain
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1208
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1209 Chains and residue data can be extacted using either ATOM/HETATM records or SEQRES records.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1210 ATOM/HETATM records after the first ENDMDL records are simply ingnored.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1211
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1212 =item B<GetConectRecordLines>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1213
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1214 $ConectRecordLinesRef = GetConectRecordLines($PDBRecordLinesRef,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1215 $AtomNumbersMapRef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1216
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1217 Collects CONECT record lines for specific atom number, modified specified data to exclude any atom
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1218 number not present in the list of specified atom numbers and returns a reference to list of
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1219 CONECT record lines.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1220
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1221 =item B<GetExperimentalTechnique>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1222
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1223 $ExperimentalTechnique = GetExperimentalTechnique($PDBRecordLinesRef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1224
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1225 Returns I<ExperimentalTechnique> value retrieved from EXPDATA record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1226
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1227 =item B<GetExperimentalTechniqueResolution>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1228
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1229 ($Resolution, $ResolutionUnits) = GetExperimentalTechniqueResolution(
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1230 $PDBRecordLinesRef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1231
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1232 Returns I<Resolution> and I<ResolutionUnits> values from REMARK 2 RESOLUTION
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1233 record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1234
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1235 =item B<GetMinMaxCoords>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1236
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1237 ($XMin, $YMin, $ZMin, $XMax, $YMax, $ZMax) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1238 GetMinMaxCoords($PDBRecordLinesRef);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1239
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1240 Returns minimum and maximum XYZ coordinates for ATOM/HETATM records.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1241
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1242 =item B<GetPDBRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1243
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1244 $RecordType = GetPDBRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1245
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1246 Returns type of I<RecordLine>.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1247
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1248 =item B<GetRecordTypesCount>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1249
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1250 $RecordTypeDataRef = GetRecordTypesCount($PDBRecordLinesRef,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1251 [$SpecifiedRecordType, $GetRecordLinesFlag]);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1252
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1253 Counts the number of each record type or a $SpecifiedRecordType and returns a reference to data
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1254 type with following key/value pairs:
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1255
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1256 $RecordTypeDataRef->{RecordTypes} - An array of unique record types
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1257 in order of their presence in the file
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1258 $RecordTypeDataRef->{Count}{$RecordType} - Count of each record type
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1259 $RecordTypeDataRef->{Lines}{$RecordType} - Optional lines data for a
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1260 specific record type.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1261
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1262 =item B<IsAtomRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1263
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1264 $Status = IsAtomRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1265
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1266 Returns 1 or 0 based on whether it's a ATOM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1267
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1268 =item B<IsConectRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1269
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1270 $Status = IsAtomConectType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1271
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1272 Returns 1 or 0 based on whether it's a CONECT record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1273
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1274 =item B<IsEndmdlRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1275
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1276 $Status = IsEndmdlRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1277
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1278 Returns 1 or 0 based on whether it's a ENDMDL a record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1279
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1280 =item B<IsHeaderRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1281
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1282 $Status = IsHeaderRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1283
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1284 Returns 1 or 0 based on whether it's a HEADER a record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1285
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1286 =item B<IsHetatmRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1287
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1288 $Status = IsHetatmRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1289
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1290 Returns 1 or 0 based on whether it's a HETATM a record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1291
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1292 =item B<IsMasterRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1293
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1294 $Status = IsMasterRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1295
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1296 Returns 1 or 0 based on whether it's a MASTER a record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1297
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1298 =item B<IsModelRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1299
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1300 $Status = IsModelRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1301
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1302 Returns 1 or 0 based on whether it's a MODEL record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1303
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1304 =item B<IsPDBFile>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1305
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1306 $Status = IsPDBFile($PDBFile);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1307
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1308 Returns 1 or 0 based on whether it's a PDB file.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1309
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1310 =item B<IsSeqresRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1311
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1312 $Status = IsSeqresRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1313
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1314 Returns 1 or 0 based on whether it's SEQRES a record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1315
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1316 =item B<IsTerRecordType>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1317
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1318 $Status = IsTerRecordType($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1319
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1320 Returns 1 or 0 based on whether it's a TER record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1321
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1322 =item B<ParseAtomOrHetatmRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1323
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1324 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1325 $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1326 $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1327 ParseAtomOrHetatmRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1328
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1329 Parses ATOM or HETATM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1330
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1331 =item B<ParseAtomRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1332
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1333 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1334 $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1335 $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1336 ParseAtomRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1337
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1338 Parses ATOM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1339
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1340 =item B<ParseConectRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1341
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1342 ($AtomNum, $BondedAtomNum1, $BondedAtomNum2, $BondedAtomNum3,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1343 $BondedAtomNum4, $HBondedAtomNum1, $HBondedAtomNum2,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1344 $SaltBridgedAtomNum1, $HBondedAtomNum3, $HBondedAtomNum4,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1345 $SaltBridgedAtomNum2) = ParseConectRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1346
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1347 Parses CONECT record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1348
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1349 =item B<ParseExpdtaRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1350
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1351 ($ContinuationNum, $ExperimentalTechnique) = ParseExpdtaRecordLine($Line);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1352
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1353 Parses EXPDTA record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1354
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1355 =item B<ParseHeaderRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1356
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1357 ($Classification, $DepositionDate, $IDCode) = ParseHeaderRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1358
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1359 Parses HEADER record line
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1360
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1361 =item B<ParseHetatmRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1362
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1363 ($AtomNumber, $AtomName, $AlternateLocation, $ResidueName, $ChainID,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1364 $ResidueNumber, $InsertionCode, $X, $Y, $Z, $Occupancy,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1365 $TemperatureFactor, $SegmentID, $ElementSymbol, $AtomCharge) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1366 ParseHetatmRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1367
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1368 Parses HETATM record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1369
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1370 =item B<ParseMasterRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1371
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1372 ($NumOfRemarkRecords, $NumOfHetRecords, $NumOfHelixRecords,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1373 $NumOfSheetRecords, $NumOfTurnRecords, $NumOfSiteRecords,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1374 $NumOfTransformationsRecords, $NumOfAtomAndHetatmRecords,
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1375 $NumOfTerRecords, $NumOfConectRecords, $NumOfSeqresRecords) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1376 ParseMasterRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1377
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1378 Parses MASTER ecord line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1379
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1380 =item B<ParseRemark2ResolutionRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1381
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1382 ($Resolution, $ResolutionUnits) = ParseRemark2ResolutionRecordLine(
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1383 $RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1384
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1385 Parses REMARK 2 RESOLUTION record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1386
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1387 =item B<ParseSeqresRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1388
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1389 ($RecordSerialNumber, $ChainID, $NumOfResidues, $ResidueNames) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1390 ParseSeqresRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1391
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1392 Parses SEQRES record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1393
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1394 =item B<ParseTerRecordLine>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1395
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1396 ($SerialNumber, $ResidueName, $ChainID, $ResidueNumber, $InsertionCode) =
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1397 ParseTerRecordLine($RecordLine);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1398
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1399 Parses TER record line.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1400
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1401 =item B<ReadPDBFile>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1402
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1403 $PDBRecordLinesRef = ReadPDBFile($PDBFile);
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1404
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1405 Reads PDB file and returns reference to record lines.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1406
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1407 =back
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1408
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1409 =head1 AUTHOR
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1410
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1411 Manish Sud <msud@san.rr.com>
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1412
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1413 =head1 SEE ALSO
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1414
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1415 FileUtil.pm, SequenceFileUtil.pm, TextUtil.pm
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1416
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1417 =head1 COPYRIGHT
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1418
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1419 Copyright (C) 2015 Manish Sud. All rights reserved.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1420
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1421 This file is part of MayaChemTools.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1422
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1423 MayaChemTools is free software; you can redistribute it and/or modify it under
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1424 the terms of the GNU Lesser General Public License as published by the Free
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1425 Software Foundation; either version 3 of the License, or (at your option)
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1426 any later version.
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1427
68300206e90d Uploaded
deepakjadmin
parents:
diff changeset
1428 =cut