| Conditions | 22 |
| Total Lines | 86 |
| Code Lines | 61 |
| Lines | 0 |
| Ratio | 0 % |
| Changes | 0 | ||
Small methods make your code easier to understand, in particular if combined with a good name. Besides, if your method is small, finding a good name is usually much easier.
For example, if you find yourself adding comments to a method's body, this is usually a good sign to extract the commented part to a new method, and use the comment as a starting point when coming up with a good name for this new method.
Commonly applied refactorings include:
If many parameters/temporary variables are present:
Complex classes like build.rna_tools.tools.rna_calc_rmsd.lib.rmsd.calculate_rmsd.get_coordinates_pdb() often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
| 1 | #!/usr/bin/env python |
||
| 109 | def get_coordinates_pdb(filename, selection, ignore_selection, ignore_hydrogens, way='all'): |
||
| 110 | """ |
||
| 111 | Get coordinates from the first chain in a pdb file |
||
| 112 | and return a vectorset with all the coordinates. |
||
| 113 | |||
| 114 | """ |
||
| 115 | # PDB files tend to be a bit of a mess. The x, y and z coordinates |
||
| 116 | # are supposed to be in column 31-38, 39-46 and 47-54, but this is not always the case. |
||
| 117 | # Because of this the three first columns containing a decimal is used. |
||
| 118 | # Since the format doesn't require a space between columns, we use the above |
||
| 119 | # column indices as a fallback. |
||
| 120 | x_column = None |
||
| 121 | V = [] |
||
| 122 | # Same with atoms and atom naming. The most robust way to do this is probably |
||
| 123 | # to assume that the atomtype is given in column 3. |
||
| 124 | atoms = [] |
||
| 125 | resi_set = set() |
||
| 126 | if way == "c1p": |
||
| 127 | way_atoms = ["C1'"] |
||
| 128 | elif way == 'pooo': |
||
| 129 | way_atoms = "P OP1 OP2 O5'".split() |
||
| 130 | elif way == 'alpha': |
||
| 131 | way_atoms = "P OP1 OP2 O5' C5'".split() |
||
| 132 | elif way == 'backbone': |
||
| 133 | way_atoms = "P OP1 OP2 O5' C5' C4' C3' O3'".split() |
||
| 134 | elif way == 'po': |
||
| 135 | way_atoms = "P OP1 OP2".split() |
||
| 136 | elif way == 'no-backbone': |
||
| 137 | way_atoms = "C5' C4' O4' C3' O3' C2' O2' C1' N9 C8 N7 C5 C6 O6 N1 C2 N2 N3 C4".split() |
||
| 138 | way_atoms += "N9 C8 N7 C5 C6 N6 N1 C2 N3 C4".split() |
||
| 139 | way_atoms += "N1 C2 O2 N3 C4 O4 C5 C6".split() |
||
| 140 | way_atoms += "N1 C2 O2 N3 C4 N4 C5 C6".split() |
||
| 141 | elif way == 'bases': |
||
| 142 | way_atoms = "N9 C8 N7 C5 C6 O6 N1 C2 N2 N3 C4".split() |
||
| 143 | way_atoms += "N9 C8 N7 C5 C6 N6 N1 C2 N3 C4".split() |
||
| 144 | way_atoms += "N1 C2 O2 N3 C4 O4 C5 C6".split() |
||
| 145 | way_atoms += "N1 C2 O2 N3 C4 N4 C5 C6".split() |
||
| 146 | elif way == 'backbone+sugar': |
||
| 147 | way_atoms = "P OP1 OP2 O5' C5' C4' O4' C3' O3' C2' O2' C1'".split() |
||
| 148 | elif way == 'sugar': |
||
| 149 | way_atoms = "C4' O4' C3' C2' O2' C1'".split() |
||
| 150 | elif way == 'all': |
||
| 151 | way_atoms = "P OP1 OP2 O5' C5' C4' O4' C3' O3' C2' O2' C1' N9 C8 N7 C5 C6 O6 N1 C2 N2 N3 C4".split() |
||
| 152 | way_atoms += "P OP1 OP2 O5' C5' C4' O4' C3' O3' C2' O2' C1' N9 C8 N7 C5 C6 N6 N1 C2 N3 C4".split() |
||
| 153 | way_atoms += "P OP1 OP2 O5' C5' C4' O4' C3' O3' C2' O2' C1' N1 C2 O2 N3 C4 O4 C5 C6".split() |
||
| 154 | way_atoms += "P OP1 OP2 O5' C5' C4' O4' C3' O3' C2' O2' C1' N1 C2 O2 N3 C4 N4 C5 C6".split() |
||
| 155 | |||
| 156 | with open(filename) as f: |
||
| 157 | lines = f.readlines() |
||
| 158 | for line in lines: |
||
| 159 | # hmm... |
||
| 160 | # of models: 490 |
||
| 161 | # Error: # of atoms is not equal target (1f27_rpr.pdb):641 vs model (struc/1f27_rnakbnm_decoy0001_amb_clx_rpr.pdb):408 |
||
| 162 | #if line.startswith("TER") or line.startswith("END"): |
||
| 163 | # break |
||
| 164 | if line.startswith("ATOM"): |
||
| 165 | curr_chain_id = line[21] |
||
| 166 | curr_resi = int(line[22:26]) |
||
| 167 | curr_atom_name = line[12:16].strip() |
||
| 168 | if selection: |
||
| 169 | if curr_chain_id in selection: |
||
| 170 | if curr_resi in selection[curr_chain_id]: |
||
| 171 | # ignore if to be ingored (!) |
||
| 172 | #try: |
||
| 173 | resi_set.add(curr_chain_id + ':' + str(curr_resi)) |
||
| 174 | x = line[30:38] |
||
| 175 | y = line[38:46] |
||
| 176 | z = line[46:54] |
||
| 177 | if ignore_selection: |
||
| 178 | if not is_in_selection(ignore_selection, curr_chain_id, curr_resi, curr_atom_name): |
||
| 179 | if curr_atom_name in way_atoms: |
||
|
|
|||
| 180 | V.append(np.asarray([x,y,z],dtype=float)) |
||
| 181 | else: |
||
| 182 | if curr_atom_name in way_atoms: |
||
| 183 | V.append(np.asarray([x,y,z],dtype=float)) |
||
| 184 | |||
| 185 | else: |
||
| 186 | x = line[30:38] |
||
| 187 | y = line[38:46] |
||
| 188 | z = line[46:54] |
||
| 189 | if curr_atom_name in way_atoms: |
||
| 190 | V.append(np.asarray([x,y,z],dtype=float)) |
||
| 191 | |||
| 192 | V = np.asarray(V) |
||
| 193 | #print filename, resi_set, len(resi_set) |
||
| 194 | return len(V), V |
||
| 195 |