File: align-utils.cc

package info (click to toggle)
coot 1.1.18%2Bdfsg-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 220,004 kB
  • sloc: cpp: 495,934; python: 35,043; ansic: 26,143; lisp: 22,768; sh: 13,186; makefile: 2,746; awk: 441; xml: 245; csh: 14
file content (92 lines) | stat: -rw-r--r-- 2,603 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
/*
 * utils/align-utils.cc
 *
 * Copyright 2009 by University of Oxford
 * Author: Paul Emsley
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as published
 * by the Free Software Foundation; either version 3 of the License, or (at
 * your option) any later version.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
 * 02110-1301, USA
 */


#include <iostream>
#include <vector>
#include <algorithm>
#include "align-utils.hh"
#ifdef HAVE_CXX11
#include <algorithm>
#endif

// strings with - in them
std::string
coot::alignment_matches(const std::string &aligned,
			const std::string &target) {

   unsigned int la = aligned.size();
   unsigned int lt = target.size();

   if (lt<la) la = lt;

   std::string matches(la, ' ');

   for (unsigned int i=0; i<lt; i++) {
      if (aligned[i] == target[i])
	 matches[i] = '|';
   }

#ifdef HAVE_CXX11
   std::vector<char> aromatics  = {'F', 'W', 'Y'}; // not H interestingly
   std::vector<char> aliphatics = {'A', 'G', 'L', 'V', 'I'};
   std::vector<char> hydroxyls  = {'T', 'Y', 'S', 'C', 'M'}; // and sulfhydryl
   std::vector<char> acidics    = {'D', 'L', 'H'};
   std::vector<char> basics     = {'R', 'E', 'N', 'Q'};
   // std::vector<char> cyclics    = {'P'}; won't make non-P matches

   std::vector<std::vector<char> > types(5);
   types[0] = aromatics;
   types[1] = aliphatics;
   types[2] = hydroxyls;
   types[3] = acidics;
   types[4] = basics;

   for (unsigned int i=0; i<lt; i++) {
      char ca = aligned[i];
      char ta = target[i];
      if (ca != ta) { // we would found it above if this were true
	 if (ca != '-') {
	    if (ta != '-') {
	       for (std::size_t j=0; j<types.size(); j++) {
		  const std::vector<char> &codes = types[j];
		  // are both ca and ta in codes?
		  std::vector<char>::const_iterator it_1;
		  std::vector<char>::const_iterator it_2;
		  it_1 = std::find(codes.begin(), codes.end(), ca);
		  it_2 = std::find(codes.begin(), codes.end(), ta);
		  if (it_1 != codes.end()) {
		     if (it_2 != codes.end()) {
			matches[i] = ':';
			break;
		     }
		  }
	       }
	    }
	 }
      }
   }

#endif

   return matches;
}