//  ==================================================================== //
//                                                                       //
//    File      : SQ_GroupData.cxx                                       //
//    Purpose   : Classes to store global information about sequences    //
//                                                                       //
//                                                                       //
//  Coded by Juergen Huber in July 2003 - February 2004                  //
//  Coded by Kai Bader (baderk@in.tum.de) in 2007 - 2008                 //
//  Copyright Department of Microbiology (Technical University Munich)   //
//                                                                       //
//  Visit our web site at: http://www.arb-home.de/                       //
//                                                                       //
//  ==================================================================== //


#include <cstdio>
#include <cctype>
#include "SQ_GroupData.h"

using namespace std;

SQ_GroupData::SQ_GroupData() {
    size = 0;
    avg_bases = 0;
    nr_sequences = 0;
    gc_prop = 0;
    initialized = false;
}

SQ_GroupData::~SQ_GroupData() {
}

consensus_result SQ_GroupData_RNA::SQ_calc_consensus(const char *sequence) const {
    consensus_result cr;
    cr.conformity = 0;
    cr.deviation = 0;

    for (int i = 0; i < size; i++) {
        int current[6] = { 0, 0, 0, 0, 0, 0 };

        // fill up current with decoded iupac values
        switch (sequence[i]) {
        case 'a':
        case 'A':
            current[0] = 100;
            break;
        case 't':
        case 'T':
            current[1] = 100;
            break;
        case 'c':
        case 'C':
            current[2] = 100;
            break;
        case 'g':
        case 'G':
            current[3] = 100;
            break;
        case 'u':
        case 'U':
            current[1] = 100;
            break;
        case 'r':
        case 'R':
            current[0] = 50;
            current[3] = 50;
            break;
        case 'y':
        case 'Y':
            current[2] = 50;
            current[1] = 50;
            break;
        case 'm':
        case 'M':
            current[0] = 50;
            current[2] = 50;
            break;
        case 'k':
        case 'K':
            current[3] = 50;
            current[1] = 50;
            break;
        case 'w':
        case 'W':
            current[0] = 50;
            current[1] = 50;
            break;
        case 's':
        case 'S':
            current[3] = 50;
            current[2] = 50;
            break;
        case 'b':
        case 'B':
            current[2] = 33;
            current[1] = 33;
            current[3] = 33;
            break;
        case 'd':
        case 'D':
            current[0] = 33;
            current[1] = 33;
            current[3] = 33;
            break;
        case 'h':
        case 'H':
            current[2] = 33;
            current[1] = 33;
            current[0] = 33;
            break;
        case 'v':
        case 'V':
            current[0] = 33;
            current[2] = 33;
            current[3] = 33;
            break;
        case 'n':
        case 'N':
        case 'x':
        case 'X':
            current[2] = 25;
            current[1] = 25;
            current[0] = 25;
            current[3] = 25;
            break;
        case '.':
            current[4] = 1;
            break;
        case '-':
            current[5] = 1;
            break;
        default:
            seq_assert(0);
            // unhandled character
            break;

        }

        int *cs = consensus[i].i;
        double sum = (double) (cs[0] + cs[1] + cs[2] + cs[3] + cs[4] + cs[5]);

        for (int j = 0; j < 6; j++) {
            int currentj = current[j];
            if (currentj > 0) {
                if (cs[j] > currentj) {
                    cr.conformity += (double) (cs[j] - currentj) / sum;
                }
                else {
                    cr.deviation += current[j];
                }
            }
        }
    }

    cr.conformity = cr.conformity / size; // set conformity in relation to sequencelength
    cr.deviation = cr.deviation / size; // set deviation in relation to sequencelength
    return cr;
}

void SQ_GroupData_RNA::SQ_add_sequence(const char *sequence) {
    for (int i = 0; i < size; i++) {
        int *cs = consensus[i].i;
        switch (sequence[i]) {
        case 'a':
        case 'A':
            cs[0] += 100;
            break;
        case 't':
        case 'T':
            cs[1] += 100;
            break;
        case 'c':
        case 'C':
            cs[2] += 100;
            break;
        case 'g':
        case 'G':
            cs[3] += 100;
            break;
        case 'u':
        case 'U':
            cs[1] += 100;
            break;
        case 'r':
        case 'R':
            cs[0] += 50;
            cs[3] += 50;
            break;
        case 'y':
        case 'Y':
            cs[2] += 50;
            cs[1] += 50;
            break;
        case 'm':
        case 'M':
            cs[0] += 50;
            cs[2] += 50;
            break;
        case 'k':
        case 'K':
            cs[3] += 50;
            cs[1] += 50;
            break;
        case 'w':
        case 'W':
            cs[0] += 50;
            cs[1] += 50;
            break;
        case 's':
        case 'S':
            cs[3] += 50;
            cs[2] += 50;
            break;
        case 'b':
        case 'B':
            cs[2] += 33;
            cs[1] += 33;
            cs[3] += 33;
            break;
        case 'd':
        case 'D':
            cs[0] += 33;
            cs[1] += 33;
            cs[3] += 33;
            break;
        case 'h':
        case 'H':
            cs[2] += 33;
            cs[1] += 33;
            cs[0] += 33;
            break;
        case 'v':
        case 'V':
            cs[0] += 33;
            cs[2] += 33;
            cs[3] += 33;
            break;
        case 'n':
        case 'x':
        case 'N':
        case 'X':
            cs[2] += 25;
            cs[1] += 25;
            cs[0] += 25;
            cs[3] += 25;
            break;
        case '.':
            cs[4] += 1;
            break;
        case '-':
            cs[5] += 1;
            break;
        default:
            fprintf(stderr, "Illegal character '%c'", sequence[i]);
            // seq_assert(0);
            // unhandled character
            break;
        }
    }
}

