aboutsummaryrefslogtreecommitdiff
path: root/kmer_utils.h
blob: a9d9a1de5b524ca3554e558a2bc2a82d803af243 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
#include <unordered_map>
using namespace std;

// Kmer functions
void convert_kmer_to_num(char *str, const unsigned long length);
unsigned long num_to_index(const char *str, const int kmer, const long error_pos, long long *current_position);
char *index_to_kmer(unsigned long long index, long kmer);

// Utility functions
size_t strnstrip(char *s, int c, size_t len);
unsigned long long pow_four(unsigned long long x);

// Variables
typedef struct {
	size_t operator() (const size_t &k) const {
	return k;
	}
} kmer_noHash_hash;

typedef struct {
	bool operator() (const size_t &x, const size_t &y) const {
		return x == y;
	}
} kmer_eq; 

typedef unordered_map<size_t,unsigned long long, kmer_noHash_hash, kmer_eq> kmer_map;

unsigned char alpha[256]; 
// file loading functions
kmer_map *get_sparse_kmer_counts_from_filename(const char *fn, const unsigned int kmer);
kmer_map *get_sparse_kmer_counts_from_file(FILE *fh, int kmer);

unsigned long long *get_dense_kmer_counts_from_file(FILE *fh, const unsigned int kmer);
unsigned long long *get_dense_kmer_counts_from_filename(const char *fn, const unsigned int kmer);

size_t load_specific_mers_from_file(char *fn, unsigned int kmer, size_t width, size_t *arr);
// print functions
void print_kmer(unsigned long long *counts, bool label, bool nonzero, unsigned int kmer);
void print_kmer(kmer_map *counts, bool label, bool nonzero, unsigned int kmer);