poacns.h 59 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342
  1. /*
  2. *
  3. * Copyright (c) 2018, Jue Ruan <ruanjue@gmail.com>
  4. *
  5. *
  6. * This program is free software: you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation, either version 3 of the License, or
  9. * (at your option) any later version.
  10. *
  11. * This program is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  14. * GNU General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU General Public License
  17. * along with this program. If not, see <http://www.gnu.org/licenses/>.
  18. */
  19. #ifndef PO_MSA_CNS_RJ_H
  20. #define PO_MSA_CNS_RJ_H
  21. #include "bit2vec.h"
  22. #include "dna.h"
  23. #include "chararray.h"
  24. #include "list.h"
  25. #include "hashset.h"
  26. #include <emmintrin.h>
  27. #include <tmmintrin.h>
  28. #if __BYTE_ORDER == 1234
  29. //#pragma message(" ** " __FILE__ " has been tested in LITTLE_ENDIAN **\n")
  30. #else
  31. #pragma message(" ** " __FILE__ " hasn't been tested in BIG_ENDIAN **\n")
  32. #endif
  33. static int cns_debug = 0;
  34. #define POG_RDLEN_MAX 0x7FF8
  35. #define POG_RDCNT_MAX 0x3FFF
  36. #define POG_BASEWIDTH 3
  37. #define POG_BASEMAX 0x3F
  38. #define POG_HEAD_NODE 0
  39. #define POG_TAIL_NODE 1
  40. #define POG_DP_BT_M 0
  41. #define POG_DP_BT_I 1
  42. #define POG_DP_BT_D 2
  43. #define POG_ALNMODE_OVERLAP 0
  44. #define POG_ALNMODE_GLOBAL 1
  45. #define POG_VST_MAX MAX_U2
  46. #define POG_SCORE_MIN (-(MAX_B2 >> 1))
  47. typedef struct {
  48. u2i rid, pos, base;
  49. u2i rbeg, rend, rmax;
  50. u2i nin, vst;
  51. u4i edge, erev;
  52. u4i aligned;
  53. union {
  54. u4i aux;
  55. u4i bpos; // backbone pos
  56. };
  57. u4i coff;
  58. union {
  59. u8i flag;
  60. struct { u4i roff, voff; };
  61. };
  62. } pog_node_t;
  63. define_list(pognodev, pog_node_t);
  64. typedef struct {
  65. u4i node;
  66. u4i cov:31, is_aux:1;
  67. u4i next;
  68. } pog_edge_t;
  69. define_list(pogedgev, pog_edge_t);
  70. typedef struct {
  71. int cnsmode; // 0: gen_cns_pog, 1: dp_call_cns_pog
  72. int refmode;
  73. int alnmode;
  74. int tribase;
  75. int sse;
  76. int near_dialog;
  77. int W_score;
  78. int W, rW, cW; // 64, 16, 8
  79. int Wmax; // 1024
  80. float W_mat_rate; // 0.92
  81. int M, X, I, D, E;
  82. float H; // homopolymer merge
  83. int T; // bonus for end
  84. u4i msa_min_cnt;
  85. float msa_min_freq;
  86. } POGPar;
  87. static const POGPar DEFAULT_POG_PAR = (POGPar){0, 0, POG_ALNMODE_OVERLAP, 0, 1, 0, 0, 64, 16, 8, 1024, 0.92, 2, -5, -2, -4, -1, -3, 20, 3, 0.5};
  88. typedef struct {
  89. u4i coff:29, bt:3;
  90. float max;
  91. } pog_cns_t;
  92. typedef struct {
  93. SeqBank *seqs;
  94. u2v *sbegs, *sends; // suggested [beg, end) on ref(1st seq) in reference-based mode
  95. pognodev *nodes;
  96. pogedgev *edges;
  97. POGPar *par;
  98. b2v *qprof;
  99. b2v *rows;
  100. u4v *rowr;
  101. b2v *btds;
  102. u2v *btvs;
  103. u4v *btxs;
  104. u4v *stack;
  105. u2i backbone;
  106. u4i msa_len;
  107. u1v *msa;
  108. u2v *bcnts[7];
  109. u2v *hcovs;
  110. u1v *cbts;
  111. BaseBank *cns;
  112. u8i ncall;
  113. } POG;
  114. static inline POG* init_pog(POGPar par){
  115. POG *g;
  116. g = malloc(sizeof(POG));
  117. g->seqs = init_seqbank();
  118. g->sbegs = init_u2v(32);
  119. g->sends = init_u2v(32);
  120. g->nodes = init_pognodev(16 * 1024);
  121. g->edges = init_pogedgev(16 * 1024);
  122. g->par = malloc(sizeof(POGPar));
  123. memcpy(g->par, &par, sizeof(POGPar));
  124. g->qprof = init_b2v(4 * 1024);
  125. g->rows = init_b2v(16 * 1024);
  126. g->rowr = init_u4v(64);
  127. g->btds = init_b2v(16 * 1024);
  128. g->btvs = init_u2v(8 * 1024 * 1024);
  129. g->btxs = init_u4v(1024);
  130. g->stack = init_u4v(32);
  131. g->backbone = 0;
  132. g->msa_len = 0;
  133. g->msa = init_u1v(16 * 1024);
  134. g->bcnts[0] = init_u2v(4 * 1024);
  135. g->bcnts[1] = init_u2v(4 * 1024);
  136. g->bcnts[2] = init_u2v(4 * 1024);
  137. g->bcnts[3] = init_u2v(4 * 1024);
  138. g->bcnts[4] = init_u2v(4 * 1024);
  139. g->bcnts[5] = init_u2v(4 * 1024);
  140. g->bcnts[6] = init_u2v(4 * 1024);
  141. g->hcovs = init_u2v(4 * 1024);
  142. g->cbts = init_u1v(5 * 2 * 1024);
  143. g->cns = init_basebank();
  144. g->ncall = 0;
  145. return g;
  146. }
  147. static inline void renew_pog(POG *g){
  148. free_seqbank(g->seqs); g->seqs = init_seqbank();
  149. renew_u2v(g->sbegs, 32);
  150. renew_u2v(g->sends, 32);
  151. renew_pognodev(g->nodes, 16 * 1024);
  152. renew_pogedgev(g->edges, 16 * 1024);
  153. renew_b2v(g->qprof, 4 * 1024);
  154. renew_b2v(g->rows, 16 * 1024);
  155. renew_u4v(g->rowr, 64);
  156. renew_b2v(g->btds, 16 * 1024);
  157. renew_u2v(g->btvs, 8 * 1024 * 1024);
  158. renew_u4v(g->btxs, 16 * 1024);
  159. renew_u4v(g->stack, 32);
  160. renew_u1v(g->msa, 16 * 1024);
  161. renew_u2v(g->bcnts[0], 4 * 1024);
  162. renew_u2v(g->bcnts[1], 4 * 1024);
  163. renew_u2v(g->bcnts[2], 4 * 1024);
  164. renew_u2v(g->bcnts[3], 4 * 1024);
  165. renew_u2v(g->bcnts[4], 4 * 1024);
  166. renew_u2v(g->bcnts[5], 4 * 1024);
  167. renew_u2v(g->bcnts[6], 4 * 1024);
  168. renew_u2v(g->hcovs, 4 * 1024);
  169. renew_u1v(g->cbts, 5 * 2 * 1024);
  170. free_basebank(g->cns); g->cns = init_basebank();
  171. }
  172. static inline void free_pog(POG *g){
  173. free_seqbank(g->seqs);
  174. free_u2v(g->sbegs);
  175. free_u2v(g->sends);
  176. free_pognodev(g->nodes);
  177. free_pogedgev(g->edges);
  178. free_b2v(g->qprof);
  179. free_b2v(g->rows);
  180. free_u4v(g->rowr);
  181. free_b2v(g->btds);
  182. free_u2v(g->btvs);
  183. free_u4v(g->btxs);
  184. free_u4v(g->stack);
  185. free_u1v(g->msa);
  186. free_u2v(g->bcnts[0]);
  187. free_u2v(g->bcnts[1]);
  188. free_u2v(g->bcnts[2]);
  189. free_u2v(g->bcnts[3]);
  190. free_u2v(g->bcnts[4]);
  191. free_u2v(g->bcnts[5]);
  192. free_u2v(g->bcnts[6]);
  193. free_u2v(g->hcovs);
  194. free_u1v(g->cbts);
  195. free_basebank(g->cns);
  196. free(g->par);
  197. free(g);
  198. }
  199. static inline void push_pog_core(POG *g, char *seq, u4i len, u2i refbeg, u2i refend){
  200. if(g->seqs->nseq < POG_RDCNT_MAX){
  201. len = num_min(len, POG_RDLEN_MAX);
  202. push_seqbank(g->seqs, NULL, 0, seq, len);
  203. push_u2v(g->sbegs, refbeg);
  204. push_u2v(g->sends, refend);
  205. }
  206. }
  207. static inline void push_pog(POG *g, char *seq, u1i len){ push_pog_core(g, seq, len, 0, 0); }
  208. static inline void fwdbitpush_pog_core(POG *g, u8i *bits, u8i off, u4i len, u2i refbeg, u2i refend){
  209. if(g->seqs->nseq < POG_RDCNT_MAX){
  210. len = num_min(len, POG_RDLEN_MAX);
  211. fwdbitpush_seqbank(g->seqs, NULL, 0, bits, off, len);
  212. push_u2v(g->sbegs, refbeg);
  213. push_u2v(g->sends, refend);
  214. }
  215. }
  216. static inline void fwdbitpush_pog(POG *g, u8i *bits, u8i off, u4i len){ fwdbitpush_pog_core(g, bits, off, len, 0, 0); }
  217. static inline void revbitpush_pog_core(POG *g, u8i *bits, u8i off, u4i len, u2i refbeg, u2i refend){
  218. if(g->seqs->nseq < POG_RDCNT_MAX){
  219. len = num_min(len, POG_RDLEN_MAX);
  220. revbitpush_seqbank(g->seqs, NULL, 0, bits, off, len);
  221. push_u2v(g->sbegs, refbeg);
  222. push_u2v(g->sends, refend);
  223. }
  224. }
  225. static inline void revbitpush_pog(POG *g, u8i *bits, u8i off, u4i len){ revbitpush_pog_core(g, bits, off, len, 0, 0); }
  226. static inline void print_dot_pog(POG *g, FILE *out){
  227. pog_node_t *n;
  228. pog_edge_t *e;
  229. u4i nidx, eidx;
  230. fprintf(out, "digraph {\n");
  231. fprintf(out, "rankdir=LR\n");
  232. fprintf(out, "N0 [label=\"BEG\"]\n");
  233. fprintf(out, "N1 [label=\"END\"]\n");
  234. for(nidx=POG_TAIL_NODE+1;nidx<g->nodes->size;nidx++){
  235. n = ref_pognodev(g->nodes, nidx);
  236. fprintf(out, "N%u [label=R%u_%u_%c]\n", nidx, n->rid, n->pos, bit_base_table[(n->base) & 0x03]);
  237. }
  238. for(nidx=0;nidx<g->nodes->size;nidx++){
  239. n = ref_pognodev(g->nodes, nidx);
  240. if(n->aligned != nidx){
  241. fprintf(out, "N%u -> N%u [color=magenta style=dashed]\n", nidx, n->aligned);
  242. }
  243. eidx = n->edge;
  244. while(eidx){
  245. e = ref_pogedgev(g->edges, eidx);
  246. #if DEBUG
  247. if(e->next == eidx){
  248. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  249. abort();
  250. }
  251. #endif
  252. eidx = e->next;
  253. if(e->is_aux) continue;
  254. fprintf(out, "N%u -> N%u [label=%u]\n", nidx, e->node, e->cov);
  255. }
  256. }
  257. fprintf(out, "}\n");
  258. }
  259. static inline void fprint_dot_pog(POG *g, char *prefix, char *suffix){
  260. FILE *out;
  261. out = open_file_for_write(prefix, suffix, 1);
  262. print_dot_pog(g, out);
  263. fclose(out);
  264. }
  265. static inline void print_vstdot_pog(POG *g, char *fname){
  266. FILE *out;
  267. pog_node_t *n;
  268. pog_edge_t *e;
  269. u4i nidx, eidx;
  270. out = open_file_for_write(fname, NULL, 1);
  271. fprintf(out, "digraph {\n");
  272. for(nidx=0;nidx<g->nodes->size;nidx++){
  273. n = ref_pognodev(g->nodes, nidx);
  274. if(nidx && n->vst == 0) continue;
  275. fprintf(out, "N%u [label=\"N%u:%u:%u:%d\"]\n", nidx, nidx, n->aux, n->nin, n->vst);
  276. eidx = n->edge;
  277. while(eidx){
  278. e = ref_pogedgev(g->edges, eidx);
  279. eidx = e->next;
  280. if(e->is_aux) continue;
  281. fprintf(out, "N%u -> N%u [label=%u]\n", nidx, e->node, e->cov);
  282. }
  283. }
  284. fprintf(out, "}\n");
  285. fclose(out);
  286. }
  287. static inline void print_seqs_pog(POG *g, char *prefix, char *suffix){
  288. FILE *out;
  289. u4i i;
  290. out = open_file_for_write(prefix, suffix, 1);
  291. for(i=0;i<g->seqs->nseq;i++){
  292. fprintf(out, ">S%u len=%u\n", i, g->seqs->rdlens->buffer[i]);
  293. println_fwdseq_basebank(g->seqs->rdseqs, g->seqs->rdoffs->buffer[i], g->seqs->rdlens->buffer[i], out);
  294. }
  295. fclose(out);
  296. }
  297. static inline void print_msa_pog(POG *g, FILE *out){
  298. char *str;
  299. u1i *cns;
  300. u4i i, j, b, e, c, n;
  301. str = malloc(g->msa_len + 1);
  302. fprintf(out, "[POS] ");
  303. for(i=j=0;i<g->msa_len;i++){
  304. if((i % 10) == 0){
  305. fprintf(out, "|%04u", i + 1);
  306. j += 5;
  307. } else if(i >= j){
  308. putc(' ', out);
  309. j ++;
  310. }
  311. }
  312. fputc('\n', out);
  313. for(i=0;i<g->seqs->nseq+1;i++){
  314. if(i == g->seqs->nseq){
  315. fprintf(out, "[CNS] ");
  316. } else {
  317. fprintf(out, "[%03u] ", i);
  318. }
  319. b = i * g->msa_len;
  320. e = b + g->msa_len;
  321. n = 0;
  322. for(j=b;j<e;j++){
  323. c = g->msa->buffer[j];
  324. if(c < 4) n ++;
  325. str[j-b] = "ACGT-acgt*"[c];
  326. //fputc("ACGT-"[c], out);
  327. }
  328. str[e-b] = 0;
  329. fputs(str, out);
  330. if(i == g->seqs->nseq){
  331. fprintf(out, "\t%u\t%u\n", (u4i)g->cns->size, n);
  332. } else {
  333. fprintf(out, "\t%u\t%u\n", g->seqs->rdlens->buffer[i], n);
  334. }
  335. }
  336. fprintf(out, "[POS] ");
  337. cns = ref_u1v(g->msa, g->msa_len * g->seqs->nseq);
  338. for(i=j=b=0;i<g->msa_len;i++){
  339. if(cns[i] < 4){
  340. j ++;
  341. if((j % 10) == 1){
  342. while(b < i){
  343. fputc(' ', out);
  344. b ++;
  345. }
  346. fprintf(out, "|%04u", j);
  347. b += 5;
  348. }
  349. }
  350. }
  351. fprintf(out, "\n");
  352. if(1){
  353. u4i divs[5];
  354. u2i *hcovs;
  355. hcovs = g->hcovs->buffer;
  356. divs[0] = 10000;
  357. divs[1] = 1000;
  358. divs[2] = 100;
  359. divs[3] = 10;
  360. divs[4] = 1;
  361. for(i=0;i<4;i++){
  362. for(j=0;j<g->msa_len;j++){
  363. if(hcovs[j] < divs[i + 1]){
  364. str[j] = ' ';
  365. } else {
  366. str[j] = '0' + ((hcovs[j] % divs[i]) / divs[i + 1]);
  367. }
  368. }
  369. str[j] = 0;
  370. fprintf(out, "[%c ] %s\n", "HCOV"[i], str);
  371. }
  372. }
  373. free(str);
  374. }
  375. static inline pog_node_t* add_node_pog(POG *g, u2i rid, u2i pos, u2i base){
  376. pog_node_t *u;
  377. u = next_ref_pognodev(g->nodes);
  378. ZEROS(u);
  379. u->rid = rid;
  380. u->pos = pos;
  381. u->base = base;
  382. u->aligned = offset_pognodev(g->nodes, u);
  383. return u;
  384. }
  385. static inline pog_edge_t* add_edge_pog(POG *g, pog_node_t *u, pog_node_t *v, int cov, int is_aux){
  386. pog_edge_t *e, *f, *p;
  387. u4i eidx;
  388. #if DEBUG
  389. if(u == v){
  390. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  391. abort();
  392. }
  393. #endif
  394. if(u->edge == 0){
  395. e = next_ref_pogedgev(g->edges);
  396. u->edge = offset_pogedgev(g->edges, e);
  397. e->node = offset_pognodev(g->nodes, v);
  398. e->cov = cov;
  399. e->is_aux = is_aux;
  400. e->next = 0;
  401. v->nin ++;
  402. return e;
  403. } else {
  404. e = f = p = NULL;
  405. encap_pogedgev(g->edges, 1);
  406. eidx = u->edge;
  407. while(eidx){
  408. f = ref_pogedgev(g->edges, eidx);
  409. eidx = f->next;
  410. if(f->node == offset_pognodev(g->nodes, v)){
  411. e = f;
  412. break;
  413. }
  414. p = f;
  415. }
  416. if(e == NULL){
  417. e = next_ref_pogedgev(g->edges);
  418. e->node = offset_pognodev(g->nodes, v);
  419. e->cov = cov;
  420. e->is_aux = is_aux;
  421. e->next = 0;
  422. v->nin ++;
  423. } else {
  424. e->is_aux &= is_aux;
  425. e->cov += cov;
  426. if(cov == 0){
  427. return e;
  428. } else if(p == NULL){
  429. return e;
  430. }
  431. // detach e from u->edge
  432. p->next = e->next;
  433. e->next = 0;
  434. }
  435. f = ref_pogedgev(g->edges, u->edge);
  436. if(e->cov > f->cov){
  437. e->next = u->edge;
  438. u->edge = offset_pogedgev(g->edges, e);
  439. } else {
  440. while(f->next){
  441. if(ref_pogedgev(g->edges, f->next)->cov < e->cov){
  442. break;
  443. }
  444. f = ref_pogedgev(g->edges, f->next);
  445. }
  446. e->next = f->next;
  447. f->next = offset_pogedgev(g->edges, e);
  448. }
  449. return e;
  450. }
  451. }
  452. static inline pog_node_t* merge_node_pog(POG *g, pog_node_t *x, pog_node_t *u){
  453. pog_node_t *v, *w;
  454. pog_edge_t *e;
  455. u4i xidx, eidx;
  456. xidx = offset_pognodev(g->nodes, x);
  457. do {
  458. v = ref_pognodev(g->nodes, xidx);
  459. if(v->nin && v->base == u->base){
  460. eidx = u->edge;
  461. while(eidx){
  462. e = ref_pogedgev(g->edges, eidx);
  463. eidx = e->next;
  464. w = ref_pognodev(g->nodes, e->node);
  465. add_edge_pog(g, v, w, e->cov, e->is_aux);
  466. w->nin --; // will delete e
  467. }
  468. u->edge = 0;
  469. break;
  470. }
  471. v = NULL;
  472. } while(xidx != offset_pognodev(g->nodes, x));
  473. u->aligned = x->aligned;
  474. x->aligned = offset_pognodev(g->nodes, u);
  475. return v? v : u;
  476. }
  477. static inline void beg_pog_core(POG *g, BaseBank *cns, u8i off, u2i len, int clear_all){
  478. pog_node_t *head, *tail, *u, *v;
  479. pog_edge_t *e;
  480. u4i i, bb, bk;
  481. g->ncall ++;
  482. if((g->ncall % 16) == 0){
  483. renew_pog(g);
  484. }
  485. clear_and_encap_pognodev(g->nodes, 2 + len);
  486. clear_pogedgev(g->edges);
  487. ZEROS(next_ref_pogedgev(g->edges));
  488. head = next_ref_pognodev(g->nodes);
  489. ZEROS(head);
  490. if(g->par->tribase){
  491. head->base = POG_BASEMAX + 1;
  492. } else {
  493. head->base = 4;
  494. }
  495. head->aligned = POG_HEAD_NODE;
  496. tail = next_ref_pognodev(g->nodes);
  497. ZEROS(tail);
  498. if(g->par->tribase){
  499. tail->base = POG_BASEMAX + 1;
  500. } else {
  501. tail->base = 4;
  502. }
  503. tail->aligned = POG_TAIL_NODE;
  504. u = head;
  505. bk = 0;
  506. // add backbone nodes
  507. g->backbone = len;
  508. for(i=0;i<len;i++){
  509. bb = get_basebank(cns, off + i);
  510. if(g->par->tribase){
  511. bk = ((bk << 2) | bb) & POG_BASEMAX;
  512. } else {
  513. bk = bb;
  514. }
  515. v = add_node_pog(g, g->seqs->nseq, i, bk);
  516. v->bpos = i;
  517. e = add_edge_pog(g, u, v, 0, 1);
  518. u = v;
  519. }
  520. e = add_edge_pog(g, u, tail, 0, 1);
  521. if(clear_all){
  522. clear_seqbank(g->seqs);
  523. clear_u2v(g->sbegs);
  524. clear_u2v(g->sends);
  525. clear_basebank(g->cns);
  526. }
  527. }
  528. static inline void beg_pog(POG *g){
  529. beg_pog_core(g, NULL, 0, 0, 1);
  530. }
  531. static inline void prepare_rd_align_pog(POG *g, u2i rid){
  532. pog_node_t *u, *v;
  533. pog_edge_t *e;
  534. b2i *row, *btds;
  535. u8i rmax;
  536. u4i seqoff, seqlen, seqlex, slen, seqinc;
  537. u4i nidx, eidx, i, j, bb;
  538. seqoff = g->seqs->rdoffs->buffer[rid];
  539. seqlen = g->seqs->rdlens->buffer[rid];
  540. seqlex = roundup_times(seqlen, 8); // 128 = 8 * sizeof(b2i)
  541. slen = seqlex >> 3;
  542. seqinc = seqlex + 8; // seqlex, max_idx, beg, end, and paddings
  543. // init graph
  544. encap_pognodev(g->nodes, seqlen + 2);
  545. encap_pogedgev(g->edges, seqlen + 2);
  546. // estimate cap of g->rows
  547. for(i=0;i<g->nodes->size;i++){
  548. v = ref_pognodev(g->nodes, i);
  549. v->roff = 0;
  550. v->voff = 0;
  551. v->coff = 0;
  552. v->vst = 0;
  553. v->aux = 0;
  554. }
  555. clear_u4v(g->stack);
  556. push_u4v(g->stack, POG_HEAD_NODE);
  557. rmax = 0;
  558. bb = 1;
  559. while(pop_u4v(g->stack, &nidx)){
  560. u = ref_pognodev(g->nodes, nidx);
  561. eidx = u->edge;
  562. while(eidx){
  563. e = ref_pogedgev(g->edges, eidx);
  564. #if DEBUG
  565. if(eidx == e->next){
  566. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  567. abort();
  568. }
  569. #endif
  570. eidx = e->next;
  571. v = ref_pognodev(g->nodes, e->node);
  572. if(v->vst == 0){
  573. bb ++;
  574. if(bb > rmax){
  575. rmax = bb;
  576. }
  577. }
  578. v->vst ++;
  579. if(v->vst == v->nin){
  580. push_u4v(g->stack, e->node);
  581. }
  582. }
  583. bb --;
  584. }
  585. #if DEBUG
  586. if(bb){
  587. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  588. abort();
  589. }
  590. #endif
  591. rmax += 2;
  592. head_sl_b2v(g->rows, g->rows->n_head);
  593. clear_and_encap_b2v(g->rows, rmax * seqinc + 8);
  594. head_sr_b2v(g->rows, (16 - (((u8i)g->rows->buffer) & 0xF)) >> 1);
  595. head_sl_b2v(g->btds, g->btds->n_head);
  596. clear_and_encap_b2v(g->btds, rmax * seqinc + 8);
  597. head_sr_b2v(g->btds, (16 - (((u8i)g->btds->buffer) & 0xF)) >> 1);
  598. inc_b2v(g->rows, seqinc);
  599. inc_b2v(g->btds, seqinc);
  600. clear_u4v(g->rowr);
  601. bb = 0;
  602. for(i=0;i<g->nodes->size;i++){
  603. v = ref_pognodev(g->nodes, i);
  604. v->vst = 0;
  605. v->erev = bb;
  606. bb += v->nin;
  607. if(i < 2) bb ++; // in case of add mnode
  608. }
  609. clear_u2v(g->btvs);
  610. inc_u2v(g->btvs, 8);
  611. clear_and_inc_u4v(g->btxs, bb + 1);
  612. //g->btxs->buffer[0] = 0;
  613. memset(g->btxs->buffer, 0, (bb + 1) * sizeof(u4i));
  614. u = ref_pognodev(g->nodes, POG_HEAD_NODE);
  615. if(g->rowr->size){
  616. u->coff = u->roff = g->rowr->buffer[--g->rowr->size];
  617. } else {
  618. u->roff = g->rows->size;
  619. inc_b2v(g->rows, seqinc);
  620. u->coff = g->btds->size;
  621. inc_b2v(g->btds, seqinc);
  622. }
  623. row = ref_b2v(g->rows, u->roff);
  624. btds = ref_b2v(g->btds, u->coff);
  625. if(g->par->alnmode == POG_ALNMODE_OVERLAP){ // overlap alignment
  626. memset(row, 0, seqinc * sizeof(b2i));
  627. //row[0] = g->par->T;
  628. } else { // global
  629. __m128i MIN;
  630. MIN = _mm_set1_epi16(POG_SCORE_MIN);
  631. for(j=0;j<slen;j++){
  632. _mm_store_si128(((__m128i*)row) + j, MIN);
  633. }
  634. //row[0] = g->par->T;
  635. }
  636. memset(btds, 0, seqinc * sizeof(b2i));
  637. if(g->par->near_dialog && g->par->W_score <= 0){
  638. row[seqlex] = g->par->W;
  639. row[seqlex + 1] = 0;
  640. row[seqlex + 2] = num_min(Int(seqlex), 2 * g->par->W + 1);
  641. } else {
  642. row[seqlex] = 0;
  643. row[seqlex + 1] = 0;
  644. row[seqlex + 2] = seqlex;
  645. }
  646. }
  647. // SSE
  648. // BANDED, Auto fit the previous-row's max score in center
  649. // OVERLAP
  650. static inline void sse_band_row_rdaln_pog(POG *g, u4i nidx1, u4i nidx2, u4i seqlen, u2i vst, u4i coff1, u4i coff2, u4i roff1, u4i roff2, b2i *qp, int W, int center){
  651. __m128i I, D, H, E, F, S, MAX, MIN, CMP;
  652. __m128i BT, BT1, BT2, BT1_MASK, BT2_MASK, BTX_MASK;
  653. b2i *row1, *row2, *btds;
  654. u4i i, slen, seqlex, beg, end;
  655. int lsth, lstf, msk, mi;
  656. UNUSED(coff1);
  657. slen = (seqlen + 7) / 8;
  658. seqlex = slen * 8;
  659. I = _mm_set1_epi16(g->par->I);
  660. D = _mm_set1_epi16(g->par->D);
  661. MIN = _mm_set1_epi16(POG_SCORE_MIN);
  662. BT1_MASK = _mm_set1_epi16(0b10);
  663. BT2_MASK = _mm_set1_epi16(0b01);
  664. BTX_MASK = _mm_set1_epi16(vst << 2);
  665. row1 = ref_b2v(g->rows, roff1);
  666. row2 = ref_b2v(g->rows, roff2);
  667. btds = ref_b2v(g->btds, coff2);
  668. if(W){
  669. if(center < 0){
  670. if(row1[row1[seqlex]] >= g->par->W_score){
  671. if(g->par->near_dialog){
  672. if(row1[seqlex + 1] > 0 || row1[seqlex + 2] < Int(seqlex)){
  673. if(row1[seqlex] == (row1[seqlex + 1] + row1[seqlex + 2]) / 2){
  674. center = (row1[seqlex + 1] + row1[seqlex + 2]) / 2 + 1;
  675. } else if(row1[seqlex] > (row1[seqlex + 1] + row1[seqlex + 2]) / 2){
  676. center = (row1[seqlex + 1] + row1[seqlex + 2]) / 2 + 2;
  677. } else {
  678. center = (row1[seqlex + 1] + row1[seqlex + 2]) / 2;
  679. }
  680. } else { // first set center
  681. center = row1[seqlex];
  682. }
  683. } else {
  684. center = row1[seqlex];
  685. }
  686. beg = num_max(center - W, row1[seqlex + 1]);
  687. end = num_min(center + 1 + W, row1[seqlex + 2] + 1);
  688. if(end > seqlex) end = seqlex;
  689. } else {
  690. beg = row1[seqlex + 1];
  691. end = num_min(row1[seqlex + 2] + 1, Int(seqlex));
  692. }
  693. } else {
  694. beg = num_max(center - W, row1[seqlex + 1]);
  695. end = num_min(center + 1 + W, row1[seqlex + 2] + 1);
  696. if(end > seqlex) end = seqlex;
  697. }
  698. } else {
  699. beg = 0;
  700. end = seqlex;
  701. }
  702. if(beg & 0x7U) beg = beg & (~0x7U);
  703. if(end & 0x7U) end = (end + 8) & (~0x7U);
  704. beg = beg / 8;
  705. end = (end + 7) / 8;
  706. if(row1[seqlex + 1] >= row1[seqlex + 2]){ // happening in realign mode
  707. for(i=beg*8;i<end*8;i+=8){
  708. _mm_store_si128(((__m128i*)(row1 + i)), MIN);
  709. }
  710. } else {
  711. if(Int(beg * 8) < row1[seqlex + 1]){
  712. for(i=beg*8;Int(i)<row1[seqlex + 1];i+=8){
  713. _mm_store_si128(((__m128i*)(row1 + i)), MIN);
  714. }
  715. }
  716. if(Int(end * 8) > row1[seqlex + 2]){
  717. for(i=row1[seqlex+2];i<end*8;i+=8){
  718. _mm_store_si128(((__m128i*)(row1 + i)), MIN);
  719. }
  720. }
  721. }
  722. if(nidx2 == POG_TAIL_NODE){
  723. while(end * 8 < seqlex){
  724. _mm_store_si128(((__m128i*)(row1)) + end, MIN);
  725. end ++;
  726. }
  727. }
  728. MAX = _mm_set1_epi16(POG_SCORE_MIN);
  729. if(beg){
  730. lstf = lsth = POG_SCORE_MIN;
  731. } else {
  732. if(row1[seqlex + 1] >= row1[seqlex + 2]){
  733. lstf = POG_SCORE_MIN;
  734. lsth = 0; // auto global alignment
  735. } else {
  736. lstf = (g->par->alnmode == POG_ALNMODE_OVERLAP)? 0 : POG_SCORE_MIN;
  737. if(nidx1){
  738. lsth = (g->par->alnmode == POG_ALNMODE_OVERLAP)? 0 : POG_SCORE_MIN;;
  739. } else {
  740. lsth = g->par->T;
  741. }
  742. }
  743. }
  744. for(i=beg;i<end;i++){
  745. E = _mm_load_si128(((__m128i*)(row1)) + i);
  746. H = _mm_slli_si128(E, 2);
  747. H = _mm_insert_epi16(H, lsth, 0);
  748. H = _mm_adds_epi16(H, _mm_load_si128(((__m128i*)qp) + i));
  749. lsth = _mm_extract_epi16(E, 7);
  750. E = _mm_adds_epi16(E, D);
  751. S = _mm_max_epi16(H, E);
  752. BT1 = _mm_cmpgt_epi16(S, H);
  753. BT1 = _mm_and_si128(BT1, BT1_MASK);
  754. F = _mm_slli_si128(S, 2);
  755. F = _mm_insert_epi16(F, lstf, 0);
  756. F = _mm_adds_epi16(F, I);
  757. F = _mm_max_epi16(S, F);
  758. while(1){
  759. H = _mm_slli_si128(F, 2);
  760. H = _mm_insert_epi16(H, lstf, 0);
  761. H = _mm_adds_epi16(H, I);
  762. CMP = _mm_cmpgt_epi16(H, F);
  763. msk = _mm_movemask_epi8(CMP);
  764. if(msk == 0){
  765. break;
  766. } else {
  767. F = _mm_max_epi16(H, F);
  768. }
  769. }
  770. MAX = _mm_max_epi16(MAX, F);
  771. lstf = _mm_extract_epi16(F, 7);
  772. BT2 = _mm_cmpgt_epi16(F, S);
  773. BT2 = _mm_and_si128(BT2, BT2_MASK);
  774. BT = _mm_xor_si128(BT1, BT2); // (0, (1, 3), 2)
  775. BT = _mm_xor_si128(BT, BTX_MASK); // (0, (1, 3), 2) | (vst << 2)
  776. _mm_store_si128(((__m128i*)row2) + i, F);
  777. _mm_stream_si128(((__m128i*)btds) + i, BT);
  778. }
  779. if(1){
  780. b2i ary[8];
  781. u4i j, k;
  782. _mm_store_si128((__m128i*)ary, MAX);
  783. k = 0;
  784. for(j=1;j<8;j++){
  785. if(ary[j] > ary[k]){
  786. k = j;
  787. }
  788. }
  789. mi = beg * 8 + k;
  790. for(i=beg+1;i<end;i++){
  791. if(row2[i * 8 + k] > row2[mi]){
  792. mi = i * 8 + k;
  793. }
  794. }
  795. } else {
  796. mi = beg * 8;
  797. for(i=mi+1;i<end*8;i++){
  798. if(row2[i] > row2[mi]){
  799. mi = i;
  800. }
  801. }
  802. }
  803. row2[seqlex] = mi;
  804. row2[seqlex + 1] = beg * 8;
  805. row2[seqlex + 2] = end * 8;
  806. }
  807. static inline void merge_row_rdaln_pog(POG *g, u4i seqlen, u4i coff1, u4i coff2, u4i roff1, u4i roff2){
  808. b2i *row1, *row2, *btd1, *btd2;
  809. u4i i, seqlex, beg[3], end[3], sz, b;
  810. row1 = ref_b2v(g->rows, roff1);
  811. row2 = ref_b2v(g->rows, roff2);
  812. btd1 = ref_b2v(g->btds, coff1);
  813. btd2 = ref_b2v(g->btds, coff2);
  814. seqlex = roundup_times(seqlen, 8);
  815. beg[0] = (row1[seqlex + 1]);
  816. beg[1] = (row2[seqlex + 1]);
  817. end[0] = (row1[seqlex + 2]);
  818. end[1] = (row2[seqlex + 2]);
  819. beg[2] = num_max(beg[0], beg[1]);
  820. end[2] = num_min(end[0], end[1]);
  821. if(1){
  822. __m128i R1, R2, D1, D2, MK;
  823. for(i=beg[2];i&0x7;i++){
  824. if(row2[i] < row1[i]){
  825. row2[i] = row1[i];
  826. btd2[i] = btd1[i];
  827. }
  828. }
  829. for(;i+8<=end[2];i+=8){
  830. R1 = _mm_load_si128((__m128i*)(row1 + i));
  831. R2 = _mm_load_si128((__m128i*)(row2 + i));
  832. D1 = _mm_load_si128((__m128i*)(btd1 + i));
  833. D2 = _mm_load_si128((__m128i*)(btd2 + i));
  834. MK = _mm_cmpgt_epi16(R1, R2);
  835. R2 = _mm_max_epi16(R1, R2);
  836. _mm_store_si128((__m128i*)(row2 + i), R2);
  837. D2 = _mm_or_si128(_mm_and_si128(MK, D1), _mm_andnot_si128(MK, D2));
  838. _mm_store_si128((__m128i*)(btd2 + i), D2);
  839. }
  840. for(;i<end[2];i++){
  841. if(row2[i] < row1[i]){
  842. row2[i] = row1[i];
  843. btd2[i] = btd1[i];
  844. }
  845. }
  846. } else {
  847. for(i=beg[2];i<end[2];i++){
  848. if(row2[i] < row1[i]){
  849. row2[i] = row1[i];
  850. btd2[i] = btd1[i];
  851. }
  852. }
  853. }
  854. if(0){
  855. if(beg[0] < beg[2]){
  856. sz = num_min(beg[2], end[0]) - beg[0];
  857. memcpy(row2 + beg[0], row1 + beg[0], sz * sizeof(b2i));
  858. memcpy(btd2 + beg[0], btd1 + beg[0], sz * sizeof(b2i));
  859. }
  860. for(i=end[2];i<beg[2];i++){ // in case of two independent regions
  861. row2[i] = POG_SCORE_MIN;
  862. }
  863. if(end[0] > end[2]){
  864. sz = num_min(end[0], seqlex) - end[2];
  865. memcpy(row2 + end[2], row1 + end[2], sz * sizeof(b2i));
  866. memcpy(btd2 + end[2], btd1 + end[2], sz * sizeof(b2i));
  867. }
  868. } else {
  869. if(beg[0] < beg[1]){
  870. b = beg[0];
  871. if(end[0] >= beg[1]){
  872. sz = beg[1] - beg[0];
  873. memcpy(row2 + b, row1 + b, sz * sizeof(b2i));
  874. memcpy(btd2 + b, btd1 + b, sz * sizeof(b2i));
  875. } else {
  876. __m128i F;
  877. F = _mm_set1_epi16(POG_SCORE_MIN);
  878. sz = end[0] - beg[0];
  879. memcpy(row2 + b, row1 + b, sz * sizeof(b2i));
  880. memcpy(btd2 + b, btd1 + b, sz * sizeof(b2i));
  881. for(i=end[0];i<beg[1];i+=8){
  882. _mm_store_si128(((__m128i*)(row2 + i)), F);
  883. }
  884. }
  885. }
  886. if(end[0] > end[1]){
  887. if(beg[0] <= end[1]){
  888. b = end[1];
  889. sz = end[0] - b;
  890. memcpy(row2 + b, row1 + b, sz * sizeof(b2i));
  891. memcpy(btd2 + b, btd1 + b, sz * sizeof(b2i));
  892. } else {
  893. __m128i F;
  894. F = _mm_set1_epi16(POG_SCORE_MIN);
  895. b = beg[0];
  896. sz = end[0] - b;
  897. memcpy(row2 + b, row1 + b, sz * sizeof(b2i));
  898. memcpy(btd2 + b, btd1 + b, sz * sizeof(b2i));
  899. for(i=end[1];i<beg[0];i+=8){
  900. _mm_store_si128(((__m128i*)(row2 + i)), F);
  901. }
  902. }
  903. }
  904. }
  905. row2[seqlex + 1] = num_min(beg[0], beg[1]);
  906. row2[seqlex + 2] = num_max(end[0], end[1]);
  907. if(row1[(row1[seqlex])] > row2[(row2[seqlex])]){
  908. row2[seqlex] = row1[seqlex];
  909. }
  910. }
  911. static inline void set_rd_query_prof(POG *g, u4i rid){
  912. b2i *qp;
  913. u4i seqoff, seqlen, seqlex, slen, seqinc;
  914. u4i i, j, bb, bk;
  915. seqoff = g->seqs->rdoffs->buffer[rid];
  916. seqlen = g->seqs->rdlens->buffer[rid];
  917. seqlex = roundup_times(seqlen, 8);
  918. slen = seqlex >> 3;
  919. seqinc = seqlex + 8;
  920. head_sl_b2v(g->qprof, g->qprof->n_head);
  921. if(g->par->tribase){
  922. clear_and_encap_b2v(g->qprof, seqlex * (POG_BASEMAX + 2) + 8);
  923. head_sr_b2v(g->qprof, (16 - (((u8i)g->qprof->buffer) & 0xF)) >> 1);
  924. for(i=0;i<=POG_BASEMAX;i++){
  925. qp = g->qprof->buffer + i * seqlex;
  926. bk = 0;
  927. for(j=0;j<seqlen;j++){
  928. bb = get_basebank(g->seqs->rdseqs, seqoff + j);
  929. bk = ((bk << 2) | bb) & POG_BASEMAX;
  930. if(bb == (i & 0x03)){
  931. if(bk == i){
  932. qp[j] = g->par->M + g->par->tribase;
  933. } else {
  934. qp[j] = g->par->M;
  935. }
  936. } else {
  937. qp[j] = g->par->X;
  938. }
  939. }
  940. for(;j<seqlex;j++){
  941. qp[j] = POG_SCORE_MIN;
  942. }
  943. }
  944. } else {
  945. clear_and_encap_b2v(g->qprof, seqlex * (4 + 1) + 8);
  946. head_sr_b2v(g->qprof, (16 - (((u8i)g->qprof->buffer) & 0xF)) >> 1);
  947. for(i=0;i<4;i++){
  948. qp = g->qprof->buffer + i * seqlex;
  949. for(j=0;j<seqlen;j++){
  950. bb = get_basebank(g->seqs->rdseqs, seqoff + j);
  951. if(bb == (i & 0x03)){
  952. qp[j] = g->par->M;
  953. } else {
  954. qp[j] = g->par->X;
  955. }
  956. }
  957. for(;j<seqlex;j++){
  958. qp[j] = POG_SCORE_MIN;
  959. }
  960. }
  961. }
  962. {
  963. __m128i X;
  964. qp = g->qprof->buffer + i * seqlex;
  965. X = _mm_set1_epi16(g->par->X);
  966. for(j=0;j<slen;j++){
  967. _mm_stream_si128(((__m128i*)qp) + j, X);
  968. }
  969. }
  970. }
  971. static inline u2i get_rdbase_pog(POG *g, u4i rid, u4i pos){
  972. u4i seqoff;
  973. seqoff = g->seqs->rdoffs->buffer[rid];
  974. if(g->par->tribase == 0){
  975. return get_basebank(g->seqs->rdseqs, seqoff + pos);
  976. }
  977. if(pos >= POG_BASEWIDTH){
  978. return sub32seqbits(g->seqs->rdseqs->bits, seqoff + pos + 1 - POG_BASEWIDTH) >> (64 - (POG_BASEWIDTH << 1));
  979. } else {
  980. return (sub32seqbits(g->seqs->rdseqs->bits, seqoff)) >> (64 - ((pos + 1) << 1));
  981. }
  982. }
  983. static inline int _cal_matches_alignment_pog(POG *g, u4i rid, int *xb, int xe, int *badtail){
  984. pog_node_t *u, *v;
  985. u4i nidx, seqoff, btx, bt, vst;
  986. int x, seqlen, mat, score, x0, x1, flag;
  987. seqlen = g->seqs->rdlens->buffer[rid];
  988. seqoff = g->seqs->rdoffs->buffer[rid];
  989. x = xe;
  990. score = 0;
  991. x0 = x1 = x;
  992. flag = 0;
  993. nidx = POG_TAIL_NODE;
  994. v = ref_pognodev(g->nodes, nidx);
  995. btx = 1;
  996. mat = 0;
  997. while(x >= 0){
  998. u = ref_pognodev(g->nodes, nidx);
  999. bt = g->btvs->buffer[u->voff + x - u->rbeg];
  1000. vst = bt >> 2;
  1001. bt = bt & 0x03;
  1002. if(bt == POG_DP_BT_M){
  1003. if(flag) score += ((u->base & 0x03) == get_basebank(g->seqs->rdseqs, seqoff + x))? g->par->M : g->par->X;
  1004. else { flag = 1; x1 = x; }
  1005. mat ++;
  1006. x --;
  1007. } else if(bt & POG_DP_BT_I){
  1008. if(flag) score += g->par->I;
  1009. x --;
  1010. } else {
  1011. if(flag) score += g->par->D;
  1012. else { flag = 1; x1 = x; }
  1013. }
  1014. if(score == 10 * g->par->M){
  1015. x0 = x + 1;
  1016. }
  1017. if(bt & POG_DP_BT_I){
  1018. } else {
  1019. nidx = g->btxs->buffer[g->nodes->buffer[nidx].erev + vst];
  1020. }
  1021. if(x < 0){
  1022. break;
  1023. }
  1024. u = ref_pognodev(g->nodes, nidx);
  1025. if(x < u->rbeg || x >= u->rend){
  1026. break;
  1027. }
  1028. }
  1029. *xb = x;
  1030. *badtail = x1 > x0? x1 - x0 : 0;
  1031. return mat;
  1032. }
  1033. static inline int _alignment2graph_pog(POG *g, u4i rid, int xb, int xe){
  1034. pog_node_t *u, *v;
  1035. pog_edge_t *e;
  1036. u4i nidx, i, seqoff, btx, bt, vst;
  1037. int x, seqlen;
  1038. seqlen = g->seqs->rdlens->buffer[rid];
  1039. seqoff = g->seqs->rdoffs->buffer[rid];
  1040. x = xe;
  1041. nidx = POG_TAIL_NODE;
  1042. v = ref_pognodev(g->nodes, nidx);
  1043. int my_print = (cns_debug > 3);
  1044. if(x + 1 < (int)seqlen){
  1045. for(i=seqlen-1;(int)i>x;i--){
  1046. if(my_print){
  1047. fprintf(stderr, "BT[%u] y=N%u_R%u_%u_%c x=%d:%c z=%d\n", rid, nidx, v->rid, v->pos, bit_base_table[(v->base) & 0x03], i, bit_base_table[get_basebank(g->seqs->rdseqs, seqoff + i)], -1);
  1048. fflush(stderr);
  1049. }
  1050. u = add_node_pog(g, rid, i, get_rdbase_pog(g, rid, i));
  1051. add_edge_pog(g, u, v, 1, 0);
  1052. v = u;
  1053. }
  1054. v->coff = ref_pognodev(g->nodes, POG_TAIL_NODE)->coff;
  1055. }
  1056. btx = 1;
  1057. while(1){
  1058. if(x >= 0){
  1059. u = ref_pognodev(g->nodes, nidx);
  1060. bt = g->btvs->buffer[u->voff + x - u->rbeg];
  1061. } else {
  1062. bt = 0;
  1063. }
  1064. vst = bt >> 2;
  1065. bt = bt & 0x03;
  1066. if(my_print){
  1067. pog_node_t *w;
  1068. w = ref_pognodev(g->nodes, nidx);
  1069. fprintf(stderr, "BT[%u] y=N%u_R%u_%u_%c x=%d:%c z=%d\n", rid, nidx, w->rid, w->pos, bit_base_table[(w->base) & 0x03], x, x>=0? bit_base_table[get_basebank(g->seqs->rdseqs, seqoff + x)] : '*', bt);
  1070. fflush(stderr);
  1071. }
  1072. if(bt == POG_DP_BT_M){
  1073. if(btx){
  1074. u = add_node_pog(g, rid, x, get_rdbase_pog(g, rid, x));
  1075. e = add_edge_pog(g, u, v, 1, 0);
  1076. x --;
  1077. if(nidx > POG_TAIL_NODE){
  1078. u = merge_node_pog(g, ref_pognodev(g->nodes, nidx), u);
  1079. }
  1080. v = u;
  1081. } else {
  1082. xb = x;
  1083. if(nidx == POG_HEAD_NODE || nidx + 1 >= g->nodes->size || g->nodes->buffer[nidx].rid != g->nodes->buffer[nidx + 1].rid){
  1084. nidx = POG_HEAD_NODE;
  1085. } else {
  1086. nidx ++;
  1087. }
  1088. u = ref_pognodev(g->nodes, nidx);
  1089. e = add_edge_pog(g, u, v, 1, 0);
  1090. if(nidx != POG_HEAD_NODE){
  1091. v = u;
  1092. u = ref_pognodev(g->nodes, POG_HEAD_NODE);
  1093. //e = add_edge_pog(g, u, v, 1, 0);
  1094. e = add_edge_pog(g, u, v, 0, 1);
  1095. }
  1096. break;
  1097. }
  1098. } else if(bt & POG_DP_BT_I){
  1099. u = add_node_pog(g, rid, x, get_rdbase_pog(g, rid, x));
  1100. e = add_edge_pog(g, u, v, 1, 0);
  1101. x --;
  1102. v = u;
  1103. } else {
  1104. }
  1105. if(x < 0){ // && nidx
  1106. if(bt == POG_DP_BT_I){
  1107. } else {
  1108. nidx = 0;
  1109. }
  1110. btx = 0;
  1111. continue;
  1112. }
  1113. if(bt & POG_DP_BT_I){
  1114. } else {
  1115. nidx = g->btxs->buffer[g->nodes->buffer[nidx].erev + vst];
  1116. }
  1117. #if DEBUG
  1118. if(nidx >= g->nodes->size){
  1119. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1120. abort();
  1121. }
  1122. #endif
  1123. u = ref_pognodev(g->nodes, nidx);
  1124. if(x < u->rbeg || x >= u->rend){
  1125. xb = x;
  1126. while(x >= 0){
  1127. u = add_node_pog(g, rid, x, get_rdbase_pog(g, rid, x));
  1128. e = add_edge_pog(g, u, v, 1, 0);
  1129. x --;
  1130. v = u;
  1131. }
  1132. {
  1133. u = ref_pognodev(g->nodes, POG_HEAD_NODE);
  1134. e = add_edge_pog(g, u, v, 1, 0);
  1135. v = u;
  1136. }
  1137. break;
  1138. }
  1139. }
  1140. return xb;
  1141. }
  1142. static inline int align_rd_pog_core(POG *g, u2i rid, int W, int *xe){
  1143. pog_node_t *u, *v;
  1144. pog_edge_t *e;
  1145. u4i seqoff, seqlen, seqlex, slen, seqinc;
  1146. b4i score, x;
  1147. b2i *qp, *row;
  1148. __m128i SMASK;
  1149. u4i nidx, eidx, coff, roff, mnode;
  1150. u4i i, j;
  1151. seqoff = g->seqs->rdoffs->buffer[rid];
  1152. seqlen = g->seqs->rdlens->buffer[rid];
  1153. seqlex = roundup_times(seqlen, 8); // 128 = 8 * sizeof(b2i)
  1154. slen = seqlex >> 3;
  1155. seqinc = seqlex + 8; // seqlex, max_idx, beg, end, and paddings
  1156. #if __BYTE_ORDER == 1234
  1157. SMASK = _mm_setr_epi8(0, 2, 4, 6, 8, 10, 12, 14, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80);
  1158. #else
  1159. // TODO: need to test in BIG_ENDIAN
  1160. SMASK = _mm_setr_epi8(1, 3, 5, 7, 9, 11, 13, 15, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80);
  1161. #endif
  1162. // set query prof
  1163. // fit buffer to 16 bytes aligned
  1164. set_rd_query_prof(g, rid);
  1165. prepare_rd_align_pog(g, rid);
  1166. clear_u4v(g->stack);
  1167. push_u4v(g->stack, POG_HEAD_NODE);
  1168. score = POG_SCORE_MIN;
  1169. mnode = POG_TAIL_NODE; // point to POG_TAIL
  1170. x = seqlen - 1;
  1171. int my_print = (cns_debug > 3);
  1172. while(pop_u4v(g->stack, &nidx)){
  1173. u = ref_pognodev(g->nodes, nidx);
  1174. u->rmax = g->rows->buffer[u->roff + seqlex];
  1175. u->rbeg = g->rows->buffer[u->roff + seqlex + 1];
  1176. u->rend = g->rows->buffer[u->roff + seqlex + 2];
  1177. if(my_print){
  1178. fprintf(stderr, "NODEALN[%u:R%u:%u] %d-%d:%d:%d %d %d\n", nidx, u->rid, u->pos, u->rbeg, u->rend, u->rmax,
  1179. g->rows->buffer[u->roff + u->rmax], g->btds->buffer[u->coff + u->rmax] >> 2, g->btds->buffer[u->coff + u->rmax] & 0x03);
  1180. }
  1181. if(g->par->alnmode == POG_ALNMODE_OVERLAP){
  1182. if(u->rend >= seqlen && g->rows->buffer[u->roff + x] > score){ // overlap alignment
  1183. score = g->rows->buffer[u->roff + x];
  1184. mnode = nidx;
  1185. }
  1186. }
  1187. eidx = u->edge;
  1188. while(eidx){
  1189. e = ref_pogedgev(g->edges, eidx);
  1190. eidx = e->next;
  1191. v = ref_pognodev(g->nodes, e->node);
  1192. qp = g->qprof->buffer + v->base * seqlex;
  1193. if(g->rowr->size){
  1194. coff = roff = g->rowr->buffer[-- g->rowr->size];
  1195. } else {
  1196. #if 0
  1197. if(g->rows->size + seqinc + g->rows->n_head > g->rows->cap){
  1198. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1199. abort();
  1200. }
  1201. #endif
  1202. roff = g->rows->size;
  1203. inc_b2v(g->rows, seqinc);
  1204. coff = g->btds->size;
  1205. inc_b2v(g->btds, seqinc);
  1206. }
  1207. g->btxs->buffer[v->erev + v->vst] = nidx; // save backtrace nidx
  1208. sse_band_row_rdaln_pog(g, nidx, e->node, seqlen, v->vst, u->coff, coff, u->roff, roff, qp, W, -1);
  1209. if(v->vst){
  1210. merge_row_rdaln_pog(g, seqlen, coff, v->coff, roff, v->roff);
  1211. push_u4v(g->rowr, roff);
  1212. } else {
  1213. v->coff = coff;
  1214. v->roff = roff;
  1215. }
  1216. v->vst ++;
  1217. if(v->vst == v->nin){
  1218. push_u4v(g->stack, e->node);
  1219. #if DEBUG
  1220. } else if(v->vst > v->nin){
  1221. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1222. abort();
  1223. #endif
  1224. }
  1225. }
  1226. push_u4v(g->rowr, u->roff);
  1227. { // compress-copy btds into btvs
  1228. u->voff = g->btvs->size;
  1229. inc_u2v(g->btvs, u->rend - u->rbeg);
  1230. if(0){
  1231. for(i=u->rbeg;i<u->rend;i++){
  1232. g->btvs->buffer[u->voff + i - u->rbeg] = (u1i)g->btds->buffer[u->coff + i];
  1233. }
  1234. } else {
  1235. memcpy(g->btvs->buffer + u->voff, g->btds->buffer + u->coff + u->rbeg, (u->rend - u->rbeg) * sizeof(u2i));
  1236. }
  1237. }
  1238. }
  1239. v = ref_pognodev(g->nodes, POG_TAIL_NODE);
  1240. #if DEBUG
  1241. if(v->roff == 0){
  1242. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1243. abort();
  1244. }
  1245. if(v->voff == 0){
  1246. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1247. abort();
  1248. }
  1249. #endif
  1250. if(W == 0){
  1251. row = ref_b2v(g->rows, v->roff);
  1252. j = 0;
  1253. for(i=1;i<seqlen;i++){
  1254. if(row[i] > row[j]){
  1255. j = i;
  1256. }
  1257. }
  1258. v->rmax = row[seqlex] = j;
  1259. v->rbeg = row[seqlex + 1] = 0;
  1260. v->rend = row[seqlex + 2] = seqlex;
  1261. }
  1262. if(g->par->alnmode == POG_ALNMODE_OVERLAP){
  1263. if(g->rows->buffer[v->roff + v->rmax] + g->par->T > score){
  1264. score = g->rows->buffer[v->roff + (g->rows->buffer[v->roff + seqlex])];
  1265. mnode = POG_TAIL_NODE;
  1266. x = (g->rows->buffer[v->roff + seqlex]);
  1267. }
  1268. } else {
  1269. score = g->rows->buffer[v->roff + seqlen - 1];
  1270. mnode = POG_TAIL_NODE;
  1271. x = seqlen - 1;
  1272. }
  1273. if(x == Int(seqlen - 1) && mnode != POG_TAIL_NODE){
  1274. v = ref_pognodev(g->nodes, POG_TAIL_NODE);
  1275. g->btvs->buffer[v->voff + x - v->rbeg] = (2 | (v->vst << 2));
  1276. g->btxs->buffer[v->erev + v->vst] = mnode;
  1277. v->vst ++;
  1278. }
  1279. *xe = x;
  1280. return score;
  1281. }
  1282. static inline int align_rd_pog(POG *g, u2i rid){
  1283. int xb, xe, rlen, bad, xlen, score, W, mat;
  1284. rlen = g->seqs->rdlens->buffer[rid];
  1285. xlen = rlen / 8 * 8;
  1286. W = g->par->W? g->par->W : xlen;
  1287. xlen = num_min(xlen, g->par->Wmax);
  1288. mat = 0;
  1289. // try increase W when align score is low
  1290. while(1){
  1291. score = align_rd_pog_core(g, rid, W, &xe);
  1292. mat = _cal_matches_alignment_pog(g, rid, &xb, xe, &bad);
  1293. if(cns_debug > 1){
  1294. fprintf(stderr, "ALIGN[%03d] len=%u ref=%d,%d band=%d aligned=%d,%d tail=%d mat=%d,%0.3f score=%d\n", rid, g->seqs->rdlens->buffer[rid], g->sbegs->buffer[rid], g->sends->buffer[rid], W, xb + 1, xe + 1, bad, mat, 1.0 * mat / rlen, score);
  1295. }
  1296. if(rid == 0){
  1297. break;
  1298. }
  1299. if(mat >= rlen * g->par->W_mat_rate && bad < 50){
  1300. break;
  1301. }
  1302. if(W >= xlen) break;
  1303. W = num_min(W * 2, xlen);
  1304. }
  1305. xb = 0;
  1306. xb = _alignment2graph_pog(g, rid, xb, xe);
  1307. return score;
  1308. }
  1309. static inline u4i realign_msa_pog_core(POG *g, u4i ridx, int W){
  1310. u2i *bcnts[7], *hcovs, *bts, *bs, *bs1;
  1311. u1i *r, *s;
  1312. int wins[20], winl, winy, winx;
  1313. u4i i, *dps, f, h, e, *row1, *row2, max, bt;
  1314. int j, beg, end, off, x, y;
  1315. hcovs = g->hcovs->buffer;
  1316. for(i=0;i<7;i++){
  1317. clear_and_encap_u2v(g->bcnts[i], g->msa_len);
  1318. bcnts[i] = g->bcnts[i]->buffer;
  1319. memset(bcnts[i], 0, g->msa_len * sizeof(u2i));
  1320. }
  1321. for(i=0;i<g->seqs->nseq;i++){
  1322. if(i == ridx) continue;
  1323. r = ref_u1v(g->msa, g->msa_len * i);
  1324. for(j=0;j<(int)g->msa_len;j++){
  1325. bcnts[r[j]][j] ++;
  1326. }
  1327. }
  1328. for(i=0;i<g->msa_len;i++){
  1329. max = 0;
  1330. for(j=1;j<4;j++){
  1331. if(bcnts[j][i] > bcnts[max][i]){
  1332. max = j;
  1333. }
  1334. }
  1335. bcnts[5][i] = max;
  1336. bcnts[6][i] = bcnts[0][i] + bcnts[1][i] + bcnts[2][i] + bcnts[3][i];
  1337. }
  1338. s = ref_u1v(g->msa, g->msa_len * ridx);
  1339. winl = 20;
  1340. winx = 0;
  1341. winy = 0;
  1342. beg = -1;
  1343. memset(wins, 0, winl * sizeof(int));
  1344. if(0){
  1345. for(i=0;i<g->msa_len;i++){
  1346. max = bcnts[5][i];
  1347. winy -= wins[winx];
  1348. if(s[i] < 4 && ((hcovs[i] >= 4 && bcnts[s[i]][i] == 0))){
  1349. wins[winx] = 1;
  1350. } else {
  1351. wins[winx] = 0;
  1352. }
  1353. winy += wins[winx];
  1354. //fprintf(stderr, " -- hcovs = %d s[i] = %c:%d i = %u winy = %d in %s -- %s:%d --\n", hcovs[i], "ACGT-"[s[i]], bcnts[s[i]][i], i, winy, __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1355. if(Int(i) > winl){
  1356. if(winy >= Int(0.9 * winl)){
  1357. if(beg < 0){
  1358. beg = i - winl;
  1359. }
  1360. } else {
  1361. if(beg >= 0){
  1362. end = i;
  1363. if(cns_debug > 1){
  1364. fprintf(stderr, " -- remove low quality fragment %d - %d: ", beg, end);
  1365. for(j=beg;j<end;j++){
  1366. fputc("ACGT-"[s[j]], stderr);
  1367. }
  1368. fputc('\n', stderr);
  1369. fflush(stderr);
  1370. }
  1371. for(j=beg;j<end;j++){
  1372. s[j] = 4;
  1373. }
  1374. }
  1375. beg = -1;
  1376. }
  1377. }
  1378. winx = (winx + 1) % winl;
  1379. }
  1380. }
  1381. clear_and_encap_b2v(g->btds, (g->msa_len + 1) * W * 2);
  1382. bts = (u2i*)g->btds->buffer;
  1383. clear_and_encap_u4v(g->btxs, (g->msa_len + 1) * W * 2);
  1384. dps = g->btxs->buffer;
  1385. memset(bts, 0, 2 * W * sizeof(u2i));
  1386. memset(dps, 0, 2 * W * sizeof(u4i));
  1387. bts += W * 2;
  1388. dps += W * 2;
  1389. for(i=0;i<g->msa_len;i++){
  1390. bs1 = bts + 2 * W * (Int(i) - 1);
  1391. bs = bts + 2 * W * i;
  1392. row1 = dps + 2 * W * (Int(i) - 1);
  1393. row2 = dps + 2 * W * i;
  1394. f = 0;
  1395. off = Int(i) - W;
  1396. if(Int(i) <= W){
  1397. beg = W - i;
  1398. } else {
  1399. beg = 0;
  1400. }
  1401. if(i + W - 1 >= g->msa_len){
  1402. end = W + g->msa_len - i;
  1403. } else {
  1404. end = W * 2 - 1;
  1405. }
  1406. if(s[i] == 4){
  1407. for(j=beg;j<end;j++){
  1408. e = row1[j + 1];
  1409. //h = row1[j] + 0 + 1;
  1410. h = row1[j];
  1411. if(h >= e){
  1412. bs[j] = 0;
  1413. } else {
  1414. h = e;
  1415. bs[j] = 1;
  1416. }
  1417. if(h >= f){
  1418. f = h;
  1419. } else {
  1420. h = f;
  1421. bs[j] = 2;
  1422. }
  1423. row2[j] = h;
  1424. }
  1425. } else {
  1426. for(j=beg;j<end;j++){
  1427. e = row1[j + 1];
  1428. //h = row1[j] + (s[i] == bcnts[5][off + j]? bcnts[s[i]][off + j] : 0);
  1429. if(Int(bcnts[s[i]][off + j] + 1) >= Int(bcnts[6][off + j] - bcnts[s[i]][off + j])){
  1430. h = row1[j] + 2 * bcnts[s[i]][off + j] - bcnts[6][off + j] + 1;
  1431. } else {
  1432. h = row1[j] + 1;
  1433. }
  1434. // bonus for putting homo together
  1435. if(i && bs1[j] == 0 && s[i] == s[i - 1]){
  1436. h += 1;
  1437. }
  1438. if(h >= e){
  1439. bs[j] = 0;
  1440. } else {
  1441. h = e;
  1442. bs[j] = 1;
  1443. }
  1444. if(h >= f){
  1445. f = h;
  1446. } else {
  1447. h = f;
  1448. bs[j] = 2;
  1449. }
  1450. row2[j] = h;
  1451. }
  1452. }
  1453. if(beg){
  1454. row2[beg - 1] = 0;
  1455. bs[beg - 1] = 0;
  1456. }
  1457. row2[end] = 0;
  1458. bs[end] = 0;
  1459. if(cns_debug > 3){
  1460. fprintf(stderr, "ROW[%u] '%c' %03d-%03d:", i, "ACGT-"[s[i]], beg, end);
  1461. for(j=beg;j<end;j++){
  1462. fprintf(stderr, " %5u[%d]", row2[j], bs[j]);
  1463. }
  1464. fprintf(stderr, "\n");
  1465. }
  1466. }
  1467. row2 = dps + 2 * W * (g->msa_len - 1);
  1468. max = row2[W];
  1469. r = ref_u1v(g->msa, g->msa_len * g->seqs->nseq);
  1470. x = y = g->msa_len - 1;
  1471. while(y >= 0 && x >= 0){
  1472. off = x - W;
  1473. bs = bts + 2 * W * x;
  1474. bt = bs[y - off];
  1475. switch(bt){
  1476. case 0: r[y] = s[x]; x --; y --; break;
  1477. case 1: x --; break;
  1478. case 2: r[y] = 4; y --; break;
  1479. }
  1480. if(cns_debug > 3 && bt){
  1481. fprintf(stderr, " -- x = %d y = %d bt = %d in %s -- %s:%d --\n", x, y, bt, __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1482. }
  1483. }
  1484. if(cns_debug > 1){
  1485. fprintf(stderr, " -- max = %d x = %d y = %d in %s -- %s:%d --\n", max, x, y, __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1486. }
  1487. while(y >= 0){
  1488. r[y] = 4;
  1489. y --;
  1490. }
  1491. return max;
  1492. }
  1493. static inline void realign_msa_pog(POG *g){
  1494. u4i ridx;
  1495. if(g->par->rW <= 0 || g->seqs->nseq < 3) return;
  1496. if(cns_debug > 1){
  1497. fprintf(stderr, "RAW MSA\n");
  1498. print_msa_pog(g, stderr);
  1499. }
  1500. for(ridx=0;ridx<g->seqs->nseq;ridx++){
  1501. if(cns_debug > 1){
  1502. fprintf(stderr, "REALIGN[%u]\n", ridx);
  1503. }
  1504. realign_msa_pog_core(g, ridx, g->par->rW);
  1505. if(cns_debug > 1){
  1506. print_msa_pog(g, stderr);
  1507. }
  1508. // update ridx alignment
  1509. memcpy(g->msa->buffer + g->msa_len * ridx, g->msa->buffer + g->msa_len * g->seqs->nseq, g->msa_len);
  1510. }
  1511. }
  1512. static const float homo_merging_cmp_norm[20] = {
  1513. 0.95, 0.90, 0.80, 0.75, 0.70,
  1514. 0.70, 0.65, 0.60, 0.60, 0.55,
  1515. 0.50, 0.45, 0.40, 0.30, 0.20,
  1516. 0.20, 0.20, 0.20, 0.20, 0.20
  1517. };
  1518. /*
  1519. static inline void dp_gen_cns_pog(POG *g){
  1520. pog_cns_t dps[2 * 5], *dp1, *dp2;
  1521. b2i *row1, *row2, *row3;
  1522. u1i *s, *r;
  1523. u4i mcnt;
  1524. int bcnts[5];
  1525. u2i *hcovs, *rexs;
  1526. u4i rid, beg, end, x, val, fidx, col, dep;
  1527. u4i mx, mi, i, j;
  1528. float DP_MIN, score0, score1;
  1529. DP_MIN = - (MAX_B4 >> 1);
  1530. mcnt = num_min(g->par->msa_min_cnt, g->seqs->nseq);
  1531. clear_and_encap_u1v(g->cbts, g->msa_len * 5);
  1532. // scan read end
  1533. clear_u4v(g->btxs);
  1534. clear_u2v(g->btvs); // whether read cov current column
  1535. hcovs = g->hcovs->buffer;
  1536. memset(hcovs, 0, g->msa_len * sizeof(u2i));
  1537. for(rid=0;rid<g->seqs->nseq;rid++){
  1538. push_u2v(g->btvs, MAX_U2);
  1539. r = ref_u1v(g->msa, g->msa_len * rid);
  1540. beg = 0;
  1541. while(beg < g->msa_len && r[beg] == 4) beg ++;
  1542. push_u4v(g->btxs, (0U << 31) | (rid << 16) | beg);
  1543. end = g->msa_len;
  1544. while(end > beg && r[end - 1] == 4) end --;
  1545. push_u4v(g->btxs, (1U << 31) | (rid << 16) | end);
  1546. for(i=beg;i<end;i++) hcovs[i] ++;
  1547. }
  1548. sort_array(g->btxs->buffer, g->btxs->size, u4i, num_cmpgt(a & 0xFFFF, b & 0xFFFF));
  1549. mx = 0;
  1550. rexs = g->btvs->buffer;
  1551. memset(dps, 0, 2 * 5 * sizeof(pog_cns_t));
  1552. fidx = 0;
  1553. clear_b2v(g->rows);
  1554. clear_u4v(g->rowr);
  1555. dp1 = dps;
  1556. inc_b2v(g->rows, g->par->cW * g->seqs->nseq);
  1557. for(i=0;i<5;i++){
  1558. dp1[i].coff = g->rows->size;
  1559. inc_b2v(g->rows, g->par->cW * g->seqs->nseq);
  1560. row1 = g->rows->buffer + dp1[i].coff;
  1561. memset(row1, 0, g->par->cW * g->seqs->nseq * sizeof(b2i));
  1562. }
  1563. dep = 0;
  1564. for(col=0;col<g->msa_len;col++){
  1565. fidx = !fidx;
  1566. dp1 = dps + fidx * 5;
  1567. dp2 = dps + (!fidx) * 5;
  1568. // collect read coverage
  1569. while(mx < g->btxs->size){
  1570. val = g->btxs->buffer[mx];
  1571. if((val & 0xFFFF) <= col){
  1572. rid = (val << 1) >> 17;
  1573. if(val & (1U << 31)){
  1574. #if DEBUG
  1575. if(rexs[rid] == MAX_U2){
  1576. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1577. abort();
  1578. }
  1579. #endif
  1580. rexs[rid] = MAX_U2;
  1581. dep --;
  1582. } else {
  1583. #if DEBUG
  1584. if(rexs[rid] < MAX_U2){
  1585. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1586. abort();
  1587. }
  1588. #endif
  1589. rexs[rid] = 0;
  1590. dep ++;
  1591. }
  1592. mx ++;
  1593. } else {
  1594. break;
  1595. }
  1596. }
  1597. for(i=0;i<5;i++){
  1598. dp2[i].max = DP_MIN;
  1599. dp2[i].bt = 4;
  1600. if(g->rowr->size){
  1601. dp2[i].coff = pop_u4v(g->rowr);
  1602. } else {
  1603. dp2.coff = g->rows->size;
  1604. inc_b2v(g->rows, g->par->cW * g->seqs->nseq);
  1605. }
  1606. }
  1607. row2 = g->rows->buffer; // temprary
  1608. if(dep < mcnt && !(g->par->refmode && rexs[0] != MAX_U2)){
  1609. //TODO: coding from here
  1610. mi = 4;
  1611. for(i=0;i<4;i++){
  1612. if(dp1[i] > dp1[mi]){
  1613. mi = i;
  1614. }
  1615. }
  1616. dp2[4] = dp1[mi];
  1617. bts[4] = mi;
  1618. } else {
  1619. for(i=0;i<=4;i++){
  1620. score0 = dp1[i];
  1621. for(j=0;j<=4;j++){
  1622. score1 = score0;
  1623. for(x=0;x<=4;x++){
  1624. if(j == 4){
  1625. if(x != 4){
  1626. score1 += bcnts[x] * g->par->I;
  1627. }
  1628. } else {
  1629. if(x == 4){
  1630. if(i == j){
  1631. score1 += bcnts[x] * g->par->H;
  1632. } else {
  1633. score1 += bcnts[x] * g->par->D;
  1634. }
  1635. } else if(x == j){
  1636. score1 += bcnts[x] * g->par->M;
  1637. } else {
  1638. score1 += bcnts[x] * g->par->X;
  1639. }
  1640. }
  1641. }
  1642. if(score1 > dp2[j]){
  1643. dp2[j] = score1;
  1644. bts[j] = i;
  1645. }
  1646. }
  1647. }
  1648. // Prior to the first read
  1649. for(rid=0;rid<g->seqs->nseq;rid++){
  1650. if(rexs[i] == 0){
  1651. continue;
  1652. }
  1653. r = ref_u1v(g->msa, g->msa_len * rid);
  1654. dp2[r[col]] += 0.1;
  1655. break;
  1656. }
  1657. }
  1658. for(i=0;i<=4;i++){
  1659. push_u1v(g->cbts, bts[i]);
  1660. }
  1661. if(cns_debug > 2){
  1662. fprintf(stderr, "[DPCNS%03u]\t[%2d, %2d, %2d, %2d, %2d]", col, bcnts[0], bcnts[1], bcnts[2], bcnts[3], bcnts[4]);
  1663. //fprintf(stderr, "\t[%0.1f, %0.1f, %0.1f, %0.1f, %0.1f]", dp1[0], dp1[1], dp1[2], dp1[3], dp1[4]);
  1664. fprintf(stderr, "\t[%0.1f:%d, %0.1f:%d, %0.1f:%d, %0.1f:%d, %0.1f:%d]\n", dp2[0], bts[0], dp2[1], bts[1], dp2[2], bts[2], dp2[3], bts[3], dp2[4], bts[4]);
  1665. }
  1666. }
  1667. // Backtrace consensus sequence
  1668. dp2 = dps + (!fidx) * 5;
  1669. mx = 4;
  1670. for(i=0;i<4;i++){
  1671. if(dp2[i] > dp2[mx]){
  1672. mx = i;
  1673. }
  1674. }
  1675. x = g->msa_len;
  1676. s = ref_u1v(g->msa, g->msa_len * g->seqs->nseq);
  1677. while(x){
  1678. x --;
  1679. s[x] = mx;
  1680. mx = g->cbts->buffer[x * 5 + mx];
  1681. }
  1682. for(i=0;i<g->msa_len;i++){
  1683. if(s[i] < 4){
  1684. bit2basebank(g->cns, s[i]);
  1685. }
  1686. }
  1687. }
  1688. */
  1689. static inline void dp_call_cns_pog(POG *g){
  1690. u1i *s, *r, bts[5];
  1691. u4i mcnt;
  1692. int bcnts[5];
  1693. u2i *hcovs, *rexs;
  1694. u4i rid, beg, end, x, val, fidx, col, dep;
  1695. u4i mx, mi, i, j;
  1696. float dps[2 * 5], *dp1, *dp2, DP_MIN, score0, score1;
  1697. DP_MIN = - (MAX_B4 >> 1);
  1698. mcnt = num_min(g->par->msa_min_cnt, g->seqs->nseq);
  1699. clear_and_encap_u1v(g->cbts, g->msa_len * 5);
  1700. // scan read end
  1701. clear_u4v(g->btxs);
  1702. clear_u2v(g->btvs); // whether read cov current column
  1703. hcovs = g->hcovs->buffer;
  1704. memset(hcovs, 0, g->msa_len * sizeof(u2i));
  1705. for(rid=0;rid<g->seqs->nseq;rid++){
  1706. push_u2v(g->btvs, 0);
  1707. r = ref_u1v(g->msa, g->msa_len * rid);
  1708. beg = 0;
  1709. while(beg < g->msa_len && r[beg] == 4) beg ++;
  1710. push_u4v(g->btxs, (0U << 31) | (rid << 16) | beg);
  1711. end = g->msa_len;
  1712. while(end > beg && r[end - 1] == 4) end --;
  1713. push_u4v(g->btxs, (1U << 31) | (rid << 16) | end);
  1714. for(i=beg;i<end;i++) hcovs[i] ++;
  1715. }
  1716. sort_array(g->btxs->buffer, g->btxs->size, u4i, num_cmpgt(a & 0xFFFF, b & 0xFFFF));
  1717. memset(dps, 0, 2 * 5 * sizeof(float));
  1718. fidx = 0;
  1719. dep = 0;
  1720. mx = 0;
  1721. rexs = g->btvs->buffer;
  1722. for(col=0;col<g->msa_len;col++){
  1723. fidx = !fidx;
  1724. dp1 = dps + fidx * 5;
  1725. dp2 = dps + (!fidx) * 5;
  1726. // collect read coverage
  1727. while(mx < g->btxs->size){
  1728. val = g->btxs->buffer[mx];
  1729. if((val & 0xFFFF) <= col){
  1730. rid = (val << 1) >> 17;
  1731. if(val & (1U << 31)){
  1732. #if DEBUG
  1733. if(rexs[rid] == 0){
  1734. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1735. abort();
  1736. }
  1737. #endif
  1738. rexs[rid] = 0;
  1739. dep --;
  1740. } else {
  1741. #if DEBUG
  1742. if(rexs[rid] == 1){
  1743. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  1744. abort();
  1745. }
  1746. #endif
  1747. rexs[rid] = 1;
  1748. dep ++;
  1749. }
  1750. mx ++;
  1751. } else {
  1752. break;
  1753. }
  1754. }
  1755. bts[0] = bts[1] = bts[2] = bts[3] = bts[4] = 4;
  1756. dp2[0] = DP_MIN;
  1757. dp2[1] = DP_MIN;
  1758. dp2[2] = DP_MIN;
  1759. dp2[3] = DP_MIN;
  1760. dp2[4] = DP_MIN;
  1761. memset(bcnts, 0, sizeof(int) * 5);
  1762. for(rid=0;rid<g->seqs->nseq;rid++){
  1763. if(rexs[rid] == 0){
  1764. continue;
  1765. }
  1766. r = ref_u1v(g->msa, g->msa_len * rid);
  1767. bcnts[r[col]] ++;
  1768. }
  1769. if(dep < mcnt && !(g->par->refmode && rexs[0])){
  1770. mi = 4;
  1771. for(i=0;i<4;i++){
  1772. if(dp1[i] > dp1[mi]){
  1773. mi = i;
  1774. }
  1775. }
  1776. dp2[4] = dp1[mi];
  1777. bts[4] = mi;
  1778. } else {
  1779. for(i=0;i<=4;i++){
  1780. score0 = dp1[i];
  1781. for(j=0;j<=4;j++){
  1782. score1 = score0;
  1783. for(x=0;x<=4;x++){
  1784. if(j == 4){
  1785. if(x != 4){
  1786. score1 += bcnts[x] * g->par->I;
  1787. }
  1788. } else {
  1789. if(x == 4){
  1790. if(i == j){
  1791. score1 += bcnts[x] * g->par->H;
  1792. } else {
  1793. score1 += bcnts[x] * g->par->D;
  1794. }
  1795. } else if(x == j){
  1796. score1 += bcnts[x] * g->par->M;
  1797. } else {
  1798. score1 += bcnts[x] * g->par->X;
  1799. }
  1800. }
  1801. }
  1802. if(score1 > dp2[j]){
  1803. dp2[j] = score1;
  1804. bts[j] = i;
  1805. }
  1806. }
  1807. }
  1808. // Prior to the first read
  1809. for(rid=0;rid<g->seqs->nseq;rid++){
  1810. if(rexs[i] == 0){
  1811. continue;
  1812. }
  1813. r = ref_u1v(g->msa, g->msa_len * rid);
  1814. dp2[r[col]] += 0.1;
  1815. break;
  1816. }
  1817. }
  1818. for(i=0;i<=4;i++){
  1819. push_u1v(g->cbts, bts[i]);
  1820. }
  1821. if(cns_debug > 2){
  1822. fprintf(stderr, "[DPCNS%03u]\t[%2d, %2d, %2d, %2d, %2d]", col, bcnts[0], bcnts[1], bcnts[2], bcnts[3], bcnts[4]);
  1823. //fprintf(stderr, "\t[%0.1f, %0.1f, %0.1f, %0.1f, %0.1f]", dp1[0], dp1[1], dp1[2], dp1[3], dp1[4]);
  1824. fprintf(stderr, "\t[%0.1f:%d, %0.1f:%d, %0.1f:%d, %0.1f:%d, %0.1f:%d]\n", dp2[0], bts[0], dp2[1], bts[1], dp2[2], bts[2], dp2[3], bts[3], dp2[4], bts[4]);
  1825. }
  1826. }
  1827. // Backtrace consensus sequence
  1828. dp2 = dps + (!fidx) * 5;
  1829. mx = 4;
  1830. for(i=0;i<4;i++){
  1831. if(dp2[i] > dp2[mx]){
  1832. mx = i;
  1833. }
  1834. }
  1835. x = g->msa_len;
  1836. s = ref_u1v(g->msa, g->msa_len * g->seqs->nseq);
  1837. while(x){
  1838. x --;
  1839. s[x] = mx;
  1840. mx = g->cbts->buffer[x * 5 + mx];
  1841. }
  1842. for(i=0;i<g->msa_len;i++){
  1843. if(s[i] < 4){
  1844. bit2basebank(g->cns, s[i]);
  1845. }
  1846. }
  1847. }
  1848. static inline void gen_cns_pog(POG *g){
  1849. u1i *s, *r;
  1850. u4i idx, lst, lsv, lsx, rid, max, i, mcnt, min_cnt, max_cnt, runlen, cnl, beg, end, cbeg, cend;
  1851. u4i freqs[5][11], fmax1, fmax2, tot, cut, *hcnts;
  1852. u2i cnts[5], *bls, cl, bx, bl, bm, dl, dm, *hcovs, corr;
  1853. //u2i *vsts;
  1854. float fl, fx1, fx2, norm, flush;
  1855. mcnt = num_min(g->par->msa_min_cnt, g->seqs->nseq);
  1856. min_cnt = num_max(mcnt, UInt(g->par->msa_min_freq * g->seqs->nseq));
  1857. max_cnt = g->seqs->nseq - min_cnt;
  1858. s = ref_u1v(g->msa, g->msa_len * g->seqs->nseq);
  1859. memset(s, 4, g->msa_len);
  1860. clear_basebank(g->cns);
  1861. hcovs = g->hcovs->buffer;
  1862. bls = hcovs + 8 + g->msa_len; // bls is all zeros, see end_pog
  1863. if(g->par->rW){
  1864. memset(hcovs, 0, g->msa_len * sizeof(u2i));
  1865. for(rid=0;rid<g->seqs->nseq;rid++){
  1866. r = ref_u1v(g->msa, g->msa_len * rid);
  1867. beg = 0;
  1868. while(beg < g->msa_len && r[beg] == 4) beg ++;
  1869. end = g->msa_len;
  1870. while(end > beg && r[end - 1] == 4) end --;
  1871. for(i=beg;i<end;i++) hcovs[i] ++;
  1872. }
  1873. }
  1874. // revise mcnt
  1875. if(g->par->refmode){
  1876. } else if(0){
  1877. tot = 0;
  1878. clear_and_encap_u4v(g->btxs, mcnt + 1);
  1879. hcnts = g->btxs->buffer;
  1880. //hcnts = alloca((mcnt + 1) * sizeof(u4i));
  1881. memset(hcnts, 0, (mcnt + 1) * sizeof(u4i));
  1882. for(i=0;i<g->msa_len;i++){
  1883. tot += (hcovs[i] + 1) * (hcovs[i]) / 2;
  1884. hcnts[num_min(hcovs[i], mcnt)] += (hcovs[i] + 1) * (hcovs[i]) / 2;
  1885. }
  1886. cut = tot * 0.8;
  1887. tot = 0;
  1888. for(i=mcnt;i>1;i--){
  1889. tot += hcnts[i];
  1890. if(tot >= cut){
  1891. break;
  1892. }
  1893. }
  1894. if(i < mcnt){
  1895. if(cns_debug > 1){
  1896. fprintf(stderr, " Revise mcnt %u -> %u\n", mcnt, i); fflush(stderr);
  1897. }
  1898. mcnt = i;
  1899. min_cnt = i;
  1900. max_cnt = g->seqs->nseq - min_cnt;
  1901. }
  1902. }
  1903. // gen cns
  1904. cbeg = 0;
  1905. cend = g->msa_len;
  1906. if(g->par->refmode){
  1907. rid = 0;
  1908. {
  1909. r = ref_u1v(g->msa, g->msa_len * rid);
  1910. cbeg = 0;
  1911. while(cbeg < g->msa_len && r[cbeg] == 4){ hcovs[cbeg] = 0; cbeg ++; }
  1912. end = g->msa_len;
  1913. while(cend > cbeg && r[cend - 1] == 4){ cend --; hcovs[cend] = 0; }
  1914. }
  1915. } else {
  1916. cbeg = 0;
  1917. while(cbeg < g->msa_len && hcovs[cbeg] < min_cnt) cbeg ++;
  1918. cend = g->msa_len;
  1919. while(cend > cbeg && hcovs[cend - 1] < min_cnt) cend --;
  1920. }
  1921. fmax1 = 5;
  1922. fmax2 = 10;
  1923. if(cns_debug > 1){
  1924. for(i=0;i<fmax1;i++){
  1925. memset(freqs[i], 0, (fmax2 + 1) * sizeof(u4i));
  1926. }
  1927. }
  1928. lst = lsv = MAX_U4;
  1929. lsx = 0;
  1930. runlen = 0;
  1931. cl = 0;
  1932. cnl = 0;
  1933. end = 0;
  1934. flush = 0;
  1935. for(idx=cbeg;idx<=cend;idx++){
  1936. if(idx < cend){
  1937. flush = 0;
  1938. memset(cnts, 0, 5 * 2);
  1939. if(g->par->refmode){
  1940. if((max = g->msa->buffer[g->msa_len * 0 + idx]) == 4){
  1941. max = 0;
  1942. } else {
  1943. if(hcovs[idx] < min_cnt){
  1944. flush = 1;
  1945. }
  1946. }
  1947. } else {
  1948. max = 0;
  1949. }
  1950. for(rid=0;rid<g->seqs->nseq;rid++){
  1951. cnts[g->msa->buffer[g->msa_len * rid + idx]] ++;
  1952. }
  1953. for(i=0;i<4;i++){
  1954. if(cnts[i] > cnts[max]){
  1955. max = i;
  1956. }
  1957. }
  1958. if(flush){
  1959. s[idx] = max;
  1960. end = idx;
  1961. } else if(hcovs[idx] >= min_cnt && cnts[max] >= mcnt && cnts[4] - (g->seqs->nseq - hcovs[idx]) < (g->seqs->nseq - cnts[4])){
  1962. s[idx] = max;
  1963. end = idx;
  1964. flush = 1;
  1965. }
  1966. } else {
  1967. if(end + 1 == idx){
  1968. end = idx;
  1969. }
  1970. max = 4;
  1971. flush = 1;
  1972. }
  1973. if(flush){
  1974. if(lst == MAX_U4){ lst = idx; lsv = idx; }
  1975. if(idx == cend || s[lst] != max){
  1976. runlen = 0;
  1977. for(rid=0;rid<g->seqs->nseq;rid++){
  1978. r = ref_u1v(g->msa, g->msa_len * rid);
  1979. bl = 0;
  1980. for(i=lsv;i<end;i++){
  1981. if(r[i] == s[lst]) bl ++;
  1982. }
  1983. bls[rid] = bl;
  1984. runlen += bl;
  1985. }
  1986. sort_array(bls, g->seqs->nseq, u2i, num_cmpgt(b, a));
  1987. bx = 1;
  1988. bl = bls[0];
  1989. bm = 1;
  1990. dl = 0;
  1991. dm = 0;
  1992. for(rid=1;rid<=hcovs[lst];rid++){
  1993. if(rid < hcovs[lst] && bls[rid] == bls[rid - 1]){
  1994. bx ++;
  1995. } else {
  1996. if(cns_debug > 1 && cl <= fmax1 && bls[rid - 1] <= fmax2){
  1997. freqs[cl - 1][bls[rid - 1]] += bx;
  1998. }
  1999. if(bx > bm){
  2000. if(dm < bm){
  2001. dm = bm;
  2002. dl = bl;
  2003. }
  2004. bm = bx;
  2005. bl = bls[rid - 1];
  2006. } else if(bx > dm){
  2007. dm = bx;
  2008. dl = bls[rid - 1];
  2009. }
  2010. bx = 1;
  2011. }
  2012. }
  2013. fl = runlen * 1.0 / hcovs[lst];
  2014. if(cns_debug > 1){
  2015. fprintf(stderr, "HOMO[%3u] %4u\t%c\t%u\t%u:%u\t%u:%u\t%u\t%u\t%0.2f", lst, cnl, bit_base_table[s[lst]], cl, bl, bm, dl, dm, runlen, hcovs[lst], fl);
  2016. if(cl != bl){
  2017. fprintf(stderr, " *\n");
  2018. } else {
  2019. fprintf(stderr, "\n");
  2020. }
  2021. }
  2022. if(cl != bl){
  2023. if(bl > cl + 1 && bl > Int(fl) + 1) bl = Int(fl) + 1; // Don't correct too much
  2024. if(bl + 1 < cl && (float)bl < fl) bl = cl - 1;
  2025. if(bl < cl && cl == dl && dm >= Int(0.8 * bm)){ // prefer increase runlen
  2026. norm = 1.0 / homo_merging_cmp_norm[num_min(cl, 19)];
  2027. } else {
  2028. norm = homo_merging_cmp_norm[num_min(bl, 19)];
  2029. }
  2030. fx1 = num_abs(cl - fl);
  2031. fx2 = num_abs(bl - fl);
  2032. if(norm * fx2 <= fx1){
  2033. corr = bl;
  2034. if(cns_debug > 1){
  2035. fprintf(stderr, "CORR[%03u] %4u\t%c\t%u->%u\n", lst, cnl, bit_base_table[s[lst]], cl, bl);
  2036. }
  2037. } else {
  2038. corr = cl;
  2039. }
  2040. } else {
  2041. corr = cl;
  2042. }
  2043. cnl += cl;
  2044. for(i=0;i<corr;i++){
  2045. bit2basebank(g->cns, s[lst]);
  2046. if(i){
  2047. s[lst + i] = s[lst];
  2048. }
  2049. }
  2050. for(i+=lst;i<end;i++){
  2051. s[i] = 4;
  2052. }
  2053. runlen = 0;
  2054. lst = idx;
  2055. lsv = lsx;
  2056. lsx = idx;
  2057. cl = 1;
  2058. } else {
  2059. cl ++;
  2060. lsx = idx;
  2061. }
  2062. }
  2063. }
  2064. if(cns_debug > 1){
  2065. for(cl=0;cl<fmax1;cl++){
  2066. fprintf(stderr, "RUNLEN[%u]", cl + 1);
  2067. for(bl=0;bl<=fmax2;bl++){
  2068. fprintf(stderr, "%10u,", freqs[cl][bl]);
  2069. }
  2070. fprintf(stderr, "\n");
  2071. }
  2072. }
  2073. }
  2074. static inline void check_dup_edges_pog(POG *g){
  2075. pog_node_t *u;
  2076. pog_edge_t *e;
  2077. u32hash *hash;
  2078. u4i nidx, eidx, *t;
  2079. int exists;
  2080. hash = init_u32hash(13);
  2081. for(nidx=0;nidx<g->nodes->size;nidx++){
  2082. u = ref_pognodev(g->nodes, nidx);
  2083. clear_u32hash(hash);
  2084. eidx = u->edge;
  2085. while(eidx){
  2086. e = ref_pogedgev(g->edges, eidx);
  2087. eidx = e->next;
  2088. t = prepare_u32hash(hash, e->node, &exists);
  2089. if(exists){
  2090. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  2091. abort();
  2092. } else {
  2093. *t = e->node;
  2094. }
  2095. }
  2096. }
  2097. free_u32hash(hash);
  2098. }
  2099. static inline void end_pog(POG *g){
  2100. pog_node_t *u, *v, *x;
  2101. pog_edge_t *e;
  2102. u1i *r;
  2103. u4i i, ridx, nidx, eidx, xidx, moff, ready, beg, end, reflen, margin;
  2104. int score;
  2105. clear_basebank(g->cns);
  2106. if(g->seqs->nseq == 0) return;
  2107. score = align_rd_pog(g, 0);
  2108. if(g->par->refmode){
  2109. // add edges to refbeg and refend, to make sure reads can be aligned quickly and correctly within small bandwidth
  2110. u = ref_pognodev(g->nodes, POG_HEAD_NODE);
  2111. reflen = g->seqs->rdlens->buffer[0];
  2112. margin = 5;
  2113. for(i=0;i<g->sbegs->size;i++){
  2114. if(g->sbegs->buffer[i] < margin || g->sbegs->buffer[i] + margin >= reflen) continue;
  2115. nidx = POG_TAIL_NODE + 1 + (reflen - 1 - g->sbegs->buffer[i]);
  2116. v = ref_pognodev(g->nodes, nidx);
  2117. e = add_edge_pog(g, u, v, 0, 1);
  2118. }
  2119. v = ref_pognodev(g->nodes, POG_TAIL_NODE);
  2120. for(i=0;i<g->sends->size;i++){
  2121. if(g->sends->buffer[i] < margin || g->sends->buffer[i] + margin >= reflen) continue;
  2122. nidx = POG_TAIL_NODE + 1 + (reflen - g->sends->buffer[i]);
  2123. u = ref_pognodev(g->nodes, nidx);
  2124. e = add_edge_pog(g, u, v, 0, 1);
  2125. }
  2126. }
  2127. for(ridx=1;ridx<g->seqs->nseq;ridx++){
  2128. score = align_rd_pog(g, ridx);
  2129. }
  2130. for(nidx=0;nidx<g->nodes->size;nidx++){
  2131. u = ref_pognodev(g->nodes, nidx);
  2132. u->vst = 0;
  2133. u->aux = 0;
  2134. u->coff = 0;
  2135. u->erev = 0;
  2136. }
  2137. // calcuate msa_len
  2138. clear_u4v(g->stack);
  2139. push_u4v(g->stack, POG_HEAD_NODE);
  2140. nidx = POG_HEAD_NODE;
  2141. while(pop_u4v(g->stack, &nidx)){
  2142. u = ref_pognodev(g->nodes, nidx);
  2143. eidx = u->edge;
  2144. while(eidx){
  2145. e = ref_pogedgev(g->edges, eidx);
  2146. eidx = e->next;
  2147. v = ref_pognodev(g->nodes, e->node);
  2148. if(u->coff + 1 > v->coff){
  2149. v->coff = u->coff + 1;
  2150. }
  2151. v->vst ++;
  2152. if(v->vst > v->nin){
  2153. print_vstdot_pog(g, "1.dot");
  2154. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  2155. check_dup_edges_pog(g);
  2156. abort();
  2157. }
  2158. }
  2159. eidx = u->edge;
  2160. while(eidx){
  2161. e = ref_pogedgev(g->edges, eidx);
  2162. eidx = e->next;
  2163. v = ref_pognodev(g->nodes, e->node);
  2164. if(v->aux) continue; // already pushed
  2165. if(v->vst > v->nin){
  2166. print_vstdot_pog(g, "1.dot");
  2167. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  2168. check_dup_edges_pog(g);
  2169. abort();
  2170. }
  2171. if(v->vst == v->nin){
  2172. ready = 1;
  2173. {
  2174. xidx = v->aligned;
  2175. moff = v->coff;
  2176. while(xidx != e->node){
  2177. x = ref_pognodev(g->nodes, xidx);
  2178. if(x->nin > x->vst){
  2179. ready = 0;
  2180. break;
  2181. }
  2182. if(x->coff > moff){
  2183. moff = x->coff;
  2184. }
  2185. xidx = x->aligned;
  2186. }
  2187. }
  2188. if(ready){
  2189. v->coff = moff;
  2190. v->aux = 1;
  2191. push_u4v(g->stack, e->node);
  2192. xidx = v->aligned;
  2193. while(xidx != e->node){
  2194. x = ref_pognodev(g->nodes, xidx);
  2195. x->coff = moff;
  2196. if(x->edge){
  2197. push_u4v(g->stack, xidx);
  2198. x->aux = 1;
  2199. }
  2200. xidx = x->aligned;
  2201. }
  2202. }
  2203. }
  2204. }
  2205. }
  2206. if(nidx != POG_TAIL_NODE){
  2207. fprint_dot_pog(g, "1.dot", NULL);
  2208. print_seqs_pog(g, "1.seqs.fa", NULL);
  2209. fprintf(stderr, " -- something wrong in %s -- %s:%d --\n", __FUNCTION__, __FILE__, __LINE__); fflush(stderr);
  2210. abort();
  2211. }
  2212. // generate MSA
  2213. u = ref_pognodev(g->nodes, POG_TAIL_NODE);
  2214. g->msa_len = u->coff;
  2215. for(nidx=0;nidx<g->nodes->size;nidx++){
  2216. u = ref_pognodev(g->nodes, nidx);
  2217. u->vst = 0;
  2218. }
  2219. clear_and_encap_u1v(g->msa, g->msa_len * (g->seqs->nseq + 2));
  2220. g->msa->size = g->msa_len * (g->seqs->nseq + 1);
  2221. memset(g->msa->buffer, 4, g->msa->size);
  2222. clear_u4v(g->stack);
  2223. push_u4v(g->stack, POG_HEAD_NODE);
  2224. while(pop_u4v(g->stack, &nidx)){
  2225. u = ref_pognodev(g->nodes, nidx);
  2226. eidx = u->edge;
  2227. while(eidx){
  2228. e = ref_pogedgev(g->edges, eidx);
  2229. eidx = e->next;
  2230. v = ref_pognodev(g->nodes, e->node);
  2231. v->vst ++;
  2232. if(v->vst >= v->nin){
  2233. ready = 1;
  2234. xidx = v->aligned;
  2235. while(xidx != e->node){
  2236. x = ref_pognodev(g->nodes, xidx);
  2237. if(x->nin > x->vst){
  2238. ready = 0;
  2239. break;
  2240. }
  2241. xidx = x->aligned;
  2242. }
  2243. if(ready){
  2244. xidx = e->node;
  2245. do {
  2246. x = ref_pognodev(g->nodes, xidx);
  2247. if(xidx != POG_TAIL_NODE){
  2248. set_u1v(g->msa, x->rid * g->msa_len + x->coff, (x->base) & 0x03);
  2249. }
  2250. if(x->edge){
  2251. push_u4v(g->stack, xidx);
  2252. }
  2253. xidx = x->aligned;
  2254. } while(xidx != e->node);
  2255. }
  2256. }
  2257. }
  2258. }
  2259. clear_and_encap_u2v(g->hcovs, g->msa_len + 8 + g->seqs->nseq);
  2260. memset(g->hcovs->buffer, 0, (g->msa_len + 8 + g->seqs->nseq) * sizeof(u2i));
  2261. for(ridx=0;ridx<g->seqs->nseq;ridx++){
  2262. r = ref_u1v(g->msa, g->msa_len * ridx);
  2263. beg = 0;
  2264. while(beg < g->msa_len && r[beg] == 4) beg ++;
  2265. end = g->msa_len;
  2266. while(end && r[end - 1] == 4) end --;
  2267. for(i=beg;i<end;i++) g->hcovs->buffer[i] ++;
  2268. }
  2269. // realignment
  2270. realign_msa_pog(g);
  2271. //// realignment again
  2272. //realign_msa_pog(g);
  2273. // gen consensus line
  2274. if(g->par->cnsmode == 1){
  2275. dp_call_cns_pog(g);
  2276. } else {
  2277. gen_cns_pog(g);
  2278. }
  2279. if(cns_debug > 1){
  2280. print_msa_pog(g, stderr);
  2281. }
  2282. if(0){
  2283. fprintf(stderr, " -- seqs\t%llu --\n", (u8i)g->seqs->rdseqs->cap); fflush(stderr);
  2284. fprintf(stderr, " -- nodes\t%llu --\n", (u8i)g->nodes->cap); fflush(stderr);
  2285. fprintf(stderr, " -- edges\t%llu --\n", (u8i)g->edges->cap); fflush(stderr);
  2286. fprintf(stderr, " -- rows\t%llu/%llu --\n", (u8i)g->rows->size, (u8i)g->rows->cap); fflush(stderr);
  2287. fprintf(stderr, " -- btds\t%llu/%llu --\n", (u8i)g->rows->size, (u8i)g->btds->cap); fflush(stderr);
  2288. fprintf(stderr, " -- btxs\t%llu/%llu --\n", (u8i)g->btxs->size, (u8i)g->btxs->cap); fflush(stderr);
  2289. fprintf(stderr, " -- cns\t%llu --\n", (u8i)g->cns->cap); fflush(stderr);
  2290. }
  2291. }
  2292. #endif