id sid tid token lemma pos 10_1101-2021_01_08_425967 1 1 Partition Partition NNP 10_1101-2021_01_08_425967 1 2 Quantitative Quantitative NNP 10_1101-2021_01_08_425967 1 3 Assessment Assessment NNP 10_1101-2021_01_08_425967 1 4 ( ( -LRB- 10_1101-2021_01_08_425967 1 5 PQA PQA NNP 10_1101-2021_01_08_425967 1 6 ) ) -RRB- 10_1101-2021_01_08_425967 1 7 : : : 10_1101-2021_01_08_425967 1 8 A a DT 10_1101-2021_01_08_425967 1 9 quantitative quantitative JJ 10_1101-2021_01_08_425967 1 10 methodology methodology NN 10_1101-2021_01_08_425967 1 11 to to TO 10_1101-2021_01_08_425967 1 12 assess assess VB 10_1101-2021_01_08_425967 1 13 the the DT 10_1101-2021_01_08_425967 1 14 embedded embed VBN 10_1101-2021_01_08_425967 1 15 noise noise NN 10_1101-2021_01_08_425967 1 16 in in IN 10_1101-2021_01_08_425967 1 17 clustered clustered JJ 10_1101-2021_01_08_425967 1 18 omics omic NNS 10_1101-2021_01_08_425967 1 19 and and CC 10_1101-2021_01_08_425967 1 20 systems system NNS 10_1101-2021_01_08_425967 1 21 biology biology NN 10_1101-2021_01_08_425967 1 22 data datum NNS 10_1101-2021_01_08_425967 1 23 Partition Partition NNP 10_1101-2021_01_08_425967 1 24 Quantitative Quantitative NNP 10_1101-2021_01_08_425967 1 25 Assessment Assessment NNP 10_1101-2021_01_08_425967 1 26 ( ( -LRB- 10_1101-2021_01_08_425967 1 27 PQA PQA NNP 10_1101-2021_01_08_425967 1 28 ) ) -RRB- 10_1101-2021_01_08_425967 1 29 : : : 10_1101-2021_01_08_425967 1 30 A a DT 10_1101-2021_01_08_425967 1 31 quantitative quantitative JJ 10_1101-2021_01_08_425967 1 32 methodology methodology NN 10_1101-2021_01_08_425967 1 33 to to TO 10_1101-2021_01_08_425967 1 34 assess assess VB 10_1101-2021_01_08_425967 1 35 the the DT 10_1101-2021_01_08_425967 1 36 embedded embed VBN 10_1101-2021_01_08_425967 1 37 noise noise NN 10_1101-2021_01_08_425967 1 38 in in IN 10_1101-2021_01_08_425967 1 39 clustered clustered JJ 10_1101-2021_01_08_425967 1 40 omics omic NNS 10_1101-2021_01_08_425967 1 41 and and CC 10_1101-2021_01_08_425967 1 42 systems system NNS 10_1101-2021_01_08_425967 1 43 biology biology NN 10_1101-2021_01_08_425967 1 44 data datum NNS 10_1101-2021_01_08_425967 1 45 Camacho Camacho NNP 10_1101-2021_01_08_425967 1 46 - - HYPH 10_1101-2021_01_08_425967 1 47 Hernández Hernández NNP 10_1101-2021_01_08_425967 1 48 , , , 10_1101-2021_01_08_425967 1 49 Diego Diego NNP 10_1101-2021_01_08_425967 1 50 A.1,2† A.1,2† NNP 10_1101-2021_01_08_425967 1 51 , , , 10_1101-2021_01_08_425967 1 52 Nieto Nieto NNP 10_1101-2021_01_08_425967 1 53 - - HYPH 10_1101-2021_01_08_425967 1 54 Caballero Caballero NNP 10_1101-2021_01_08_425967 1 55 , , , 10_1101-2021_01_08_425967 1 56 Victor Victor NNP 10_1101-2021_01_08_425967 1 57 E.1,2† E.1,2† NNP 10_1101-2021_01_08_425967 1 58 , , , 10_1101-2021_01_08_425967 1 59 León León NNP 10_1101-2021_01_08_425967 1 60 - - HYPH 10_1101-2021_01_08_425967 1 61 Burguete Burguete NNP 10_1101-2021_01_08_425967 1 62 , , , 10_1101-2021_01_08_425967 1 63 José José NNP 10_1101-2021_01_08_425967 1 64 E.1,2 E.1,2 NNP 10_1101-2021_01_08_425967 1 65 , , , 10_1101-2021_01_08_425967 1 66 and and CC 10_1101-2021_01_08_425967 1 67 Freyre Freyre NNP 10_1101-2021_01_08_425967 1 68 - - HYPH 10_1101-2021_01_08_425967 1 69 González González NNP 10_1101-2021_01_08_425967 1 70 , , , 10_1101-2021_01_08_425967 1 71 Julio Julio NNP 10_1101-2021_01_08_425967 1 72 A.1 A.1 NNP 10_1101-2021_01_08_425967 1 73 , , , 10_1101-2021_01_08_425967 1 74 * * NFP 10_1101-2021_01_08_425967 1 75 1 1 CD 10_1101-2021_01_08_425967 1 76 Regulatory Regulatory NNP 10_1101-2021_01_08_425967 1 77 Systems Systems NNPS 10_1101-2021_01_08_425967 1 78 Biology Biology NNP 10_1101-2021_01_08_425967 1 79 Research Research NNP 10_1101-2021_01_08_425967 1 80 Group Group NNP 10_1101-2021_01_08_425967 1 81 , , , 10_1101-2021_01_08_425967 1 82 Laboratory Laboratory NNP 10_1101-2021_01_08_425967 1 83 of of IN 10_1101-2021_01_08_425967 1 84 Systems Systems NNPS 10_1101-2021_01_08_425967 1 85 and and CC 10_1101-2021_01_08_425967 1 86 Synthetic Synthetic NNP 10_1101-2021_01_08_425967 1 87 Biology Biology NNP 10_1101-2021_01_08_425967 1 88 and and CC 10_1101-2021_01_08_425967 1 89 2 2 CD 10_1101-2021_01_08_425967 1 90 Undergraduate Undergraduate NNP 10_1101-2021_01_08_425967 1 91 Program Program NNP 10_1101-2021_01_08_425967 1 92 in in IN 10_1101-2021_01_08_425967 1 93 Genomic Genomic NNP 10_1101-2021_01_08_425967 1 94 Sciences Sciences NNPS 10_1101-2021_01_08_425967 1 95 , , , 10_1101-2021_01_08_425967 1 96 Center Center NNP 10_1101-2021_01_08_425967 1 97 for for IN 10_1101-2021_01_08_425967 1 98 Genomic Genomic NNP 10_1101-2021_01_08_425967 1 99 Sciences Sciences NNPS 10_1101-2021_01_08_425967 1 100 , , , 10_1101-2021_01_08_425967 1 101 Universidad Universidad NNP 10_1101-2021_01_08_425967 1 102 Nacional Nacional NNP 10_1101-2021_01_08_425967 1 103 Autónoma Autónoma NNP 10_1101-2021_01_08_425967 1 104 de de NNP 10_1101-2021_01_08_425967 1 105 México México NNP 10_1101-2021_01_08_425967 1 106 ( ( -LRB- 10_1101-2021_01_08_425967 1 107 UNAM UNAM NNP 10_1101-2021_01_08_425967 1 108 ) ) -RRB- 10_1101-2021_01_08_425967 1 109 , , , 10_1101-2021_01_08_425967 1 110 Morelos Morelos NNP 10_1101-2021_01_08_425967 1 111 , , , 10_1101-2021_01_08_425967 1 112 Mexico Mexico NNP 10_1101-2021_01_08_425967 1 113 . . . 10_1101-2021_01_08_425967 2 1 † † RB 10_1101-2021_01_08_425967 2 2 These these DT 10_1101-2021_01_08_425967 2 3 authors author NNS 10_1101-2021_01_08_425967 2 4 contributed contribute VBD 10_1101-2021_01_08_425967 2 5 equally equally RB 10_1101-2021_01_08_425967 2 6 to to IN 10_1101-2021_01_08_425967 2 7 this this DT 10_1101-2021_01_08_425967 2 8 work work NN 10_1101-2021_01_08_425967 2 9 . . . 10_1101-2021_01_08_425967 3 1 * * NFP 10_1101-2021_01_08_425967 3 2 Corresponding correspond VBG 10_1101-2021_01_08_425967 3 3 author author NN 10_1101-2021_01_08_425967 3 4 : : : 10_1101-2021_01_08_425967 3 5 jfreyre@ccg.unam.mx jfreyre@ccg.unam.mx NNP 10_1101-2021_01_08_425967 3 6 Abstract Abstract NNP 10_1101-2021_01_08_425967 3 7 : : : 10_1101-2021_01_08_425967 3 8 Identifying identify VBG 10_1101-2021_01_08_425967 3 9 groups group NNS 10_1101-2021_01_08_425967 3 10 that that WDT 10_1101-2021_01_08_425967 3 11 share share VBP 10_1101-2021_01_08_425967 3 12 common common JJ 10_1101-2021_01_08_425967 3 13 features feature NNS 10_1101-2021_01_08_425967 3 14 among among IN 10_1101-2021_01_08_425967 3 15 datasets dataset NNS 10_1101-2021_01_08_425967 3 16 through through IN 10_1101-2021_01_08_425967 3 17 clustering cluster VBG 10_1101-2021_01_08_425967 3 18 analysis analysis NN 10_1101-2021_01_08_425967 3 19 is be VBZ 10_1101-2021_01_08_425967 3 20 a a DT 10_1101-2021_01_08_425967 3 21 typical typical JJ 10_1101-2021_01_08_425967 3 22 problem problem NN 10_1101-2021_01_08_425967 3 23 in in IN 10_1101-2021_01_08_425967 3 24 many many JJ 10_1101-2021_01_08_425967 3 25 fields field NNS 10_1101-2021_01_08_425967 3 26 of of IN 10_1101-2021_01_08_425967 3 27 science science NN 10_1101-2021_01_08_425967 3 28 , , , 10_1101-2021_01_08_425967 3 29 particularly particularly RB 10_1101-2021_01_08_425967 3 30 in in IN 10_1101-2021_01_08_425967 3 31 post post NN 10_1101-2021_01_08_425967 3 32 - - NNS 10_1101-2021_01_08_425967 3 33 omics omic NNS 10_1101-2021_01_08_425967 3 34 and and CC 10_1101-2021_01_08_425967 3 35 systems system NNS 10_1101-2021_01_08_425967 3 36 biology biology NN 10_1101-2021_01_08_425967 3 37 research research NN 10_1101-2021_01_08_425967 3 38 . . . 10_1101-2021_01_08_425967 4 1 In in IN 10_1101-2021_01_08_425967 4 2 respect respect NN 10_1101-2021_01_08_425967 4 3 of of IN 10_1101-2021_01_08_425967 4 4 this this DT 10_1101-2021_01_08_425967 4 5 , , , 10_1101-2021_01_08_425967 4 6 quantifying quantify VBG 10_1101-2021_01_08_425967 4 7 how how WRB 10_1101-2021_01_08_425967 4 8 a a DT 10_1101-2021_01_08_425967 4 9 measure measure NN 10_1101-2021_01_08_425967 4 10 can can MD 10_1101-2021_01_08_425967 4 11 cluster cluster VB 10_1101-2021_01_08_425967 4 12 or or CC 10_1101-2021_01_08_425967 4 13 organize organize VB 10_1101-2021_01_08_425967 4 14 intrinsic intrinsic JJ 10_1101-2021_01_08_425967 4 15 groups group NNS 10_1101-2021_01_08_425967 4 16 is be VBZ 10_1101-2021_01_08_425967 4 17 important important JJ 10_1101-2021_01_08_425967 4 18 since since IN 10_1101-2021_01_08_425967 4 19 currently currently RB 10_1101-2021_01_08_425967 4 20 there there EX 10_1101-2021_01_08_425967 4 21 is be VBZ 10_1101-2021_01_08_425967 4 22 no no DT 10_1101-2021_01_08_425967 4 23 statistical statistical JJ 10_1101-2021_01_08_425967 4 24 evaluation evaluation NN 10_1101-2021_01_08_425967 4 25 of of IN 10_1101-2021_01_08_425967 4 26 how how WRB 10_1101-2021_01_08_425967 4 27 ordered order VBN 10_1101-2021_01_08_425967 4 28 is be VBZ 10_1101-2021_01_08_425967 4 29 , , , 10_1101-2021_01_08_425967 4 30 or or CC 10_1101-2021_01_08_425967 4 31 how how WRB 10_1101-2021_01_08_425967 4 32 much much JJ 10_1101-2021_01_08_425967 4 33 noise noise NN 10_1101-2021_01_08_425967 4 34 is be VBZ 10_1101-2021_01_08_425967 4 35 embedded embed VBN 10_1101-2021_01_08_425967 4 36 in in IN 10_1101-2021_01_08_425967 4 37 the the DT 10_1101-2021_01_08_425967 4 38 resulting result VBG 10_1101-2021_01_08_425967 4 39 clustered clustered JJ 10_1101-2021_01_08_425967 4 40 vector vector NN 10_1101-2021_01_08_425967 4 41 . . . 10_1101-2021_01_08_425967 5 1 Many many JJ 10_1101-2021_01_08_425967 5 2 of of IN 10_1101-2021_01_08_425967 5 3 the the DT 10_1101-2021_01_08_425967 5 4 literature literature NN 10_1101-2021_01_08_425967 5 5 focuses focus VBZ 10_1101-2021_01_08_425967 5 6 on on IN 10_1101-2021_01_08_425967 5 7 how how WRB 10_1101-2021_01_08_425967 5 8 well well RB 10_1101-2021_01_08_425967 5 9 the the DT 10_1101-2021_01_08_425967 5 10 clustering cluster VBG 10_1101-2021_01_08_425967 5 11 algorithm algorithm NN 10_1101-2021_01_08_425967 5 12 orders order VBZ 10_1101-2021_01_08_425967 5 13 the the DT 10_1101-2021_01_08_425967 5 14 data datum NNS 10_1101-2021_01_08_425967 5 15 , , , 10_1101-2021_01_08_425967 5 16 with with IN 10_1101-2021_01_08_425967 5 17 several several JJ 10_1101-2021_01_08_425967 5 18 measures measure NNS 10_1101-2021_01_08_425967 5 19 regarding regard VBG 10_1101-2021_01_08_425967 5 20 external external JJ 10_1101-2021_01_08_425967 5 21 and and CC 10_1101-2021_01_08_425967 5 22 internal internal JJ 10_1101-2021_01_08_425967 5 23 statistical statistical JJ 10_1101-2021_01_08_425967 5 24 measures measure NNS 10_1101-2021_01_08_425967 5 25 ; ; : 10_1101-2021_01_08_425967 5 26 but but CC 10_1101-2021_01_08_425967 5 27 none none NN 10_1101-2021_01_08_425967 5 28 measure measure NN 10_1101-2021_01_08_425967 5 29 has have VBZ 10_1101-2021_01_08_425967 5 30 been be VBN 10_1101-2021_01_08_425967 5 31 developed develop VBN 10_1101-2021_01_08_425967 5 32 to to TO 10_1101-2021_01_08_425967 5 33 statistically statistically RB 10_1101-2021_01_08_425967 5 34 quantify quantify VB 10_1101-2021_01_08_425967 5 35 the the DT 10_1101-2021_01_08_425967 5 36 noise noise NN 10_1101-2021_01_08_425967 5 37 in in IN 10_1101-2021_01_08_425967 5 38 an an DT 10_1101-2021_01_08_425967 5 39 arranged arrange VBN 10_1101-2021_01_08_425967 5 40 vector vector NN 10_1101-2021_01_08_425967 5 41 posterior posterior NN 10_1101-2021_01_08_425967 5 42 a a DT 10_1101-2021_01_08_425967 5 43 clustering cluster VBG 10_1101-2021_01_08_425967 5 44 algorithm algorithm NN 10_1101-2021_01_08_425967 5 45 , , , 10_1101-2021_01_08_425967 5 46 i.e. i.e. FW 10_1101-2021_01_08_425967 5 47 , , , 10_1101-2021_01_08_425967 5 48 how how WRB 10_1101-2021_01_08_425967 5 49 much much JJ 10_1101-2021_01_08_425967 5 50 of of IN 10_1101-2021_01_08_425967 5 51 the the DT 10_1101-2021_01_08_425967 5 52 clustering clustering NN 10_1101-2021_01_08_425967 5 53 is be VBZ 10_1101-2021_01_08_425967 5 54 due due JJ 10_1101-2021_01_08_425967 5 55 to to IN 10_1101-2021_01_08_425967 5 56 randomness randomness NN 10_1101-2021_01_08_425967 5 57 . . . 10_1101-2021_01_08_425967 6 1 Here here RB 10_1101-2021_01_08_425967 6 2 , , , 10_1101-2021_01_08_425967 6 3 we -PRON- PRP 10_1101-2021_01_08_425967 6 4 present present VBP 10_1101-2021_01_08_425967 6 5 a a DT 10_1101-2021_01_08_425967 6 6 quantitative quantitative JJ 10_1101-2021_01_08_425967 6 7 methodology methodology NN 10_1101-2021_01_08_425967 6 8 , , , 10_1101-2021_01_08_425967 6 9 based base VBN 10_1101-2021_01_08_425967 6 10 on on IN 10_1101-2021_01_08_425967 6 11 autocorrelation autocorrelation NN 10_1101-2021_01_08_425967 6 12 , , , 10_1101-2021_01_08_425967 6 13 to to TO 10_1101-2021_01_08_425967 6 14 assess assess VB 10_1101-2021_01_08_425967 6 15 this this DT 10_1101-2021_01_08_425967 6 16 problem problem NN 10_1101-2021_01_08_425967 6 17 . . . 10_1101-2021_01_08_425967 7 1 Keywords keyword NNS 10_1101-2021_01_08_425967 7 2 : : : 10_1101-2021_01_08_425967 7 3 omics omic NNS 10_1101-2021_01_08_425967 7 4 data datum NNS 10_1101-2021_01_08_425967 7 5 ; ; : 10_1101-2021_01_08_425967 7 6 hierarchical hierarchical JJ 10_1101-2021_01_08_425967 7 7 clustering clustering NN 10_1101-2021_01_08_425967 7 8 ; ; : 10_1101-2021_01_08_425967 7 9 noise noise NN 10_1101-2021_01_08_425967 7 10 quantification quantification NN 10_1101-2021_01_08_425967 7 11 . . . 10_1101-2021_01_08_425967 8 1 1 1 LS 10_1101-2021_01_08_425967 8 2 . . . 10_1101-2021_01_08_425967 9 1 Introduction introduction NN 10_1101-2021_01_08_425967 9 2 A a DT 10_1101-2021_01_08_425967 9 3 common common JJ 10_1101-2021_01_08_425967 9 4 task task NN 10_1101-2021_01_08_425967 9 5 in in IN 10_1101-2021_01_08_425967 9 6 today today NN 10_1101-2021_01_08_425967 9 7 ’s ’s POS 10_1101-2021_01_08_425967 9 8 research research NN 10_1101-2021_01_08_425967 9 9 is be VBZ 10_1101-2021_01_08_425967 9 10 the the DT 10_1101-2021_01_08_425967 9 11 identification identification NN 10_1101-2021_01_08_425967 9 12 of of IN 10_1101-2021_01_08_425967 9 13 specific specific JJ 10_1101-2021_01_08_425967 9 14 markers marker NNS 10_1101-2021_01_08_425967 9 15 , , , 10_1101-2021_01_08_425967 9 16 as as IN 10_1101-2021_01_08_425967 9 17 predictors predictor NNS 10_1101-2021_01_08_425967 9 18 of of IN 10_1101-2021_01_08_425967 9 19 a a DT 10_1101-2021_01_08_425967 9 20 classification classification NN 10_1101-2021_01_08_425967 9 21 yielded yield VBN 10_1101-2021_01_08_425967 9 22 in in IN 10_1101-2021_01_08_425967 9 23 clustering cluster VBG 10_1101-2021_01_08_425967 9 24 analysis analysis NN 10_1101-2021_01_08_425967 9 25 of of IN 10_1101-2021_01_08_425967 9 26 the the DT 10_1101-2021_01_08_425967 9 27 data datum NNS 10_1101-2021_01_08_425967 9 28 . . . 10_1101-2021_01_08_425967 10 1 For for IN 10_1101-2021_01_08_425967 10 2 instance instance NN 10_1101-2021_01_08_425967 10 3 , , , 10_1101-2021_01_08_425967 10 4 this this DT 10_1101-2021_01_08_425967 10 5 approach approach NN 10_1101-2021_01_08_425967 10 6 is be VBZ 10_1101-2021_01_08_425967 10 7 particularly particularly RB 10_1101-2021_01_08_425967 10 8 useful useful JJ 10_1101-2021_01_08_425967 10 9 after after IN 10_1101-2021_01_08_425967 10 10 high high JJ 10_1101-2021_01_08_425967 10 11 - - HYPH 10_1101-2021_01_08_425967 10 12 throughput throughput NN 10_1101-2021_01_08_425967 10 13 experiments experiment NNS 10_1101-2021_01_08_425967 10 14 to to TO 10_1101-2021_01_08_425967 10 15 compare compare VB 10_1101-2021_01_08_425967 10 16 gene gene NN 10_1101-2021_01_08_425967 10 17 expression expression NN 10_1101-2021_01_08_425967 10 18 or or CC 10_1101-2021_01_08_425967 10 19 methylation methylation NN 10_1101-2021_01_08_425967 10 20 profiles profile NNS 10_1101-2021_01_08_425967 10 21 among among IN 10_1101-2021_01_08_425967 10 22 different different JJ 10_1101-2021_01_08_425967 10 23 cell cell NN 10_1101-2021_01_08_425967 10 24 lines line NNS 10_1101-2021_01_08_425967 10 25 [ [ -LRB- 10_1101-2021_01_08_425967 10 26 1 1 CD 10_1101-2021_01_08_425967 10 27 ] ] -RRB- 10_1101-2021_01_08_425967 10 28 . . . 10_1101-2021_01_08_425967 11 1 This this DT 10_1101-2021_01_08_425967 11 2 task task NN 10_1101-2021_01_08_425967 11 3 is be VBZ 10_1101-2021_01_08_425967 11 4 coming come VBG 10_1101-2021_01_08_425967 11 5 handful handful NN 10_1101-2021_01_08_425967 11 6 in in IN 10_1101-2021_01_08_425967 11 7 the the DT 10_1101-2021_01_08_425967 11 8 nascent nascent JJ 10_1101-2021_01_08_425967 11 9 field field NN 10_1101-2021_01_08_425967 11 10 of of IN 10_1101-2021_01_08_425967 11 11 single single JJ 10_1101-2021_01_08_425967 11 12 - - HYPH 10_1101-2021_01_08_425967 11 13 cell cell NN 10_1101-2021_01_08_425967 11 14 sequencing sequencing NN 10_1101-2021_01_08_425967 11 15 , , , 10_1101-2021_01_08_425967 11 16 leading lead VBG 10_1101-2021_01_08_425967 11 17 the the DT 10_1101-2021_01_08_425967 11 18 important important JJ 10_1101-2021_01_08_425967 11 19 step step NN 10_1101-2021_01_08_425967 11 20 of of IN 10_1101-2021_01_08_425967 11 21 clustering cluster VBG 10_1101-2021_01_08_425967 11 22 cells cell NNS 10_1101-2021_01_08_425967 11 23 to to IN 10_1101-2021_01_08_425967 11 24 further further JJ 10_1101-2021_01_08_425967 11 25 classification classification NN 10_1101-2021_01_08_425967 11 26 or or CC 10_1101-2021_01_08_425967 11 27 as as IN 10_1101-2021_01_08_425967 11 28 a a DT 10_1101-2021_01_08_425967 11 29 qualifying qualifying NN 10_1101-2021_01_08_425967 11 30 metric metric JJ 10_1101-2021_01_08_425967 11 31 of of IN 10_1101-2021_01_08_425967 11 32 the the DT 10_1101-2021_01_08_425967 11 33 sequencing sequencing NN 10_1101-2021_01_08_425967 11 34 process process NN 10_1101-2021_01_08_425967 11 35 [ [ -LRB- 10_1101-2021_01_08_425967 11 36 2 2 CD 10_1101-2021_01_08_425967 11 37 ] ] -RRB- 10_1101-2021_01_08_425967 11 38 . . . 10_1101-2021_01_08_425967 12 1 Regarding regard VBG 10_1101-2021_01_08_425967 12 2 the the DT 10_1101-2021_01_08_425967 12 3 vastly vastly RB 10_1101-2021_01_08_425967 12 4 used use VBN 10_1101-2021_01_08_425967 12 5 gene gene NN 10_1101-2021_01_08_425967 12 6 expression expression NN 10_1101-2021_01_08_425967 12 7 assays assays RB 10_1101-2021_01_08_425967 12 8 , , , 10_1101-2021_01_08_425967 12 9 the the DT 10_1101-2021_01_08_425967 12 10 vector vector NN 10_1101-2021_01_08_425967 12 11 of of IN 10_1101-2021_01_08_425967 12 12 profiles profile NNS 10_1101-2021_01_08_425967 12 13 for for IN 10_1101-2021_01_08_425967 12 14 each each DT 10_1101-2021_01_08_425967 12 15 marker marker NN 10_1101-2021_01_08_425967 12 16 across across IN 10_1101-2021_01_08_425967 12 17 different different JJ 10_1101-2021_01_08_425967 12 18 cell cell NN 10_1101-2021_01_08_425967 12 19 lines line NNS 10_1101-2021_01_08_425967 12 20 is be VBZ 10_1101-2021_01_08_425967 12 21 recorded record VBN 10_1101-2021_01_08_425967 12 22 using use VBG 10_1101-2021_01_08_425967 12 23 hierarchical hierarchical JJ 10_1101-2021_01_08_425967 12 24 clustering clustering NN 10_1101-2021_01_08_425967 12 25 algorithms algorithm NNS 10_1101-2021_01_08_425967 12 26 . . . 10_1101-2021_01_08_425967 13 1 These these DT 10_1101-2021_01_08_425967 13 2 algorithms algorithm NNS 10_1101-2021_01_08_425967 13 3 yield yield VBP 10_1101-2021_01_08_425967 13 4 a a DT 10_1101-2021_01_08_425967 13 5 dendrogram dendrogram NN 10_1101-2021_01_08_425967 13 6 and and CC 10_1101-2021_01_08_425967 13 7 a a DT 10_1101-2021_01_08_425967 13 8 heat heat NN 10_1101-2021_01_08_425967 13 9 map map NN 10_1101-2021_01_08_425967 13 10 representing represent VBG 10_1101-2021_01_08_425967 13 11 the the DT 10_1101-2021_01_08_425967 13 12 vector vector NN 10_1101-2021_01_08_425967 13 13 of of IN 10_1101-2021_01_08_425967 13 14 marker marker NN 10_1101-2021_01_08_425967 13 15 profiles profile NNS 10_1101-2021_01_08_425967 13 16 , , , 10_1101-2021_01_08_425967 13 17 illustrating illustrate VBG 10_1101-2021_01_08_425967 13 18 the the DT 10_1101-2021_01_08_425967 13 19 arrangement arrangement NN 10_1101-2021_01_08_425967 13 20 of of IN 10_1101-2021_01_08_425967 13 21 the the DT 10_1101-2021_01_08_425967 13 22 clusters cluster NNS 10_1101-2021_01_08_425967 13 23 . . . 10_1101-2021_01_08_425967 14 1 To to TO 10_1101-2021_01_08_425967 14 2 assess assess VB 10_1101-2021_01_08_425967 14 3 how how WRB 10_1101-2021_01_08_425967 14 4 well well RB 10_1101-2021_01_08_425967 14 5 the the DT 10_1101-2021_01_08_425967 14 6 clustering clustering NN 10_1101-2021_01_08_425967 14 7 is be VBZ 10_1101-2021_01_08_425967 14 8 segregating segregate VBG 10_1101-2021_01_08_425967 14 9 different different JJ 10_1101-2021_01_08_425967 14 10 cell cell NN 10_1101-2021_01_08_425967 14 11 lines line NNS 10_1101-2021_01_08_425967 14 12 , , , 10_1101-2021_01_08_425967 14 13 a a DT 10_1101-2021_01_08_425967 14 14 class class NN 10_1101-2021_01_08_425967 14 15 stating state VBG 10_1101-2021_01_08_425967 14 16 the the DT 10_1101-2021_01_08_425967 14 17 desired desire VBN 10_1101-2021_01_08_425967 14 18 partitioning partitioning NN 10_1101-2021_01_08_425967 14 19 of of IN 10_1101-2021_01_08_425967 14 20 each each DT 10_1101-2021_01_08_425967 14 21 cell cell NN 10_1101-2021_01_08_425967 14 22 line line NN 10_1101-2021_01_08_425967 14 23 is be VBZ 10_1101-2021_01_08_425967 14 24 provided provide VBN 10_1101-2021_01_08_425967 14 25 a a DT 10_1101-2021_01_08_425967 14 26 posteriori posteriori NN 10_1101-2021_01_08_425967 14 27 . . . 10_1101-2021_01_08_425967 15 1 Then then RB 10_1101-2021_01_08_425967 15 2 , , , 10_1101-2021_01_08_425967 15 3 a a DT 10_1101-2021_01_08_425967 15 4 simple simple JJ 10_1101-2021_01_08_425967 15 5 visual visual JJ 10_1101-2021_01_08_425967 15 6 inspection inspection NN 10_1101-2021_01_08_425967 15 7 of of IN 10_1101-2021_01_08_425967 15 8 the the DT 10_1101-2021_01_08_425967 15 9 vector vector NN 10_1101-2021_01_08_425967 15 10 of of IN 10_1101-2021_01_08_425967 15 11 classes class NNS 10_1101-2021_01_08_425967 15 12 is be VBZ 10_1101-2021_01_08_425967 15 13 used use VBN 10_1101-2021_01_08_425967 15 14 to to TO 10_1101-2021_01_08_425967 15 15 estimate estimate VB 10_1101-2021_01_08_425967 15 16 whether whether IN 10_1101-2021_01_08_425967 15 17 the the DT 10_1101-2021_01_08_425967 15 18 clustering clustering NN 10_1101-2021_01_08_425967 15 19 is be VBZ 10_1101-2021_01_08_425967 15 20 providing provide VBG 10_1101-2021_01_08_425967 15 21 a a DT 10_1101-2021_01_08_425967 15 22 good good JJ 10_1101-2021_01_08_425967 15 23 partition partition NN 10_1101-2021_01_08_425967 15 24 . . . 10_1101-2021_01_08_425967 16 1 Such such JJ 10_1101-2021_01_08_425967 16 2 partition partition NN 10_1101-2021_01_08_425967 16 3 vector vector NN 10_1101-2021_01_08_425967 16 4 is be VBZ 10_1101-2021_01_08_425967 16 5 colored color VBN 10_1101-2021_01_08_425967 16 6 according accord VBG 10_1101-2021_01_08_425967 16 7 to to IN 10_1101-2021_01_08_425967 16 8 the the DT 10_1101-2021_01_08_425967 16 9 classification classification NN 10_1101-2021_01_08_425967 16 10 that that IN 10_1101-2021_01_08_425967 16 11 each each DT 10_1101-2021_01_08_425967 16 12 item item NN 10_1101-2021_01_08_425967 16 13 is be VBZ 10_1101-2021_01_08_425967 16 14 associated associate VBN 10_1101-2021_01_08_425967 16 15 with with IN 10_1101-2021_01_08_425967 16 16 , , , 10_1101-2021_01_08_425967 16 17 and and CC 10_1101-2021_01_08_425967 16 18 it -PRON- PRP 10_1101-2021_01_08_425967 16 19 is be VBZ 10_1101-2021_01_08_425967 16 20 expected expect VBN 10_1101-2021_01_08_425967 16 21 that that IN 10_1101-2021_01_08_425967 16 22 similar similar JJ 10_1101-2021_01_08_425967 16 23 items item NNS 10_1101-2021_01_08_425967 16 24 will will MD 10_1101-2021_01_08_425967 16 25 be be VB 10_1101-2021_01_08_425967 16 26 contiguous contiguous JJ 10_1101-2021_01_08_425967 16 27 , , , 10_1101-2021_01_08_425967 16 28 so so RB 10_1101-2021_01_08_425967 16 29 the the DT 10_1101-2021_01_08_425967 16 30 formed form VBN 10_1101-2021_01_08_425967 16 31 groups group NNS 10_1101-2021_01_08_425967 16 32 are be VBP 10_1101-2021_01_08_425967 16 33 assessed assess VBN 10_1101-2021_01_08_425967 16 34 qualitatively qualitatively RB 10_1101-2021_01_08_425967 16 35 on on IN 10_1101-2021_01_08_425967 16 36 the the DT 10_1101-2021_01_08_425967 16 37 biological biological JJ 10_1101-2021_01_08_425967 16 38 background background NN 10_1101-2021_01_08_425967 16 39 of of IN 10_1101-2021_01_08_425967 16 40 each each DT 10_1101-2021_01_08_425967 16 41 item item NN 10_1101-2021_01_08_425967 16 42 . . . 10_1101-2021_01_08_425967 17 1 This this DT 10_1101-2021_01_08_425967 17 2 procedure procedure NN 10_1101-2021_01_08_425967 17 3 should should MD 10_1101-2021_01_08_425967 17 4 not not RB 10_1101-2021_01_08_425967 17 5 be be VB 10_1101-2021_01_08_425967 17 6 confused confuse VBN 10_1101-2021_01_08_425967 17 7 with with IN 10_1101-2021_01_08_425967 17 8 “ " `` 10_1101-2021_01_08_425967 17 9 supervised supervised JJ 10_1101-2021_01_08_425967 17 10 clustering clustering NN 10_1101-2021_01_08_425967 17 11 ” " '' 10_1101-2021_01_08_425967 17 12 , , , 10_1101-2021_01_08_425967 17 13 which which WDT 10_1101-2021_01_08_425967 17 14 provides provide VBZ 10_1101-2021_01_08_425967 17 15 a a DT 10_1101-2021_01_08_425967 17 16 vector vector NN 10_1101-2021_01_08_425967 17 17 of of IN 10_1101-2021_01_08_425967 17 18 classes class NNS 10_1101-2021_01_08_425967 17 19 starting start VBG 10_1101-2021_01_08_425967 17 20 the the DT 10_1101-2021_01_08_425967 17 21 desired desire VBN 10_1101-2021_01_08_425967 17 22 partitioning partition VBG 10_1101-2021_01_08_425967 17 23 a a DT 10_1101-2021_01_08_425967 17 24 priori priori FW 10_1101-2021_01_08_425967 17 25 . . . 10_1101-2021_01_08_425967 18 1 This this DT 10_1101-2021_01_08_425967 18 2 is be VBZ 10_1101-2021_01_08_425967 18 3 then then RB 10_1101-2021_01_08_425967 18 4 used use VBN 10_1101-2021_01_08_425967 18 5 to to TO 10_1101-2021_01_08_425967 18 6 guide guide VB 10_1101-2021_01_08_425967 18 7 the the DT 10_1101-2021_01_08_425967 18 8 clustering cluster VBG 10_1101-2021_01_08_425967 18 9 algorithms algorithm NNS 10_1101-2021_01_08_425967 18 10 by by IN 10_1101-2021_01_08_425967 18 11 allowing allow VBG 10_1101-2021_01_08_425967 18 12 the the DT 10_1101-2021_01_08_425967 18 13 learning learning NN 10_1101-2021_01_08_425967 18 14 of of IN 10_1101-2021_01_08_425967 18 15 the the DT 10_1101-2021_01_08_425967 18 16 metric metric JJ 10_1101-2021_01_08_425967 18 17 distances distance NNS 10_1101-2021_01_08_425967 18 18 that that WDT 10_1101-2021_01_08_425967 18 19 optimizes optimize VBZ 10_1101-2021_01_08_425967 18 20 the the DT 10_1101-2021_01_08_425967 18 21 partitioning partitioning NN 10_1101-2021_01_08_425967 18 22 [ [ -LRB- 10_1101-2021_01_08_425967 18 23 3 3 CD 10_1101-2021_01_08_425967 18 24 ] ] -RRB- 10_1101-2021_01_08_425967 18 25 . . . 10_1101-2021_01_08_425967 19 1 Additionally additionally RB 10_1101-2021_01_08_425967 19 2 , , , 10_1101-2021_01_08_425967 19 3 it -PRON- PRP 10_1101-2021_01_08_425967 19 4 may may MD 10_1101-2021_01_08_425967 19 5 get get VB 10_1101-2021_01_08_425967 19 6 confused confused JJ 10_1101-2021_01_08_425967 19 7 with with IN 10_1101-2021_01_08_425967 19 8 the the DT 10_1101-2021_01_08_425967 19 9 metric metric JJ 10_1101-2021_01_08_425967 19 10 assessment assessment NN 10_1101-2021_01_08_425967 19 11 of of IN 10_1101-2021_01_08_425967 19 12 the the DT 10_1101-2021_01_08_425967 19 13 clustering cluster VBG 10_1101-2021_01_08_425967 19 14 algorithms algorithm NNS 10_1101-2021_01_08_425967 19 15 , , , 10_1101-2021_01_08_425967 19 16 especially especially RB 10_1101-2021_01_08_425967 19 17 with with IN 10_1101-2021_01_08_425967 19 18 the the DT 10_1101-2021_01_08_425967 19 19 external external JJ 10_1101-2021_01_08_425967 19 20 cluster cluster NN 10_1101-2021_01_08_425967 19 21 evaluation evaluation NN 10_1101-2021_01_08_425967 19 22 . . . 10_1101-2021_01_08_425967 20 1 For for IN 10_1101-2021_01_08_425967 20 2 this this DT 10_1101-2021_01_08_425967 20 3 , , , 10_1101-2021_01_08_425967 20 4 various various JJ 10_1101-2021_01_08_425967 20 5 metrics metric NNS 10_1101-2021_01_08_425967 20 6 have have VBP 10_1101-2021_01_08_425967 20 7 been be VBN 10_1101-2021_01_08_425967 20 8 developed develop VBN 10_1101-2021_01_08_425967 20 9 to to TO 10_1101-2021_01_08_425967 20 10 qualify qualify VB 10_1101-2021_01_08_425967 20 11 the the DT 10_1101-2021_01_08_425967 20 12 clustering cluster VBG 10_1101-2021_01_08_425967 20 13 algorithm algorithm NN 10_1101-2021_01_08_425967 20 14 itself -PRON- PRP 10_1101-2021_01_08_425967 20 15 , , , 10_1101-2021_01_08_425967 20 16 such such JJ 10_1101-2021_01_08_425967 20 17 as as IN 10_1101-2021_01_08_425967 20 18 intrinsic intrinsic JJ 10_1101-2021_01_08_425967 20 19 and and CC 10_1101-2021_01_08_425967 20 20 extrinsic extrinsic JJ 10_1101-2021_01_08_425967 20 21 measures measure NNS 10_1101-2021_01_08_425967 20 22 . . . 10_1101-2021_01_08_425967 21 1 These these DT 10_1101-2021_01_08_425967 21 2 metrics metric NNS 10_1101-2021_01_08_425967 21 3 are be VBP 10_1101-2021_01_08_425967 21 4 used use VBN 10_1101-2021_01_08_425967 21 5 for for IN 10_1101-2021_01_08_425967 21 6 clustering cluster VBG 10_1101-2021_01_08_425967 21 7 algorithm algorithm JJ 10_1101-2021_01_08_425967 21 8 validation validation NN 10_1101-2021_01_08_425967 21 9 . . . 10_1101-2021_01_08_425967 22 1 The the DT 10_1101-2021_01_08_425967 22 2 extrinsic extrinsic NN 10_1101-2021_01_08_425967 22 3 validation validation NN 10_1101-2021_01_08_425967 22 4 compares compare VBZ 10_1101-2021_01_08_425967 22 5 the the DT 10_1101-2021_01_08_425967 22 6 clustering clustering NN 10_1101-2021_01_08_425967 22 7 to to IN 10_1101-2021_01_08_425967 22 8 a a DT 10_1101-2021_01_08_425967 22 9 goal goal NN 10_1101-2021_01_08_425967 22 10 to to TO 10_1101-2021_01_08_425967 22 11 say say VB 10_1101-2021_01_08_425967 22 12 whether whether IN 10_1101-2021_01_08_425967 22 13 it -PRON- PRP 10_1101-2021_01_08_425967 22 14 is be VBZ 10_1101-2021_01_08_425967 22 15 a a DT 10_1101-2021_01_08_425967 22 16 good good JJ 10_1101-2021_01_08_425967 22 17 clustering clustering NN 10_1101-2021_01_08_425967 22 18 or or CC 10_1101-2021_01_08_425967 22 19 not not RB 10_1101-2021_01_08_425967 22 20 . . . 10_1101-2021_01_08_425967 23 1 The the DT 10_1101-2021_01_08_425967 23 2 internal internal JJ 10_1101-2021_01_08_425967 23 3 validation validation NN 10_1101-2021_01_08_425967 23 4 compares compare VBZ 10_1101-2021_01_08_425967 23 5 the the DT 10_1101-2021_01_08_425967 23 6 elements element NNS 10_1101-2021_01_08_425967 23 7 within within IN 10_1101-2021_01_08_425967 23 8 the the DT 10_1101-2021_01_08_425967 23 9 cluster cluster NN 10_1101-2021_01_08_425967 23 10 and and CC 10_1101-2021_01_08_425967 23 11 their -PRON- PRP$ 10_1101-2021_01_08_425967 23 12 differences difference NNS 10_1101-2021_01_08_425967 23 13 [ [ -LRB- 10_1101-2021_01_08_425967 23 14 4 4 CD 10_1101-2021_01_08_425967 23 15 ] ] -RRB- 10_1101-2021_01_08_425967 23 16 . . . 10_1101-2021_01_08_425967 24 1 PQA PQA NNP 10_1101-2021_01_08_425967 24 2 involves involve VBZ 10_1101-2021_01_08_425967 24 3 characteristics characteristic NNS 10_1101-2021_01_08_425967 24 4 of of IN 10_1101-2021_01_08_425967 24 5 both both DT 10_1101-2021_01_08_425967 24 6 kinds kind NNS 10_1101-2021_01_08_425967 24 7 of of IN 10_1101-2021_01_08_425967 24 8 validation validation NN 10_1101-2021_01_08_425967 24 9 , , , 10_1101-2021_01_08_425967 24 10 through through IN 10_1101-2021_01_08_425967 24 11 using use VBG 10_1101-2021_01_08_425967 24 12 both both CC 10_1101-2021_01_08_425967 24 13 the the DT 10_1101-2021_01_08_425967 24 14 .CC .CC NFP 10_1101-2021_01_08_425967 24 15 - - : 10_1101-2021_01_08_425967 24 16 BY by IN 10_1101-2021_01_08_425967 24 17 4.0 4.0 CD 10_1101-2021_01_08_425967 24 18 International international JJ 10_1101-2021_01_08_425967 24 19 licensemade licensemade NN 10_1101-2021_01_08_425967 24 20 available available JJ 10_1101-2021_01_08_425967 24 21 under under IN 10_1101-2021_01_08_425967 24 22 a a DT 10_1101-2021_01_08_425967 24 23 ( ( -LRB- 10_1101-2021_01_08_425967 24 24 which which WDT 10_1101-2021_01_08_425967 24 25 was be VBD 10_1101-2021_01_08_425967 24 26 not not RB 10_1101-2021_01_08_425967 24 27 certified certify VBN 10_1101-2021_01_08_425967 24 28 by by IN 10_1101-2021_01_08_425967 24 29 peer peer NN 10_1101-2021_01_08_425967 24 30 review review NN 10_1101-2021_01_08_425967 24 31 ) ) -RRB- 10_1101-2021_01_08_425967 24 32 is be VBZ 10_1101-2021_01_08_425967 24 33 the the DT 10_1101-2021_01_08_425967 24 34 author author NN 10_1101-2021_01_08_425967 24 35 / / SYM 10_1101-2021_01_08_425967 24 36 funder funder NN 10_1101-2021_01_08_425967 24 37 , , , 10_1101-2021_01_08_425967 24 38 who who WP 10_1101-2021_01_08_425967 24 39 has have VBZ 10_1101-2021_01_08_425967 24 40 granted grant VBN 10_1101-2021_01_08_425967 24 41 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 24 42 a a DT 10_1101-2021_01_08_425967 24 43 license license NN 10_1101-2021_01_08_425967 24 44 to to TO 10_1101-2021_01_08_425967 24 45 display display VB 10_1101-2021_01_08_425967 24 46 the the DT 10_1101-2021_01_08_425967 24 47 preprint preprint NN 10_1101-2021_01_08_425967 24 48 in in IN 10_1101-2021_01_08_425967 24 49 perpetuity perpetuity NN 10_1101-2021_01_08_425967 24 50 . . . 10_1101-2021_01_08_425967 25 1 It -PRON- PRP 10_1101-2021_01_08_425967 25 2 is be VBZ 10_1101-2021_01_08_425967 25 3 The the DT 10_1101-2021_01_08_425967 25 4 copyright copyright NN 10_1101-2021_01_08_425967 25 5 holder holder NN 10_1101-2021_01_08_425967 25 6 for for IN 10_1101-2021_01_08_425967 25 7 this this DT 10_1101-2021_01_08_425967 25 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 25 9 version version NN 10_1101-2021_01_08_425967 25 10 posted post VBD 10_1101-2021_01_08_425967 25 11 January January NNP 10_1101-2021_01_08_425967 25 12 9 9 CD 10_1101-2021_01_08_425967 25 13 , , , 10_1101-2021_01_08_425967 25 14 2021 2021 CD 10_1101-2021_01_08_425967 25 15 . . . 10_1101-2021_01_08_425967 25 16 ; ; : 10_1101-2021_01_08_425967 25 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 25 18 : : : 10_1101-2021_01_08_425967 25 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 25 20 preprint preprint NN 10_1101-2021_01_08_425967 25 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 25 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ ADD 10_1101-2021_01_08_425967 25 23 crafted craft VBN 10_1101-2021_01_08_425967 25 24 goal goal NN 10_1101-2021_01_08_425967 25 25 standard standard NN 10_1101-2021_01_08_425967 25 26 and and CC 10_1101-2021_01_08_425967 25 27 the the DT 10_1101-2021_01_08_425967 25 28 yielded yield VBN 10_1101-2021_01_08_425967 25 29 signal signal NN 10_1101-2021_01_08_425967 25 30 itself -PRON- PRP 10_1101-2021_01_08_425967 25 31 ( ( -LRB- 10_1101-2021_01_08_425967 25 32 clustered cluster VBN 10_1101-2021_01_08_425967 25 33 vector vector NN 10_1101-2021_01_08_425967 25 34 ) ) -RRB- 10_1101-2021_01_08_425967 25 35 . . . 10_1101-2021_01_08_425967 26 1 However however RB 10_1101-2021_01_08_425967 26 2 , , , 10_1101-2021_01_08_425967 26 3 PQA PQA NNP 10_1101-2021_01_08_425967 26 4 gathers gather VBZ 10_1101-2021_01_08_425967 26 5 these these DT 10_1101-2021_01_08_425967 26 6 elements element NNS 10_1101-2021_01_08_425967 26 7 not not RB 10_1101-2021_01_08_425967 26 8 qualifying qualify VBG 10_1101-2021_01_08_425967 26 9 the the DT 10_1101-2021_01_08_425967 26 10 clustering cluster VBG 10_1101-2021_01_08_425967 26 11 algorithm algorithm NN 10_1101-2021_01_08_425967 26 12 itself -PRON- PRP 10_1101-2021_01_08_425967 26 13 but but CC 10_1101-2021_01_08_425967 26 14 to to TO 10_1101-2021_01_08_425967 26 15 quantify quantify VB 10_1101-2021_01_08_425967 26 16 the the DT 10_1101-2021_01_08_425967 26 17 noise noise NN 10_1101-2021_01_08_425967 26 18 embedded embed VBN 10_1101-2021_01_08_425967 26 19 in in IN 10_1101-2021_01_08_425967 26 20 the the DT 10_1101-2021_01_08_425967 26 21 cluster cluster NN 10_1101-2021_01_08_425967 26 22 , , , 10_1101-2021_01_08_425967 26 23 this this DT 10_1101-2021_01_08_425967 26 24 noise noise NN 10_1101-2021_01_08_425967 26 25 may may MD 10_1101-2021_01_08_425967 26 26 be be VB 10_1101-2021_01_08_425967 26 27 due due IN 10_1101-2021_01_08_425967 26 28 to to IN 10_1101-2021_01_08_425967 26 29 the the DT 10_1101-2021_01_08_425967 26 30 intrinsic intrinsic JJ 10_1101-2021_01_08_425967 26 31 metric metric JJ 10_1101-2021_01_08_425967 26 32 or or CC 10_1101-2021_01_08_425967 26 33 marker marker NN 10_1101-2021_01_08_425967 26 34 used use VBN 10_1101-2021_01_08_425967 26 35 to to TO 10_1101-2021_01_08_425967 26 36 order order VB 10_1101-2021_01_08_425967 26 37 the the DT 10_1101-2021_01_08_425967 26 38 data data NN 10_1101-2021_01_08_425967 26 39 set set VBN 10_1101-2021_01_08_425967 26 40 . . . 10_1101-2021_01_08_425967 27 1 A a DT 10_1101-2021_01_08_425967 27 2 possible possible JJ 10_1101-2021_01_08_425967 27 3 caveat caveat NN 10_1101-2021_01_08_425967 27 4 of of IN 10_1101-2021_01_08_425967 27 5 the the DT 10_1101-2021_01_08_425967 27 6 qualitative qualitative JJ 10_1101-2021_01_08_425967 27 7 assessment assessment NN 10_1101-2021_01_08_425967 27 8 discussed discuss VBN 10_1101-2021_01_08_425967 27 9 above above RB 10_1101-2021_01_08_425967 27 10 is be VBZ 10_1101-2021_01_08_425967 27 11 that that IN 10_1101-2021_01_08_425967 27 12 humans human NNS 10_1101-2021_01_08_425967 27 13 tend tend VBP 10_1101-2021_01_08_425967 27 14 to to TO 10_1101-2021_01_08_425967 27 15 perceive perceive VB 10_1101-2021_01_08_425967 27 16 meaningful meaningful JJ 10_1101-2021_01_08_425967 27 17 patterns pattern NNS 10_1101-2021_01_08_425967 27 18 within within IN 10_1101-2021_01_08_425967 27 19 random random JJ 10_1101-2021_01_08_425967 27 20 data datum NNS 10_1101-2021_01_08_425967 27 21 leading lead VBG 10_1101-2021_01_08_425967 27 22 to to IN 10_1101-2021_01_08_425967 27 23 a a DT 10_1101-2021_01_08_425967 27 24 cognitive cognitive JJ 10_1101-2021_01_08_425967 27 25 bias bias NN 10_1101-2021_01_08_425967 27 26 known know VBN 10_1101-2021_01_08_425967 27 27 as as IN 10_1101-2021_01_08_425967 27 28 apophenia apophenia NNP 10_1101-2021_01_08_425967 27 29 [ [ -LRB- 10_1101-2021_01_08_425967 27 30 5 5 CD 10_1101-2021_01_08_425967 27 31 ] ] -RRB- 10_1101-2021_01_08_425967 27 32 . . . 10_1101-2021_01_08_425967 28 1 While while IN 10_1101-2021_01_08_425967 28 2 interpreting interpret VBG 10_1101-2021_01_08_425967 28 3 the the DT 10_1101-2021_01_08_425967 28 4 partitions partition NNS 10_1101-2021_01_08_425967 28 5 obtained obtain VBN 10_1101-2021_01_08_425967 28 6 from from IN 10_1101-2021_01_08_425967 28 7 unsupervised unsupervise VBN 10_1101-2021_01_08_425967 28 8 clustering cluster VBG 10_1101-2021_01_08_425967 28 9 analysis analysis NN 10_1101-2021_01_08_425967 28 10 , , , 10_1101-2021_01_08_425967 28 11 researchers researcher NNS 10_1101-2021_01_08_425967 28 12 attempt attempt VBP 10_1101-2021_01_08_425967 28 13 to to TO 10_1101-2021_01_08_425967 28 14 visually visually RB 10_1101-2021_01_08_425967 28 15 assess assess VB 10_1101-2021_01_08_425967 28 16 how how WRB 10_1101-2021_01_08_425967 28 17 close close JJ 10_1101-2021_01_08_425967 28 18 the the DT 10_1101-2021_01_08_425967 28 19 classifications classification NNS 10_1101-2021_01_08_425967 28 20 are be VBP 10_1101-2021_01_08_425967 28 21 to to IN 10_1101-2021_01_08_425967 28 22 each each DT 10_1101-2021_01_08_425967 28 23 other other JJ 10_1101-2021_01_08_425967 28 24 finding find VBG 10_1101-2021_01_08_425967 28 25 patterns pattern NNS 10_1101-2021_01_08_425967 28 26 that that WDT 10_1101-2021_01_08_425967 28 27 are be VBP 10_1101-2021_01_08_425967 28 28 not not RB 10_1101-2021_01_08_425967 28 29 well well RB 10_1101-2021_01_08_425967 28 30 supported support VBN 10_1101-2021_01_08_425967 28 31 by by IN 10_1101-2021_01_08_425967 28 32 the the DT 10_1101-2021_01_08_425967 28 33 data datum NNS 10_1101-2021_01_08_425967 28 34 . . . 10_1101-2021_01_08_425967 29 1 Such such PDT 10_1101-2021_01_08_425967 29 2 an an DT 10_1101-2021_01_08_425967 29 3 effect effect NN 10_1101-2021_01_08_425967 29 4 is be VBZ 10_1101-2021_01_08_425967 29 5 raised raise VBN 10_1101-2021_01_08_425967 29 6 because because IN 10_1101-2021_01_08_425967 29 7 the the DT 10_1101-2021_01_08_425967 29 8 adjacency adjacency NN 10_1101-2021_01_08_425967 29 9 between between IN 10_1101-2021_01_08_425967 29 10 items item NNS 10_1101-2021_01_08_425967 29 11 may may MD 10_1101-2021_01_08_425967 29 12 give give VB 10_1101-2021_01_08_425967 29 13 a a DT 10_1101-2021_01_08_425967 29 14 notion notion NN 10_1101-2021_01_08_425967 29 15 of of IN 10_1101-2021_01_08_425967 29 16 the the DT 10_1101-2021_01_08_425967 29 17 dissimilarity dissimilarity NN 10_1101-2021_01_08_425967 29 18 distance distance NN 10_1101-2021_01_08_425967 29 19 in in IN 10_1101-2021_01_08_425967 29 20 the the DT 10_1101-2021_01_08_425967 29 21 dendrogram dendrogram NNP 10_1101-2021_01_08_425967 29 22 leaves leave NNS 10_1101-2021_01_08_425967 29 23 . . . 10_1101-2021_01_08_425967 30 1 Unfortunately unfortunately RB 10_1101-2021_01_08_425967 30 2 , , , 10_1101-2021_01_08_425967 30 3 as as RB 10_1101-2021_01_08_425967 30 4 much much RB 10_1101-2021_01_08_425967 30 5 as as IN 10_1101-2021_01_08_425967 30 6 we -PRON- PRP 10_1101-2021_01_08_425967 30 7 know know VBP 10_1101-2021_01_08_425967 30 8 , , , 10_1101-2021_01_08_425967 30 9 there there EX 10_1101-2021_01_08_425967 30 10 is be VBZ 10_1101-2021_01_08_425967 30 11 no no DT 10_1101-2021_01_08_425967 30 12 method method NN 10_1101-2021_01_08_425967 30 13 to to TO 10_1101-2021_01_08_425967 30 14 quantitatively quantitatively RB 10_1101-2021_01_08_425967 30 15 assess assess VB 10_1101-2021_01_08_425967 30 16 the the DT 10_1101-2021_01_08_425967 30 17 quality quality NN 10_1101-2021_01_08_425967 30 18 of of IN 10_1101-2021_01_08_425967 30 19 the the DT 10_1101-2021_01_08_425967 30 20 groups group NNS 10_1101-2021_01_08_425967 30 21 of of IN 10_1101-2021_01_08_425967 30 22 classifications classification NNS 10_1101-2021_01_08_425967 30 23 from from IN 10_1101-2021_01_08_425967 30 24 the the DT 10_1101-2021_01_08_425967 30 25 clustering clustering NN 10_1101-2021_01_08_425967 30 26 or or CC 10_1101-2021_01_08_425967 30 27 , , , 10_1101-2021_01_08_425967 30 28 at at IN 10_1101-2021_01_08_425967 30 29 least least JJS 10_1101-2021_01_08_425967 30 30 , , , 10_1101-2021_01_08_425967 30 31 there there EX 10_1101-2021_01_08_425967 30 32 is be VBZ 10_1101-2021_01_08_425967 30 33 no no DT 10_1101-2021_01_08_425967 30 34 attempt attempt NN 10_1101-2021_01_08_425967 30 35 to to TO 10_1101-2021_01_08_425967 30 36 quantify quantify VB 10_1101-2021_01_08_425967 30 37 whether whether IN 10_1101-2021_01_08_425967 30 38 certain certain JJ 10_1101-2021_01_08_425967 30 39 configuration configuration NN 10_1101-2021_01_08_425967 30 40 or or CC 10_1101-2021_01_08_425967 30 41 order order NN 10_1101-2021_01_08_425967 30 42 of of IN 10_1101-2021_01_08_425967 30 43 the the DT 10_1101-2021_01_08_425967 30 44 items item NNS 10_1101-2021_01_08_425967 30 45 may may MD 10_1101-2021_01_08_425967 30 46 be be VB 10_1101-2021_01_08_425967 30 47 due due JJ 10_1101-2021_01_08_425967 30 48 to to IN 10_1101-2021_01_08_425967 30 49 randomness randomness NN 10_1101-2021_01_08_425967 30 50 . . . 10_1101-2021_01_08_425967 31 1 This this DT 10_1101-2021_01_08_425967 31 2 is be VBZ 10_1101-2021_01_08_425967 31 3 a a DT 10_1101-2021_01_08_425967 31 4 serious serious JJ 10_1101-2021_01_08_425967 31 5 caveat caveat NN 10_1101-2021_01_08_425967 31 6 , , , 10_1101-2021_01_08_425967 31 7 since since IN 10_1101-2021_01_08_425967 31 8 the the DT 10_1101-2021_01_08_425967 31 9 insertion insertion NN 10_1101-2021_01_08_425967 31 10 of of IN 10_1101-2021_01_08_425967 31 11 noise noise NN 10_1101-2021_01_08_425967 31 12 can can MD 10_1101-2021_01_08_425967 31 13 lead lead VB 10_1101-2021_01_08_425967 31 14 to to IN 10_1101-2021_01_08_425967 31 15 false false JJ 10_1101-2021_01_08_425967 31 16 conclusion conclusion NN 10_1101-2021_01_08_425967 31 17 or or CC 10_1101-2021_01_08_425967 31 18 misleading misleading JJ 10_1101-2021_01_08_425967 31 19 results result NNS 10_1101-2021_01_08_425967 31 20 . . . 10_1101-2021_01_08_425967 32 1 Furthermore furthermore RB 10_1101-2021_01_08_425967 32 2 , , , 10_1101-2021_01_08_425967 32 3 the the DT 10_1101-2021_01_08_425967 32 4 purging purging NN 10_1101-2021_01_08_425967 32 5 of of IN 10_1101-2021_01_08_425967 32 6 this this DT 10_1101-2021_01_08_425967 32 7 noise noise NN 10_1101-2021_01_08_425967 32 8 can can MD 10_1101-2021_01_08_425967 32 9 lead lead VB 10_1101-2021_01_08_425967 32 10 to to IN 10_1101-2021_01_08_425967 32 11 a a DT 10_1101-2021_01_08_425967 32 12 more more RBR 10_1101-2021_01_08_425967 32 13 efficient efficient JJ 10_1101-2021_01_08_425967 32 14 descriptions description NNS 10_1101-2021_01_08_425967 32 15 of of IN 10_1101-2021_01_08_425967 32 16 markers marker NNS 10_1101-2021_01_08_425967 32 17 and and CC 10_1101-2021_01_08_425967 32 18 its -PRON- PRP$ 10_1101-2021_01_08_425967 32 19 phenomena phenomenon NNS 10_1101-2021_01_08_425967 32 20 , , , 10_1101-2021_01_08_425967 32 21 accelerating accelerate VBG 10_1101-2021_01_08_425967 32 22 the the DT 10_1101-2021_01_08_425967 32 23 advance advance NN 10_1101-2021_01_08_425967 32 24 in in IN 10_1101-2021_01_08_425967 32 25 many many JJ 10_1101-2021_01_08_425967 32 26 fields field NNS 10_1101-2021_01_08_425967 32 27 . . . 10_1101-2021_01_08_425967 33 1 In in IN 10_1101-2021_01_08_425967 33 2 statistics statistic NNS 10_1101-2021_01_08_425967 33 3 , , , 10_1101-2021_01_08_425967 33 4 serial serial JJ 10_1101-2021_01_08_425967 33 5 correlation correlation NN 10_1101-2021_01_08_425967 33 6 ( ( -LRB- 10_1101-2021_01_08_425967 33 7 SC SC NNP 10_1101-2021_01_08_425967 33 8 ) ) -RRB- 10_1101-2021_01_08_425967 33 9 is be VBZ 10_1101-2021_01_08_425967 33 10 a a DT 10_1101-2021_01_08_425967 33 11 term term NN 10_1101-2021_01_08_425967 33 12 used use VBN 10_1101-2021_01_08_425967 33 13 to to TO 10_1101-2021_01_08_425967 33 14 describe describe VB 10_1101-2021_01_08_425967 33 15 the the DT 10_1101-2021_01_08_425967 33 16 relationship relationship NN 10_1101-2021_01_08_425967 33 17 between between IN 10_1101-2021_01_08_425967 33 18 observations observation NNS 10_1101-2021_01_08_425967 33 19 of of IN 10_1101-2021_01_08_425967 33 20 the the DT 10_1101-2021_01_08_425967 33 21 same same JJ 10_1101-2021_01_08_425967 33 22 variable variable NN 10_1101-2021_01_08_425967 33 23 over over IN 10_1101-2021_01_08_425967 33 24 specific specific JJ 10_1101-2021_01_08_425967 33 25 periods period NNS 10_1101-2021_01_08_425967 33 26 . . . 10_1101-2021_01_08_425967 34 1 It -PRON- PRP 10_1101-2021_01_08_425967 34 2 was be VBD 10_1101-2021_01_08_425967 34 3 originally originally RB 10_1101-2021_01_08_425967 34 4 used use VBN 10_1101-2021_01_08_425967 34 5 in in IN 10_1101-2021_01_08_425967 34 6 engineering engineering NN 10_1101-2021_01_08_425967 34 7 to to TO 10_1101-2021_01_08_425967 34 8 determine determine VB 10_1101-2021_01_08_425967 34 9 how how WRB 10_1101-2021_01_08_425967 34 10 a a DT 10_1101-2021_01_08_425967 34 11 signal signal NN 10_1101-2021_01_08_425967 34 12 , , , 10_1101-2021_01_08_425967 34 13 for for IN 10_1101-2021_01_08_425967 34 14 instance instance NN 10_1101-2021_01_08_425967 34 15 , , , 10_1101-2021_01_08_425967 34 16 a a DT 10_1101-2021_01_08_425967 34 17 radio radio NN 10_1101-2021_01_08_425967 34 18 wave wave NN 10_1101-2021_01_08_425967 34 19 , , , 10_1101-2021_01_08_425967 34 20 varies vary VBZ 10_1101-2021_01_08_425967 34 21 with with IN 10_1101-2021_01_08_425967 34 22 itself -PRON- PRP 10_1101-2021_01_08_425967 34 23 over over IN 10_1101-2021_01_08_425967 34 24 time time NN 10_1101-2021_01_08_425967 34 25 . . . 10_1101-2021_01_08_425967 35 1 Later later RB 10_1101-2021_01_08_425967 35 2 , , , 10_1101-2021_01_08_425967 35 3 SC SC NNP 10_1101-2021_01_08_425967 35 4 was be VBD 10_1101-2021_01_08_425967 35 5 adapted adapt VBN 10_1101-2021_01_08_425967 35 6 to to IN 10_1101-2021_01_08_425967 35 7 econometrics econometric NNS 10_1101-2021_01_08_425967 35 8 to to TO 10_1101-2021_01_08_425967 35 9 analyze analyze VB 10_1101-2021_01_08_425967 35 10 economic economic JJ 10_1101-2021_01_08_425967 35 11 data datum NNS 10_1101-2021_01_08_425967 35 12 over over IN 10_1101-2021_01_08_425967 35 13 time time NN 10_1101-2021_01_08_425967 35 14 principally principally RB 10_1101-2021_01_08_425967 35 15 to to TO 10_1101-2021_01_08_425967 35 16 predict predict VB 10_1101-2021_01_08_425967 35 17 stock stock NN 10_1101-2021_01_08_425967 35 18 prices price NNS 10_1101-2021_01_08_425967 35 19 and and CC 10_1101-2021_01_08_425967 35 20 , , , 10_1101-2021_01_08_425967 35 21 in in IN 10_1101-2021_01_08_425967 35 22 other other JJ 10_1101-2021_01_08_425967 35 23 fields field NNS 10_1101-2021_01_08_425967 35 24 , , , 10_1101-2021_01_08_425967 35 25 to to IN 10_1101-2021_01_08_425967 35 26 model model NN 10_1101-2021_01_08_425967 35 27 - - HYPH 10_1101-2021_01_08_425967 35 28 independent independent JJ 10_1101-2021_01_08_425967 35 29 random random JJ 10_1101-2021_01_08_425967 35 30 variables variable NNS 10_1101-2021_01_08_425967 35 31 [ [ -LRB- 10_1101-2021_01_08_425967 35 32 6 6 CD 10_1101-2021_01_08_425967 35 33 ] ] -RRB- 10_1101-2021_01_08_425967 35 34 . . . 10_1101-2021_01_08_425967 36 1 We -PRON- PRP 10_1101-2021_01_08_425967 36 2 applied apply VBD 10_1101-2021_01_08_425967 36 3 the the DT 10_1101-2021_01_08_425967 36 4 SC SC NNP 10_1101-2021_01_08_425967 36 5 to to TO 10_1101-2021_01_08_425967 36 6 propose propose VB 10_1101-2021_01_08_425967 36 7 a a DT 10_1101-2021_01_08_425967 36 8 manner manner NN 10_1101-2021_01_08_425967 36 9 to to TO 10_1101-2021_01_08_425967 36 10 quantify quantify VB 10_1101-2021_01_08_425967 36 11 how how WRB 10_1101-2021_01_08_425967 36 12 well well RB 10_1101-2021_01_08_425967 36 13 is be VBZ 10_1101-2021_01_08_425967 36 14 the the DT 10_1101-2021_01_08_425967 36 15 grouping grouping NN 10_1101-2021_01_08_425967 36 16 of of IN 10_1101-2021_01_08_425967 36 17 a a DT 10_1101-2021_01_08_425967 36 18 posterior posterior NN 10_1101-2021_01_08_425967 36 19 classification classification NN 10_1101-2021_01_08_425967 36 20 just just RB 10_1101-2021_01_08_425967 36 21 by by IN 10_1101-2021_01_08_425967 36 22 retrieving retrieve VBG 10_1101-2021_01_08_425967 36 23 the the DT 10_1101-2021_01_08_425967 36 24 results result NNS 10_1101-2021_01_08_425967 36 25 of of IN 10_1101-2021_01_08_425967 36 26 unsupervised unsupervised JJ 10_1101-2021_01_08_425967 36 27 clustering cluster VBG 10_1101-2021_01_08_425967 36 28 analysis analysis NN 10_1101-2021_01_08_425967 36 29 . . . 10_1101-2021_01_08_425967 37 1 Thus thus RB 10_1101-2021_01_08_425967 37 2 , , , 10_1101-2021_01_08_425967 37 3 we -PRON- PRP 10_1101-2021_01_08_425967 37 4 propose propose VBP 10_1101-2021_01_08_425967 37 5 a a DT 10_1101-2021_01_08_425967 37 6 novel novel JJ 10_1101-2021_01_08_425967 37 7 relative relative JJ 10_1101-2021_01_08_425967 37 8 score score NN 10_1101-2021_01_08_425967 37 9 , , , 10_1101-2021_01_08_425967 37 10 PQA PQA NNP 10_1101-2021_01_08_425967 37 11 , , , 10_1101-2021_01_08_425967 37 12 to to TO 10_1101-2021_01_08_425967 37 13 solve solve VB 10_1101-2021_01_08_425967 37 14 the the DT 10_1101-2021_01_08_425967 37 15 subjectivity subjectivity NN 10_1101-2021_01_08_425967 37 16 of of IN 10_1101-2021_01_08_425967 37 17 the the DT 10_1101-2021_01_08_425967 37 18 visual visual JJ 10_1101-2021_01_08_425967 37 19 inspection inspection NN 10_1101-2021_01_08_425967 37 20 and and CC 10_1101-2021_01_08_425967 37 21 to to TO 10_1101-2021_01_08_425967 37 22 statistically statistically RB 10_1101-2021_01_08_425967 37 23 quantify quantify VB 10_1101-2021_01_08_425967 37 24 how how WRB 10_1101-2021_01_08_425967 37 25 much much JJ 10_1101-2021_01_08_425967 37 26 noise noise NN 10_1101-2021_01_08_425967 37 27 is be VBZ 10_1101-2021_01_08_425967 37 28 embedded embed VBN 10_1101-2021_01_08_425967 37 29 in in IN 10_1101-2021_01_08_425967 37 30 the the DT 10_1101-2021_01_08_425967 37 31 results result NNS 10_1101-2021_01_08_425967 37 32 of of IN 10_1101-2021_01_08_425967 37 33 clustering cluster VBG 10_1101-2021_01_08_425967 37 34 analysis analysis NN 10_1101-2021_01_08_425967 37 35 . . . 10_1101-2021_01_08_425967 38 1 2 2 LS 10_1101-2021_01_08_425967 38 2 . . . 10_1101-2021_01_08_425967 39 1 Methodology methodology NN 10_1101-2021_01_08_425967 39 2 2.1 2.1 CD 10_1101-2021_01_08_425967 39 3 . . . 10_1101-2021_01_08_425967 40 1 Assigning assign VBG 10_1101-2021_01_08_425967 40 2 numeric numeric JJ 10_1101-2021_01_08_425967 40 3 labels label NNS 10_1101-2021_01_08_425967 40 4 to to IN 10_1101-2021_01_08_425967 40 5 classifications classification NNS 10_1101-2021_01_08_425967 40 6 A a DT 10_1101-2021_01_08_425967 40 7 vector vector NN 10_1101-2021_01_08_425967 40 8 denoting denote VBG 10_1101-2021_01_08_425967 40 9 the the DT 10_1101-2021_01_08_425967 40 10 putative putative JJ 10_1101-2021_01_08_425967 40 11 similarities similarity NNS 10_1101-2021_01_08_425967 40 12 among among IN 10_1101-2021_01_08_425967 40 13 the the DT 10_1101-2021_01_08_425967 40 14 variables variable NNS 10_1101-2021_01_08_425967 40 15 in in IN 10_1101-2021_01_08_425967 40 16 a a DT 10_1101-2021_01_08_425967 40 17 study study NN 10_1101-2021_01_08_425967 40 18 is be VBZ 10_1101-2021_01_08_425967 40 19 usually usually RB 10_1101-2021_01_08_425967 40 20 obtained obtain VBN 10_1101-2021_01_08_425967 40 21 after after IN 10_1101-2021_01_08_425967 40 22 a a DT 10_1101-2021_01_08_425967 40 23 clustering cluster VBG 10_1101-2021_01_08_425967 40 24 analysis analysis NN 10_1101-2021_01_08_425967 40 25 . . . 10_1101-2021_01_08_425967 41 1 Each each DT 10_1101-2021_01_08_425967 41 2 variable variable NN 10_1101-2021_01_08_425967 41 3 is be VBZ 10_1101-2021_01_08_425967 41 4 classified classify VBN 10_1101-2021_01_08_425967 41 5 to to TO 10_1101-2021_01_08_425967 41 6 generate generate VB 10_1101-2021_01_08_425967 41 7 a a DT 10_1101-2021_01_08_425967 41 8 vector vector NN 10_1101-2021_01_08_425967 41 9 of of IN 10_1101-2021_01_08_425967 41 10 profiles profile NNS 10_1101-2021_01_08_425967 41 11 ( ( -LRB- 10_1101-2021_01_08_425967 41 12 VP VP NNP 10_1101-2021_01_08_425967 41 13 ) ) -RRB- 10_1101-2021_01_08_425967 41 14 . . . 10_1101-2021_01_08_425967 42 1 Such such PDT 10_1101-2021_01_08_425967 42 2 a a DT 10_1101-2021_01_08_425967 42 3 vector vector NN 10_1101-2021_01_08_425967 42 4 of of IN 10_1101-2021_01_08_425967 42 5 classifications classification NNS 10_1101-2021_01_08_425967 42 6 is be VBZ 10_1101-2021_01_08_425967 42 7 usually usually RB 10_1101-2021_01_08_425967 42 8 translated translate VBN 10_1101-2021_01_08_425967 42 9 into into IN 10_1101-2021_01_08_425967 42 10 a a DT 10_1101-2021_01_08_425967 42 11 colors color NNS 10_1101-2021_01_08_425967 42 12 vector vector NN 10_1101-2021_01_08_425967 42 13 , , , 10_1101-2021_01_08_425967 42 14 in in IN 10_1101-2021_01_08_425967 42 15 which which WDT 10_1101-2021_01_08_425967 42 16 each each DT 10_1101-2021_01_08_425967 42 17 color color NN 10_1101-2021_01_08_425967 42 18 represents represent VBZ 10_1101-2021_01_08_425967 42 19 a a DT 10_1101-2021_01_08_425967 42 20 classification classification NN 10_1101-2021_01_08_425967 42 21 . . . 10_1101-2021_01_08_425967 43 1 It -PRON- PRP 10_1101-2021_01_08_425967 43 2 is be VBZ 10_1101-2021_01_08_425967 43 3 common common JJ 10_1101-2021_01_08_425967 43 4 to to TO 10_1101-2021_01_08_425967 43 5 inspect inspect VB 10_1101-2021_01_08_425967 43 6 this this DT 10_1101-2021_01_08_425967 43 7 vector vector NN 10_1101-2021_01_08_425967 43 8 to to TO 10_1101-2021_01_08_425967 43 9 find find VB 10_1101-2021_01_08_425967 43 10 groups group NNS 10_1101-2021_01_08_425967 43 11 that that WDT 10_1101-2021_01_08_425967 43 12 make make VBP 10_1101-2021_01_08_425967 43 13 sense sense NN 10_1101-2021_01_08_425967 43 14 according accord VBG 10_1101-2021_01_08_425967 43 15 to to IN 10_1101-2021_01_08_425967 43 16 the the DT 10_1101-2021_01_08_425967 43 17 analyzed analyze VBN 10_1101-2021_01_08_425967 43 18 data datum NNS 10_1101-2021_01_08_425967 43 19 . . . 10_1101-2021_01_08_425967 44 1 To to IN 10_1101-2021_01_08_425967 44 2 the the DT 10_1101-2021_01_08_425967 44 3 method method NN 10_1101-2021_01_08_425967 44 4 presented present VBN 10_1101-2021_01_08_425967 44 5 in in IN 10_1101-2021_01_08_425967 44 6 this this DT 10_1101-2021_01_08_425967 44 7 work work NN 10_1101-2021_01_08_425967 44 8 , , , 10_1101-2021_01_08_425967 44 9 the the DT 10_1101-2021_01_08_425967 44 10 VP VP NNP 10_1101-2021_01_08_425967 44 11 may may MD 10_1101-2021_01_08_425967 44 12 be be VB 10_1101-2021_01_08_425967 44 13 as as RB 10_1101-2021_01_08_425967 44 14 simple simple JJ 10_1101-2021_01_08_425967 44 15 as as IN 10_1101-2021_01_08_425967 44 16 a a DT 10_1101-2021_01_08_425967 44 17 vector vector NN 10_1101-2021_01_08_425967 44 18 of of IN 10_1101-2021_01_08_425967 44 19 strings string NNS 10_1101-2021_01_08_425967 44 20 or or CC 10_1101-2021_01_08_425967 44 21 numbers number NNS 10_1101-2021_01_08_425967 44 22 that that WDT 10_1101-2021_01_08_425967 44 23 represent represent VBP 10_1101-2021_01_08_425967 44 24 the the DT 10_1101-2021_01_08_425967 44 25 input input NN 10_1101-2021_01_08_425967 44 26 . . . 10_1101-2021_01_08_425967 45 1 .CC .CC NFP 10_1101-2021_01_08_425967 45 2 - - : 10_1101-2021_01_08_425967 45 3 BY by IN 10_1101-2021_01_08_425967 45 4 4.0 4.0 CD 10_1101-2021_01_08_425967 45 5 International international JJ 10_1101-2021_01_08_425967 45 6 licensemade licensemade NN 10_1101-2021_01_08_425967 45 7 available available JJ 10_1101-2021_01_08_425967 45 8 under under IN 10_1101-2021_01_08_425967 45 9 a a DT 10_1101-2021_01_08_425967 45 10 ( ( -LRB- 10_1101-2021_01_08_425967 45 11 which which WDT 10_1101-2021_01_08_425967 45 12 was be VBD 10_1101-2021_01_08_425967 45 13 not not RB 10_1101-2021_01_08_425967 45 14 certified certify VBN 10_1101-2021_01_08_425967 45 15 by by IN 10_1101-2021_01_08_425967 45 16 peer peer NN 10_1101-2021_01_08_425967 45 17 review review NN 10_1101-2021_01_08_425967 45 18 ) ) -RRB- 10_1101-2021_01_08_425967 45 19 is be VBZ 10_1101-2021_01_08_425967 45 20 the the DT 10_1101-2021_01_08_425967 45 21 author author NN 10_1101-2021_01_08_425967 45 22 / / SYM 10_1101-2021_01_08_425967 45 23 funder funder NN 10_1101-2021_01_08_425967 45 24 , , , 10_1101-2021_01_08_425967 45 25 who who WP 10_1101-2021_01_08_425967 45 26 has have VBZ 10_1101-2021_01_08_425967 45 27 granted grant VBN 10_1101-2021_01_08_425967 45 28 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 45 29 a a DT 10_1101-2021_01_08_425967 45 30 license license NN 10_1101-2021_01_08_425967 45 31 to to TO 10_1101-2021_01_08_425967 45 32 display display VB 10_1101-2021_01_08_425967 45 33 the the DT 10_1101-2021_01_08_425967 45 34 preprint preprint NN 10_1101-2021_01_08_425967 45 35 in in IN 10_1101-2021_01_08_425967 45 36 perpetuity perpetuity NN 10_1101-2021_01_08_425967 45 37 . . . 10_1101-2021_01_08_425967 46 1 It -PRON- PRP 10_1101-2021_01_08_425967 46 2 is be VBZ 10_1101-2021_01_08_425967 46 3 The the DT 10_1101-2021_01_08_425967 46 4 copyright copyright NN 10_1101-2021_01_08_425967 46 5 holder holder NN 10_1101-2021_01_08_425967 46 6 for for IN 10_1101-2021_01_08_425967 46 7 this this DT 10_1101-2021_01_08_425967 46 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 46 9 version version NN 10_1101-2021_01_08_425967 46 10 posted post VBD 10_1101-2021_01_08_425967 46 11 January January NNP 10_1101-2021_01_08_425967 46 12 9 9 CD 10_1101-2021_01_08_425967 46 13 , , , 10_1101-2021_01_08_425967 46 14 2021 2021 CD 10_1101-2021_01_08_425967 46 15 . . . 10_1101-2021_01_08_425967 46 16 ; ; : 10_1101-2021_01_08_425967 46 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 46 18 : : : 10_1101-2021_01_08_425967 46 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 46 20 preprint preprint NN 10_1101-2021_01_08_425967 46 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 46 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ -LRB- 10_1101-2021_01_08_425967 46 23 Figure Figure NNP 10_1101-2021_01_08_425967 46 24 1 1 CD 10_1101-2021_01_08_425967 46 25 . . . 10_1101-2021_01_08_425967 47 1 The the DT 10_1101-2021_01_08_425967 47 2 pipeline pipeline NN 10_1101-2021_01_08_425967 47 3 of of IN 10_1101-2021_01_08_425967 47 4 the the DT 10_1101-2021_01_08_425967 47 5 PQA PQA NNP 10_1101-2021_01_08_425967 47 6 methodology methodology NN 10_1101-2021_01_08_425967 47 7 . . . 10_1101-2021_01_08_425967 48 1 Whatever whatever WDT 10_1101-2021_01_08_425967 48 2 representation representation NN 10_1101-2021_01_08_425967 48 3 of of IN 10_1101-2021_01_08_425967 48 4 the the DT 10_1101-2021_01_08_425967 48 5 classifications classification NNS 10_1101-2021_01_08_425967 48 6 may may MD 10_1101-2021_01_08_425967 48 7 be be VB 10_1101-2021_01_08_425967 48 8 , , , 10_1101-2021_01_08_425967 48 9 it -PRON- PRP 10_1101-2021_01_08_425967 48 10 is be VBZ 10_1101-2021_01_08_425967 48 11 necessary necessary JJ 10_1101-2021_01_08_425967 48 12 to to TO 10_1101-2021_01_08_425967 48 13 transform transform VB 10_1101-2021_01_08_425967 48 14 the the DT 10_1101-2021_01_08_425967 48 15 classifications classification NNS 10_1101-2021_01_08_425967 48 16 to to IN 10_1101-2021_01_08_425967 48 17 a a DT 10_1101-2021_01_08_425967 48 18 vector vector NN 10_1101-2021_01_08_425967 48 19 of of IN 10_1101-2021_01_08_425967 48 20 numeric numeric JJ 10_1101-2021_01_08_425967 48 21 labels label NNS 10_1101-2021_01_08_425967 48 22 , , , 10_1101-2021_01_08_425967 48 23 in in IN 10_1101-2021_01_08_425967 48 24 which which WDT 10_1101-2021_01_08_425967 48 25 a a DT 10_1101-2021_01_08_425967 48 26 number number NN 10_1101-2021_01_08_425967 48 27 represents represent VBZ 10_1101-2021_01_08_425967 48 28 a a DT 10_1101-2021_01_08_425967 48 29 classification classification NN 10_1101-2021_01_08_425967 48 30 , , , 10_1101-2021_01_08_425967 48 31 to to TO 10_1101-2021_01_08_425967 48 32 be be VB 10_1101-2021_01_08_425967 48 33 able able JJ 10_1101-2021_01_08_425967 48 34 to to TO 10_1101-2021_01_08_425967 48 35 calculate calculate VB 10_1101-2021_01_08_425967 48 36 SC SC NNP 10_1101-2021_01_08_425967 48 37 . . . 10_1101-2021_01_08_425967 49 1 To to TO 10_1101-2021_01_08_425967 49 2 accomplish accomplish VB 10_1101-2021_01_08_425967 49 3 this this DT 10_1101-2021_01_08_425967 49 4 , , , 10_1101-2021_01_08_425967 49 5 we -PRON- PRP 10_1101-2021_01_08_425967 49 6 assign assign VBP 10_1101-2021_01_08_425967 49 7 the the DT 10_1101-2021_01_08_425967 49 8 first first JJ 10_1101-2021_01_08_425967 49 9 numeric numeric JJ 10_1101-2021_01_08_425967 49 10 label label NN 10_1101-2021_01_08_425967 49 11 ( ( -LRB- 10_1101-2021_01_08_425967 49 12 number number NN 10_1101-2021_01_08_425967 49 13 1 1 CD 10_1101-2021_01_08_425967 49 14 ) ) -RRB- 10_1101-2021_01_08_425967 49 15 to to IN 10_1101-2021_01_08_425967 49 16 the the DT 10_1101-2021_01_08_425967 49 17 first first JJ 10_1101-2021_01_08_425967 49 18 item item NN 10_1101-2021_01_08_425967 49 19 in in IN 10_1101-2021_01_08_425967 49 20 the the DT 10_1101-2021_01_08_425967 49 21 vector vector NN 10_1101-2021_01_08_425967 49 22 , , , 10_1101-2021_01_08_425967 49 23 which which WDT 10_1101-2021_01_08_425967 49 24 usually usually RB 10_1101-2021_01_08_425967 49 25 lays lay VBZ 10_1101-2021_01_08_425967 49 26 at at IN 10_1101-2021_01_08_425967 49 27 one one CD 10_1101-2021_01_08_425967 49 28 of of IN 10_1101-2021_01_08_425967 49 29 the the DT 10_1101-2021_01_08_425967 49 30 vector vector NN 10_1101-2021_01_08_425967 49 31 ’s ’s POS 10_1101-2021_01_08_425967 49 32 extremes extreme NNS 10_1101-2021_01_08_425967 49 33 . . . 10_1101-2021_01_08_425967 50 1 Then then RB 10_1101-2021_01_08_425967 50 2 , , , 10_1101-2021_01_08_425967 50 3 if if IN 10_1101-2021_01_08_425967 50 4 the the DT 10_1101-2021_01_08_425967 50 5 classification classification NN 10_1101-2021_01_08_425967 50 6 o o IN 10_1101-2021_01_08_425967 50 7 the the DT 10_1101-2021_01_08_425967 50 8 next next JJ 10_1101-2021_01_08_425967 50 9 item item NN 10_1101-2021_01_08_425967 50 10 is be VBZ 10_1101-2021_01_08_425967 50 11 different different JJ 10_1101-2021_01_08_425967 50 12 from from IN 10_1101-2021_01_08_425967 50 13 the the DT 10_1101-2021_01_08_425967 50 14 previous previous JJ 10_1101-2021_01_08_425967 50 15 one one NN 10_1101-2021_01_08_425967 50 16 , , , 10_1101-2021_01_08_425967 50 17 the the DT 10_1101-2021_01_08_425967 50 18 next next JJ 10_1101-2021_01_08_425967 50 19 number number NN 10_1101-2021_01_08_425967 50 20 in in IN 10_1101-2021_01_08_425967 50 21 the the DT 10_1101-2021_01_08_425967 50 22 sequence sequence NN 10_1101-2021_01_08_425967 50 23 is be VBZ 10_1101-2021_01_08_425967 50 24 assigned assign VBN 10_1101-2021_01_08_425967 50 25 , , , 10_1101-2021_01_08_425967 50 26 and and CC 10_1101-2021_01_08_425967 50 27 so so RB 10_1101-2021_01_08_425967 50 28 on on RB 10_1101-2021_01_08_425967 50 29 . . . 10_1101-2021_01_08_425967 51 1 This this DT 10_1101-2021_01_08_425967 51 2 way way NN 10_1101-2021_01_08_425967 51 3 of of IN 10_1101-2021_01_08_425967 51 4 labeling label VBG 10_1101-2021_01_08_425967 51 5 warrants warrant NNS 10_1101-2021_01_08_425967 51 6 that that IN 10_1101-2021_01_08_425967 51 7 the the DT 10_1101-2021_01_08_425967 51 8 changes change NNS 10_1101-2021_01_08_425967 51 9 in in IN 10_1101-2021_01_08_425967 51 10 the the DT 10_1101-2021_01_08_425967 51 11 SC SC NNP 10_1101-2021_01_08_425967 51 12 values value NNS 10_1101-2021_01_08_425967 51 13 are be VBP 10_1101-2021_01_08_425967 51 14 due due JJ 10_1101-2021_01_08_425967 51 15 to to IN 10_1101-2021_01_08_425967 51 16 the the DT 10_1101-2021_01_08_425967 51 17 order order NN 10_1101-2021_01_08_425967 51 18 of of IN 10_1101-2021_01_08_425967 51 19 numbers number NNS 10_1101-2021_01_08_425967 51 20 , , , 10_1101-2021_01_08_425967 51 21 that that DT 10_1101-2021_01_08_425967 51 22 is be VBZ 10_1101-2021_01_08_425967 51 23 to to TO 10_1101-2021_01_08_425967 51 24 say say VB 10_1101-2021_01_08_425967 51 25 , , , 10_1101-2021_01_08_425967 51 26 the the DT 10_1101-2021_01_08_425967 51 27 grouping grouping NN 10_1101-2021_01_08_425967 51 28 of of IN 10_1101-2021_01_08_425967 51 29 the the DT 10_1101-2021_01_08_425967 51 30 classifications classification NNS 10_1101-2021_01_08_425967 51 31 resulting result VBG 10_1101-2021_01_08_425967 51 32 from from IN 10_1101-2021_01_08_425967 51 33 the the DT 10_1101-2021_01_08_425967 51 34 clustering clustering NN 10_1101-2021_01_08_425967 51 35 , , , 10_1101-2021_01_08_425967 51 36 and and CC 10_1101-2021_01_08_425967 51 37 it -PRON- PRP 10_1101-2021_01_08_425967 51 38 is be VBZ 10_1101-2021_01_08_425967 51 39 not not RB 10_1101-2021_01_08_425967 51 40 an an DT 10_1101-2021_01_08_425967 51 41 artifact artifact NN 10_1101-2021_01_08_425967 51 42 of of IN 10_1101-2021_01_08_425967 51 43 the the DT 10_1101-2021_01_08_425967 51 44 labeling labeling NN 10_1101-2021_01_08_425967 51 45 itself -PRON- PRP 10_1101-2021_01_08_425967 51 46 ( ( -LRB- 10_1101-2021_01_08_425967 51 47 Figure figure NN 10_1101-2021_01_08_425967 51 48 1 1 CD 10_1101-2021_01_08_425967 51 49 ) ) -RRB- 10_1101-2021_01_08_425967 51 50 . . . 10_1101-2021_01_08_425967 52 1 2.2 2.2 CD 10_1101-2021_01_08_425967 52 2 . . . 10_1101-2021_01_08_425967 53 1 PQA PQA NNP 10_1101-2021_01_08_425967 53 2 score score NN 10_1101-2021_01_08_425967 53 3 Because because IN 10_1101-2021_01_08_425967 53 4 the the DT 10_1101-2021_01_08_425967 53 5 order order NN 10_1101-2021_01_08_425967 53 6 of of IN 10_1101-2021_01_08_425967 53 7 the the DT 10_1101-2021_01_08_425967 53 8 VP VP NNP 10_1101-2021_01_08_425967 53 9 could could MD 10_1101-2021_01_08_425967 53 10 be be VB 10_1101-2021_01_08_425967 53 11 interpreted interpret VBN 10_1101-2021_01_08_425967 53 12 as as IN 10_1101-2021_01_08_425967 53 13 the the DT 10_1101-2021_01_08_425967 53 14 grouping grouping NN 10_1101-2021_01_08_425967 53 15 of of IN 10_1101-2021_01_08_425967 53 16 the the DT 10_1101-2021_01_08_425967 53 17 classifications classification NNS 10_1101-2021_01_08_425967 53 18 , , , 10_1101-2021_01_08_425967 53 19 we -PRON- PRP 10_1101-2021_01_08_425967 53 20 measure measure VBP 10_1101-2021_01_08_425967 53 21 how how WRB 10_1101-2021_01_08_425967 53 22 well well RB 10_1101-2021_01_08_425967 53 23 the the DT 10_1101-2021_01_08_425967 53 24 same same JJ 10_1101-2021_01_08_425967 53 25 classifications classification NNS 10_1101-2021_01_08_425967 53 26 are be VBP 10_1101-2021_01_08_425967 53 27 held hold VBN 10_1101-2021_01_08_425967 53 28 together together RB 10_1101-2021_01_08_425967 53 29 in in IN 10_1101-2021_01_08_425967 53 30 the the DT 10_1101-2021_01_08_425967 53 31 VP vp NN 10_1101-2021_01_08_425967 53 32 through through IN 10_1101-2021_01_08_425967 53 33 an an DT 10_1101-2021_01_08_425967 53 34 SC SC NNP 10_1101-2021_01_08_425967 53 35 shifted shift VBD 10_1101-2021_01_08_425967 53 36 one one CD 10_1101-2021_01_08_425967 53 37 position position NN 10_1101-2021_01_08_425967 53 38 . . . 10_1101-2021_01_08_425967 54 1 Such such JJ 10_1101-2021_01_08_425967 54 2 sort sort NN 10_1101-2021_01_08_425967 54 3 of of IN 10_1101-2021_01_08_425967 54 4 correlation correlation NN 10_1101-2021_01_08_425967 54 5 is be VBZ 10_1101-2021_01_08_425967 54 6 defined define VBN 10_1101-2021_01_08_425967 54 7 as as IN 10_1101-2021_01_08_425967 54 8 the the DT 10_1101-2021_01_08_425967 54 9 Pearson Pearson NNP 10_1101-2021_01_08_425967 54 10 - - HYPH 10_1101-2021_01_08_425967 54 11 product product NN 10_1101-2021_01_08_425967 54 12 - - HYPH 10_1101-2021_01_08_425967 54 13 moment moment NN 10_1101-2021_01_08_425967 54 14 correlation correlation NN 10_1101-2021_01_08_425967 54 15 between between IN 10_1101-2021_01_08_425967 54 16 the the DT 10_1101-2021_01_08_425967 54 17 VP VP NNP 10_1101-2021_01_08_425967 54 18 discarding discard VBG 10_1101-2021_01_08_425967 54 19 the the DT 10_1101-2021_01_08_425967 54 20 first first JJ 10_1101-2021_01_08_425967 54 21 item item NN 10_1101-2021_01_08_425967 54 22 , , , 10_1101-2021_01_08_425967 54 23 and and CC 10_1101-2021_01_08_425967 54 24 the the DT 10_1101-2021_01_08_425967 54 25 VP VP NNP 10_1101-2021_01_08_425967 54 26 discarding discard VBG 10_1101-2021_01_08_425967 54 27 the the DT 10_1101-2021_01_08_425967 54 28 last last JJ 10_1101-2021_01_08_425967 54 29 ( ( -LRB- 10_1101-2021_01_08_425967 54 30 Equation equation NN 10_1101-2021_01_08_425967 54 31 1 1 CD 10_1101-2021_01_08_425967 54 32 , , , 10_1101-2021_01_08_425967 54 33 xi xi NNP 10_1101-2021_01_08_425967 54 34 ( ( -LRB- 10_1101-2021_01_08_425967 54 35 order order NN 10_1101-2021_01_08_425967 54 36 vector vector NNP 10_1101-2021_01_08_425967 54 37 i i NNP 10_1101-2021_01_08_425967 54 38 - - HYPH 10_1101-2021_01_08_425967 54 39 th th NNP 10_1101-2021_01_08_425967 54 40 position position NN 10_1101-2021_01_08_425967 54 41 ) ) -RRB- 10_1101-2021_01_08_425967 54 42 , , , 10_1101-2021_01_08_425967 54 43 n n CC 10_1101-2021_01_08_425967 54 44 ( ( -LRB- 10_1101-2021_01_08_425967 54 45 length length NN 10_1101-2021_01_08_425967 54 46 of of IN 10_1101-2021_01_08_425967 54 47 x x NN 10_1101-2021_01_08_425967 54 48 ) ) -RRB- 10_1101-2021_01_08_425967 54 49 , , , 10_1101-2021_01_08_425967 54 50 𝜌𝑖 𝜌𝑖 XX 10_1101-2021_01_08_425967 54 51 ( ( -LRB- 10_1101-2021_01_08_425967 54 52 resulting result VBG 10_1101-2021_01_08_425967 54 53 SC SC NNP 10_1101-2021_01_08_425967 54 54 ) ) -RRB- 10_1101-2021_01_08_425967 54 55 ) ) -RRB- 10_1101-2021_01_08_425967 54 56 . . . 10_1101-2021_01_08_425967 55 1 𝜌𝑖 𝜌𝑖 FW 10_1101-2021_01_08_425967 55 2 = = NFP 10_1101-2021_01_08_425967 55 3 ∑ ∑ . 10_1101-2021_01_08_425967 55 4 ( ( -LRB- 10_1101-2021_01_08_425967 55 5 𝑥𝑖− 𝑥𝑖− XX 10_1101-2021_01_08_425967 55 6 ∑ ∑ XX 10_1101-2021_01_08_425967 55 7 𝑥𝑖 𝑥𝑖 XX 10_1101-2021_01_08_425967 55 8 𝑛 𝑛 DT 10_1101-2021_01_08_425967 55 9 𝑗=2 𝑗=2 JJ 10_1101-2021_01_08_425967 55 10 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 11 ) ) -RRB- 10_1101-2021_01_08_425967 55 12 ∑ ∑ . 10_1101-2021_01_08_425967 55 13 ( ( -LRB- 10_1101-2021_01_08_425967 55 14 𝑥𝑖− 𝑥𝑖− XX 10_1101-2021_01_08_425967 55 15 ∑ ∑ XX 10_1101-2021_01_08_425967 55 16 𝑥𝑖 𝑥𝑖 VB 10_1101-2021_01_08_425967 55 17 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 18 𝑗=1 𝑗=1 JJ 10_1101-2021_01_08_425967 55 19 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 20 ) ) -RRB- 10_1101-2021_01_08_425967 55 21 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 22 𝑖=1 𝑖=1 NN 10_1101-2021_01_08_425967 55 23 𝑛 𝑛 NN 10_1101-2021_01_08_425967 55 24 𝑖=2 𝑖=2 NN 10_1101-2021_01_08_425967 55 25 √∑ √∑ NNP 10_1101-2021_01_08_425967 55 26 ( ( -LRB- 10_1101-2021_01_08_425967 55 27 𝑥𝑖− 𝑥𝑖− XX 10_1101-2021_01_08_425967 55 28 ∑ ∑ XX 10_1101-2021_01_08_425967 55 29 𝑥𝑖 𝑥𝑖 XX 10_1101-2021_01_08_425967 55 30 𝑛 𝑛 DT 10_1101-2021_01_08_425967 55 31 𝑗=2 𝑗=2 JJ 10_1101-2021_01_08_425967 55 32 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 33 ) ) -RRB- 10_1101-2021_01_08_425967 55 34 2 2 CD 10_1101-2021_01_08_425967 55 35 𝑛 𝑛 NN 10_1101-2021_01_08_425967 55 36 𝑖=2 𝑖=2 CD 10_1101-2021_01_08_425967 55 37 √∑ √∑ NNP 10_1101-2021_01_08_425967 55 38 ( ( -LRB- 10_1101-2021_01_08_425967 55 39 𝑥𝑖 𝑥𝑖 VB 10_1101-2021_01_08_425967 55 40 − − NNP 10_1101-2021_01_08_425967 55 41 ∑ ∑ . 10_1101-2021_01_08_425967 55 42 𝑥𝑖 𝑥𝑖 VB 10_1101-2021_01_08_425967 55 43 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 44 𝑗=1 𝑗=1 VBZ 10_1101-2021_01_08_425967 55 45 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 46 ) ) -RRB- 10_1101-2021_01_08_425967 55 47 2 2 CD 10_1101-2021_01_08_425967 55 48 𝑛−1 𝑛−1 NNP 10_1101-2021_01_08_425967 55 49 𝑖=1 𝑖=1 NNS 10_1101-2021_01_08_425967 55 50 ( ( -LRB- 10_1101-2021_01_08_425967 55 51 1 1 CD 10_1101-2021_01_08_425967 55 52 ) ) -RRB- 10_1101-2021_01_08_425967 55 53 We -PRON- PRP 10_1101-2021_01_08_425967 55 54 then then RB 10_1101-2021_01_08_425967 55 55 define define VBP 10_1101-2021_01_08_425967 55 56 the the DT 10_1101-2021_01_08_425967 55 57 PQA PQA NNP 10_1101-2021_01_08_425967 55 58 as as IN 10_1101-2021_01_08_425967 55 59 the the DT 10_1101-2021_01_08_425967 55 60 SC SC NNP 10_1101-2021_01_08_425967 55 61 of of IN 10_1101-2021_01_08_425967 55 62 the the DT 10_1101-2021_01_08_425967 55 63 VP VP NNP 10_1101-2021_01_08_425967 55 64 after after IN 10_1101-2021_01_08_425967 55 65 removing remove VBG 10_1101-2021_01_08_425967 55 66 background background NN 10_1101-2021_01_08_425967 55 67 noise noise NN 10_1101-2021_01_08_425967 55 68 , , , 10_1101-2021_01_08_425967 55 69 normalized normalize VBD 10_1101-2021_01_08_425967 55 70 for for IN 10_1101-2021_01_08_425967 55 71 the the DT 10_1101-2021_01_08_425967 55 72 SC SC NNP 10_1101-2021_01_08_425967 55 73 of of IN 10_1101-2021_01_08_425967 55 74 the the DT 10_1101-2021_01_08_425967 55 75 percent percent NN 10_1101-2021_01_08_425967 55 76 grouping grouping NN 10_1101-2021_01_08_425967 55 77 partitions partition NNS 10_1101-2021_01_08_425967 55 78 ( ( -LRB- 10_1101-2021_01_08_425967 55 79 defined define VBN 10_1101-2021_01_08_425967 55 80 as as IN 10_1101-2021_01_08_425967 55 81 the the DT 10_1101-2021_01_08_425967 55 82 sorted sorted JJ 10_1101-2021_01_08_425967 55 83 vector vector NN 10_1101-2021_01_08_425967 55 84 in in IN 10_1101-2021_01_08_425967 55 85 ascending ascend VBG 10_1101-2021_01_08_425967 55 86 order order NN 10_1101-2021_01_08_425967 55 87 ) ) -RRB- 10_1101-2021_01_08_425967 55 88 . . . 10_1101-2021_01_08_425967 56 1 This this DT 10_1101-2021_01_08_425967 56 2 , , , 10_1101-2021_01_08_425967 56 3 the the DT 10_1101-2021_01_08_425967 56 4 more more RBR 10_1101-2021_01_08_425967 56 5 similar similar JJ 10_1101-2021_01_08_425967 56 6 VP vp NN 10_1101-2021_01_08_425967 56 7 is be VBZ 10_1101-2021_01_08_425967 56 8 to to IN 10_1101-2021_01_08_425967 56 9 its -PRON- PRP$ 10_1101-2021_01_08_425967 56 10 sorted sorted JJ 10_1101-2021_01_08_425967 56 11 vector vector NN 10_1101-2021_01_08_425967 56 12 , , , 10_1101-2021_01_08_425967 56 13 the the DT 10_1101-2021_01_08_425967 56 14 higher high JJR 10_1101-2021_01_08_425967 56 15 the the DT 10_1101-2021_01_08_425967 56 16 score score NN 10_1101-2021_01_08_425967 56 17 is be VBZ 10_1101-2021_01_08_425967 56 18 yielded yield VBN 10_1101-2021_01_08_425967 56 19 ( ( -LRB- 10_1101-2021_01_08_425967 56 20 Equation Equation NNP 10_1101-2021_01_08_425967 56 21 2 2 CD 10_1101-2021_01_08_425967 56 22 , , , 10_1101-2021_01_08_425967 56 23 𝝆𝒙 𝝆𝒙 NNP 10_1101-2021_01_08_425967 56 24 ( ( -LRB- 10_1101-2021_01_08_425967 56 25 SC SC NNP 10_1101-2021_01_08_425967 56 26 of of IN 10_1101-2021_01_08_425967 56 27 the the DT 10_1101-2021_01_08_425967 56 28 VP VP NNP 10_1101-2021_01_08_425967 56 29 ) ) -RRB- 10_1101-2021_01_08_425967 56 30 , , , 10_1101-2021_01_08_425967 56 31 𝝆𝑹𝒂𝒏𝒅𝒙̅̅ 𝝆𝑹𝒂𝒏𝒅𝒙̅̅ : 10_1101-2021_01_08_425967 56 32 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 56 33 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 56 34 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 56 35 ̅ ̅ . 10_1101-2021_01_08_425967 56 36 ( ( -LRB- 10_1101-2021_01_08_425967 56 37 Mean Mean NNP 10_1101-2021_01_08_425967 56 38 of of IN 10_1101-2021_01_08_425967 56 39 the the DT 10_1101-2021_01_08_425967 56 40 SC SC NNP 10_1101-2021_01_08_425967 56 41 of of IN 10_1101-2021_01_08_425967 56 42 one one CD 10_1101-2021_01_08_425967 56 43 thousand thousand CD 10_1101-2021_01_08_425967 56 44 randomizations randomization NNS 10_1101-2021_01_08_425967 56 45 ) ) -RRB- 10_1101-2021_01_08_425967 56 46 , , , 10_1101-2021_01_08_425967 56 47 𝝆𝑷𝒆𝒓𝒇𝒆𝒄𝒕𝒙 𝝆𝑷𝒆𝒓𝒇𝒆𝒄𝒕𝒙 NNP 10_1101-2021_01_08_425967 56 48 SC SC NNP 10_1101-2021_01_08_425967 56 49 of of IN 10_1101-2021_01_08_425967 56 50 the the DT 10_1101-2021_01_08_425967 56 51 sorted sorted JJ 10_1101-2021_01_08_425967 56 52 vector vector NN 10_1101-2021_01_08_425967 56 53 in in IN 10_1101-2021_01_08_425967 56 54 ascending ascend VBG 10_1101-2021_01_08_425967 56 55 order order NN 10_1101-2021_01_08_425967 56 56 ) ) -RRB- 10_1101-2021_01_08_425967 56 57 ) ) -RRB- 10_1101-2021_01_08_425967 56 58 . . . 10_1101-2021_01_08_425967 57 1 𝑷𝑸𝑨𝒙 𝑷𝑸𝑨𝒙 NNS 10_1101-2021_01_08_425967 57 2 = = SYM 10_1101-2021_01_08_425967 57 3 𝝆𝒙−𝝆𝑹𝒂𝒏𝒅𝒙̅̅ 𝝆𝒙−𝝆𝑹𝒂𝒏𝒅𝒙̅̅ , 10_1101-2021_01_08_425967 57 4 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 57 5 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 57 6 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 57 7 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 57 8 ̅ ̅ NNP 10_1101-2021_01_08_425967 57 9 𝝆𝑷𝒆𝒓𝒇𝒆𝒄𝒕𝒙 𝝆𝑷𝒆𝒓𝒇𝒆𝒄𝒕𝒙 NNP 10_1101-2021_01_08_425967 57 10 ( ( -LRB- 10_1101-2021_01_08_425967 57 11 2 2 CD 10_1101-2021_01_08_425967 57 12 ) ) -RRB- 10_1101-2021_01_08_425967 57 13 2.3 2.3 CD 10_1101-2021_01_08_425967 57 14 . . . 10_1101-2021_01_08_425967 58 1 Background background NN 10_1101-2021_01_08_425967 58 2 - - HYPH 10_1101-2021_01_08_425967 58 3 noise noise NNP 10_1101-2021_01_08_425967 58 4 correlation correlation NN 10_1101-2021_01_08_425967 58 5 factor factor NN 10_1101-2021_01_08_425967 58 6 in in IN 10_1101-2021_01_08_425967 58 7 the the DT 10_1101-2021_01_08_425967 58 8 PQA PQA NNP 10_1101-2021_01_08_425967 58 9 score score NN 10_1101-2021_01_08_425967 58 10 .CC .CC NFP 10_1101-2021_01_08_425967 58 11 - - : 10_1101-2021_01_08_425967 58 12 BY by IN 10_1101-2021_01_08_425967 58 13 4.0 4.0 CD 10_1101-2021_01_08_425967 58 14 International international JJ 10_1101-2021_01_08_425967 58 15 licensemade licensemade NN 10_1101-2021_01_08_425967 58 16 available available JJ 10_1101-2021_01_08_425967 58 17 under under IN 10_1101-2021_01_08_425967 58 18 a a DT 10_1101-2021_01_08_425967 58 19 ( ( -LRB- 10_1101-2021_01_08_425967 58 20 which which WDT 10_1101-2021_01_08_425967 58 21 was be VBD 10_1101-2021_01_08_425967 58 22 not not RB 10_1101-2021_01_08_425967 58 23 certified certify VBN 10_1101-2021_01_08_425967 58 24 by by IN 10_1101-2021_01_08_425967 58 25 peer peer NN 10_1101-2021_01_08_425967 58 26 review review NN 10_1101-2021_01_08_425967 58 27 ) ) -RRB- 10_1101-2021_01_08_425967 58 28 is be VBZ 10_1101-2021_01_08_425967 58 29 the the DT 10_1101-2021_01_08_425967 58 30 author author NN 10_1101-2021_01_08_425967 58 31 / / SYM 10_1101-2021_01_08_425967 58 32 funder funder NN 10_1101-2021_01_08_425967 58 33 , , , 10_1101-2021_01_08_425967 58 34 who who WP 10_1101-2021_01_08_425967 58 35 has have VBZ 10_1101-2021_01_08_425967 58 36 granted grant VBN 10_1101-2021_01_08_425967 58 37 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 58 38 a a DT 10_1101-2021_01_08_425967 58 39 license license NN 10_1101-2021_01_08_425967 58 40 to to TO 10_1101-2021_01_08_425967 58 41 display display VB 10_1101-2021_01_08_425967 58 42 the the DT 10_1101-2021_01_08_425967 58 43 preprint preprint NN 10_1101-2021_01_08_425967 58 44 in in IN 10_1101-2021_01_08_425967 58 45 perpetuity perpetuity NN 10_1101-2021_01_08_425967 58 46 . . . 10_1101-2021_01_08_425967 59 1 It -PRON- PRP 10_1101-2021_01_08_425967 59 2 is be VBZ 10_1101-2021_01_08_425967 59 3 The the DT 10_1101-2021_01_08_425967 59 4 copyright copyright NN 10_1101-2021_01_08_425967 59 5 holder holder NN 10_1101-2021_01_08_425967 59 6 for for IN 10_1101-2021_01_08_425967 59 7 this this DT 10_1101-2021_01_08_425967 59 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 59 9 version version NN 10_1101-2021_01_08_425967 59 10 posted post VBD 10_1101-2021_01_08_425967 59 11 January January NNP 10_1101-2021_01_08_425967 59 12 9 9 CD 10_1101-2021_01_08_425967 59 13 , , , 10_1101-2021_01_08_425967 59 14 2021 2021 CD 10_1101-2021_01_08_425967 59 15 . . . 10_1101-2021_01_08_425967 59 16 ; ; : 10_1101-2021_01_08_425967 59 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 59 18 : : : 10_1101-2021_01_08_425967 59 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 59 20 preprint preprint NN 10_1101-2021_01_08_425967 59 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 UH 10_1101-2021_01_08_425967 59 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ ADD 10_1101-2021_01_08_425967 59 23 To to TO 10_1101-2021_01_08_425967 59 24 compute compute VB 10_1101-2021_01_08_425967 59 25 the the DT 10_1101-2021_01_08_425967 59 26 background background NN 10_1101-2021_01_08_425967 59 27 - - HYPH 10_1101-2021_01_08_425967 59 28 noise noise NN 10_1101-2021_01_08_425967 59 29 correlation correlation NN 10_1101-2021_01_08_425967 59 30 factor factor NN 10_1101-2021_01_08_425967 59 31 in in IN 10_1101-2021_01_08_425967 59 32 the the DT 10_1101-2021_01_08_425967 59 33 PQA PQA NNP 10_1101-2021_01_08_425967 59 34 score score NN 10_1101-2021_01_08_425967 59 35 definition definition NN 10_1101-2021_01_08_425967 59 36 , , , 10_1101-2021_01_08_425967 59 37 we -PRON- PRP 10_1101-2021_01_08_425967 59 38 sample sample VBP 10_1101-2021_01_08_425967 59 39 the the DT 10_1101-2021_01_08_425967 59 40 indexes index NNS 10_1101-2021_01_08_425967 59 41 of of IN 10_1101-2021_01_08_425967 59 42 the the DT 10_1101-2021_01_08_425967 59 43 VP VP NNP 10_1101-2021_01_08_425967 59 44 and and CC 10_1101-2021_01_08_425967 59 45 the the DT 10_1101-2021_01_08_425967 59 46 swapping swap VBG 10_1101-2021_01_08_425967 59 47 the the DT 10_1101-2021_01_08_425967 59 48 corresponding correspond VBG 10_1101-2021_01_08_425967 59 49 items item NNS 10_1101-2021_01_08_425967 59 50 . . . 10_1101-2021_01_08_425967 60 1 This this DT 10_1101-2021_01_08_425967 60 2 background background NN 10_1101-2021_01_08_425967 60 3 correction correction NN 10_1101-2021_01_08_425967 60 4 is be VBZ 10_1101-2021_01_08_425967 60 5 aimed aim VBN 10_1101-2021_01_08_425967 60 6 to to TO 10_1101-2021_01_08_425967 60 7 remove remove VB 10_1101-2021_01_08_425967 60 8 inherent inherent JJ 10_1101-2021_01_08_425967 60 9 noise noise NN 10_1101-2021_01_08_425967 60 10 in in IN 10_1101-2021_01_08_425967 60 11 the the DT 10_1101-2021_01_08_425967 60 12 data datum NNS 10_1101-2021_01_08_425967 60 13 , , , 10_1101-2021_01_08_425967 60 14 even even RB 10_1101-2021_01_08_425967 60 15 though though IN 10_1101-2021_01_08_425967 60 16 the the DT 10_1101-2021_01_08_425967 60 17 score score NN 10_1101-2021_01_08_425967 60 18 may may MD 10_1101-2021_01_08_425967 60 19 still still RB 10_1101-2021_01_08_425967 60 20 be be VB 10_1101-2021_01_08_425967 60 21 subjected subject VBN 10_1101-2021_01_08_425967 60 22 to to TO 10_1101-2021_01_08_425967 60 23 noise noise NN 10_1101-2021_01_08_425967 60 24 from from IN 10_1101-2021_01_08_425967 60 25 the the DT 10_1101-2021_01_08_425967 60 26 chosen choose VBN 10_1101-2021_01_08_425967 60 27 clustering cluster VBG 10_1101-2021_01_08_425967 60 28 algorithm algorithm NN 10_1101-2021_01_08_425967 60 29 or or CC 10_1101-2021_01_08_425967 60 30 discrepancies discrepancy NNS 10_1101-2021_01_08_425967 60 31 in in IN 10_1101-2021_01_08_425967 60 32 the the DT 10_1101-2021_01_08_425967 60 33 posterior posterior NN 10_1101-2021_01_08_425967 60 34 classification classification NN 10_1101-2021_01_08_425967 60 35 . . . 10_1101-2021_01_08_425967 61 1 2.4 2.4 CD 10_1101-2021_01_08_425967 61 2 . . . 10_1101-2021_01_08_425967 62 1 Statistical statistical JJ 10_1101-2021_01_08_425967 62 2 significance significance NN 10_1101-2021_01_08_425967 62 3 of of IN 10_1101-2021_01_08_425967 62 4 the the DT 10_1101-2021_01_08_425967 62 5 PQA PQA NNP 10_1101-2021_01_08_425967 62 6 score score NN 10_1101-2021_01_08_425967 62 7 To to TO 10_1101-2021_01_08_425967 62 8 quantify quantify VB 10_1101-2021_01_08_425967 62 9 the the DT 10_1101-2021_01_08_425967 62 10 statistical statistical JJ 10_1101-2021_01_08_425967 62 11 significance significance NN 10_1101-2021_01_08_425967 62 12 of of IN 10_1101-2021_01_08_425967 62 13 the the DT 10_1101-2021_01_08_425967 62 14 PQA PQA NNP 10_1101-2021_01_08_425967 62 15 score score NN 10_1101-2021_01_08_425967 62 16 , , , 10_1101-2021_01_08_425967 62 17 we -PRON- PRP 10_1101-2021_01_08_425967 62 18 calculate calculate VBP 10_1101-2021_01_08_425967 62 19 a a DT 10_1101-2021_01_08_425967 62 20 Z z NN 10_1101-2021_01_08_425967 62 21 - - HYPH 10_1101-2021_01_08_425967 62 22 score score NN 10_1101-2021_01_08_425967 62 23 ( ( -LRB- 10_1101-2021_01_08_425967 62 24 Equation equation NN 10_1101-2021_01_08_425967 62 25 3 3 CD 10_1101-2021_01_08_425967 62 26 ) ) -RRB- 10_1101-2021_01_08_425967 62 27 , , , 10_1101-2021_01_08_425967 62 28 𝒛𝒙 𝒛𝒙 JJ 10_1101-2021_01_08_425967 62 29 = = SYM 10_1101-2021_01_08_425967 62 30 𝑷𝑸𝑨𝒙−𝑷𝑸𝑨𝑹𝒂𝒏𝒅̅̅ 𝑷𝑸𝑨𝒙−𝑷𝑸𝑨𝑹𝒂𝒏𝒅̅̅ FW 10_1101-2021_01_08_425967 62 31 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 32 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 33 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 34 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 35 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 36 ̅ ̅ NNP 10_1101-2021_01_08_425967 62 37 𝑺𝑫𝑷𝑸𝑨𝑹𝒂𝒏𝒅 𝑺𝑫𝑷𝑸𝑨𝑹𝒂𝒏𝒅 JJ 10_1101-2021_01_08_425967 62 38 ( ( -LRB- 10_1101-2021_01_08_425967 62 39 3 3 CD 10_1101-2021_01_08_425967 62 40 ) ) -RRB- 10_1101-2021_01_08_425967 62 41 where where WRB 10_1101-2021_01_08_425967 62 42 𝑃𝑄𝐴𝑥 𝑃𝑄𝐴𝑥 NNS 10_1101-2021_01_08_425967 62 43 is be VBZ 10_1101-2021_01_08_425967 62 44 the the DT 10_1101-2021_01_08_425967 62 45 PQA PQA NNP 10_1101-2021_01_08_425967 62 46 score score NN 10_1101-2021_01_08_425967 62 47 of of IN 10_1101-2021_01_08_425967 62 48 the the DT 10_1101-2021_01_08_425967 62 49 VP VP NNP 10_1101-2021_01_08_425967 62 50 , , , 10_1101-2021_01_08_425967 62 51 𝑃𝑄𝐴𝑅𝑎𝑛𝑑̅̅ 𝑃𝑄𝐴𝑅𝑎𝑛𝑑̅̅ NNP 10_1101-2021_01_08_425967 62 52 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 53 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 54 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 55 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 56 ̅̅ ̅̅ NNP 10_1101-2021_01_08_425967 62 57 is be VBZ 10_1101-2021_01_08_425967 62 58 the the DT 10_1101-2021_01_08_425967 62 59 mean mean NN 10_1101-2021_01_08_425967 62 60 of of IN 10_1101-2021_01_08_425967 62 61 PQA PQA NNP 10_1101-2021_01_08_425967 62 62 scores score NNS 10_1101-2021_01_08_425967 62 63 of of IN 10_1101-2021_01_08_425967 62 64 one one CD 10_1101-2021_01_08_425967 62 65 thousand thousand CD 10_1101-2021_01_08_425967 62 66 randomizations randomization NNS 10_1101-2021_01_08_425967 62 67 of of IN 10_1101-2021_01_08_425967 62 68 the the DT 10_1101-2021_01_08_425967 62 69 VP vp NN 10_1101-2021_01_08_425967 62 70 . . . 10_1101-2021_01_08_425967 63 1 These these DT 10_1101-2021_01_08_425967 63 2 randomizations randomization NNS 10_1101-2021_01_08_425967 63 3 have have VBP 10_1101-2021_01_08_425967 63 4 the the DT 10_1101-2021_01_08_425967 63 5 purpose purpose NN 10_1101-2021_01_08_425967 63 6 of of IN 10_1101-2021_01_08_425967 63 7 generating generate VBG 10_1101-2021_01_08_425967 63 8 a a DT 10_1101-2021_01_08_425967 63 9 solid solid JJ 10_1101-2021_01_08_425967 63 10 random random JJ 10_1101-2021_01_08_425967 63 11 background background NN 10_1101-2021_01_08_425967 63 12 to to TO 10_1101-2021_01_08_425967 63 13 compare compare VB 10_1101-2021_01_08_425967 63 14 it -PRON- PRP 10_1101-2021_01_08_425967 63 15 to to IN 10_1101-2021_01_08_425967 63 16 the the DT 10_1101-2021_01_08_425967 63 17 real real JJ 10_1101-2021_01_08_425967 63 18 signal signal NN 10_1101-2021_01_08_425967 63 19 . . . 10_1101-2021_01_08_425967 64 1 The the DT 10_1101-2021_01_08_425967 64 2 number number NN 10_1101-2021_01_08_425967 64 3 of of IN 10_1101-2021_01_08_425967 64 4 randomizations randomization NNS 10_1101-2021_01_08_425967 64 5 does do VBZ 10_1101-2021_01_08_425967 64 6 not not RB 10_1101-2021_01_08_425967 64 7 depend depend VB 10_1101-2021_01_08_425967 64 8 on on IN 10_1101-2021_01_08_425967 64 9 the the DT 10_1101-2021_01_08_425967 64 10 size size NN 10_1101-2021_01_08_425967 64 11 of of IN 10_1101-2021_01_08_425967 64 12 the the DT 10_1101-2021_01_08_425967 64 13 VP VP NNP 10_1101-2021_01_08_425967 64 14 . . . 10_1101-2021_01_08_425967 65 1 It -PRON- PRP 10_1101-2021_01_08_425967 65 2 is be VBZ 10_1101-2021_01_08_425967 65 3 worth worth JJ 10_1101-2021_01_08_425967 65 4 to to TO 10_1101-2021_01_08_425967 65 5 notice notice VB 10_1101-2021_01_08_425967 65 6 that that IN 10_1101-2021_01_08_425967 65 7 there there EX 10_1101-2021_01_08_425967 65 8 are be VBP 10_1101-2021_01_08_425967 65 9 two two CD 10_1101-2021_01_08_425967 65 10 randomization randomization NN 10_1101-2021_01_08_425967 65 11 processes process NNS 10_1101-2021_01_08_425967 65 12 , , , 10_1101-2021_01_08_425967 65 13 one one CD 10_1101-2021_01_08_425967 65 14 is be VBZ 10_1101-2021_01_08_425967 65 15 meant mean VBN 10_1101-2021_01_08_425967 65 16 to to TO 10_1101-2021_01_08_425967 65 17 generate generate VB 10_1101-2021_01_08_425967 65 18 the the DT 10_1101-2021_01_08_425967 65 19 input input NN 10_1101-2021_01_08_425967 65 20 population population NN 10_1101-2021_01_08_425967 65 21 of of IN 10_1101-2021_01_08_425967 65 22 random random JJ 10_1101-2021_01_08_425967 65 23 vectors vector NNS 10_1101-2021_01_08_425967 65 24 to to TO 10_1101-2021_01_08_425967 65 25 calculate calculate VB 10_1101-2021_01_08_425967 65 26 the the DT 10_1101-2021_01_08_425967 65 27 PQA PQA NNP 10_1101-2021_01_08_425967 65 28 score score NN 10_1101-2021_01_08_425967 65 29 to to TO 10_1101-2021_01_08_425967 65 30 further further RB 10_1101-2021_01_08_425967 65 31 calculate calculate VB 10_1101-2021_01_08_425967 65 32 a a DT 10_1101-2021_01_08_425967 65 33 Z- z- NN 10_1101-2021_01_08_425967 65 34 score score NN 10_1101-2021_01_08_425967 65 35 and and CC 10_1101-2021_01_08_425967 65 36 the the DT 10_1101-2021_01_08_425967 65 37 other other JJ 10_1101-2021_01_08_425967 65 38 is be VBZ 10_1101-2021_01_08_425967 65 39 representing represent VBG 10_1101-2021_01_08_425967 65 40 the the DT 10_1101-2021_01_08_425967 65 41 noise noise NN 10_1101-2021_01_08_425967 65 42 in in IN 10_1101-2021_01_08_425967 65 43 Equation Equation NNP 10_1101-2021_01_08_425967 65 44 2 2 CD 10_1101-2021_01_08_425967 65 45 . . . 10_1101-2021_01_08_425967 66 1 2.5 2.5 CD 10_1101-2021_01_08_425967 66 2 . . . 10_1101-2021_01_08_425967 67 1 Defining define VBG 10_1101-2021_01_08_425967 67 2 noise noise NN 10_1101-2021_01_08_425967 67 3 proportions proportion NNS 10_1101-2021_01_08_425967 67 4 To to TO 10_1101-2021_01_08_425967 67 5 provide provide VB 10_1101-2021_01_08_425967 67 6 a a DT 10_1101-2021_01_08_425967 67 7 quantification quantification NN 10_1101-2021_01_08_425967 67 8 of of IN 10_1101-2021_01_08_425967 67 9 the the DT 10_1101-2021_01_08_425967 67 10 embedded embed VBN 10_1101-2021_01_08_425967 67 11 noise noise NN 10_1101-2021_01_08_425967 67 12 in in IN 10_1101-2021_01_08_425967 67 13 the the DT 10_1101-2021_01_08_425967 67 14 VP VP NNP 10_1101-2021_01_08_425967 67 15 , , , 10_1101-2021_01_08_425967 67 16 we -PRON- PRP 10_1101-2021_01_08_425967 67 17 calculate calculate VBP 10_1101-2021_01_08_425967 67 18 the the DT 10_1101-2021_01_08_425967 67 19 Z z NN 10_1101-2021_01_08_425967 67 20 - - HYPH 10_1101-2021_01_08_425967 67 21 scores score NNS 10_1101-2021_01_08_425967 67 22 from from IN 10_1101-2021_01_08_425967 67 23 the the DT 10_1101-2021_01_08_425967 67 24 distribution distribution NN 10_1101-2021_01_08_425967 67 25 of of IN 10_1101-2021_01_08_425967 67 26 PQA PQA NNP 10_1101-2021_01_08_425967 67 27 values value NNS 10_1101-2021_01_08_425967 67 28 of of IN 10_1101-2021_01_08_425967 67 29 the the DT 10_1101-2021_01_08_425967 67 30 randomized randomized JJ 10_1101-2021_01_08_425967 67 31 vectors vector NNS 10_1101-2021_01_08_425967 67 32 . . . 10_1101-2021_01_08_425967 68 1 This this DT 10_1101-2021_01_08_425967 68 2 shuffling shuffling NN 10_1101-2021_01_08_425967 68 3 is be VBZ 10_1101-2021_01_08_425967 68 4 yielded yield VBN 10_1101-2021_01_08_425967 68 5 by by IN 10_1101-2021_01_08_425967 68 6 scrambling scramble VBG 10_1101-2021_01_08_425967 68 7 the the DT 10_1101-2021_01_08_425967 68 8 vector vector NN 10_1101-2021_01_08_425967 68 9 . . . 10_1101-2021_01_08_425967 69 1 Then then RB 10_1101-2021_01_08_425967 69 2 this this DT 10_1101-2021_01_08_425967 69 3 Z z NN 10_1101-2021_01_08_425967 69 4 - - HYPH 10_1101-2021_01_08_425967 69 5 score score NN 10_1101-2021_01_08_425967 69 6 is be VBZ 10_1101-2021_01_08_425967 69 7 interpolated interpolate VBN 10_1101-2021_01_08_425967 69 8 to to TO 10_1101-2021_01_08_425967 69 9 retrieve retrieve VB 10_1101-2021_01_08_425967 69 10 the the DT 10_1101-2021_01_08_425967 69 11 estimated estimate VBN 10_1101-2021_01_08_425967 69 12 noise noise NN 10_1101-2021_01_08_425967 69 13 in in IN 10_1101-2021_01_08_425967 69 14 the the DT 10_1101-2021_01_08_425967 69 15 VP VP NNP 10_1101-2021_01_08_425967 69 16 cluster cluster NN 10_1101-2021_01_08_425967 69 17 . . . 10_1101-2021_01_08_425967 70 1 2.6 2.6 CD 10_1101-2021_01_08_425967 70 2 . . . 10_1101-2021_01_08_425967 71 1 Effect effect NN 10_1101-2021_01_08_425967 71 2 of of IN 10_1101-2021_01_08_425967 71 3 the the DT 10_1101-2021_01_08_425967 71 4 length length NN 10_1101-2021_01_08_425967 71 5 and and CC 10_1101-2021_01_08_425967 71 6 number number NN 10_1101-2021_01_08_425967 71 7 of of IN 10_1101-2021_01_08_425967 71 8 partitions partition NNS 10_1101-2021_01_08_425967 71 9 of of IN 10_1101-2021_01_08_425967 71 10 the the DT 10_1101-2021_01_08_425967 71 11 vector vector NN 10_1101-2021_01_08_425967 71 12 in in IN 10_1101-2021_01_08_425967 71 13 the the DT 10_1101-2021_01_08_425967 71 14 Z z JJ 10_1101-2021_01_08_425967 71 15 - - HYPH 10_1101-2021_01_08_425967 71 16 score score NN 10_1101-2021_01_08_425967 71 17 distributions distribution NNS 10_1101-2021_01_08_425967 71 18 . . . 10_1101-2021_01_08_425967 72 1 Since since IN 10_1101-2021_01_08_425967 72 2 we -PRON- PRP 10_1101-2021_01_08_425967 72 3 want want VBP 10_1101-2021_01_08_425967 72 4 to to TO 10_1101-2021_01_08_425967 72 5 compare compare VB 10_1101-2021_01_08_425967 72 6 the the DT 10_1101-2021_01_08_425967 72 7 PQA PQA NNP 10_1101-2021_01_08_425967 72 8 with with IN 10_1101-2021_01_08_425967 72 9 the the DT 10_1101-2021_01_08_425967 72 10 noise noise NN 10_1101-2021_01_08_425967 72 11 , , , 10_1101-2021_01_08_425967 72 12 we -PRON- PRP 10_1101-2021_01_08_425967 72 13 randomized randomize VBD 10_1101-2021_01_08_425967 72 14 1000 1000 CD 10_1101-2021_01_08_425967 72 15 times time NNS 10_1101-2021_01_08_425967 72 16 the the DT 10_1101-2021_01_08_425967 72 17 VP VP NNP 10_1101-2021_01_08_425967 72 18 . . . 10_1101-2021_01_08_425967 73 1 We -PRON- PRP 10_1101-2021_01_08_425967 73 2 opted opt VBD 10_1101-2021_01_08_425967 73 3 to to TO 10_1101-2021_01_08_425967 73 4 describe describe VB 10_1101-2021_01_08_425967 73 5 the the DT 10_1101-2021_01_08_425967 73 6 dynamic dynamic NN 10_1101-2021_01_08_425967 73 7 of of IN 10_1101-2021_01_08_425967 73 8 the the DT 10_1101-2021_01_08_425967 73 9 Z z NN 10_1101-2021_01_08_425967 73 10 - - HYPH 10_1101-2021_01_08_425967 73 11 score score NN 10_1101-2021_01_08_425967 73 12 given give VBN 10_1101-2021_01_08_425967 73 13 the the DT 10_1101-2021_01_08_425967 73 14 different different JJ 10_1101-2021_01_08_425967 73 15 percentage percentage NN 10_1101-2021_01_08_425967 73 16 of of IN 10_1101-2021_01_08_425967 73 17 noise noise NN 10_1101-2021_01_08_425967 73 18 and and CC 10_1101-2021_01_08_425967 73 19 the the DT 10_1101-2021_01_08_425967 73 20 number number NN 10_1101-2021_01_08_425967 73 21 of of IN 10_1101-2021_01_08_425967 73 22 partitions partition NNS 10_1101-2021_01_08_425967 73 23 . . . 10_1101-2021_01_08_425967 74 1 For for IN 10_1101-2021_01_08_425967 74 2 this this DT 10_1101-2021_01_08_425967 74 3 , , , 10_1101-2021_01_08_425967 74 4 we -PRON- PRP 10_1101-2021_01_08_425967 74 5 synthetically synthetically RB 10_1101-2021_01_08_425967 74 6 crafted craft VBD 10_1101-2021_01_08_425967 74 7 vector vector NN 10_1101-2021_01_08_425967 74 8 of of IN 10_1101-2021_01_08_425967 74 9 both both DT 10_1101-2021_01_08_425967 74 10 ranging range VBG 10_1101-2021_01_08_425967 74 11 from from IN 10_1101-2021_01_08_425967 74 12 0 0 CD 10_1101-2021_01_08_425967 74 13 to to IN 10_1101-2021_01_08_425967 74 14 100 100 CD 10_1101-2021_01_08_425967 74 15 elements element NNS 10_1101-2021_01_08_425967 74 16 and and CC 10_1101-2021_01_08_425967 74 17 number number NN 10_1101-2021_01_08_425967 74 18 of of IN 10_1101-2021_01_08_425967 74 19 classifications classification NNS 10_1101-2021_01_08_425967 74 20 . . . 10_1101-2021_01_08_425967 75 1 The the DT 10_1101-2021_01_08_425967 75 2 Z z NN 10_1101-2021_01_08_425967 75 3 - - HYPH 10_1101-2021_01_08_425967 75 4 scores score NNS 10_1101-2021_01_08_425967 75 5 were be VBD 10_1101-2021_01_08_425967 75 6 retrieved retrieve VBN 10_1101-2021_01_08_425967 75 7 from from IN 10_1101-2021_01_08_425967 75 8 the the DT 10_1101-2021_01_08_425967 75 9 crafted crafted JJ 10_1101-2021_01_08_425967 75 10 vectors vector NNS 10_1101-2021_01_08_425967 75 11 using use VBG 10_1101-2021_01_08_425967 75 12 the the DT 10_1101-2021_01_08_425967 75 13 formulas formula NNS 10_1101-2021_01_08_425967 75 14 described describe VBN 10_1101-2021_01_08_425967 75 15 above above RB 10_1101-2021_01_08_425967 75 16 . . . 10_1101-2021_01_08_425967 76 1 3 3 LS 10_1101-2021_01_08_425967 76 2 . . . 10_1101-2021_01_08_425967 77 1 Results result NNS 10_1101-2021_01_08_425967 77 2 and and CC 10_1101-2021_01_08_425967 77 3 Discussion Discussion NNP 10_1101-2021_01_08_425967 77 4 3.1 3.1 CD 10_1101-2021_01_08_425967 77 5 . . . 10_1101-2021_01_08_425967 78 1 Effects effect NNS 10_1101-2021_01_08_425967 78 2 of of IN 10_1101-2021_01_08_425967 78 3 permuted permute VBN 10_1101-2021_01_08_425967 78 4 numeric numeric JJ 10_1101-2021_01_08_425967 78 5 labels label NNS 10_1101-2021_01_08_425967 78 6 on on IN 10_1101-2021_01_08_425967 78 7 the the DT 10_1101-2021_01_08_425967 78 8 partition partition NN 10_1101-2021_01_08_425967 78 9 We -PRON- PRP 10_1101-2021_01_08_425967 78 10 wondered wonder VBD 10_1101-2021_01_08_425967 78 11 whether whether IN 10_1101-2021_01_08_425967 78 12 the the DT 10_1101-2021_01_08_425967 78 13 correct correct JJ 10_1101-2021_01_08_425967 78 14 assigning assigning NN 10_1101-2021_01_08_425967 78 15 of of IN 10_1101-2021_01_08_425967 78 16 numeric numeric JJ 10_1101-2021_01_08_425967 78 17 labels label NNS 10_1101-2021_01_08_425967 78 18 to to TO 10_1101-2021_01_08_425967 78 19 alter alter VB 10_1101-2021_01_08_425967 78 20 the the DT 10_1101-2021_01_08_425967 78 21 less less RBR 10_1101-2021_01_08_425967 78 22 possible possible JJ 10_1101-2021_01_08_425967 78 23 the the DT 10_1101-2021_01_08_425967 78 24 SC SC NNP 10_1101-2021_01_08_425967 78 25 calculations calculation NNS 10_1101-2021_01_08_425967 78 26 , , , 10_1101-2021_01_08_425967 78 27 so so RB 10_1101-2021_01_08_425967 78 28 we -PRON- PRP 10_1101-2021_01_08_425967 78 29 analyzed analyze VBD 10_1101-2021_01_08_425967 78 30 how how WRB 10_1101-2021_01_08_425967 78 31 the the DT 10_1101-2021_01_08_425967 78 32 SC SC NNP 10_1101-2021_01_08_425967 78 33 changes change VBZ 10_1101-2021_01_08_425967 78 34 over over IN 10_1101-2021_01_08_425967 78 35 the the DT 10_1101-2021_01_08_425967 78 36 synthetic synthetic JJ 10_1101-2021_01_08_425967 78 37 partitions partition NNS 10_1101-2021_01_08_425967 78 38 with with IN 10_1101-2021_01_08_425967 78 39 permuted permute VBN 10_1101-2021_01_08_425967 78 40 labels label NNS 10_1101-2021_01_08_425967 78 41 . . . 10_1101-2021_01_08_425967 79 1 We -PRON- PRP 10_1101-2021_01_08_425967 79 2 began begin VBD 10_1101-2021_01_08_425967 79 3 generating generate VBG 10_1101-2021_01_08_425967 79 4 synthetic synthetic JJ 10_1101-2021_01_08_425967 79 5 partitions partition NNS 10_1101-2021_01_08_425967 79 6 in in IN 10_1101-2021_01_08_425967 79 7 ascending ascend VBG 10_1101-2021_01_08_425967 79 8 and and CC 10_1101-2021_01_08_425967 79 9 descending descend VBG 10_1101-2021_01_08_425967 79 10 order order NN 10_1101-2021_01_08_425967 79 11 , , , 10_1101-2021_01_08_425967 79 12 increasing increase VBG 10_1101-2021_01_08_425967 79 13 both both CC 10_1101-2021_01_08_425967 79 14 the the DT 10_1101-2021_01_08_425967 79 15 number number NN 10_1101-2021_01_08_425967 79 16 of of IN 10_1101-2021_01_08_425967 79 17 classifications classification NNS 10_1101-2021_01_08_425967 79 18 and and CC 10_1101-2021_01_08_425967 79 19 the the DT 10_1101-2021_01_08_425967 79 20 number number NN 10_1101-2021_01_08_425967 79 21 of of IN 10_1101-2021_01_08_425967 79 22 items item NNS 10_1101-2021_01_08_425967 79 23 , , , 10_1101-2021_01_08_425967 79 24 up up RB 10_1101-2021_01_08_425967 79 25 to to TO 10_1101-2021_01_08_425967 79 26 100 100 CD 10_1101-2021_01_08_425967 79 27 . . . 10_1101-2021_01_08_425967 80 1 It -PRON- PRP 10_1101-2021_01_08_425967 80 2 is be VBZ 10_1101-2021_01_08_425967 80 3 important important JJ 10_1101-2021_01_08_425967 80 4 to to TO 10_1101-2021_01_08_425967 80 5 highlight highlight VB 10_1101-2021_01_08_425967 80 6 that that IN 10_1101-2021_01_08_425967 80 7 the the DT 10_1101-2021_01_08_425967 80 8 number number NN 10_1101-2021_01_08_425967 80 9 of of IN 10_1101-2021_01_08_425967 80 10 items item NNS 10_1101-2021_01_08_425967 80 11 belonging belong VBG 10_1101-2021_01_08_425967 80 12 to to IN 10_1101-2021_01_08_425967 80 13 each each DT 10_1101-2021_01_08_425967 80 14 classification classification NN 10_1101-2021_01_08_425967 80 15 was be VBD 10_1101-2021_01_08_425967 80 16 kept keep VBN 10_1101-2021_01_08_425967 80 17 constant constant JJ 10_1101-2021_01_08_425967 80 18 . . . 10_1101-2021_01_08_425967 81 1 Because because IN 10_1101-2021_01_08_425967 81 2 trying try VBG 10_1101-2021_01_08_425967 81 3 all all PDT 10_1101-2021_01_08_425967 81 4 the the DT 10_1101-2021_01_08_425967 81 5 possible possible JJ 10_1101-2021_01_08_425967 81 6 permutations permutation NNS 10_1101-2021_01_08_425967 81 7 for for IN 10_1101-2021_01_08_425967 81 8 each each DT 10_1101-2021_01_08_425967 81 9 vector vector NN 10_1101-2021_01_08_425967 81 10 would would MD 10_1101-2021_01_08_425967 81 11 be be VB 10_1101-2021_01_08_425967 81 12 implausible implausible JJ 10_1101-2021_01_08_425967 81 13 , , , 10_1101-2021_01_08_425967 81 14 we -PRON- PRP 10_1101-2021_01_08_425967 81 15 created create VBD 10_1101-2021_01_08_425967 81 16 a a DT 10_1101-2021_01_08_425967 81 17 subset subset NN 10_1101-2021_01_08_425967 81 18 of of IN 10_1101-2021_01_08_425967 81 19 1000 1000 CD 10_1101-2021_01_08_425967 81 20 permutations permutation NNS 10_1101-2021_01_08_425967 81 21 of of IN 10_1101-2021_01_08_425967 81 22 each each DT 10_1101-2021_01_08_425967 81 23 vector vector NN 10_1101-2021_01_08_425967 81 24 , , , 10_1101-2021_01_08_425967 81 25 then then RB 10_1101-2021_01_08_425967 81 26 we -PRON- PRP 10_1101-2021_01_08_425967 81 27 calculated calculate VBD 10_1101-2021_01_08_425967 81 28 the the DT 10_1101-2021_01_08_425967 81 29 mean mean JJ 10_1101-2021_01_08_425967 81 30 SC SC NNP 10_1101-2021_01_08_425967 81 31 ( ( -LRB- 10_1101-2021_01_08_425967 81 32 Figure Figure NNP 10_1101-2021_01_08_425967 81 33 1 1 CD 10_1101-2021_01_08_425967 81 34 , , , 10_1101-2021_01_08_425967 81 35 see see VB 10_1101-2021_01_08_425967 81 36 Methodology Methodology NNP 10_1101-2021_01_08_425967 81 37 ) ) -RRB- 10_1101-2021_01_08_425967 81 38 . . . 10_1101-2021_01_08_425967 82 1 We -PRON- PRP 10_1101-2021_01_08_425967 82 2 observed observe VBD 10_1101-2021_01_08_425967 82 3 that that IN 10_1101-2021_01_08_425967 82 4 the the DT 10_1101-2021_01_08_425967 82 5 mean mean JJ 10_1101-2021_01_08_425967 82 6 SC SC NNP 10_1101-2021_01_08_425967 82 7 got get VBD 10_1101-2021_01_08_425967 82 8 high high JJ 10_1101-2021_01_08_425967 82 9 when when WRB 10_1101-2021_01_08_425967 82 10 the the DT 10_1101-2021_01_08_425967 82 11 number number NN 10_1101-2021_01_08_425967 82 12 of of IN 10_1101-2021_01_08_425967 82 13 items item NNS 10_1101-2021_01_08_425967 82 14 in in IN 10_1101-2021_01_08_425967 82 15 the the DT 10_1101-2021_01_08_425967 82 16 VP VP NNP 10_1101-2021_01_08_425967 82 17 was be VBD 10_1101-2021_01_08_425967 82 18 greater great JJR 10_1101-2021_01_08_425967 82 19 or or CC 10_1101-2021_01_08_425967 82 20 equal equal JJ 10_1101-2021_01_08_425967 82 21 to to IN 10_1101-2021_01_08_425967 82 22 2 2 CD 10_1101-2021_01_08_425967 82 23 times time NNS 10_1101-2021_01_08_425967 82 24 the the DT 10_1101-2021_01_08_425967 82 25 number number NN 10_1101-2021_01_08_425967 82 26 of of IN 10_1101-2021_01_08_425967 82 27 classifications classification NNS 10_1101-2021_01_08_425967 82 28 , , , 10_1101-2021_01_08_425967 82 29 nevertheless nevertheless RB 10_1101-2021_01_08_425967 82 30 , , , 10_1101-2021_01_08_425967 82 31 we -PRON- PRP 10_1101-2021_01_08_425967 82 32 got get VBD 10_1101-2021_01_08_425967 82 33 the the DT 10_1101-2021_01_08_425967 82 34 highest high JJS 10_1101-2021_01_08_425967 82 35 SC SC NNP 10_1101-2021_01_08_425967 82 36 when when WRB 10_1101-2021_01_08_425967 82 37 the the DT 10_1101-2021_01_08_425967 82 38 numeric numeric JJ 10_1101-2021_01_08_425967 82 39 labels label NNS 10_1101-2021_01_08_425967 82 40 we -PRON- PRP 10_1101-2021_01_08_425967 82 41 assigned assign VBN 10_1101-2021_01_08_425967 82 42 by by IN 10_1101-2021_01_08_425967 82 43 sequential sequential JJ 10_1101-2021_01_08_425967 82 44 order order NN 10_1101-2021_01_08_425967 82 45 , , , 10_1101-2021_01_08_425967 82 46 either either CC 10_1101-2021_01_08_425967 82 47 ascending ascend VBG 10_1101-2021_01_08_425967 82 48 or or CC 10_1101-2021_01_08_425967 82 49 descending descend VBG 10_1101-2021_01_08_425967 82 50 ( ( -LRB- 10_1101-2021_01_08_425967 82 51 Figure Figure NNP 10_1101-2021_01_08_425967 82 52 2 2 CD 10_1101-2021_01_08_425967 82 53 ) ) -RRB- 10_1101-2021_01_08_425967 82 54 . . . 10_1101-2021_01_08_425967 83 1 .CC .CC NFP 10_1101-2021_01_08_425967 83 2 - - : 10_1101-2021_01_08_425967 83 3 BY by IN 10_1101-2021_01_08_425967 83 4 4.0 4.0 CD 10_1101-2021_01_08_425967 83 5 International international JJ 10_1101-2021_01_08_425967 83 6 licensemade licensemade NN 10_1101-2021_01_08_425967 83 7 available available JJ 10_1101-2021_01_08_425967 83 8 under under IN 10_1101-2021_01_08_425967 83 9 a a DT 10_1101-2021_01_08_425967 83 10 ( ( -LRB- 10_1101-2021_01_08_425967 83 11 which which WDT 10_1101-2021_01_08_425967 83 12 was be VBD 10_1101-2021_01_08_425967 83 13 not not RB 10_1101-2021_01_08_425967 83 14 certified certify VBN 10_1101-2021_01_08_425967 83 15 by by IN 10_1101-2021_01_08_425967 83 16 peer peer NN 10_1101-2021_01_08_425967 83 17 review review NN 10_1101-2021_01_08_425967 83 18 ) ) -RRB- 10_1101-2021_01_08_425967 83 19 is be VBZ 10_1101-2021_01_08_425967 83 20 the the DT 10_1101-2021_01_08_425967 83 21 author author NN 10_1101-2021_01_08_425967 83 22 / / SYM 10_1101-2021_01_08_425967 83 23 funder funder NN 10_1101-2021_01_08_425967 83 24 , , , 10_1101-2021_01_08_425967 83 25 who who WP 10_1101-2021_01_08_425967 83 26 has have VBZ 10_1101-2021_01_08_425967 83 27 granted grant VBN 10_1101-2021_01_08_425967 83 28 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 83 29 a a DT 10_1101-2021_01_08_425967 83 30 license license NN 10_1101-2021_01_08_425967 83 31 to to TO 10_1101-2021_01_08_425967 83 32 display display VB 10_1101-2021_01_08_425967 83 33 the the DT 10_1101-2021_01_08_425967 83 34 preprint preprint NN 10_1101-2021_01_08_425967 83 35 in in IN 10_1101-2021_01_08_425967 83 36 perpetuity perpetuity NN 10_1101-2021_01_08_425967 83 37 . . . 10_1101-2021_01_08_425967 84 1 It -PRON- PRP 10_1101-2021_01_08_425967 84 2 is be VBZ 10_1101-2021_01_08_425967 84 3 The the DT 10_1101-2021_01_08_425967 84 4 copyright copyright NN 10_1101-2021_01_08_425967 84 5 holder holder NN 10_1101-2021_01_08_425967 84 6 for for IN 10_1101-2021_01_08_425967 84 7 this this DT 10_1101-2021_01_08_425967 84 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 84 9 version version NN 10_1101-2021_01_08_425967 84 10 posted post VBD 10_1101-2021_01_08_425967 84 11 January January NNP 10_1101-2021_01_08_425967 84 12 9 9 CD 10_1101-2021_01_08_425967 84 13 , , , 10_1101-2021_01_08_425967 84 14 2021 2021 CD 10_1101-2021_01_08_425967 84 15 . . . 10_1101-2021_01_08_425967 84 16 ; ; : 10_1101-2021_01_08_425967 84 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 84 18 : : : 10_1101-2021_01_08_425967 84 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 84 20 preprint preprint NN 10_1101-2021_01_08_425967 84 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 84 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ -LRB- 10_1101-2021_01_08_425967 84 23 Figure Figure NNP 10_1101-2021_01_08_425967 84 24 2 2 CD 10_1101-2021_01_08_425967 84 25 . . . 10_1101-2021_01_08_425967 85 1 Z z NN 10_1101-2021_01_08_425967 85 2 - - HYPH 10_1101-2021_01_08_425967 85 3 scores score NNS 10_1101-2021_01_08_425967 85 4 of of IN 10_1101-2021_01_08_425967 85 5 the the DT 10_1101-2021_01_08_425967 85 6 PQA PQA NNP 10_1101-2021_01_08_425967 85 7 scores score NNS 10_1101-2021_01_08_425967 85 8 from from IN 10_1101-2021_01_08_425967 85 9 partitions partition NNS 10_1101-2021_01_08_425967 85 10 varying vary VBG 10_1101-2021_01_08_425967 85 11 in in IN 10_1101-2021_01_08_425967 85 12 the the DT 10_1101-2021_01_08_425967 85 13 number number NN 10_1101-2021_01_08_425967 85 14 of of IN 10_1101-2021_01_08_425967 85 15 classifications classification NNS 10_1101-2021_01_08_425967 85 16 and and CC 10_1101-2021_01_08_425967 85 17 the the DT 10_1101-2021_01_08_425967 85 18 length length NN 10_1101-2021_01_08_425967 85 19 of of IN 10_1101-2021_01_08_425967 85 20 the the DT 10_1101-2021_01_08_425967 85 21 partition partition NN 10_1101-2021_01_08_425967 85 22 . . . 10_1101-2021_01_08_425967 86 1 3.2 3.2 CD 10_1101-2021_01_08_425967 86 2 . . . 10_1101-2021_01_08_425967 87 1 Length length NN 10_1101-2021_01_08_425967 87 2 of of IN 10_1101-2021_01_08_425967 87 3 partitions partition NNS 10_1101-2021_01_08_425967 87 4 as as IN 10_1101-2021_01_08_425967 87 5 a a DT 10_1101-2021_01_08_425967 87 6 proxy proxy NN 10_1101-2021_01_08_425967 87 7 of of IN 10_1101-2021_01_08_425967 87 8 the the DT 10_1101-2021_01_08_425967 87 9 number number NN 10_1101-2021_01_08_425967 87 10 of of IN 10_1101-2021_01_08_425967 87 11 classifications classification NNS 10_1101-2021_01_08_425967 87 12 We -PRON- PRP 10_1101-2021_01_08_425967 87 13 wonder wonder VBP 10_1101-2021_01_08_425967 87 14 whether whether IN 10_1101-2021_01_08_425967 87 15 the the DT 10_1101-2021_01_08_425967 87 16 number number NN 10_1101-2021_01_08_425967 87 17 of of IN 10_1101-2021_01_08_425967 87 18 classifications classification NNS 10_1101-2021_01_08_425967 87 19 and and CC 10_1101-2021_01_08_425967 87 20 the the DT 10_1101-2021_01_08_425967 87 21 length length NN 10_1101-2021_01_08_425967 87 22 of of IN 10_1101-2021_01_08_425967 87 23 the the DT 10_1101-2021_01_08_425967 87 24 VP VP NNP 10_1101-2021_01_08_425967 87 25 may may MD 10_1101-2021_01_08_425967 87 26 change change VB 10_1101-2021_01_08_425967 87 27 the the DT 10_1101-2021_01_08_425967 87 28 statistical statistical JJ 10_1101-2021_01_08_425967 87 29 significance significance NN 10_1101-2021_01_08_425967 87 30 of of IN 10_1101-2021_01_08_425967 87 31 the the DT 10_1101-2021_01_08_425967 87 32 PQA PQA NNP 10_1101-2021_01_08_425967 87 33 score score NN 10_1101-2021_01_08_425967 87 34 because because IN 10_1101-2021_01_08_425967 87 35 of of IN 10_1101-2021_01_08_425967 87 36 the the DT 10_1101-2021_01_08_425967 87 37 less less JJR 10_1101-2021_01_08_425967 87 38 the the DT 10_1101-2021_01_08_425967 87 39 number number NN 10_1101-2021_01_08_425967 87 40 of of IN 10_1101-2021_01_08_425967 87 41 items item NNS 10_1101-2021_01_08_425967 87 42 in in IN 10_1101-2021_01_08_425967 87 43 the the DT 10_1101-2021_01_08_425967 87 44 VP VP NNP 10_1101-2021_01_08_425967 87 45 , , , 10_1101-2021_01_08_425967 87 46 the the DT 10_1101-2021_01_08_425967 87 47 greater great JJR 10_1101-2021_01_08_425967 87 48 the the DT 10_1101-2021_01_08_425967 87 49 chance chance NN 10_1101-2021_01_08_425967 87 50 to to TO 10_1101-2021_01_08_425967 87 51 group group VB 10_1101-2021_01_08_425967 87 52 each each DT 10_1101-2021_01_08_425967 87 53 item item NN 10_1101-2021_01_08_425967 87 54 with with IN 10_1101-2021_01_08_425967 87 55 any any DT 10_1101-2021_01_08_425967 87 56 order order NN 10_1101-2021_01_08_425967 87 57 . . . 10_1101-2021_01_08_425967 88 1 We -PRON- PRP 10_1101-2021_01_08_425967 88 2 then then RB 10_1101-2021_01_08_425967 88 3 tested test VBD 10_1101-2021_01_08_425967 88 4 such such JJ 10_1101-2021_01_08_425967 88 5 effect effect NN 10_1101-2021_01_08_425967 88 6 by by IN 10_1101-2021_01_08_425967 88 7 calculating calculate VBG 10_1101-2021_01_08_425967 88 8 a a DT 10_1101-2021_01_08_425967 88 9 Z z NN 10_1101-2021_01_08_425967 88 10 - - HYPH 10_1101-2021_01_08_425967 88 11 score score NN 10_1101-2021_01_08_425967 88 12 from from IN 10_1101-2021_01_08_425967 88 13 ordered order VBN 10_1101-2021_01_08_425967 88 14 synthetic synthetic JJ 10_1101-2021_01_08_425967 88 15 partitions partition NNS 10_1101-2021_01_08_425967 88 16 increasing increase VBG 10_1101-2021_01_08_425967 88 17 both both CC 10_1101-2021_01_08_425967 88 18 the the DT 10_1101-2021_01_08_425967 88 19 number number NN 10_1101-2021_01_08_425967 88 20 of of IN 10_1101-2021_01_08_425967 88 21 classifications classification NNS 10_1101-2021_01_08_425967 88 22 and and CC 10_1101-2021_01_08_425967 88 23 the the DT 10_1101-2021_01_08_425967 88 24 number number NN 10_1101-2021_01_08_425967 88 25 of of IN 10_1101-2021_01_08_425967 88 26 items item NNS 10_1101-2021_01_08_425967 88 27 up up IN 10_1101-2021_01_08_425967 88 28 to to IN 10_1101-2021_01_08_425967 88 29 100 100 CD 10_1101-2021_01_08_425967 88 30 . . . 10_1101-2021_01_08_425967 89 1 We -PRON- PRP 10_1101-2021_01_08_425967 89 2 also also RB 10_1101-2021_01_08_425967 89 3 kept keep VBD 10_1101-2021_01_08_425967 89 4 constant constant JJ 10_1101-2021_01_08_425967 89 5 the the DT 10_1101-2021_01_08_425967 89 6 number number NN 10_1101-2021_01_08_425967 89 7 of of IN 10_1101-2021_01_08_425967 89 8 classifications classification NNS 10_1101-2021_01_08_425967 89 9 for for IN 10_1101-2021_01_08_425967 89 10 the the DT 10_1101-2021_01_08_425967 89 11 sake sake NN 10_1101-2021_01_08_425967 89 12 of of IN 10_1101-2021_01_08_425967 89 13 this this DT 10_1101-2021_01_08_425967 89 14 analysis analysis NN 10_1101-2021_01_08_425967 89 15 . . . 10_1101-2021_01_08_425967 90 1 We -PRON- PRP 10_1101-2021_01_08_425967 90 2 noticed notice VBD 10_1101-2021_01_08_425967 90 3 that that IN 10_1101-2021_01_08_425967 90 4 only only RB 10_1101-2021_01_08_425967 90 5 the the DT 10_1101-2021_01_08_425967 90 6 length length NN 10_1101-2021_01_08_425967 90 7 of of IN 10_1101-2021_01_08_425967 90 8 the the DT 10_1101-2021_01_08_425967 90 9 partition partition NN 10_1101-2021_01_08_425967 90 10 has have VBZ 10_1101-2021_01_08_425967 90 11 a a DT 10_1101-2021_01_08_425967 90 12 true true JJ 10_1101-2021_01_08_425967 90 13 effect effect NN 10_1101-2021_01_08_425967 90 14 on on IN 10_1101-2021_01_08_425967 90 15 the the DT 10_1101-2021_01_08_425967 90 16 Z z NN 10_1101-2021_01_08_425967 90 17 - - HYPH 10_1101-2021_01_08_425967 90 18 score score NN 10_1101-2021_01_08_425967 90 19 , , , 10_1101-2021_01_08_425967 90 20 but but CC 10_1101-2021_01_08_425967 90 21 that that DT 10_1101-2021_01_08_425967 90 22 is be VBZ 10_1101-2021_01_08_425967 90 23 not not RB 10_1101-2021_01_08_425967 90 24 the the DT 10_1101-2021_01_08_425967 90 25 case case NN 10_1101-2021_01_08_425967 90 26 for for IN 10_1101-2021_01_08_425967 90 27 the the DT 10_1101-2021_01_08_425967 90 28 number number NN 10_1101-2021_01_08_425967 90 29 of of IN 10_1101-2021_01_08_425967 90 30 classifications classification NNS 10_1101-2021_01_08_425967 90 31 . . . 10_1101-2021_01_08_425967 91 1 We -PRON- PRP 10_1101-2021_01_08_425967 91 2 observed observe VBD 10_1101-2021_01_08_425967 91 3 that that IN 10_1101-2021_01_08_425967 91 4 every every DT 10_1101-2021_01_08_425967 91 5 partition partition NN 10_1101-2021_01_08_425967 91 6 minor minor JJ 10_1101-2021_01_08_425967 91 7 than than IN 10_1101-2021_01_08_425967 91 8 13 13 CD 10_1101-2021_01_08_425967 91 9 could could MD 10_1101-2021_01_08_425967 91 10 be be VB 10_1101-2021_01_08_425967 91 11 considered consider VBN 10_1101-2021_01_08_425967 91 12 as as IN 10_1101-2021_01_08_425967 91 13 pure pure JJ 10_1101-2021_01_08_425967 91 14 noise noise NN 10_1101-2021_01_08_425967 91 15 , , , 10_1101-2021_01_08_425967 91 16 however however RB 10_1101-2021_01_08_425967 91 17 , , , 10_1101-2021_01_08_425967 91 18 we -PRON- PRP 10_1101-2021_01_08_425967 91 19 consider consider VBP 10_1101-2021_01_08_425967 91 20 a a DT 10_1101-2021_01_08_425967 91 21 Z z NN 10_1101-2021_01_08_425967 91 22 - - HYPH 10_1101-2021_01_08_425967 91 23 score score NN 10_1101-2021_01_08_425967 91 24 cutoff cutoff NN 10_1101-2021_01_08_425967 91 25 of of IN 10_1101-2021_01_08_425967 91 26 greater great JJR 10_1101-2021_01_08_425967 91 27 than than IN 10_1101-2021_01_08_425967 91 28 3 3 CD 10_1101-2021_01_08_425967 91 29 ( ( -LRB- 10_1101-2021_01_08_425967 91 30 p p NN 10_1101-2021_01_08_425967 91 31 - - HYPH 10_1101-2021_01_08_425967 91 32 value value NN 10_1101-2021_01_08_425967 91 33 of of IN 10_1101-2021_01_08_425967 91 34 0.002 0.002 CD 10_1101-2021_01_08_425967 91 35 ) ) -RRB- 10_1101-2021_01_08_425967 91 36 . . . 10_1101-2021_01_08_425967 92 1 We -PRON- PRP 10_1101-2021_01_08_425967 92 2 also also RB 10_1101-2021_01_08_425967 92 3 observed observe VBD 10_1101-2021_01_08_425967 92 4 Z z NN 10_1101-2021_01_08_425967 92 5 - - HYPH 10_1101-2021_01_08_425967 92 6 score score NN 10_1101-2021_01_08_425967 92 7 values value NNS 10_1101-2021_01_08_425967 92 8 still still RB 10_1101-2021_01_08_425967 92 9 greater great JJR 10_1101-2021_01_08_425967 92 10 than than IN 10_1101-2021_01_08_425967 92 11 2 2 CD 10_1101-2021_01_08_425967 92 12 with with IN 10_1101-2021_01_08_425967 92 13 a a DT 10_1101-2021_01_08_425967 92 14 length length NN 10_1101-2021_01_08_425967 92 15 of of IN 10_1101-2021_01_08_425967 92 16 12 12 CD 10_1101-2021_01_08_425967 92 17 , , , 10_1101-2021_01_08_425967 92 18 11 11 CD 10_1101-2021_01_08_425967 92 19 , , , 10_1101-2021_01_08_425967 92 20 and and CC 10_1101-2021_01_08_425967 92 21 10 10 CD 10_1101-2021_01_08_425967 92 22 , , , 10_1101-2021_01_08_425967 92 23 but but CC 10_1101-2021_01_08_425967 92 24 lesser less JJR 10_1101-2021_01_08_425967 92 25 than than IN 10_1101-2021_01_08_425967 92 26 with with IN 10_1101-2021_01_08_425967 92 27 lengths length NNS 10_1101-2021_01_08_425967 92 28 between between IN 10_1101-2021_01_08_425967 92 29 2 2 CD 10_1101-2021_01_08_425967 92 30 and and CC 10_1101-2021_01_08_425967 92 31 9 9 CD 10_1101-2021_01_08_425967 92 32 ( ( -LRB- 10_1101-2021_01_08_425967 92 33 Figure figure NN 10_1101-2021_01_08_425967 92 34 2 2 CD 10_1101-2021_01_08_425967 92 35 ) ) -RRB- 10_1101-2021_01_08_425967 92 36 . . . 10_1101-2021_01_08_425967 93 1 If if IN 10_1101-2021_01_08_425967 93 2 we -PRON- PRP 10_1101-2021_01_08_425967 93 3 were be VBD 10_1101-2021_01_08_425967 93 4 more more RBR 10_1101-2021_01_08_425967 93 5 flexible flexible JJ 10_1101-2021_01_08_425967 93 6 , , , 10_1101-2021_01_08_425967 93 7 we -PRON- PRP 10_1101-2021_01_08_425967 93 8 could could MD 10_1101-2021_01_08_425967 93 9 have have VB 10_1101-2021_01_08_425967 93 10 laid lay VBN 10_1101-2021_01_08_425967 93 11 out out RP 10_1101-2021_01_08_425967 93 12 a a DT 10_1101-2021_01_08_425967 93 13 length length NN 10_1101-2021_01_08_425967 93 14 cutoff cutoff NN 10_1101-2021_01_08_425967 93 15 on on IN 10_1101-2021_01_08_425967 93 16 those those DT 10_1101-2021_01_08_425967 93 17 values value NNS 10_1101-2021_01_08_425967 93 18 without without IN 10_1101-2021_01_08_425967 93 19 losing lose VBG 10_1101-2021_01_08_425967 93 20 statistical statistical JJ 10_1101-2021_01_08_425967 93 21 significance significance NN 10_1101-2021_01_08_425967 93 22 , , , 10_1101-2021_01_08_425967 93 23 since since IN 10_1101-2021_01_08_425967 93 24 a a DT 10_1101-2021_01_08_425967 93 25 Z z NN 10_1101-2021_01_08_425967 93 26 - - HYPH 10_1101-2021_01_08_425967 93 27 score score NN 10_1101-2021_01_08_425967 93 28 of of IN 10_1101-2021_01_08_425967 93 29 2 2 CD 10_1101-2021_01_08_425967 93 30 corresponds correspond NNS 10_1101-2021_01_08_425967 93 31 roughly roughly RB 10_1101-2021_01_08_425967 93 32 to to IN 10_1101-2021_01_08_425967 93 33 a a DT 10_1101-2021_01_08_425967 93 34 p p NN 10_1101-2021_01_08_425967 93 35 - - HYPH 10_1101-2021_01_08_425967 93 36 value value NN 10_1101-2021_01_08_425967 93 37 of of IN 10_1101-2021_01_08_425967 93 38 0.05 0.05 CD 10_1101-2021_01_08_425967 93 39 . . . 10_1101-2021_01_08_425967 94 1 The the DT 10_1101-2021_01_08_425967 94 2 results result NNS 10_1101-2021_01_08_425967 94 3 of of IN 10_1101-2021_01_08_425967 94 4 this this DT 10_1101-2021_01_08_425967 94 5 analysis analysis NN 10_1101-2021_01_08_425967 94 6 were be VBD 10_1101-2021_01_08_425967 94 7 expected expect VBN 10_1101-2021_01_08_425967 94 8 by by IN 10_1101-2021_01_08_425967 94 9 intuition intuition NN 10_1101-2021_01_08_425967 94 10 because because IN 10_1101-2021_01_08_425967 94 11 the the DT 10_1101-2021_01_08_425967 94 12 probability probability NN 10_1101-2021_01_08_425967 94 13 of of IN 10_1101-2021_01_08_425967 94 14 an an DT 10_1101-2021_01_08_425967 94 15 item item NN 10_1101-2021_01_08_425967 94 16 to to TO 10_1101-2021_01_08_425967 94 17 occupy occupy VB 10_1101-2021_01_08_425967 94 18 a a DT 10_1101-2021_01_08_425967 94 19 position position NN 10_1101-2021_01_08_425967 94 20 in in IN 10_1101-2021_01_08_425967 94 21 the the DT 10_1101-2021_01_08_425967 94 22 VP VP NNP 10_1101-2021_01_08_425967 94 23 increases increase VBZ 10_1101-2021_01_08_425967 94 24 the the DT 10_1101-2021_01_08_425967 94 25 number number NN 10_1101-2021_01_08_425967 94 26 of of IN 10_1101-2021_01_08_425967 94 27 items item NNS 10_1101-2021_01_08_425967 94 28 does do VBZ 10_1101-2021_01_08_425967 94 29 the the DT 10_1101-2021_01_08_425967 94 30 same same JJ 10_1101-2021_01_08_425967 94 31 . . . 10_1101-2021_01_08_425967 95 1 3.3 3.3 CD 10_1101-2021_01_08_425967 95 2 . . . 10_1101-2021_01_08_425967 96 1 Proof proof NN 10_1101-2021_01_08_425967 96 2 of of IN 10_1101-2021_01_08_425967 96 3 concept concept NN 10_1101-2021_01_08_425967 96 4 : : : 10_1101-2021_01_08_425967 96 5 Quantifying quantify VBG 10_1101-2021_01_08_425967 96 6 real real JJ 10_1101-2021_01_08_425967 96 7 noise noise NN 10_1101-2021_01_08_425967 96 8 After after IN 10_1101-2021_01_08_425967 96 9 a a DT 10_1101-2021_01_08_425967 96 10 literature literature NN 10_1101-2021_01_08_425967 96 11 revision revision NN 10_1101-2021_01_08_425967 96 12 , , , 10_1101-2021_01_08_425967 96 13 we -PRON- PRP 10_1101-2021_01_08_425967 96 14 noticed notice VBD 10_1101-2021_01_08_425967 96 15 that that IN 10_1101-2021_01_08_425967 96 16 some some DT 10_1101-2021_01_08_425967 96 17 datasets dataset NNS 10_1101-2021_01_08_425967 96 18 were be VBD 10_1101-2021_01_08_425967 96 19 subject subject JJ 10_1101-2021_01_08_425967 96 20 to to IN 10_1101-2021_01_08_425967 96 21 visual visual JJ 10_1101-2021_01_08_425967 96 22 inspection inspection NN 10_1101-2021_01_08_425967 96 23 in in IN 10_1101-2021_01_08_425967 96 24 their -PRON- PRP$ 10_1101-2021_01_08_425967 96 25 respective respective JJ 10_1101-2021_01_08_425967 96 26 papers paper NNS 10_1101-2021_01_08_425967 96 27 , , , 10_1101-2021_01_08_425967 96 28 so so RB 10_1101-2021_01_08_425967 96 29 we -PRON- PRP 10_1101-2021_01_08_425967 96 30 applied apply VBD 10_1101-2021_01_08_425967 96 31 our -PRON- PRP$ 10_1101-2021_01_08_425967 96 32 method method NN 10_1101-2021_01_08_425967 96 33 to to TO 10_1101-2021_01_08_425967 96 34 quantify quantify VB 10_1101-2021_01_08_425967 96 35 the the DT 10_1101-2021_01_08_425967 96 36 proportion proportion NN 10_1101-2021_01_08_425967 96 37 of of IN 10_1101-2021_01_08_425967 96 38 noise noise NN 10_1101-2021_01_08_425967 96 39 embedded embed VBN 10_1101-2021_01_08_425967 96 40 in in IN 10_1101-2021_01_08_425967 96 41 those those DT 10_1101-2021_01_08_425967 96 42 datasets dataset NNS 10_1101-2021_01_08_425967 96 43 and and CC 10_1101-2021_01_08_425967 96 44 to to TO 10_1101-2021_01_08_425967 96 45 test test VB 10_1101-2021_01_08_425967 96 46 whether whether IN 10_1101-2021_01_08_425967 96 47 they -PRON- PRP 10_1101-2021_01_08_425967 96 48 may may MD 10_1101-2021_01_08_425967 96 49 lead lead VB 10_1101-2021_01_08_425967 96 50 to to IN 10_1101-2021_01_08_425967 96 51 apophenia apophenia NNP 10_1101-2021_01_08_425967 96 52 . . . 10_1101-2021_01_08_425967 97 1 We -PRON- PRP 10_1101-2021_01_08_425967 97 2 choose choose VBP 10_1101-2021_01_08_425967 97 3 two two CD 10_1101-2021_01_08_425967 97 4 datasets dataset NNS 10_1101-2021_01_08_425967 97 5 from from IN 10_1101-2021_01_08_425967 97 6 literature literature NN 10_1101-2021_01_08_425967 97 7 because because IN 10_1101-2021_01_08_425967 97 8 of of IN 10_1101-2021_01_08_425967 97 9 two two CD 10_1101-2021_01_08_425967 97 10 main main JJ 10_1101-2021_01_08_425967 97 11 reasons reason NNS 10_1101-2021_01_08_425967 97 12 , , , 10_1101-2021_01_08_425967 97 13 first first RB 10_1101-2021_01_08_425967 97 14 , , , 10_1101-2021_01_08_425967 97 15 the the DT 10_1101-2021_01_08_425967 97 16 data datum NNS 10_1101-2021_01_08_425967 97 17 should should MD 10_1101-2021_01_08_425967 97 18 have have VB 10_1101-2021_01_08_425967 97 19 a a DT 10_1101-2021_01_08_425967 97 20 high high JJ 10_1101-2021_01_08_425967 97 21 number number NN 10_1101-2021_01_08_425967 97 22 of of IN 10_1101-2021_01_08_425967 97 23 items item NNS 10_1101-2021_01_08_425967 97 24 that that WDT 10_1101-2021_01_08_425967 97 25 are be VBP 10_1101-2021_01_08_425967 97 26 way way NN 10_1101-2021_01_08_425967 97 27 above above IN 10_1101-2021_01_08_425967 97 28 our -PRON- PRP$ 10_1101-2021_01_08_425967 97 29 Z z JJ 10_1101-2021_01_08_425967 97 30 - - HYPH 10_1101-2021_01_08_425967 97 31 score score NN 10_1101-2021_01_08_425967 97 32 significance significance NN 10_1101-2021_01_08_425967 97 33 threshold threshold NN 10_1101-2021_01_08_425967 97 34 ( ( -LRB- 10_1101-2021_01_08_425967 97 35 > > NNP 10_1101-2021_01_08_425967 97 36 13 13 CD 10_1101-2021_01_08_425967 97 37 ) ) -RRB- 10_1101-2021_01_08_425967 97 38 and and CC 10_1101-2021_01_08_425967 97 39 , , , 10_1101-2021_01_08_425967 97 40 second second JJ 10_1101-2021_01_08_425967 97 41 , , , 10_1101-2021_01_08_425967 97 42 we -PRON- PRP 10_1101-2021_01_08_425967 97 43 wanted want VBD 10_1101-2021_01_08_425967 97 44 contrasting contrast VBG 10_1101-2021_01_08_425967 97 45 orderings ordering NNS 10_1101-2021_01_08_425967 97 46 of of IN 10_1101-2021_01_08_425967 97 47 the the DT 10_1101-2021_01_08_425967 97 48 partitions partition NNS 10_1101-2021_01_08_425967 97 49 so so IN 10_1101-2021_01_08_425967 97 50 to to TO 10_1101-2021_01_08_425967 97 51 have have VB 10_1101-2021_01_08_425967 97 52 one one CD 10_1101-2021_01_08_425967 97 53 dataset dataset NN 10_1101-2021_01_08_425967 97 54 that that WDT 10_1101-2021_01_08_425967 97 55 looks look VBZ 10_1101-2021_01_08_425967 97 56 very very RB 10_1101-2021_01_08_425967 97 57 disordered disorder VBN 10_1101-2021_01_08_425967 97 58 and and CC 10_1101-2021_01_08_425967 97 59 another another DT 10_1101-2021_01_08_425967 97 60 that that WDT 10_1101-2021_01_08_425967 97 61 looks look VBZ 10_1101-2021_01_08_425967 97 62 somewhat somewhat RB 10_1101-2021_01_08_425967 97 63 ordered order VBN 10_1101-2021_01_08_425967 97 64 to to TO 10_1101-2021_01_08_425967 97 65 compare compare VB 10_1101-2021_01_08_425967 97 66 the the DT 10_1101-2021_01_08_425967 97 67 noise noise NN 10_1101-2021_01_08_425967 97 68 proportions proportion NNS 10_1101-2021_01_08_425967 97 69 . . . 10_1101-2021_01_08_425967 98 1 Lastly lastly RB 10_1101-2021_01_08_425967 98 2 , , , 10_1101-2021_01_08_425967 98 3 we -PRON- PRP 10_1101-2021_01_08_425967 98 4 assessed assess VBD 10_1101-2021_01_08_425967 98 5 the the DT 10_1101-2021_01_08_425967 98 6 behavior behavior NN 10_1101-2021_01_08_425967 98 7 of of IN 10_1101-2021_01_08_425967 98 8 the the DT 10_1101-2021_01_08_425967 98 9 metric metric JJ 10_1101-2021_01_08_425967 98 10 in in IN 10_1101-2021_01_08_425967 98 11 highly highly RB 10_1101-2021_01_08_425967 98 12 ordered order VBN 10_1101-2021_01_08_425967 98 13 data datum NNS 10_1101-2021_01_08_425967 98 14 . . . 10_1101-2021_01_08_425967 99 1 This this DT 10_1101-2021_01_08_425967 99 2 also also RB 10_1101-2021_01_08_425967 99 3 matches match VBZ 10_1101-2021_01_08_425967 99 4 our -PRON- PRP$ 10_1101-2021_01_08_425967 99 5 threshold threshold NN 10_1101-2021_01_08_425967 99 6 mentioned mention VBN 10_1101-2021_01_08_425967 99 7 above above RB 10_1101-2021_01_08_425967 99 8 . . . 10_1101-2021_01_08_425967 100 1 3.3.1 3.3.1 CD 10_1101-2021_01_08_425967 100 2 . . . 10_1101-2021_01_08_425967 101 1 Cancer cancer NN 10_1101-2021_01_08_425967 101 2 methylation methylation NN 10_1101-2021_01_08_425967 101 3 signatures signature VBZ 10_1101-2021_01_08_425967 101 4 The the DT 10_1101-2021_01_08_425967 101 5 first first JJ 10_1101-2021_01_08_425967 101 6 dataset dataset NN 10_1101-2021_01_08_425967 101 7 consists consist VBZ 10_1101-2021_01_08_425967 101 8 of of IN 10_1101-2021_01_08_425967 101 9 methylation methylation NN 10_1101-2021_01_08_425967 101 10 profiles profile NNS 10_1101-2021_01_08_425967 101 11 of of IN 10_1101-2021_01_08_425967 101 12 242 242 CD 10_1101-2021_01_08_425967 101 13 different different JJ 10_1101-2021_01_08_425967 101 14 cancerous cancerous JJ 10_1101-2021_01_08_425967 101 15 and and CC 10_1101-2021_01_08_425967 101 16 non non JJ 10_1101-2021_01_08_425967 101 17 - - JJ 10_1101-2021_01_08_425967 101 18 cancerous cancerous JJ 10_1101-2021_01_08_425967 101 19 samples sample NNS 10_1101-2021_01_08_425967 101 20 [ [ -LRB- 10_1101-2021_01_08_425967 101 21 7 7 CD 10_1101-2021_01_08_425967 101 22 ] ] -RRB- 10_1101-2021_01_08_425967 101 23 ( ( -LRB- 10_1101-2021_01_08_425967 101 24 Figure figure NN 10_1101-2021_01_08_425967 101 25 3 3 CD 10_1101-2021_01_08_425967 101 26 ) ) -RRB- 10_1101-2021_01_08_425967 101 27 . . . 10_1101-2021_01_08_425967 102 1 Though though IN 10_1101-2021_01_08_425967 102 2 the the DT 10_1101-2021_01_08_425967 102 3 classifications classification NNS 10_1101-2021_01_08_425967 102 4 look look VBP 10_1101-2021_01_08_425967 102 5 very very RB 10_1101-2021_01_08_425967 102 6 sparse sparse RB 10_1101-2021_01_08_425967 102 7 and and CC 10_1101-2021_01_08_425967 102 8 the the DT 10_1101-2021_01_08_425967 102 9 groups group NNS 10_1101-2021_01_08_425967 102 10 are be VBP 10_1101-2021_01_08_425967 102 11 torn tear VBN 10_1101-2021_01_08_425967 102 12 apart apart RB 10_1101-2021_01_08_425967 102 13 in in IN 10_1101-2021_01_08_425967 102 14 many many JJ 10_1101-2021_01_08_425967 102 15 subgroups subgroup NNS 10_1101-2021_01_08_425967 102 16 distributed distribute VBN 10_1101-2021_01_08_425967 102 17 along along RB 10_1101-2021_01_08_425967 102 18 with with IN 10_1101-2021_01_08_425967 102 19 the the DT 10_1101-2021_01_08_425967 102 20 data datum NNS 10_1101-2021_01_08_425967 102 21 ’s ’s POS 10_1101-2021_01_08_425967 102 22 VP VP NNP 10_1101-2021_01_08_425967 102 23 . . . 10_1101-2021_01_08_425967 103 1 We -PRON- PRP 10_1101-2021_01_08_425967 103 2 detected detect VBD 10_1101-2021_01_08_425967 103 3 25.1 25.1 CD 10_1101-2021_01_08_425967 103 4 % % NN 10_1101-2021_01_08_425967 103 5 of of IN 10_1101-2021_01_08_425967 103 6 noise noise NN 10_1101-2021_01_08_425967 103 7 and and CC 10_1101-2021_01_08_425967 103 8 a a DT 10_1101-2021_01_08_425967 103 9 PQA PQA NNP 10_1101-2021_01_08_425967 103 10 score score NN 10_1101-2021_01_08_425967 103 11 .CC .CC NFP 10_1101-2021_01_08_425967 103 12 - - : 10_1101-2021_01_08_425967 103 13 BY by IN 10_1101-2021_01_08_425967 103 14 4.0 4.0 CD 10_1101-2021_01_08_425967 103 15 International international JJ 10_1101-2021_01_08_425967 103 16 licensemade licensemade NN 10_1101-2021_01_08_425967 103 17 available available JJ 10_1101-2021_01_08_425967 103 18 under under IN 10_1101-2021_01_08_425967 103 19 a a DT 10_1101-2021_01_08_425967 103 20 ( ( -LRB- 10_1101-2021_01_08_425967 103 21 which which WDT 10_1101-2021_01_08_425967 103 22 was be VBD 10_1101-2021_01_08_425967 103 23 not not RB 10_1101-2021_01_08_425967 103 24 certified certify VBN 10_1101-2021_01_08_425967 103 25 by by IN 10_1101-2021_01_08_425967 103 26 peer peer NN 10_1101-2021_01_08_425967 103 27 review review NN 10_1101-2021_01_08_425967 103 28 ) ) -RRB- 10_1101-2021_01_08_425967 103 29 is be VBZ 10_1101-2021_01_08_425967 103 30 the the DT 10_1101-2021_01_08_425967 103 31 author author NN 10_1101-2021_01_08_425967 103 32 / / SYM 10_1101-2021_01_08_425967 103 33 funder funder NN 10_1101-2021_01_08_425967 103 34 , , , 10_1101-2021_01_08_425967 103 35 who who WP 10_1101-2021_01_08_425967 103 36 has have VBZ 10_1101-2021_01_08_425967 103 37 granted grant VBN 10_1101-2021_01_08_425967 103 38 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 103 39 a a DT 10_1101-2021_01_08_425967 103 40 license license NN 10_1101-2021_01_08_425967 103 41 to to TO 10_1101-2021_01_08_425967 103 42 display display VB 10_1101-2021_01_08_425967 103 43 the the DT 10_1101-2021_01_08_425967 103 44 preprint preprint NN 10_1101-2021_01_08_425967 103 45 in in IN 10_1101-2021_01_08_425967 103 46 perpetuity perpetuity NN 10_1101-2021_01_08_425967 103 47 . . . 10_1101-2021_01_08_425967 104 1 It -PRON- PRP 10_1101-2021_01_08_425967 104 2 is be VBZ 10_1101-2021_01_08_425967 104 3 The the DT 10_1101-2021_01_08_425967 104 4 copyright copyright NN 10_1101-2021_01_08_425967 104 5 holder holder NN 10_1101-2021_01_08_425967 104 6 for for IN 10_1101-2021_01_08_425967 104 7 this this DT 10_1101-2021_01_08_425967 104 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 104 9 version version NN 10_1101-2021_01_08_425967 104 10 posted post VBD 10_1101-2021_01_08_425967 104 11 January January NNP 10_1101-2021_01_08_425967 104 12 9 9 CD 10_1101-2021_01_08_425967 104 13 , , , 10_1101-2021_01_08_425967 104 14 2021 2021 CD 10_1101-2021_01_08_425967 104 15 . . . 10_1101-2021_01_08_425967 104 16 ; ; : 10_1101-2021_01_08_425967 104 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 104 18 : : : 10_1101-2021_01_08_425967 104 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 104 20 preprint preprint NN 10_1101-2021_01_08_425967 104 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 104 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ NNS 10_1101-2021_01_08_425967 104 23 of of IN 10_1101-2021_01_08_425967 104 24 0.53 0.53 CD 10_1101-2021_01_08_425967 104 25 ( ( -LRB- 10_1101-2021_01_08_425967 104 26 Figure figure NN 10_1101-2021_01_08_425967 104 27 4 4 CD 10_1101-2021_01_08_425967 104 28 , , , 10_1101-2021_01_08_425967 104 29 with with IN 10_1101-2021_01_08_425967 104 30 a a DT 10_1101-2021_01_08_425967 104 31 Z z NN 10_1101-2021_01_08_425967 104 32 - - HYPH 10_1101-2021_01_08_425967 104 33 score score NN 10_1101-2021_01_08_425967 104 34 of of IN 10_1101-2021_01_08_425967 104 35 8.2 8.2 CD 10_1101-2021_01_08_425967 104 36 and and CC 10_1101-2021_01_08_425967 104 37 a a DT 10_1101-2021_01_08_425967 104 38 p p NN 10_1101-2021_01_08_425967 104 39 - - HYPH 10_1101-2021_01_08_425967 104 40 value value NN 10_1101-2021_01_08_425967 104 41 of of IN 10_1101-2021_01_08_425967 104 42 9.6x10 9.6x10 CD 10_1101-2021_01_08_425967 104 43 - - SYM 10_1101-2021_01_08_425967 104 44 17 17 CD 10_1101-2021_01_08_425967 104 45 ) ) -RRB- 10_1101-2021_01_08_425967 104 46 , , , 10_1101-2021_01_08_425967 104 47 both both DT 10_1101-2021_01_08_425967 104 48 numbers number NNS 10_1101-2021_01_08_425967 104 49 imply imply VBP 10_1101-2021_01_08_425967 104 50 that that IN 10_1101-2021_01_08_425967 104 51 even even RB 10_1101-2021_01_08_425967 104 52 though though IN 10_1101-2021_01_08_425967 104 53 there there EX 10_1101-2021_01_08_425967 104 54 may may MD 10_1101-2021_01_08_425967 104 55 be be VB 10_1101-2021_01_08_425967 104 56 disordered disorder VBN 10_1101-2021_01_08_425967 104 57 in in IN 10_1101-2021_01_08_425967 104 58 the the DT 10_1101-2021_01_08_425967 104 59 VP VP NNP 10_1101-2021_01_08_425967 104 60 , , , 10_1101-2021_01_08_425967 104 61 there there EX 10_1101-2021_01_08_425967 104 62 is be VBZ 10_1101-2021_01_08_425967 104 63 not not RB 10_1101-2021_01_08_425967 104 64 a a DT 10_1101-2021_01_08_425967 104 65 very very RB 10_1101-2021_01_08_425967 104 66 high high JJ 10_1101-2021_01_08_425967 104 67 noise noise NN 10_1101-2021_01_08_425967 104 68 proportion proportion NN 10_1101-2021_01_08_425967 104 69 nor nor CC 10_1101-2021_01_08_425967 104 70 a a DT 10_1101-2021_01_08_425967 104 71 high high JJ 10_1101-2021_01_08_425967 104 72 PQA PQA NNP 10_1101-2021_01_08_425967 104 73 score score NN 10_1101-2021_01_08_425967 104 74 . . . 10_1101-2021_01_08_425967 105 1 These these DT 10_1101-2021_01_08_425967 105 2 results result NNS 10_1101-2021_01_08_425967 105 3 suggest suggest VBP 10_1101-2021_01_08_425967 105 4 that that IN 10_1101-2021_01_08_425967 105 5 , , , 10_1101-2021_01_08_425967 105 6 like like IN 10_1101-2021_01_08_425967 105 7 any any DT 10_1101-2021_01_08_425967 105 8 other other JJ 10_1101-2021_01_08_425967 105 9 statistical statistical JJ 10_1101-2021_01_08_425967 105 10 test test NN 10_1101-2021_01_08_425967 105 11 , , , 10_1101-2021_01_08_425967 105 12 the the DT 10_1101-2021_01_08_425967 105 13 longer long JJR 10_1101-2021_01_08_425967 105 14 the the DT 10_1101-2021_01_08_425967 105 15 number number NN 10_1101-2021_01_08_425967 105 16 of of IN 10_1101-2021_01_08_425967 105 17 items item NNS 10_1101-2021_01_08_425967 105 18 in in IN 10_1101-2021_01_08_425967 105 19 the the DT 10_1101-2021_01_08_425967 105 20 partition partition NN 10_1101-2021_01_08_425967 105 21 the the DT 10_1101-2021_01_08_425967 105 22 more more RBR 10_1101-2021_01_08_425967 105 23 diluted diluted JJ 10_1101-2021_01_08_425967 105 24 is be VBZ 10_1101-2021_01_08_425967 105 25 the the DT 10_1101-2021_01_08_425967 105 26 effect effect NN 10_1101-2021_01_08_425967 105 27 of of IN 10_1101-2021_01_08_425967 105 28 disorder disorder NN 10_1101-2021_01_08_425967 105 29 in in IN 10_1101-2021_01_08_425967 105 30 the the DT 10_1101-2021_01_08_425967 105 31 VP VP NNP 10_1101-2021_01_08_425967 105 32 , , , 10_1101-2021_01_08_425967 105 33 and and CC 10_1101-2021_01_08_425967 105 34 the the DT 10_1101-2021_01_08_425967 105 35 results result NNS 10_1101-2021_01_08_425967 105 36 also also RB 10_1101-2021_01_08_425967 105 37 lead lead VBP 10_1101-2021_01_08_425967 105 38 to to IN 10_1101-2021_01_08_425967 105 39 a a DT 10_1101-2021_01_08_425967 105 40 greater great JJR 10_1101-2021_01_08_425967 105 41 statistical statistical JJ 10_1101-2021_01_08_425967 105 42 significance significance NN 10_1101-2021_01_08_425967 105 43 as as IN 10_1101-2021_01_08_425967 105 44 shown show VBN 10_1101-2021_01_08_425967 105 45 in in IN 10_1101-2021_01_08_425967 105 46 the the DT 10_1101-2021_01_08_425967 105 47 analysis analysis NN 10_1101-2021_01_08_425967 105 48 of of IN 10_1101-2021_01_08_425967 105 49 the the DT 10_1101-2021_01_08_425967 105 50 number number NN 10_1101-2021_01_08_425967 105 51 of of IN 10_1101-2021_01_08_425967 105 52 items item NNS 10_1101-2021_01_08_425967 105 53 and and CC 10_1101-2021_01_08_425967 105 54 classifications classification NNS 10_1101-2021_01_08_425967 105 55 . . . 10_1101-2021_01_08_425967 106 1 Besides besides IN 10_1101-2021_01_08_425967 106 2 the the DT 10_1101-2021_01_08_425967 106 3 authors author NNS 10_1101-2021_01_08_425967 106 4 concluded conclude VBD 10_1101-2021_01_08_425967 106 5 that that IN 10_1101-2021_01_08_425967 106 6 their -PRON- PRP$ 10_1101-2021_01_08_425967 106 7 clustering cluster VBG 10_1101-2021_01_08_425967 106 8 analysis analysis NN 10_1101-2021_01_08_425967 106 9 results result NNS 10_1101-2021_01_08_425967 106 10 made make VBD 10_1101-2021_01_08_425967 106 11 sense sense NN 10_1101-2021_01_08_425967 106 12 from from IN 10_1101-2021_01_08_425967 106 13 their -PRON- PRP$ 10_1101-2021_01_08_425967 106 14 molecular molecular JJ 10_1101-2021_01_08_425967 106 15 and and CC 10_1101-2021_01_08_425967 106 16 biological biological JJ 10_1101-2021_01_08_425967 106 17 background background NN 10_1101-2021_01_08_425967 106 18 , , , 10_1101-2021_01_08_425967 106 19 as as RB 10_1101-2021_01_08_425967 106 20 well well RB 10_1101-2021_01_08_425967 106 21 as as IN 10_1101-2021_01_08_425967 106 22 the the DT 10_1101-2021_01_08_425967 106 23 perspectives perspective NNS 10_1101-2021_01_08_425967 106 24 about about IN 10_1101-2021_01_08_425967 106 25 the the DT 10_1101-2021_01_08_425967 106 26 analyzed analyze VBN 10_1101-2021_01_08_425967 106 27 profiles profile NNS 10_1101-2021_01_08_425967 106 28 , , , 10_1101-2021_01_08_425967 106 29 they -PRON- PRP 10_1101-2021_01_08_425967 106 30 only only RB 10_1101-2021_01_08_425967 106 31 assessed assess VBD 10_1101-2021_01_08_425967 106 32 grouping group VBG 10_1101-2021_01_08_425967 106 33 just just RB 10_1101-2021_01_08_425967 106 34 by by IN 10_1101-2021_01_08_425967 106 35 visual visual JJ 10_1101-2021_01_08_425967 106 36 inspection inspection NN 10_1101-2021_01_08_425967 106 37 and and CC 10_1101-2021_01_08_425967 106 38 concluded conclude VBD 10_1101-2021_01_08_425967 106 39 the the DT 10_1101-2021_01_08_425967 106 40 grouping grouping NN 10_1101-2021_01_08_425967 106 41 was be VBD 10_1101-2021_01_08_425967 106 42 well well RB 10_1101-2021_01_08_425967 106 43 done do VBN 10_1101-2021_01_08_425967 106 44 . . . 10_1101-2021_01_08_425967 107 1 However however RB 10_1101-2021_01_08_425967 107 2 , , , 10_1101-2021_01_08_425967 107 3 understanding understand VBG 10_1101-2021_01_08_425967 107 4 the the DT 10_1101-2021_01_08_425967 107 5 noise noise NN 10_1101-2021_01_08_425967 107 6 in in IN 10_1101-2021_01_08_425967 107 7 the the DT 10_1101-2021_01_08_425967 107 8 cluster cluster NN 10_1101-2021_01_08_425967 107 9 can can MD 10_1101-2021_01_08_425967 107 10 help help VB 10_1101-2021_01_08_425967 107 11 to to TO 10_1101-2021_01_08_425967 107 12 pursue pursue VB 10_1101-2021_01_08_425967 107 13 better well JJR 10_1101-2021_01_08_425967 107 14 markers marker NNS 10_1101-2021_01_08_425967 107 15 since since IN 10_1101-2021_01_08_425967 107 16 it -PRON- PRP 10_1101-2021_01_08_425967 107 17 could could MD 10_1101-2021_01_08_425967 107 18 help help VB 10_1101-2021_01_08_425967 107 19 to to TO 10_1101-2021_01_08_425967 107 20 narrow narrow VB 10_1101-2021_01_08_425967 107 21 the the DT 10_1101-2021_01_08_425967 107 22 search search NN 10_1101-2021_01_08_425967 107 23 space space NN 10_1101-2021_01_08_425967 107 24 in in IN 10_1101-2021_01_08_425967 107 25 these these DT 10_1101-2021_01_08_425967 107 26 kinds kind NNS 10_1101-2021_01_08_425967 107 27 of of IN 10_1101-2021_01_08_425967 107 28 studies study NNS 10_1101-2021_01_08_425967 107 29 . . . 10_1101-2021_01_08_425967 108 1 ( ( -LRB- 10_1101-2021_01_08_425967 108 2 a a LS 10_1101-2021_01_08_425967 108 3 ) ) -RRB- 10_1101-2021_01_08_425967 108 4 ( ( -LRB- 10_1101-2021_01_08_425967 108 5 b b NN 10_1101-2021_01_08_425967 108 6 ) ) -RRB- 10_1101-2021_01_08_425967 108 7 Figure Figure NNP 10_1101-2021_01_08_425967 108 8 3 3 CD 10_1101-2021_01_08_425967 108 9 . . . 10_1101-2021_01_08_425967 109 1 Visual visual JJ 10_1101-2021_01_08_425967 109 2 representation representation NN 10_1101-2021_01_08_425967 109 3 of of IN 10_1101-2021_01_08_425967 109 4 clustered cluster VBN 10_1101-2021_01_08_425967 109 5 data datum NNS 10_1101-2021_01_08_425967 109 6 used use VBN 10_1101-2021_01_08_425967 109 7 to to TO 10_1101-2021_01_08_425967 109 8 assess assess VB 10_1101-2021_01_08_425967 109 9 the the DT 10_1101-2021_01_08_425967 109 10 method method NN 10_1101-2021_01_08_425967 109 11 . . . 10_1101-2021_01_08_425967 110 1 ( ( -LRB- 10_1101-2021_01_08_425967 110 2 a a LS 10_1101-2021_01_08_425967 110 3 ) ) -RRB- 10_1101-2021_01_08_425967 110 4 Dataset dataset NN 10_1101-2021_01_08_425967 110 5 from from IN 10_1101-2021_01_08_425967 110 6 Jie Jie NNP 10_1101-2021_01_08_425967 110 7 Shen Shen NNP 10_1101-2021_01_08_425967 110 8 et et NNP 10_1101-2021_01_08_425967 110 9 . . . 10_1101-2021_01_08_425967 111 1 al al NNP 10_1101-2021_01_08_425967 111 2 . . . 10_1101-2021_01_08_425967 112 1 ( ( -LRB- 10_1101-2021_01_08_425967 112 2 b b LS 10_1101-2021_01_08_425967 112 3 ) ) -RRB- 10_1101-2021_01_08_425967 112 4 Dataset dataset NN 10_1101-2021_01_08_425967 112 5 from from IN 10_1101-2021_01_08_425967 112 6 Tooyoka Tooyoka NNP 10_1101-2021_01_08_425967 112 7 et et NNP 10_1101-2021_01_08_425967 112 8 . . . 10_1101-2021_01_08_425967 113 1 al al NNP 10_1101-2021_01_08_425967 113 2 . . . 10_1101-2021_01_08_425967 114 1 3.3.2 3.3.2 CD 10_1101-2021_01_08_425967 114 2 . . . 10_1101-2021_01_08_425967 115 1 Distribution distribution NN 10_1101-2021_01_08_425967 115 2 of of IN 10_1101-2021_01_08_425967 115 3 microRNAs micrornas NN 10_1101-2021_01_08_425967 115 4 in in IN 10_1101-2021_01_08_425967 115 5 cancer cancer NN 10_1101-2021_01_08_425967 115 6 The the DT 10_1101-2021_01_08_425967 115 7 second second JJ 10_1101-2021_01_08_425967 115 8 dataset dataset NN 10_1101-2021_01_08_425967 115 9 consists consist VBZ 10_1101-2021_01_08_425967 115 10 of of IN 10_1101-2021_01_08_425967 115 11 103 103 CD 10_1101-2021_01_08_425967 115 12 expression expression NN 10_1101-2021_01_08_425967 115 13 profiles profile NNS 10_1101-2021_01_08_425967 115 14 of of IN 10_1101-2021_01_08_425967 115 15 microRNAs microRNAs NNP 10_1101-2021_01_08_425967 115 16 from from IN 10_1101-2021_01_08_425967 115 17 three three CD 10_1101-2021_01_08_425967 115 18 classes class NNS 10_1101-2021_01_08_425967 115 19 of of IN 10_1101-2021_01_08_425967 115 20 samples sample NNS 10_1101-2021_01_08_425967 115 21 : : : 10_1101-2021_01_08_425967 115 22 invasive invasive JJ 10_1101-2021_01_08_425967 115 23 breast breast NN 10_1101-2021_01_08_425967 115 24 cancer cancer NN 10_1101-2021_01_08_425967 115 25 , , , 10_1101-2021_01_08_425967 115 26 those those DT 10_1101-2021_01_08_425967 115 27 with with IN 10_1101-2021_01_08_425967 115 28 ductal ductal JJ 10_1101-2021_01_08_425967 115 29 carcinoma carcinoma NN 10_1101-2021_01_08_425967 115 30 in in IN 10_1101-2021_01_08_425967 115 31 situ situ NN 10_1101-2021_01_08_425967 115 32 ( ( -LRB- 10_1101-2021_01_08_425967 115 33 DCIS DCIS NNP 10_1101-2021_01_08_425967 115 34 ) ) -RRB- 10_1101-2021_01_08_425967 115 35 , , , 10_1101-2021_01_08_425967 115 36 and and CC 10_1101-2021_01_08_425967 115 37 health health NN 10_1101-2021_01_08_425967 115 38 ( ( -LRB- 10_1101-2021_01_08_425967 115 39 Figure figure NN 10_1101-2021_01_08_425967 115 40 3 3 CD 10_1101-2021_01_08_425967 115 41 ) ) -RRB- 10_1101-2021_01_08_425967 115 42 [ [ -LRB- 10_1101-2021_01_08_425967 115 43 8 8 CD 10_1101-2021_01_08_425967 115 44 ] ] -RRB- 10_1101-2021_01_08_425967 115 45 . . . 10_1101-2021_01_08_425967 116 1 The the DT 10_1101-2021_01_08_425967 116 2 authors author NNS 10_1101-2021_01_08_425967 116 3 visually visually RB 10_1101-2021_01_08_425967 116 4 identified identify VBD 10_1101-2021_01_08_425967 116 5 three three CD 10_1101-2021_01_08_425967 116 6 clusters cluster NNS 10_1101-2021_01_08_425967 116 7 , , , 10_1101-2021_01_08_425967 116 8 though though IN 10_1101-2021_01_08_425967 116 9 selecting select VBG 10_1101-2021_01_08_425967 116 10 the the DT 10_1101-2021_01_08_425967 116 11 right right JJ 10_1101-2021_01_08_425967 116 12 cutting cutting NN 10_1101-2021_01_08_425967 116 13 height height NN 10_1101-2021_01_08_425967 116 14 threshold threshold NN 10_1101-2021_01_08_425967 116 15 is be VBZ 10_1101-2021_01_08_425967 116 16 difficult difficult JJ 10_1101-2021_01_08_425967 116 17 . . . 10_1101-2021_01_08_425967 117 1 Besides besides RB 10_1101-2021_01_08_425967 117 2 , , , 10_1101-2021_01_08_425967 117 3 one one CD 10_1101-2021_01_08_425967 117 4 of of IN 10_1101-2021_01_08_425967 117 5 the the DT 10_1101-2021_01_08_425967 117 6 clusters cluster NNS 10_1101-2021_01_08_425967 117 7 is be VBZ 10_1101-2021_01_08_425967 117 8 a a DT 10_1101-2021_01_08_425967 117 9 mix mix NN 10_1101-2021_01_08_425967 117 10 of of IN 10_1101-2021_01_08_425967 117 11 classes class NNS 10_1101-2021_01_08_425967 117 12 in in IN 10_1101-2021_01_08_425967 117 13 different different JJ 10_1101-2021_01_08_425967 117 14 proportions proportion NNS 10_1101-2021_01_08_425967 117 15 , , , 10_1101-2021_01_08_425967 117 16 leading lead VBG 10_1101-2021_01_08_425967 117 17 the the DT 10_1101-2021_01_08_425967 117 18 authors author NNS 10_1101-2021_01_08_425967 117 19 to to TO 10_1101-2021_01_08_425967 117 20 arguably arguably RB 10_1101-2021_01_08_425967 117 21 conclude conclude VB 10_1101-2021_01_08_425967 117 22 that that IN 10_1101-2021_01_08_425967 117 23 the the DT 10_1101-2021_01_08_425967 117 24 DCIS DCIS NNP 10_1101-2021_01_08_425967 117 25 and and CC 10_1101-2021_01_08_425967 117 26 control control NN 10_1101-2021_01_08_425967 117 27 sample sample NN 10_1101-2021_01_08_425967 117 28 profiles profile NNS 10_1101-2021_01_08_425967 117 29 are be VBP 10_1101-2021_01_08_425967 117 30 not not RB 10_1101-2021_01_08_425967 117 31 different different JJ 10_1101-2021_01_08_425967 117 32 . . . 10_1101-2021_01_08_425967 118 1 On on IN 10_1101-2021_01_08_425967 118 2 this this DT 10_1101-2021_01_08_425967 118 3 matter matter NN 10_1101-2021_01_08_425967 118 4 , , , 10_1101-2021_01_08_425967 118 5 the the DT 10_1101-2021_01_08_425967 118 6 PQA PQA NNP 10_1101-2021_01_08_425967 118 7 score score NN 10_1101-2021_01_08_425967 118 8 and and CC 10_1101-2021_01_08_425967 118 9 the the DT 10_1101-2021_01_08_425967 118 10 proportion proportion NN 10_1101-2021_01_08_425967 118 11 of of IN 10_1101-2021_01_08_425967 118 12 noise noise NN 10_1101-2021_01_08_425967 118 13 are be VBP 10_1101-2021_01_08_425967 118 14 0.62 0.62 CD 10_1101-2021_01_08_425967 118 15 and and CC 10_1101-2021_01_08_425967 118 16 30.2 30.2 CD 10_1101-2021_01_08_425967 118 17 % % NN 10_1101-2021_01_08_425967 118 18 , , , 10_1101-2021_01_08_425967 118 19 respectively respectively RB 10_1101-2021_01_08_425967 118 20 ( ( -LRB- 10_1101-2021_01_08_425967 118 21 Figure figure NN 10_1101-2021_01_08_425967 118 22 4 4 CD 10_1101-2021_01_08_425967 118 23 , , , 10_1101-2021_01_08_425967 118 24 with with IN 10_1101-2021_01_08_425967 118 25 Z z NN 10_1101-2021_01_08_425967 118 26 - - HYPH 10_1101-2021_01_08_425967 118 27 score score NN 10_1101-2021_01_08_425967 118 28 of of IN 10_1101-2021_01_08_425967 118 29 6.2 6.2 CD 10_1101-2021_01_08_425967 118 30 and and CC 10_1101-2021_01_08_425967 118 31 a a DT 10_1101-2021_01_08_425967 118 32 p p NN 10_1101-2021_01_08_425967 118 33 - - HYPH 10_1101-2021_01_08_425967 118 34 value value NN 10_1101-2021_01_08_425967 118 35 of of IN 10_1101-2021_01_08_425967 118 36 3.9x10 3.9x10 CD 10_1101-2021_01_08_425967 118 37 - - SYM 10_1101-2021_01_08_425967 118 38 10 10 CD 10_1101-2021_01_08_425967 118 39 ) ) -RRB- 10_1101-2021_01_08_425967 118 40 providing provide VBG 10_1101-2021_01_08_425967 118 41 a a DT 10_1101-2021_01_08_425967 118 42 quantitative quantitative JJ 10_1101-2021_01_08_425967 118 43 assay assay NN 10_1101-2021_01_08_425967 118 44 to to TO 10_1101-2021_01_08_425967 118 45 support support VB 10_1101-2021_01_08_425967 118 46 the the DT 10_1101-2021_01_08_425967 118 47 grouping grouping NN 10_1101-2021_01_08_425967 118 48 that that IN 10_1101-2021_01_08_425967 118 49 the the DT 10_1101-2021_01_08_425967 118 50 authors author NNS 10_1101-2021_01_08_425967 118 51 claimed claim VBD 10_1101-2021_01_08_425967 118 52 . . . 10_1101-2021_01_08_425967 119 1 Furthermore furthermore RB 10_1101-2021_01_08_425967 119 2 , , , 10_1101-2021_01_08_425967 119 3 in in IN 10_1101-2021_01_08_425967 119 4 comparison comparison NN 10_1101-2021_01_08_425967 119 5 with with IN 10_1101-2021_01_08_425967 119 6 the the DT 10_1101-2021_01_08_425967 119 7 methylation methylation NN 10_1101-2021_01_08_425967 119 8 profiles profile NNS 10_1101-2021_01_08_425967 119 9 discussed discuss VBN 10_1101-2021_01_08_425967 119 10 above above RB 10_1101-2021_01_08_425967 119 11 , , , 10_1101-2021_01_08_425967 119 12 we -PRON- PRP 10_1101-2021_01_08_425967 119 13 can can MD 10_1101-2021_01_08_425967 119 14 appreciate appreciate VB 10_1101-2021_01_08_425967 119 15 that that IN 10_1101-2021_01_08_425967 119 16 a a DT 10_1101-2021_01_08_425967 119 17 partition partition NN 10_1101-2021_01_08_425967 119 18 which which WDT 10_1101-2021_01_08_425967 119 19 appear appear VBP 10_1101-2021_01_08_425967 119 20 even even RB 10_1101-2021_01_08_425967 119 21 less less RBR 10_1101-2021_01_08_425967 119 22 fuzzy fuzzy JJ 10_1101-2021_01_08_425967 119 23 has have VBZ 10_1101-2021_01_08_425967 119 24 even even RB 10_1101-2021_01_08_425967 119 25 a a DT 10_1101-2021_01_08_425967 119 26 higher high JJR 10_1101-2021_01_08_425967 119 27 noise noise NN 10_1101-2021_01_08_425967 119 28 ratio ratio NN 10_1101-2021_01_08_425967 119 29 , , , 10_1101-2021_01_08_425967 119 30 supporting support VBG 10_1101-2021_01_08_425967 119 31 the the DT 10_1101-2021_01_08_425967 119 32 idea idea NN 10_1101-2021_01_08_425967 119 33 of of IN 10_1101-2021_01_08_425967 119 34 how how WRB 10_1101-2021_01_08_425967 119 35 visual visual JJ 10_1101-2021_01_08_425967 119 36 inspection inspection NN 10_1101-2021_01_08_425967 119 37 could could MD 10_1101-2021_01_08_425967 119 38 lead lead VB 10_1101-2021_01_08_425967 119 39 to to IN 10_1101-2021_01_08_425967 119 40 misleading misleading JJ 10_1101-2021_01_08_425967 119 41 results result NNS 10_1101-2021_01_08_425967 119 42 . . . 10_1101-2021_01_08_425967 120 1 ( ( -LRB- 10_1101-2021_01_08_425967 120 2 a a LS 10_1101-2021_01_08_425967 120 3 ) ) -RRB- 10_1101-2021_01_08_425967 120 4 ( ( -LRB- 10_1101-2021_01_08_425967 120 5 b b NN 10_1101-2021_01_08_425967 120 6 ) ) -RRB- 10_1101-2021_01_08_425967 120 7 Figure Figure NNP 10_1101-2021_01_08_425967 120 8 4 4 CD 10_1101-2021_01_08_425967 120 9 . . . 10_1101-2021_01_08_425967 121 1 Z z JJ 10_1101-2021_01_08_425967 121 2 - - HYPH 10_1101-2021_01_08_425967 121 3 score score NN 10_1101-2021_01_08_425967 121 4 distribution distribution NN 10_1101-2021_01_08_425967 121 5 by by IN 10_1101-2021_01_08_425967 121 6 percentage percentage NN 10_1101-2021_01_08_425967 121 7 of of IN 10_1101-2021_01_08_425967 121 8 randomized randomized JJ 10_1101-2021_01_08_425967 121 9 items item NNS 10_1101-2021_01_08_425967 121 10 . . . 10_1101-2021_01_08_425967 122 1 ( ( -LRB- 10_1101-2021_01_08_425967 122 2 a a LS 10_1101-2021_01_08_425967 122 3 ) ) -RRB- 10_1101-2021_01_08_425967 122 4 Dataset dataset NN 10_1101-2021_01_08_425967 122 5 from from IN 10_1101-2021_01_08_425967 122 6 Jie Jie NNP 10_1101-2021_01_08_425967 122 7 Shen Shen NNP 10_1101-2021_01_08_425967 122 8 et et NNP 10_1101-2021_01_08_425967 122 9 . . . 10_1101-2021_01_08_425967 123 1 al al NNP 10_1101-2021_01_08_425967 123 2 . . . 10_1101-2021_01_08_425967 124 1 ( ( -LRB- 10_1101-2021_01_08_425967 124 2 b b LS 10_1101-2021_01_08_425967 124 3 ) ) -RRB- 10_1101-2021_01_08_425967 124 4 Dataset dataset NN 10_1101-2021_01_08_425967 124 5 from from IN 10_1101-2021_01_08_425967 124 6 Tooyoka Tooyoka NNP 10_1101-2021_01_08_425967 124 7 et et NNP 10_1101-2021_01_08_425967 124 8 . . . 10_1101-2021_01_08_425967 125 1 al al NNP 10_1101-2021_01_08_425967 125 2 . . . 10_1101-2021_01_08_425967 126 1 The the DT 10_1101-2021_01_08_425967 126 2 red red JJ 10_1101-2021_01_08_425967 126 3 dots dot NNS 10_1101-2021_01_08_425967 126 4 represent represent VBP 10_1101-2021_01_08_425967 126 5 the the DT 10_1101-2021_01_08_425967 126 6 Z z NN 10_1101-2021_01_08_425967 126 7 - - HYPH 10_1101-2021_01_08_425967 126 8 score score NN 10_1101-2021_01_08_425967 126 9 interpolation interpolation NN 10_1101-2021_01_08_425967 126 10 of of IN 10_1101-2021_01_08_425967 126 11 the the DT 10_1101-2021_01_08_425967 126 12 corresponding corresponding JJ 10_1101-2021_01_08_425967 126 13 data data NN 10_1101-2021_01_08_425967 126 14 sets set NNS 10_1101-2021_01_08_425967 126 15 . . . 10_1101-2021_01_08_425967 127 1 .CC .CC NFP 10_1101-2021_01_08_425967 127 2 - - : 10_1101-2021_01_08_425967 127 3 BY by IN 10_1101-2021_01_08_425967 127 4 4.0 4.0 CD 10_1101-2021_01_08_425967 127 5 International international JJ 10_1101-2021_01_08_425967 127 6 licensemade licensemade NN 10_1101-2021_01_08_425967 127 7 available available JJ 10_1101-2021_01_08_425967 127 8 under under IN 10_1101-2021_01_08_425967 127 9 a a DT 10_1101-2021_01_08_425967 127 10 ( ( -LRB- 10_1101-2021_01_08_425967 127 11 which which WDT 10_1101-2021_01_08_425967 127 12 was be VBD 10_1101-2021_01_08_425967 127 13 not not RB 10_1101-2021_01_08_425967 127 14 certified certify VBN 10_1101-2021_01_08_425967 127 15 by by IN 10_1101-2021_01_08_425967 127 16 peer peer NN 10_1101-2021_01_08_425967 127 17 review review NN 10_1101-2021_01_08_425967 127 18 ) ) -RRB- 10_1101-2021_01_08_425967 127 19 is be VBZ 10_1101-2021_01_08_425967 127 20 the the DT 10_1101-2021_01_08_425967 127 21 author author NN 10_1101-2021_01_08_425967 127 22 / / SYM 10_1101-2021_01_08_425967 127 23 funder funder NN 10_1101-2021_01_08_425967 127 24 , , , 10_1101-2021_01_08_425967 127 25 who who WP 10_1101-2021_01_08_425967 127 26 has have VBZ 10_1101-2021_01_08_425967 127 27 granted grant VBN 10_1101-2021_01_08_425967 127 28 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 127 29 a a DT 10_1101-2021_01_08_425967 127 30 license license NN 10_1101-2021_01_08_425967 127 31 to to TO 10_1101-2021_01_08_425967 127 32 display display VB 10_1101-2021_01_08_425967 127 33 the the DT 10_1101-2021_01_08_425967 127 34 preprint preprint NN 10_1101-2021_01_08_425967 127 35 in in IN 10_1101-2021_01_08_425967 127 36 perpetuity perpetuity NN 10_1101-2021_01_08_425967 127 37 . . . 10_1101-2021_01_08_425967 128 1 It -PRON- PRP 10_1101-2021_01_08_425967 128 2 is be VBZ 10_1101-2021_01_08_425967 128 3 The the DT 10_1101-2021_01_08_425967 128 4 copyright copyright NN 10_1101-2021_01_08_425967 128 5 holder holder NN 10_1101-2021_01_08_425967 128 6 for for IN 10_1101-2021_01_08_425967 128 7 this this DT 10_1101-2021_01_08_425967 128 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 128 9 version version NN 10_1101-2021_01_08_425967 128 10 posted post VBD 10_1101-2021_01_08_425967 128 11 January January NNP 10_1101-2021_01_08_425967 128 12 9 9 CD 10_1101-2021_01_08_425967 128 13 , , , 10_1101-2021_01_08_425967 128 14 2021 2021 CD 10_1101-2021_01_08_425967 128 15 . . . 10_1101-2021_01_08_425967 128 16 ; ; : 10_1101-2021_01_08_425967 128 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 128 18 : : : 10_1101-2021_01_08_425967 128 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 128 20 preprint preprint NN 10_1101-2021_01_08_425967 128 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 128 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ ADD 10_1101-2021_01_08_425967 128 23 3.3.3 3.3.3 CD 10_1101-2021_01_08_425967 128 24 . . . 10_1101-2021_01_08_425967 129 1 Comparison comparison NN 10_1101-2021_01_08_425967 129 2 of of IN 10_1101-2021_01_08_425967 129 3 genetic genetic JJ 10_1101-2021_01_08_425967 129 4 regulatory regulatory JJ 10_1101-2021_01_08_425967 129 5 networks network NNS 10_1101-2021_01_08_425967 129 6 with with IN 10_1101-2021_01_08_425967 129 7 theoretical theoretical JJ 10_1101-2021_01_08_425967 129 8 models model NNS 10_1101-2021_01_08_425967 129 9 Finally finally RB 10_1101-2021_01_08_425967 129 10 , , , 10_1101-2021_01_08_425967 129 11 to to TO 10_1101-2021_01_08_425967 129 12 assess assess VB 10_1101-2021_01_08_425967 129 13 the the DT 10_1101-2021_01_08_425967 129 14 PQA PQA NNP 10_1101-2021_01_08_425967 129 15 methodology methodology NN 10_1101-2021_01_08_425967 129 16 using use VBG 10_1101-2021_01_08_425967 129 17 systems system NNS 10_1101-2021_01_08_425967 129 18 biology biology NN 10_1101-2021_01_08_425967 129 19 data datum NNS 10_1101-2021_01_08_425967 129 20 we -PRON- PRP 10_1101-2021_01_08_425967 129 21 clustered cluster VBD 10_1101-2021_01_08_425967 129 22 210 210 CD 10_1101-2021_01_08_425967 129 23 networks network NNS 10_1101-2021_01_08_425967 129 24 according accord VBG 10_1101-2021_01_08_425967 129 25 to to IN 10_1101-2021_01_08_425967 129 26 their -PRON- PRP$ 10_1101-2021_01_08_425967 129 27 pairwise pairwise NN 10_1101-2021_01_08_425967 129 28 dissimilarity dissimilarity NN 10_1101-2021_01_08_425967 129 29 [ [ -LRB- 10_1101-2021_01_08_425967 129 30 9 9 CD 10_1101-2021_01_08_425967 129 31 ] ] -RRB- 10_1101-2021_01_08_425967 129 32 . . . 10_1101-2021_01_08_425967 130 1 First first RB 10_1101-2021_01_08_425967 130 2 , , , 10_1101-2021_01_08_425967 130 3 42 42 CD 10_1101-2021_01_08_425967 130 4 curated curate VBN 10_1101-2021_01_08_425967 130 5 biological biological JJ 10_1101-2021_01_08_425967 130 6 networks network NNS 10_1101-2021_01_08_425967 130 7 were be VBD 10_1101-2021_01_08_425967 130 8 retrieved retrieve VBN 10_1101-2021_01_08_425967 130 9 from from IN 10_1101-2021_01_08_425967 130 10 Abasy Abasy NNP 10_1101-2021_01_08_425967 130 11 Atlas Atlas NNP 10_1101-2021_01_08_425967 130 12 ( ( -LRB- 10_1101-2021_01_08_425967 130 13 v2.2 v2.2 NN 10_1101-2021_01_08_425967 130 14 ) ) -RRB- 10_1101-2021_01_08_425967 130 15 [ [ -LRB- 10_1101-2021_01_08_425967 130 16 10 10 CD 10_1101-2021_01_08_425967 130 17 ] ] -RRB- 10_1101-2021_01_08_425967 130 18 . . . 10_1101-2021_01_08_425967 131 1 For for IN 10_1101-2021_01_08_425967 131 2 each each DT 10_1101-2021_01_08_425967 131 3 biological biological JJ 10_1101-2021_01_08_425967 131 4 network network NN 10_1101-2021_01_08_425967 131 5 , , , 10_1101-2021_01_08_425967 131 6 we -PRON- PRP 10_1101-2021_01_08_425967 131 7 then then RB 10_1101-2021_01_08_425967 131 8 constructed construct VBD 10_1101-2021_01_08_425967 131 9 four four CD 10_1101-2021_01_08_425967 131 10 networks network NNS 10_1101-2021_01_08_425967 131 11 each each DT 10_1101-2021_01_08_425967 131 12 according accord VBG 10_1101-2021_01_08_425967 131 13 to to IN 10_1101-2021_01_08_425967 131 14 a a DT 10_1101-2021_01_08_425967 131 15 theoretical theoretical JJ 10_1101-2021_01_08_425967 131 16 model model NN 10_1101-2021_01_08_425967 131 17 ( ( -LRB- 10_1101-2021_01_08_425967 131 18 Barabasi Barabasi NNP 10_1101-2021_01_08_425967 131 19 - - HYPH 10_1101-2021_01_08_425967 131 20 Alberts Alberts NNP 10_1101-2021_01_08_425967 131 21 , , , 10_1101-2021_01_08_425967 131 22 Erdos Erdos NNP 10_1101-2021_01_08_425967 131 23 - - HYPH 10_1101-2021_01_08_425967 131 24 Renyi Renyi NNP 10_1101-2021_01_08_425967 131 25 , , , 10_1101-2021_01_08_425967 131 26 Scale scale NN 10_1101-2021_01_08_425967 131 27 - - HYPH 10_1101-2021_01_08_425967 131 28 free free JJ 10_1101-2021_01_08_425967 131 29 , , , 10_1101-2021_01_08_425967 131 30 and and CC 10_1101-2021_01_08_425967 131 31 Hierarchical- Hierarchical- NNP 10_1101-2021_01_08_425967 131 32 modular modular JJ 10_1101-2021_01_08_425967 131 33 ) ) -RRB- 10_1101-2021_01_08_425967 131 34 . . . 10_1101-2021_01_08_425967 132 1 We -PRON- PRP 10_1101-2021_01_08_425967 132 2 estimated estimate VBD 10_1101-2021_01_08_425967 132 3 the the DT 10_1101-2021_01_08_425967 132 4 parameters parameter NNS 10_1101-2021_01_08_425967 132 5 of of IN 10_1101-2021_01_08_425967 132 6 each each DT 10_1101-2021_01_08_425967 132 7 theoretical theoretical JJ 10_1101-2021_01_08_425967 132 8 model model NN 10_1101-2021_01_08_425967 132 9 from from IN 10_1101-2021_01_08_425967 132 10 the the DT 10_1101-2021_01_08_425967 132 11 properties property NNS 10_1101-2021_01_08_425967 132 12 of of IN 10_1101-2021_01_08_425967 132 13 the the DT 10_1101-2021_01_08_425967 132 14 corresponding correspond VBG 10_1101-2021_01_08_425967 132 15 biological biological JJ 10_1101-2021_01_08_425967 132 16 network network NN 10_1101-2021_01_08_425967 132 17 . . . 10_1101-2021_01_08_425967 133 1 The the DT 10_1101-2021_01_08_425967 133 2 models model NNS 10_1101-2021_01_08_425967 133 3 used use VBD 10_1101-2021_01_08_425967 133 4 reproduce reproduce VBP 10_1101-2021_01_08_425967 133 5 one one CD 10_1101-2021_01_08_425967 133 6 or or CC 10_1101-2021_01_08_425967 133 7 more more JJR 10_1101-2021_01_08_425967 133 8 intrinsic intrinsic JJ 10_1101-2021_01_08_425967 133 9 characteristics characteristic NNS 10_1101-2021_01_08_425967 133 10 of of IN 10_1101-2021_01_08_425967 133 11 the the DT 10_1101-2021_01_08_425967 133 12 biological biological JJ 10_1101-2021_01_08_425967 133 13 networks network NNS 10_1101-2021_01_08_425967 133 14 , , , 10_1101-2021_01_08_425967 133 15 such such JJ 10_1101-2021_01_08_425967 133 16 as as IN 10_1101-2021_01_08_425967 133 17 power power NN 10_1101-2021_01_08_425967 133 18 - - HYPH 10_1101-2021_01_08_425967 133 19 law law NN 10_1101-2021_01_08_425967 133 20 distribution distribution NN 10_1101-2021_01_08_425967 133 21 , , , 10_1101-2021_01_08_425967 133 22 hubs hub NNS 10_1101-2021_01_08_425967 133 23 , , , 10_1101-2021_01_08_425967 133 24 and and CC 10_1101-2021_01_08_425967 133 25 scale scale NN 10_1101-2021_01_08_425967 133 26 - - HYPH 10_1101-2021_01_08_425967 133 27 free free JJ 10_1101-2021_01_08_425967 133 28 degrees degree NNS 10_1101-2021_01_08_425967 133 29 , , , 10_1101-2021_01_08_425967 133 30 and and CC 10_1101-2021_01_08_425967 133 31 hierarchical hierarchical JJ 10_1101-2021_01_08_425967 133 32 modular modular JJ 10_1101-2021_01_08_425967 133 33 structure structure NN 10_1101-2021_01_08_425967 133 34 [ [ -LRB- 10_1101-2021_01_08_425967 133 35 11 11 CD 10_1101-2021_01_08_425967 133 36 ] ] -RRB- 10_1101-2021_01_08_425967 133 37 . . . 10_1101-2021_01_08_425967 134 1 Visual visual JJ 10_1101-2021_01_08_425967 134 2 inspection inspection NN 10_1101-2021_01_08_425967 134 3 suggested suggest VBD 10_1101-2021_01_08_425967 134 4 that that IN 10_1101-2021_01_08_425967 134 5 the the DT 10_1101-2021_01_08_425967 134 6 classification classification NN 10_1101-2021_01_08_425967 134 7 yielded yield VBD 10_1101-2021_01_08_425967 134 8 a a DT 10_1101-2021_01_08_425967 134 9 highly highly RB 10_1101-2021_01_08_425967 134 10 ordered order VBN 10_1101-2021_01_08_425967 134 11 PV PV NNP 10_1101-2021_01_08_425967 134 12 , , , 10_1101-2021_01_08_425967 134 13 distinguishing distinguish VBG 10_1101-2021_01_08_425967 134 14 according accord VBG 10_1101-2021_01_08_425967 134 15 to to IN 10_1101-2021_01_08_425967 134 16 the the DT 10_1101-2021_01_08_425967 134 17 nature nature NN 10_1101-2021_01_08_425967 134 18 of of IN 10_1101-2021_01_08_425967 134 19 each each DT 10_1101-2021_01_08_425967 134 20 network network NN 10_1101-2021_01_08_425967 134 21 ( ( -LRB- 10_1101-2021_01_08_425967 134 22 Figure Figure NNP 10_1101-2021_01_08_425967 134 23 5 5 CD 10_1101-2021_01_08_425967 134 24 ) ) -RRB- 10_1101-2021_01_08_425967 134 25 . . . 10_1101-2021_01_08_425967 135 1 The the DT 10_1101-2021_01_08_425967 135 2 PQA PQA NNP 10_1101-2021_01_08_425967 135 3 score score NN 10_1101-2021_01_08_425967 135 4 for for IN 10_1101-2021_01_08_425967 135 5 this this DT 10_1101-2021_01_08_425967 135 6 VP VP NNP 10_1101-2021_01_08_425967 135 7 is be VBZ 10_1101-2021_01_08_425967 135 8 0.92 0.92 CD 10_1101-2021_01_08_425967 135 9 ( ( -LRB- 10_1101-2021_01_08_425967 135 10 p p NN 10_1101-2021_01_08_425967 135 11 - - HYPH 10_1101-2021_01_08_425967 135 12 value value NN 10_1101-2021_01_08_425967 135 13 = = SYM 10_1101-2021_01_08_425967 135 14 2.5x10 2.5x10 CD 10_1101-2021_01_08_425967 135 15 - - SYM 10_1101-2021_01_08_425967 135 16 40 40 CD 10_1101-2021_01_08_425967 135 17 , , , 10_1101-2021_01_08_425967 135 18 Z z NN 10_1101-2021_01_08_425967 135 19 - - HYPH 10_1101-2021_01_08_425967 135 20 score score NN 10_1101-2021_01_08_425967 135 21 = = SYM 10_1101-2021_01_08_425967 135 22 13.2 13.2 CD 10_1101-2021_01_08_425967 135 23 ) ) -RRB- 10_1101-2021_01_08_425967 135 24 and and CC 10_1101-2021_01_08_425967 135 25 the the DT 10_1101-2021_01_08_425967 135 26 proportion proportion NN 10_1101-2021_01_08_425967 135 27 of of IN 10_1101-2021_01_08_425967 135 28 noise noise NN 10_1101-2021_01_08_425967 135 29 was be VBD 10_1101-2021_01_08_425967 135 30 5.8 5.8 CD 10_1101-2021_01_08_425967 135 31 % % NN 10_1101-2021_01_08_425967 135 32 ( ( -LRB- 10_1101-2021_01_08_425967 135 33 Figure Figure NNP 10_1101-2021_01_08_425967 135 34 6 6 CD 10_1101-2021_01_08_425967 135 35 ) ) -RRB- 10_1101-2021_01_08_425967 135 36 . . . 10_1101-2021_01_08_425967 136 1 In in IN 10_1101-2021_01_08_425967 136 2 contrast contrast NN 10_1101-2021_01_08_425967 136 3 to to IN 10_1101-2021_01_08_425967 136 4 the the DT 10_1101-2021_01_08_425967 136 5 previous previous JJ 10_1101-2021_01_08_425967 136 6 examples example NNS 10_1101-2021_01_08_425967 136 7 , , , 10_1101-2021_01_08_425967 136 8 here here RB 10_1101-2021_01_08_425967 136 9 we -PRON- PRP 10_1101-2021_01_08_425967 136 10 obtained obtain VBD 10_1101-2021_01_08_425967 136 11 a a DT 10_1101-2021_01_08_425967 136 12 highly highly RB 10_1101-2021_01_08_425967 136 13 ordered order VBN 10_1101-2021_01_08_425967 136 14 clustering clustering NN 10_1101-2021_01_08_425967 136 15 and and CC 10_1101-2021_01_08_425967 136 16 a a DT 10_1101-2021_01_08_425967 136 17 very very RB 10_1101-2021_01_08_425967 136 18 low low JJ 10_1101-2021_01_08_425967 136 19 proportion proportion NN 10_1101-2021_01_08_425967 136 20 of of IN 10_1101-2021_01_08_425967 136 21 noise noise NN 10_1101-2021_01_08_425967 136 22 , , , 10_1101-2021_01_08_425967 136 23 which which WDT 10_1101-2021_01_08_425967 136 24 suggests suggest VBZ 10_1101-2021_01_08_425967 136 25 that that IN 10_1101-2021_01_08_425967 136 26 although although IN 10_1101-2021_01_08_425967 136 27 the the DT 10_1101-2021_01_08_425967 136 28 models model NNS 10_1101-2021_01_08_425967 136 29 recapitulate recapitulate VBP 10_1101-2021_01_08_425967 136 30 some some DT 10_1101-2021_01_08_425967 136 31 of of IN 10_1101-2021_01_08_425967 136 32 the the DT 10_1101-2021_01_08_425967 136 33 properties property NNS 10_1101-2021_01_08_425967 136 34 of of IN 10_1101-2021_01_08_425967 136 35 genetic genetic JJ 10_1101-2021_01_08_425967 136 36 regulatory regulatory JJ 10_1101-2021_01_08_425967 136 37 networks network NNS 10_1101-2021_01_08_425967 136 38 , , , 10_1101-2021_01_08_425967 136 39 each each DT 10_1101-2021_01_08_425967 136 40 of of IN 10_1101-2021_01_08_425967 136 41 them -PRON- PRP 10_1101-2021_01_08_425967 136 42 is be VBZ 10_1101-2021_01_08_425967 136 43 not not RB 10_1101-2021_01_08_425967 136 44 sufficient sufficient JJ 10_1101-2021_01_08_425967 136 45 to to TO 10_1101-2021_01_08_425967 136 46 capture capture VB 10_1101-2021_01_08_425967 136 47 their -PRON- PRP$ 10_1101-2021_01_08_425967 136 48 structural structural JJ 10_1101-2021_01_08_425967 136 49 properties property NNS 10_1101-2021_01_08_425967 136 50 . . . 10_1101-2021_01_08_425967 137 1 Figure figure NN 10_1101-2021_01_08_425967 137 2 5 5 CD 10_1101-2021_01_08_425967 137 3 . . . 10_1101-2021_01_08_425967 138 1 Cluster cluster JJ 10_1101-2021_01_08_425967 138 2 analysis analysis NN 10_1101-2021_01_08_425967 138 3 of of IN 10_1101-2021_01_08_425967 138 4 distance distance NN 10_1101-2021_01_08_425967 138 5 among among IN 10_1101-2021_01_08_425967 138 6 gene gene NN 10_1101-2021_01_08_425967 138 7 regulatory regulatory JJ 10_1101-2021_01_08_425967 138 8 networks network NNS 10_1101-2021_01_08_425967 138 9 and and CC 10_1101-2021_01_08_425967 138 10 theoretical theoretical JJ 10_1101-2021_01_08_425967 138 11 network network NN 10_1101-2021_01_08_425967 138 12 models model NNS 10_1101-2021_01_08_425967 138 13 . . . 10_1101-2021_01_08_425967 139 1 The the DT 10_1101-2021_01_08_425967 139 2 abbreviations abbreviation NNS 10_1101-2021_01_08_425967 139 3 and and CC 10_1101-2021_01_08_425967 139 4 colors color NNS 10_1101-2021_01_08_425967 139 5 used use VBN 10_1101-2021_01_08_425967 139 6 in in IN 10_1101-2021_01_08_425967 139 7 the the DT 10_1101-2021_01_08_425967 139 8 posterior posterior NN 10_1101-2021_01_08_425967 139 9 classification classification NN 10_1101-2021_01_08_425967 139 10 are be VBP 10_1101-2021_01_08_425967 139 11 as as IN 10_1101-2021_01_08_425967 139 12 follows follow VBZ 10_1101-2021_01_08_425967 139 13 : : : 10_1101-2021_01_08_425967 139 14 Barabasi- Barabasi- NNP 10_1101-2021_01_08_425967 139 15 Alberts Alberts NNPS 10_1101-2021_01_08_425967 139 16 ( ( -LRB- 10_1101-2021_01_08_425967 139 17 BA BA NNP 10_1101-2021_01_08_425967 139 18 , , , 10_1101-2021_01_08_425967 139 19 red red NN 10_1101-2021_01_08_425967 139 20 ) ) -RRB- 10_1101-2021_01_08_425967 139 21 , , , 10_1101-2021_01_08_425967 139 22 Erdos Erdos NNP 10_1101-2021_01_08_425967 139 23 - - HYPH 10_1101-2021_01_08_425967 139 24 Renyi Renyi NNP 10_1101-2021_01_08_425967 139 25 ( ( -LRB- 10_1101-2021_01_08_425967 139 26 ER ER NNP 10_1101-2021_01_08_425967 139 27 , , , 10_1101-2021_01_08_425967 139 28 blue blue JJ 10_1101-2021_01_08_425967 139 29 ) ) -RRB- 10_1101-2021_01_08_425967 139 30 , , , 10_1101-2021_01_08_425967 139 31 Scale scale NN 10_1101-2021_01_08_425967 139 32 - - HYPH 10_1101-2021_01_08_425967 139 33 free free JJ 10_1101-2021_01_08_425967 139 34 ( ( -LRB- 10_1101-2021_01_08_425967 139 35 SF SF NNP 10_1101-2021_01_08_425967 139 36 , , , 10_1101-2021_01_08_425967 139 37 green green JJ 10_1101-2021_01_08_425967 139 38 ) ) -RRB- 10_1101-2021_01_08_425967 139 39 , , , 10_1101-2021_01_08_425967 139 40 Hierarchical hierarchical JJ 10_1101-2021_01_08_425967 139 41 modularity modularity NN 10_1101-2021_01_08_425967 139 42 ( ( -LRB- 10_1101-2021_01_08_425967 139 43 HM HM NNP 10_1101-2021_01_08_425967 139 44 , , , 10_1101-2021_01_08_425967 139 45 purple purple NNP 10_1101-2021_01_08_425967 139 46 ) ) -RRB- 10_1101-2021_01_08_425967 139 47 , , , 10_1101-2021_01_08_425967 139 48 and and CC 10_1101-2021_01_08_425967 139 49 biological biological JJ 10_1101-2021_01_08_425967 139 50 networks network NNS 10_1101-2021_01_08_425967 139 51 ( ( -LRB- 10_1101-2021_01_08_425967 139 52 Bi Bi NNP 10_1101-2021_01_08_425967 139 53 , , , 10_1101-2021_01_08_425967 139 54 orange orange NNP 10_1101-2021_01_08_425967 139 55 ) ) -RRB- 10_1101-2021_01_08_425967 139 56 . . . 10_1101-2021_01_08_425967 140 1 .CC .CC NFP 10_1101-2021_01_08_425967 140 2 - - : 10_1101-2021_01_08_425967 140 3 BY by IN 10_1101-2021_01_08_425967 140 4 4.0 4.0 CD 10_1101-2021_01_08_425967 140 5 International international JJ 10_1101-2021_01_08_425967 140 6 licensemade licensemade NN 10_1101-2021_01_08_425967 140 7 available available JJ 10_1101-2021_01_08_425967 140 8 under under IN 10_1101-2021_01_08_425967 140 9 a a DT 10_1101-2021_01_08_425967 140 10 ( ( -LRB- 10_1101-2021_01_08_425967 140 11 which which WDT 10_1101-2021_01_08_425967 140 12 was be VBD 10_1101-2021_01_08_425967 140 13 not not RB 10_1101-2021_01_08_425967 140 14 certified certify VBN 10_1101-2021_01_08_425967 140 15 by by IN 10_1101-2021_01_08_425967 140 16 peer peer NN 10_1101-2021_01_08_425967 140 17 review review NN 10_1101-2021_01_08_425967 140 18 ) ) -RRB- 10_1101-2021_01_08_425967 140 19 is be VBZ 10_1101-2021_01_08_425967 140 20 the the DT 10_1101-2021_01_08_425967 140 21 author author NN 10_1101-2021_01_08_425967 140 22 / / SYM 10_1101-2021_01_08_425967 140 23 funder funder NN 10_1101-2021_01_08_425967 140 24 , , , 10_1101-2021_01_08_425967 140 25 who who WP 10_1101-2021_01_08_425967 140 26 has have VBZ 10_1101-2021_01_08_425967 140 27 granted grant VBN 10_1101-2021_01_08_425967 140 28 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 140 29 a a DT 10_1101-2021_01_08_425967 140 30 license license NN 10_1101-2021_01_08_425967 140 31 to to TO 10_1101-2021_01_08_425967 140 32 display display VB 10_1101-2021_01_08_425967 140 33 the the DT 10_1101-2021_01_08_425967 140 34 preprint preprint NN 10_1101-2021_01_08_425967 140 35 in in IN 10_1101-2021_01_08_425967 140 36 perpetuity perpetuity NN 10_1101-2021_01_08_425967 140 37 . . . 10_1101-2021_01_08_425967 141 1 It -PRON- PRP 10_1101-2021_01_08_425967 141 2 is be VBZ 10_1101-2021_01_08_425967 141 3 The the DT 10_1101-2021_01_08_425967 141 4 copyright copyright NN 10_1101-2021_01_08_425967 141 5 holder holder NN 10_1101-2021_01_08_425967 141 6 for for IN 10_1101-2021_01_08_425967 141 7 this this DT 10_1101-2021_01_08_425967 141 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 141 9 version version NN 10_1101-2021_01_08_425967 141 10 posted post VBD 10_1101-2021_01_08_425967 141 11 January January NNP 10_1101-2021_01_08_425967 141 12 9 9 CD 10_1101-2021_01_08_425967 141 13 , , , 10_1101-2021_01_08_425967 141 14 2021 2021 CD 10_1101-2021_01_08_425967 141 15 . . . 10_1101-2021_01_08_425967 141 16 ; ; : 10_1101-2021_01_08_425967 141 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 141 18 : : : 10_1101-2021_01_08_425967 141 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 141 20 preprint preprint NN 10_1101-2021_01_08_425967 141 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 141 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ -LRB- 10_1101-2021_01_08_425967 141 23 Figure Figure NNP 10_1101-2021_01_08_425967 141 24 6 6 CD 10_1101-2021_01_08_425967 141 25 . . . 10_1101-2021_01_08_425967 142 1 Z z JJ 10_1101-2021_01_08_425967 142 2 - - HYPH 10_1101-2021_01_08_425967 142 3 score score NN 10_1101-2021_01_08_425967 142 4 distribution distribution NN 10_1101-2021_01_08_425967 142 5 by by IN 10_1101-2021_01_08_425967 142 6 percentage percentage NN 10_1101-2021_01_08_425967 142 7 of of IN 10_1101-2021_01_08_425967 142 8 randomized randomized JJ 10_1101-2021_01_08_425967 142 9 items item NNS 10_1101-2021_01_08_425967 142 10 of of IN 10_1101-2021_01_08_425967 142 11 VP VP NNP 10_1101-2021_01_08_425967 142 12 from from IN 10_1101-2021_01_08_425967 142 13 genetic genetic JJ 10_1101-2021_01_08_425967 142 14 regulatory regulatory JJ 10_1101-2021_01_08_425967 142 15 networks network NNS 10_1101-2021_01_08_425967 142 16 . . . 10_1101-2021_01_08_425967 143 1 The the DT 10_1101-2021_01_08_425967 143 2 red red JJ 10_1101-2021_01_08_425967 143 3 dot dot NN 10_1101-2021_01_08_425967 143 4 represents represent VBZ 10_1101-2021_01_08_425967 143 5 the the DT 10_1101-2021_01_08_425967 143 6 Z z NN 10_1101-2021_01_08_425967 143 7 - - HYPH 10_1101-2021_01_08_425967 143 8 score score NN 10_1101-2021_01_08_425967 143 9 interpolation interpolation NN 10_1101-2021_01_08_425967 143 10 of of IN 10_1101-2021_01_08_425967 143 11 the the DT 10_1101-2021_01_08_425967 143 12 actual actual JJ 10_1101-2021_01_08_425967 143 13 data data NN 10_1101-2021_01_08_425967 143 14 set set NN 10_1101-2021_01_08_425967 143 15 . . . 10_1101-2021_01_08_425967 144 1 4 4 LS 10_1101-2021_01_08_425967 144 2 . . . 10_1101-2021_01_08_425967 145 1 Conclusions conclusion NNS 10_1101-2021_01_08_425967 145 2 In in IN 10_1101-2021_01_08_425967 145 3 this this DT 10_1101-2021_01_08_425967 145 4 work work NN 10_1101-2021_01_08_425967 145 5 , , , 10_1101-2021_01_08_425967 145 6 we -PRON- PRP 10_1101-2021_01_08_425967 145 7 presented present VBD 10_1101-2021_01_08_425967 145 8 a a DT 10_1101-2021_01_08_425967 145 9 novel novel JJ 10_1101-2021_01_08_425967 145 10 method method NN 10_1101-2021_01_08_425967 145 11 to to TO 10_1101-2021_01_08_425967 145 12 quantify quantify VB 10_1101-2021_01_08_425967 145 13 the the DT 10_1101-2021_01_08_425967 145 14 proportion proportion NN 10_1101-2021_01_08_425967 145 15 of of IN 10_1101-2021_01_08_425967 145 16 noise noise NN 10_1101-2021_01_08_425967 145 17 embedded embed VBN 10_1101-2021_01_08_425967 145 18 in in IN 10_1101-2021_01_08_425967 145 19 the the DT 10_1101-2021_01_08_425967 145 20 grouping grouping NN 10_1101-2021_01_08_425967 145 21 of of IN 10_1101-2021_01_08_425967 145 22 associated associate VBN 10_1101-2021_01_08_425967 145 23 classes class NNS 10_1101-2021_01_08_425967 145 24 of of IN 10_1101-2021_01_08_425967 145 25 the the DT 10_1101-2021_01_08_425967 145 26 elements element NNS 10_1101-2021_01_08_425967 145 27 in in IN 10_1101-2021_01_08_425967 145 28 hierarchical hierarchical JJ 10_1101-2021_01_08_425967 145 29 clustering clustering NN 10_1101-2021_01_08_425967 145 30 . . . 10_1101-2021_01_08_425967 146 1 We -PRON- PRP 10_1101-2021_01_08_425967 146 2 proposed propose VBD 10_1101-2021_01_08_425967 146 3 a a DT 10_1101-2021_01_08_425967 146 4 relative relative JJ 10_1101-2021_01_08_425967 146 5 score score NN 10_1101-2021_01_08_425967 146 6 derived derive VBN 10_1101-2021_01_08_425967 146 7 from from IN 10_1101-2021_01_08_425967 146 8 an an DT 10_1101-2021_01_08_425967 146 9 SC SC NNP 10_1101-2021_01_08_425967 146 10 of of IN 10_1101-2021_01_08_425967 146 11 the the DT 10_1101-2021_01_08_425967 146 12 VP vp NN 10_1101-2021_01_08_425967 146 13 from from IN 10_1101-2021_01_08_425967 146 14 the the DT 10_1101-2021_01_08_425967 146 15 dendrogram dendrogram NN 10_1101-2021_01_08_425967 146 16 of of IN 10_1101-2021_01_08_425967 146 17 any any DT 10_1101-2021_01_08_425967 146 18 clustering cluster VBG 10_1101-2021_01_08_425967 146 19 analysis analysis NN 10_1101-2021_01_08_425967 146 20 and and CC 10_1101-2021_01_08_425967 146 21 calculated calculate VBD 10_1101-2021_01_08_425967 146 22 Z- Z- NNP 10_1101-2021_01_08_425967 146 23 statistics statistic NNS 10_1101-2021_01_08_425967 146 24 as as RB 10_1101-2021_01_08_425967 146 25 well well RB 10_1101-2021_01_08_425967 146 26 as as IN 10_1101-2021_01_08_425967 146 27 an an DT 10_1101-2021_01_08_425967 146 28 extrapolation extrapolation NN 10_1101-2021_01_08_425967 146 29 to to TO 10_1101-2021_01_08_425967 146 30 deliver deliver VB 10_1101-2021_01_08_425967 146 31 an an DT 10_1101-2021_01_08_425967 146 32 estimation estimation NN 10_1101-2021_01_08_425967 146 33 of of IN 10_1101-2021_01_08_425967 146 34 noise noise NN 10_1101-2021_01_08_425967 146 35 in in IN 10_1101-2021_01_08_425967 146 36 the the DT 10_1101-2021_01_08_425967 146 37 VP vp NN 10_1101-2021_01_08_425967 146 38 . . . 10_1101-2021_01_08_425967 147 1 We -PRON- PRP 10_1101-2021_01_08_425967 147 2 explain explain VBP 10_1101-2021_01_08_425967 147 3 how how WRB 10_1101-2021_01_08_425967 147 4 the the DT 10_1101-2021_01_08_425967 147 5 method method NN 10_1101-2021_01_08_425967 147 6 is be VBZ 10_1101-2021_01_08_425967 147 7 formulated formulate VBN 10_1101-2021_01_08_425967 147 8 and and CC 10_1101-2021_01_08_425967 147 9 show show VB 10_1101-2021_01_08_425967 147 10 the the DT 10_1101-2021_01_08_425967 147 11 tests test NNS 10_1101-2021_01_08_425967 147 12 we -PRON- PRP 10_1101-2021_01_08_425967 147 13 made make VBD 10_1101-2021_01_08_425967 147 14 to to TO 10_1101-2021_01_08_425967 147 15 systematically systematically RB 10_1101-2021_01_08_425967 147 16 refine refine VB 10_1101-2021_01_08_425967 147 17 it -PRON- PRP 10_1101-2021_01_08_425967 147 18 . . . 10_1101-2021_01_08_425967 148 1 We -PRON- PRP 10_1101-2021_01_08_425967 148 2 additionally additionally RB 10_1101-2021_01_08_425967 148 3 made make VBD 10_1101-2021_01_08_425967 148 4 a a DT 10_1101-2021_01_08_425967 148 5 proof proof NN 10_1101-2021_01_08_425967 148 6 of of IN 10_1101-2021_01_08_425967 148 7 concept concept NN 10_1101-2021_01_08_425967 148 8 by by IN 10_1101-2021_01_08_425967 148 9 using use VBG 10_1101-2021_01_08_425967 148 10 clustering cluster VBG 10_1101-2021_01_08_425967 148 11 data datum NNS 10_1101-2021_01_08_425967 148 12 from from IN 10_1101-2021_01_08_425967 148 13 two two CD 10_1101-2021_01_08_425967 148 14 works work NNS 10_1101-2021_01_08_425967 148 15 that that WDT 10_1101-2021_01_08_425967 148 16 we -PRON- PRP 10_1101-2021_01_08_425967 148 17 think think VBP 10_1101-2021_01_08_425967 148 18 perfectly perfectly RB 10_1101-2021_01_08_425967 148 19 represent represent VBP 10_1101-2021_01_08_425967 148 20 overfitting overfitting NN 10_1101-2021_01_08_425967 148 21 by by IN 10_1101-2021_01_08_425967 148 22 apophenia apophenia NNP 10_1101-2021_01_08_425967 148 23 . . . 10_1101-2021_01_08_425967 149 1 Additionally additionally RB 10_1101-2021_01_08_425967 149 2 , , , 10_1101-2021_01_08_425967 149 3 we -PRON- PRP 10_1101-2021_01_08_425967 149 4 added add VBD 10_1101-2021_01_08_425967 149 5 an an DT 10_1101-2021_01_08_425967 149 6 example example NN 10_1101-2021_01_08_425967 149 7 from from IN 10_1101-2021_01_08_425967 149 8 network network NN 10_1101-2021_01_08_425967 149 9 biology biology NN 10_1101-2021_01_08_425967 149 10 where where WRB 10_1101-2021_01_08_425967 149 11 clustered clustered JJ 10_1101-2021_01_08_425967 149 12 networks network NNS 10_1101-2021_01_08_425967 149 13 are be VBP 10_1101-2021_01_08_425967 149 14 separated separate VBN 10_1101-2021_01_08_425967 149 15 by by IN 10_1101-2021_01_08_425967 149 16 intrinsic intrinsic JJ 10_1101-2021_01_08_425967 149 17 characteristics characteristic NNS 10_1101-2021_01_08_425967 149 18 . . . 10_1101-2021_01_08_425967 150 1 Although although IN 10_1101-2021_01_08_425967 150 2 in in IN 10_1101-2021_01_08_425967 150 3 this this DT 10_1101-2021_01_08_425967 150 4 work work NN 10_1101-2021_01_08_425967 150 5 we -PRON- PRP 10_1101-2021_01_08_425967 150 6 focused focus VBD 10_1101-2021_01_08_425967 150 7 on on IN 10_1101-2021_01_08_425967 150 8 examples example NNS 10_1101-2021_01_08_425967 150 9 where where WRB 10_1101-2021_01_08_425967 150 10 hierarchical hierarchical JJ 10_1101-2021_01_08_425967 150 11 clustering clustering NN 10_1101-2021_01_08_425967 150 12 is be VBZ 10_1101-2021_01_08_425967 150 13 performed perform VBN 10_1101-2021_01_08_425967 150 14 , , , 10_1101-2021_01_08_425967 150 15 this this DT 10_1101-2021_01_08_425967 150 16 framework framework NN 10_1101-2021_01_08_425967 150 17 can can MD 10_1101-2021_01_08_425967 150 18 apply apply VB 10_1101-2021_01_08_425967 150 19 to to IN 10_1101-2021_01_08_425967 150 20 any any DT 10_1101-2021_01_08_425967 150 21 partition partition NN 10_1101-2021_01_08_425967 150 22 algorithm algorithm VB 10_1101-2021_01_08_425967 150 23 in in IN 10_1101-2021_01_08_425967 150 24 which which WDT 10_1101-2021_01_08_425967 150 25 the the DT 10_1101-2021_01_08_425967 150 26 elements element NNS 10_1101-2021_01_08_425967 150 27 are be VBP 10_1101-2021_01_08_425967 150 28 identified identify VBN 10_1101-2021_01_08_425967 150 29 and and CC 10_1101-2021_01_08_425967 150 30 a a DT 10_1101-2021_01_08_425967 150 31 vector vector NN 10_1101-2021_01_08_425967 150 32 of of IN 10_1101-2021_01_08_425967 150 33 the the DT 10_1101-2021_01_08_425967 150 34 order order NN 10_1101-2021_01_08_425967 150 35 can can MD 10_1101-2021_01_08_425967 150 36 be be VB 10_1101-2021_01_08_425967 150 37 acquired acquire VBN 10_1101-2021_01_08_425967 150 38 . . . 10_1101-2021_01_08_425967 151 1 We -PRON- PRP 10_1101-2021_01_08_425967 151 2 concluded conclude VBD 10_1101-2021_01_08_425967 151 3 that that IN 10_1101-2021_01_08_425967 151 4 the the DT 10_1101-2021_01_08_425967 151 5 clustered clustered JJ 10_1101-2021_01_08_425967 151 6 sets set NNS 10_1101-2021_01_08_425967 151 7 of of IN 10_1101-2021_01_08_425967 151 8 biologic biologic JJ 10_1101-2021_01_08_425967 151 9 data datum NNS 10_1101-2021_01_08_425967 151 10 have have VBP 10_1101-2021_01_08_425967 151 11 a a DT 10_1101-2021_01_08_425967 151 12 high high JJ 10_1101-2021_01_08_425967 151 13 measure measure NN 10_1101-2021_01_08_425967 151 14 of of IN 10_1101-2021_01_08_425967 151 15 noise noise NN 10_1101-2021_01_08_425967 151 16 , , , 10_1101-2021_01_08_425967 151 17 despite despite IN 10_1101-2021_01_08_425967 151 18 looking look VBG 10_1101-2021_01_08_425967 151 19 well well RB 10_1101-2021_01_08_425967 151 20 grouped group VBN 10_1101-2021_01_08_425967 151 21 . . . 10_1101-2021_01_08_425967 152 1 We -PRON- PRP 10_1101-2021_01_08_425967 152 2 proved prove VBD 10_1101-2021_01_08_425967 152 3 what what WP 10_1101-2021_01_08_425967 152 4 a a DT 10_1101-2021_01_08_425967 152 5 minimum minimum JJ 10_1101-2021_01_08_425967 152 6 number number NN 10_1101-2021_01_08_425967 152 7 of of IN 10_1101-2021_01_08_425967 152 8 classifications classification NNS 10_1101-2021_01_08_425967 152 9 should should MD 10_1101-2021_01_08_425967 152 10 be be VB 10_1101-2021_01_08_425967 152 11 considered consider VBN 10_1101-2021_01_08_425967 152 12 in in IN 10_1101-2021_01_08_425967 152 13 this this DT 10_1101-2021_01_08_425967 152 14 sort sort NN 10_1101-2021_01_08_425967 152 15 of of IN 10_1101-2021_01_08_425967 152 16 clustering cluster VBG 10_1101-2021_01_08_425967 152 17 analysis analysis NN 10_1101-2021_01_08_425967 152 18 to to TO 10_1101-2021_01_08_425967 152 19 have have VB 10_1101-2021_01_08_425967 152 20 a a DT 10_1101-2021_01_08_425967 152 21 significant significant JJ 10_1101-2021_01_08_425967 152 22 reduction reduction NN 10_1101-2021_01_08_425967 152 23 of of IN 10_1101-2021_01_08_425967 152 24 noise noise NN 10_1101-2021_01_08_425967 152 25 . . . 10_1101-2021_01_08_425967 153 1 On on IN 10_1101-2021_01_08_425967 153 2 the the DT 10_1101-2021_01_08_425967 153 3 other other JJ 10_1101-2021_01_08_425967 153 4 hand hand NN 10_1101-2021_01_08_425967 153 5 , , , 10_1101-2021_01_08_425967 153 6 we -PRON- PRP 10_1101-2021_01_08_425967 153 7 permuted permute VBD 10_1101-2021_01_08_425967 153 8 the the DT 10_1101-2021_01_08_425967 153 9 labels label NNS 10_1101-2021_01_08_425967 153 10 of of IN 10_1101-2021_01_08_425967 153 11 the the DT 10_1101-2021_01_08_425967 153 12 associated associate VBN 10_1101-2021_01_08_425967 153 13 classes class NNS 10_1101-2021_01_08_425967 153 14 and and CC 10_1101-2021_01_08_425967 153 15 concluded conclude VBD 10_1101-2021_01_08_425967 153 16 that that IN 10_1101-2021_01_08_425967 153 17 the the DT 10_1101-2021_01_08_425967 153 18 effect effect NN 10_1101-2021_01_08_425967 153 19 is be VBZ 10_1101-2021_01_08_425967 153 20 negligible negligible JJ 10_1101-2021_01_08_425967 153 21 . . . 10_1101-2021_01_08_425967 154 1 We -PRON- PRP 10_1101-2021_01_08_425967 154 2 proved prove VBD 10_1101-2021_01_08_425967 154 3 that that IN 10_1101-2021_01_08_425967 154 4 randomness randomness NN 10_1101-2021_01_08_425967 154 5 still still RB 10_1101-2021_01_08_425967 154 6 plays play VBZ 10_1101-2021_01_08_425967 154 7 an an DT 10_1101-2021_01_08_425967 154 8 important important JJ 10_1101-2021_01_08_425967 154 9 role role NN 10_1101-2021_01_08_425967 154 10 by by IN 10_1101-2021_01_08_425967 154 11 biasing bias VBG 10_1101-2021_01_08_425967 154 12 the the DT 10_1101-2021_01_08_425967 154 13 results result NNS 10_1101-2021_01_08_425967 154 14 , , , 10_1101-2021_01_08_425967 154 15 though though IN 10_1101-2021_01_08_425967 154 16 it -PRON- PRP 10_1101-2021_01_08_425967 154 17 may may MD 10_1101-2021_01_08_425967 154 18 not not RB 10_1101-2021_01_08_425967 154 19 be be VB 10_1101-2021_01_08_425967 154 20 evident evident JJ 10_1101-2021_01_08_425967 154 21 through through IN 10_1101-2021_01_08_425967 154 22 visual visual JJ 10_1101-2021_01_08_425967 154 23 inspection inspection NN 10_1101-2021_01_08_425967 154 24 . . . 10_1101-2021_01_08_425967 155 1 The the DT 10_1101-2021_01_08_425967 155 2 PQA PQA NNP 10_1101-2021_01_08_425967 155 3 could could MD 10_1101-2021_01_08_425967 155 4 be be VB 10_1101-2021_01_08_425967 155 5 used use VBN 10_1101-2021_01_08_425967 155 6 as as IN 10_1101-2021_01_08_425967 155 7 a a DT 10_1101-2021_01_08_425967 155 8 benchmark benchmark NN 10_1101-2021_01_08_425967 155 9 to to TO 10_1101-2021_01_08_425967 155 10 test test VB 10_1101-2021_01_08_425967 155 11 what what WP 10_1101-2021_01_08_425967 155 12 clustering cluster VBG 10_1101-2021_01_08_425967 155 13 algorithm algorithm NNP 10_1101-2021_01_08_425967 155 14 should should MD 10_1101-2021_01_08_425967 155 15 be be VB 10_1101-2021_01_08_425967 155 16 appropriate appropriate JJ 10_1101-2021_01_08_425967 155 17 for for IN 10_1101-2021_01_08_425967 155 18 the the DT 10_1101-2021_01_08_425967 155 19 analyzed analyze VBN 10_1101-2021_01_08_425967 155 20 dataset dataset NN 10_1101-2021_01_08_425967 155 21 by by IN 10_1101-2021_01_08_425967 155 22 minimizing minimize VBG 10_1101-2021_01_08_425967 155 23 the the DT 10_1101-2021_01_08_425967 155 24 noise noise NN 10_1101-2021_01_08_425967 155 25 proportion proportion NN 10_1101-2021_01_08_425967 155 26 and and CC 10_1101-2021_01_08_425967 155 27 to to TO 10_1101-2021_01_08_425967 155 28 guide guide VB 10_1101-2021_01_08_425967 155 29 omics omic NNS 10_1101-2021_01_08_425967 155 30 experimental experimental JJ 10_1101-2021_01_08_425967 155 31 designs design NNS 10_1101-2021_01_08_425967 155 32 . . . 10_1101-2021_01_08_425967 156 1 Nevertheless nevertheless RB 10_1101-2021_01_08_425967 156 2 , , , 10_1101-2021_01_08_425967 156 3 a a DT 10_1101-2021_01_08_425967 156 4 word word NN 10_1101-2021_01_08_425967 156 5 of of IN 10_1101-2021_01_08_425967 156 6 caution caution NN 10_1101-2021_01_08_425967 156 7 , , , 10_1101-2021_01_08_425967 156 8 the the DT 10_1101-2021_01_08_425967 156 9 PQA PQA NNP 10_1101-2021_01_08_425967 156 10 score score NN 10_1101-2021_01_08_425967 156 11 alone alone RB 10_1101-2021_01_08_425967 156 12 can can MD 10_1101-2021_01_08_425967 156 13 be be VB 10_1101-2021_01_08_425967 156 14 subject subject JJ 10_1101-2021_01_08_425967 156 15 to to IN 10_1101-2021_01_08_425967 156 16 subjectivity subjectivity NN 10_1101-2021_01_08_425967 156 17 if if IN 10_1101-2021_01_08_425967 156 18 not not RB 10_1101-2021_01_08_425967 156 19 used use VBN 10_1101-2021_01_08_425967 156 20 properly properly RB 10_1101-2021_01_08_425967 156 21 since since IN 10_1101-2021_01_08_425967 156 22 it -PRON- PRP 10_1101-2021_01_08_425967 156 23 depended depend VBD 10_1101-2021_01_08_425967 156 24 on on IN 10_1101-2021_01_08_425967 156 25 the the DT 10_1101-2021_01_08_425967 156 26 characteristics characteristic NNS 10_1101-2021_01_08_425967 156 27 of of IN 10_1101-2021_01_08_425967 156 28 the the DT 10_1101-2021_01_08_425967 156 29 analyzed analyze VBN 10_1101-2021_01_08_425967 156 30 data datum NNS 10_1101-2021_01_08_425967 156 31 . . . 10_1101-2021_01_08_425967 157 1 Thus thus RB 10_1101-2021_01_08_425967 157 2 , , , 10_1101-2021_01_08_425967 157 3 the the DT 10_1101-2021_01_08_425967 157 4 PQA PQA NNP 10_1101-2021_01_08_425967 157 5 score score NN 10_1101-2021_01_08_425967 157 6 is be VBZ 10_1101-2021_01_08_425967 157 7 thought think VBN 10_1101-2021_01_08_425967 157 8 to to TO 10_1101-2021_01_08_425967 157 9 be be VB 10_1101-2021_01_08_425967 157 10 considered consider VBN 10_1101-2021_01_08_425967 157 11 as as IN 10_1101-2021_01_08_425967 157 12 a a DT 10_1101-2021_01_08_425967 157 13 quantification quantification NN 10_1101-2021_01_08_425967 157 14 of of IN 10_1101-2021_01_08_425967 157 15 noise noise NN 10_1101-2021_01_08_425967 157 16 in in IN 10_1101-2021_01_08_425967 157 17 clustered cluster VBN 10_1101-2021_01_08_425967 157 18 data datum NNS 10_1101-2021_01_08_425967 157 19 and and CC 10_1101-2021_01_08_425967 157 20 should should MD 10_1101-2021_01_08_425967 157 21 be be VB 10_1101-2021_01_08_425967 157 22 used use VBN 10_1101-2021_01_08_425967 157 23 with with IN 10_1101-2021_01_08_425967 157 24 discretion discretion NN 10_1101-2021_01_08_425967 157 25 . . . 10_1101-2021_01_08_425967 158 1 Author author NN 10_1101-2021_01_08_425967 158 2 Contributions Contributions NNP 10_1101-2021_01_08_425967 158 3 : : : 10_1101-2021_01_08_425967 158 4 Conceptualization Conceptualization NNP 10_1101-2021_01_08_425967 158 5 , , , 10_1101-2021_01_08_425967 158 6 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 159 1 ; ; : 10_1101-2021_01_08_425967 159 2 methodology methodology NN 10_1101-2021_01_08_425967 159 3 , , , 10_1101-2021_01_08_425967 159 4 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 160 1 ; ; : 10_1101-2021_01_08_425967 160 2 software software NN 10_1101-2021_01_08_425967 160 3 , , , 10_1101-2021_01_08_425967 160 4 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 160 5 , , , 10_1101-2021_01_08_425967 160 6 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 160 7 , , , 10_1101-2021_01_08_425967 160 8 and and CC 10_1101-2021_01_08_425967 160 9 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 161 1 ; ; : 10_1101-2021_01_08_425967 161 2 validation validation NN 10_1101-2021_01_08_425967 161 3 , , , 10_1101-2021_01_08_425967 161 4 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 161 5 , , , 10_1101-2021_01_08_425967 161 6 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 161 7 , , , 10_1101-2021_01_08_425967 161 8 and and CC 10_1101-2021_01_08_425967 161 9 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 162 1 ; ; : 10_1101-2021_01_08_425967 162 2 formal formal JJ 10_1101-2021_01_08_425967 162 3 analysis analysis NN 10_1101-2021_01_08_425967 162 4 , , , 10_1101-2021_01_08_425967 162 5 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 162 6 , , , 10_1101-2021_01_08_425967 162 7 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 162 8 , , , 10_1101-2021_01_08_425967 162 9 and and CC 10_1101-2021_01_08_425967 162 10 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 163 1 ; ; : 10_1101-2021_01_08_425967 163 2 investigation investigation NN 10_1101-2021_01_08_425967 163 3 , , , 10_1101-2021_01_08_425967 163 4 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 163 5 , , , 10_1101-2021_01_08_425967 163 6 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 163 7 , , , 10_1101-2021_01_08_425967 163 8 J.R.L.B. J.R.L.B. NNP 10_1101-2021_01_08_425967 163 9 , , , 10_1101-2021_01_08_425967 163 10 and and CC 10_1101-2021_01_08_425967 163 11 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 164 1 ; ; : 10_1101-2021_01_08_425967 164 2 resources resource NNS 10_1101-2021_01_08_425967 164 3 , , , 10_1101-2021_01_08_425967 164 4 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 165 1 ; ; : 10_1101-2021_01_08_425967 165 2 data datum NNS 10_1101-2021_01_08_425967 165 3 curation curation NN 10_1101-2021_01_08_425967 165 4 , , , 10_1101-2021_01_08_425967 165 5 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 165 6 , , , 10_1101-2021_01_08_425967 165 7 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 165 8 , , , 10_1101-2021_01_08_425967 165 9 and and CC 10_1101-2021_01_08_425967 165 10 J.E.L.B. J.E.L.B. NNP 10_1101-2021_01_08_425967 166 1 ; ; : 10_1101-2021_01_08_425967 166 2 writing writing NN 10_1101-2021_01_08_425967 166 3 — — : 10_1101-2021_01_08_425967 166 4 original original JJ 10_1101-2021_01_08_425967 166 5 draft draft NN 10_1101-2021_01_08_425967 166 6 preparation preparation NN 10_1101-2021_01_08_425967 166 7 , , , 10_1101-2021_01_08_425967 166 8 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 166 9 , , , 10_1101-2021_01_08_425967 166 10 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 166 11 , , , 10_1101-2021_01_08_425967 166 12 J.E.L.B. J.E.L.B. NNP 10_1101-2021_01_08_425967 166 13 , , , 10_1101-2021_01_08_425967 166 14 and and CC 10_1101-2021_01_08_425967 166 15 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 167 1 ; ; : 10_1101-2021_01_08_425967 167 2 writing writing NN 10_1101-2021_01_08_425967 167 3 — — : 10_1101-2021_01_08_425967 167 4 review review NN 10_1101-2021_01_08_425967 167 5 and and CC 10_1101-2021_01_08_425967 167 6 editing editing NN 10_1101-2021_01_08_425967 167 7 , , , 10_1101-2021_01_08_425967 167 8 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 167 9 , , , 10_1101-2021_01_08_425967 167 10 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 167 11 , , , 10_1101-2021_01_08_425967 167 12 and and CC 10_1101-2021_01_08_425967 167 13 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 168 1 ; ; : 10_1101-2021_01_08_425967 168 2 visualization visualization NN 10_1101-2021_01_08_425967 168 3 , , , 10_1101-2021_01_08_425967 168 4 D.A.C.H. D.A.C.H. NNP 10_1101-2021_01_08_425967 168 5 , , , 10_1101-2021_01_08_425967 168 6 V.E.N.C. V.E.N.C. NNP 10_1101-2021_01_08_425967 168 7 , , , 10_1101-2021_01_08_425967 168 8 J.E.L.B. J.E.L.B. NNP 10_1101-2021_01_08_425967 168 9 , , , 10_1101-2021_01_08_425967 168 10 and and CC 10_1101-2021_01_08_425967 168 11 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 169 1 ; ; : 10_1101-2021_01_08_425967 169 2 supervision supervision NN 10_1101-2021_01_08_425967 169 3 , , , 10_1101-2021_01_08_425967 169 4 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 170 1 ; ; : 10_1101-2021_01_08_425967 170 2 project project NN 10_1101-2021_01_08_425967 170 3 administration administration NNP 10_1101-2021_01_08_425967 170 4 , , , 10_1101-2021_01_08_425967 170 5 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 171 1 ; ; : 10_1101-2021_01_08_425967 171 2 funding funding NN 10_1101-2021_01_08_425967 171 3 acquisition acquisition NN 10_1101-2021_01_08_425967 171 4 , , , 10_1101-2021_01_08_425967 171 5 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 172 1 All all DT 10_1101-2021_01_08_425967 172 2 authors author NNS 10_1101-2021_01_08_425967 172 3 have have VBP 10_1101-2021_01_08_425967 172 4 read read VBN 10_1101-2021_01_08_425967 172 5 and and CC 10_1101-2021_01_08_425967 172 6 agreed agree VBD 10_1101-2021_01_08_425967 172 7 to to IN 10_1101-2021_01_08_425967 172 8 the the DT 10_1101-2021_01_08_425967 172 9 published publish VBN 10_1101-2021_01_08_425967 172 10 version version NN 10_1101-2021_01_08_425967 172 11 of of IN 10_1101-2021_01_08_425967 172 12 the the DT 10_1101-2021_01_08_425967 172 13 manuscript manuscript NN 10_1101-2021_01_08_425967 172 14 . . . 10_1101-2021_01_08_425967 173 1 .CC .CC NFP 10_1101-2021_01_08_425967 173 2 - - : 10_1101-2021_01_08_425967 173 3 BY by IN 10_1101-2021_01_08_425967 173 4 4.0 4.0 CD 10_1101-2021_01_08_425967 173 5 International international JJ 10_1101-2021_01_08_425967 173 6 licensemade licensemade NN 10_1101-2021_01_08_425967 173 7 available available JJ 10_1101-2021_01_08_425967 173 8 under under IN 10_1101-2021_01_08_425967 173 9 a a DT 10_1101-2021_01_08_425967 173 10 ( ( -LRB- 10_1101-2021_01_08_425967 173 11 which which WDT 10_1101-2021_01_08_425967 173 12 was be VBD 10_1101-2021_01_08_425967 173 13 not not RB 10_1101-2021_01_08_425967 173 14 certified certify VBN 10_1101-2021_01_08_425967 173 15 by by IN 10_1101-2021_01_08_425967 173 16 peer peer NN 10_1101-2021_01_08_425967 173 17 review review NN 10_1101-2021_01_08_425967 173 18 ) ) -RRB- 10_1101-2021_01_08_425967 173 19 is be VBZ 10_1101-2021_01_08_425967 173 20 the the DT 10_1101-2021_01_08_425967 173 21 author author NN 10_1101-2021_01_08_425967 173 22 / / SYM 10_1101-2021_01_08_425967 173 23 funder funder NN 10_1101-2021_01_08_425967 173 24 , , , 10_1101-2021_01_08_425967 173 25 who who WP 10_1101-2021_01_08_425967 173 26 has have VBZ 10_1101-2021_01_08_425967 173 27 granted grant VBN 10_1101-2021_01_08_425967 173 28 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 173 29 a a DT 10_1101-2021_01_08_425967 173 30 license license NN 10_1101-2021_01_08_425967 173 31 to to TO 10_1101-2021_01_08_425967 173 32 display display VB 10_1101-2021_01_08_425967 173 33 the the DT 10_1101-2021_01_08_425967 173 34 preprint preprint NN 10_1101-2021_01_08_425967 173 35 in in IN 10_1101-2021_01_08_425967 173 36 perpetuity perpetuity NN 10_1101-2021_01_08_425967 173 37 . . . 10_1101-2021_01_08_425967 174 1 It -PRON- PRP 10_1101-2021_01_08_425967 174 2 is be VBZ 10_1101-2021_01_08_425967 174 3 The the DT 10_1101-2021_01_08_425967 174 4 copyright copyright NN 10_1101-2021_01_08_425967 174 5 holder holder NN 10_1101-2021_01_08_425967 174 6 for for IN 10_1101-2021_01_08_425967 174 7 this this DT 10_1101-2021_01_08_425967 174 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 174 9 version version NN 10_1101-2021_01_08_425967 174 10 posted post VBD 10_1101-2021_01_08_425967 174 11 January January NNP 10_1101-2021_01_08_425967 174 12 9 9 CD 10_1101-2021_01_08_425967 174 13 , , , 10_1101-2021_01_08_425967 174 14 2021 2021 CD 10_1101-2021_01_08_425967 174 15 . . . 10_1101-2021_01_08_425967 174 16 ; ; : 10_1101-2021_01_08_425967 174 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 174 18 : : : 10_1101-2021_01_08_425967 174 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 174 20 preprint preprint NN 10_1101-2021_01_08_425967 174 21 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NN 10_1101-2021_01_08_425967 174 22 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ ADD 10_1101-2021_01_08_425967 174 23 Funding funding NN 10_1101-2021_01_08_425967 174 24 : : : 10_1101-2021_01_08_425967 174 25 This this DT 10_1101-2021_01_08_425967 174 26 work work NN 10_1101-2021_01_08_425967 174 27 was be VBD 10_1101-2021_01_08_425967 174 28 supported support VBN 10_1101-2021_01_08_425967 174 29 by by IN 10_1101-2021_01_08_425967 174 30 the the DT 10_1101-2021_01_08_425967 174 31 Programa Programa NNP 10_1101-2021_01_08_425967 174 32 de de IN 10_1101-2021_01_08_425967 174 33 Apoyo Apoyo NNP 10_1101-2021_01_08_425967 174 34 a a DT 10_1101-2021_01_08_425967 174 35 Proyectos Proyectos NNP 10_1101-2021_01_08_425967 174 36 de de IN 10_1101-2021_01_08_425967 174 37 Investigación investigación NN 10_1101-2021_01_08_425967 174 38 e e NN 10_1101-2021_01_08_425967 174 39 Innovación Innovación NNP 10_1101-2021_01_08_425967 174 40 Tecnológica Tecnológica NNP 10_1101-2021_01_08_425967 174 41 ( ( -LRB- 10_1101-2021_01_08_425967 174 42 PAPIIT PAPIIT NNP 10_1101-2021_01_08_425967 174 43 - - HYPH 10_1101-2021_01_08_425967 174 44 UNAM UNAM NNP 10_1101-2021_01_08_425967 174 45 ) ) -RRB- 10_1101-2021_01_08_425967 174 46 [ [ -LRB- 10_1101-2021_01_08_425967 174 47 IN205918 in205918 NN 10_1101-2021_01_08_425967 174 48 to to IN 10_1101-2021_01_08_425967 174 49 J.A.F.G. J.A.F.G. NNP 10_1101-2021_01_08_425967 174 50 ] ] -RRB- 10_1101-2021_01_08_425967 174 51 . . . 10_1101-2021_01_08_425967 175 1 Conflicts conflict NNS 10_1101-2021_01_08_425967 175 2 of of IN 10_1101-2021_01_08_425967 175 3 Interest interest NN 10_1101-2021_01_08_425967 175 4 : : : 10_1101-2021_01_08_425967 175 5 The the DT 10_1101-2021_01_08_425967 175 6 authors author NNS 10_1101-2021_01_08_425967 175 7 declare declare VBP 10_1101-2021_01_08_425967 175 8 no no DT 10_1101-2021_01_08_425967 175 9 conflict conflict NN 10_1101-2021_01_08_425967 175 10 of of IN 10_1101-2021_01_08_425967 175 11 interest interest NN 10_1101-2021_01_08_425967 175 12 . . . 10_1101-2021_01_08_425967 176 1 References reference NNS 10_1101-2021_01_08_425967 176 2 1 1 CD 10_1101-2021_01_08_425967 176 3 . . . 10_1101-2021_01_08_425967 177 1 Kang Kang NNP 10_1101-2021_01_08_425967 177 2 , , , 10_1101-2021_01_08_425967 177 3 S. S. NNP 10_1101-2021_01_08_425967 177 4 , , , 10_1101-2021_01_08_425967 177 5 Kim Kim NNP 10_1101-2021_01_08_425967 177 6 , , , 10_1101-2021_01_08_425967 177 7 B. B. NNP 10_1101-2021_01_08_425967 177 8 , , , 10_1101-2021_01_08_425967 177 9 Park Park NNP 10_1101-2021_01_08_425967 177 10 , , , 10_1101-2021_01_08_425967 177 11 S.-B. S.-B. NNP 10_1101-2021_01_08_425967 177 12 , , , 10_1101-2021_01_08_425967 177 13 et et NNP 10_1101-2021_01_08_425967 177 14 al al NNP 10_1101-2021_01_08_425967 177 15 . . . 10_1101-2021_01_08_425967 178 1 2013 2013 CD 10_1101-2021_01_08_425967 178 2 . . . 10_1101-2021_01_08_425967 179 1 Stage stage NN 10_1101-2021_01_08_425967 179 2 - - HYPH 10_1101-2021_01_08_425967 179 3 specific specific JJ 10_1101-2021_01_08_425967 179 4 methylome methylome JJ 10_1101-2021_01_08_425967 179 5 screen screen NN 10_1101-2021_01_08_425967 179 6 identifies identifie NNS 10_1101-2021_01_08_425967 179 7 that that WDT 10_1101-2021_01_08_425967 179 8 NEFL NEFL NNP 10_1101-2021_01_08_425967 179 9 is be VBZ 10_1101-2021_01_08_425967 179 10 downregulated downregulate VBN 10_1101-2021_01_08_425967 179 11 by by IN 10_1101-2021_01_08_425967 179 12 promoter promoter NN 10_1101-2021_01_08_425967 179 13 hypermethylation hypermethylation NN 10_1101-2021_01_08_425967 179 14 in in IN 10_1101-2021_01_08_425967 179 15 breast breast NN 10_1101-2021_01_08_425967 179 16 cancer cancer NN 10_1101-2021_01_08_425967 179 17 . . . 10_1101-2021_01_08_425967 180 1 International International NNP 10_1101-2021_01_08_425967 180 2 Journal Journal NNP 10_1101-2021_01_08_425967 180 3 of of IN 10_1101-2021_01_08_425967 180 4 Oncology Oncology NNP 10_1101-2021_01_08_425967 180 5 43(5 43(5 CD 10_1101-2021_01_08_425967 180 6 ) ) -RRB- 10_1101-2021_01_08_425967 180 7 , , , 10_1101-2021_01_08_425967 180 8 pp pp NNP 10_1101-2021_01_08_425967 180 9 . . . 10_1101-2021_01_08_425967 181 1 1659–1665 1659–1665 CD 10_1101-2021_01_08_425967 181 2 , , , 10_1101-2021_01_08_425967 181 3 doi:10.3892 doi:10.3892 NNP 10_1101-2021_01_08_425967 181 4 / / SYM 10_1101-2021_01_08_425967 181 5 ijo.2013.2094 ijo.2013.2094 NNP 10_1101-2021_01_08_425967 181 6 . . . 10_1101-2021_01_08_425967 182 1 2 2 LS 10_1101-2021_01_08_425967 182 2 . . . 10_1101-2021_01_08_425967 183 1 Kiselev Kiselev NNP 10_1101-2021_01_08_425967 183 2 , , , 10_1101-2021_01_08_425967 183 3 V. V. NNP 10_1101-2021_01_08_425967 183 4 Y. Y. NNP 10_1101-2021_01_08_425967 183 5 , , , 10_1101-2021_01_08_425967 183 6 Andrews Andrews NNP 10_1101-2021_01_08_425967 183 7 , , , 10_1101-2021_01_08_425967 183 8 T. T. NNP 10_1101-2021_01_08_425967 183 9 S. S. NNP 10_1101-2021_01_08_425967 183 10 , , , 10_1101-2021_01_08_425967 183 11 & & CC 10_1101-2021_01_08_425967 183 12 Hemberg Hemberg NNP 10_1101-2021_01_08_425967 183 13 , , , 10_1101-2021_01_08_425967 183 14 M. M. NNP 10_1101-2021_01_08_425967 183 15 ( ( -LRB- 10_1101-2021_01_08_425967 183 16 2019 2019 CD 10_1101-2021_01_08_425967 183 17 ) ) -RRB- 10_1101-2021_01_08_425967 183 18 . . . 10_1101-2021_01_08_425967 184 1 Challenges challenge NNS 10_1101-2021_01_08_425967 184 2 in in IN 10_1101-2021_01_08_425967 184 3 unsupervised unsupervise VBN 10_1101-2021_01_08_425967 184 4 clustering clustering NN 10_1101-2021_01_08_425967 184 5 of of IN 10_1101-2021_01_08_425967 184 6 single single JJ 10_1101-2021_01_08_425967 184 7 - - HYPH 10_1101-2021_01_08_425967 184 8 cell cell NN 10_1101-2021_01_08_425967 184 9 RNA RNA NNP 10_1101-2021_01_08_425967 184 10 - - HYPH 10_1101-2021_01_08_425967 184 11 seq seq NN 10_1101-2021_01_08_425967 184 12 data datum NNS 10_1101-2021_01_08_425967 184 13 . . . 10_1101-2021_01_08_425967 185 1 Nature Nature NNP 10_1101-2021_01_08_425967 185 2 Reviews Reviews NNPS 10_1101-2021_01_08_425967 185 3 Genetics Genetics NNP 10_1101-2021_01_08_425967 185 4 , , , 10_1101-2021_01_08_425967 185 5 20(5 20(5 CD 10_1101-2021_01_08_425967 185 6 ) ) -RRB- 10_1101-2021_01_08_425967 185 7 , , , 10_1101-2021_01_08_425967 185 8 273 273 CD 10_1101-2021_01_08_425967 185 9 - - SYM 10_1101-2021_01_08_425967 185 10 282 282 CD 10_1101-2021_01_08_425967 185 11 , , , 10_1101-2021_01_08_425967 185 12 doi:10.1038 doi:10.1038 NNP 10_1101-2021_01_08_425967 185 13 / / SYM 10_1101-2021_01_08_425967 185 14 s41576 s41576 NNP 10_1101-2021_01_08_425967 185 15 - - HYPH 10_1101-2021_01_08_425967 185 16 018 018 CD 10_1101-2021_01_08_425967 185 17 - - HYPH 10_1101-2021_01_08_425967 185 18 0088 0088 CD 10_1101-2021_01_08_425967 185 19 - - SYM 10_1101-2021_01_08_425967 185 20 9 9 CD 10_1101-2021_01_08_425967 185 21 . . . 10_1101-2021_01_08_425967 186 1 3 3 LS 10_1101-2021_01_08_425967 186 2 . . . 10_1101-2021_01_08_425967 187 1 Al Al NNP 10_1101-2021_01_08_425967 187 2 - - HYPH 10_1101-2021_01_08_425967 187 3 Harbi Harbi NNP 10_1101-2021_01_08_425967 187 4 , , , 10_1101-2021_01_08_425967 187 5 S.H. S.H. NNP 10_1101-2021_01_08_425967 188 1 and and CC 10_1101-2021_01_08_425967 188 2 Rayward Rayward NNP 10_1101-2021_01_08_425967 188 3 - - HYPH 10_1101-2021_01_08_425967 188 4 Smith Smith NNP 10_1101-2021_01_08_425967 188 5 , , , 10_1101-2021_01_08_425967 188 6 V.J. V.J. NNP 10_1101-2021_01_08_425967 189 1 2006 2006 CD 10_1101-2021_01_08_425967 189 2 . . . 10_1101-2021_01_08_425967 190 1 Adapting adapt VBG 10_1101-2021_01_08_425967 190 2 k k NNP 10_1101-2021_01_08_425967 190 3 - - HYPH 10_1101-2021_01_08_425967 190 4 means mean NNS 10_1101-2021_01_08_425967 190 5 for for IN 10_1101-2021_01_08_425967 190 6 supervised supervise VBN 10_1101-2021_01_08_425967 190 7 clustering clustering NN 10_1101-2021_01_08_425967 190 8 . . . 10_1101-2021_01_08_425967 191 1 Applied Applied NNP 10_1101-2021_01_08_425967 191 2 Intelligence Intelligence NNP 10_1101-2021_01_08_425967 191 3 24(3 24(3 CD 10_1101-2021_01_08_425967 191 4 ) ) -RRB- 10_1101-2021_01_08_425967 191 5 , , , 10_1101-2021_01_08_425967 191 6 pp pp NNP 10_1101-2021_01_08_425967 191 7 . . . 10_1101-2021_01_08_425967 192 1 219–226 219–226 CD 10_1101-2021_01_08_425967 192 2 , , , 10_1101-2021_01_08_425967 192 3 doi:10.1007 doi:10.1007 NN 10_1101-2021_01_08_425967 192 4 / / SYM 10_1101-2021_01_08_425967 192 5 s10489 s10489 JJ 10_1101-2021_01_08_425967 192 6 - - HYPH 10_1101-2021_01_08_425967 192 7 006 006 CD 10_1101-2021_01_08_425967 192 8 - - HYPH 10_1101-2021_01_08_425967 192 9 8513 8513 CD 10_1101-2021_01_08_425967 192 10 - - SYM 10_1101-2021_01_08_425967 192 11 8 8 CD 10_1101-2021_01_08_425967 192 12 . . . 10_1101-2021_01_08_425967 193 1 4 4 LS 10_1101-2021_01_08_425967 193 2 . . . 10_1101-2021_01_08_425967 194 1 Hassani Hassani NNP 10_1101-2021_01_08_425967 194 2 , , , 10_1101-2021_01_08_425967 194 3 M. M. NNP 10_1101-2021_01_08_425967 194 4 , , , 10_1101-2021_01_08_425967 194 5 & & CC 10_1101-2021_01_08_425967 194 6 Seidl Seidl NNP 10_1101-2021_01_08_425967 194 7 , , , 10_1101-2021_01_08_425967 194 8 T. t. NN 10_1101-2021_01_08_425967 194 9 ( ( -LRB- 10_1101-2021_01_08_425967 194 10 2017 2017 CD 10_1101-2021_01_08_425967 194 11 ) ) -RRB- 10_1101-2021_01_08_425967 194 12 . . . 10_1101-2021_01_08_425967 195 1 Using use VBG 10_1101-2021_01_08_425967 195 2 internal internal JJ 10_1101-2021_01_08_425967 195 3 evaluation evaluation NN 10_1101-2021_01_08_425967 195 4 measures measure NNS 10_1101-2021_01_08_425967 195 5 to to TO 10_1101-2021_01_08_425967 195 6 validate validate VB 10_1101-2021_01_08_425967 195 7 the the DT 10_1101-2021_01_08_425967 195 8 quality quality NN 10_1101-2021_01_08_425967 195 9 of of IN 10_1101-2021_01_08_425967 195 10 diverse diverse JJ 10_1101-2021_01_08_425967 195 11 stream stream NN 10_1101-2021_01_08_425967 195 12 clustering cluster VBG 10_1101-2021_01_08_425967 195 13 algorithms algorithm NNS 10_1101-2021_01_08_425967 195 14 . . . 10_1101-2021_01_08_425967 196 1 Vietnam Vietnam NNP 10_1101-2021_01_08_425967 196 2 Journal Journal NNP 10_1101-2021_01_08_425967 196 3 of of IN 10_1101-2021_01_08_425967 196 4 Computer Computer NNP 10_1101-2021_01_08_425967 196 5 Science Science NNP 10_1101-2021_01_08_425967 196 6 , , , 10_1101-2021_01_08_425967 196 7 4(3 4(3 NNP 10_1101-2021_01_08_425967 196 8 ) ) -RRB- 10_1101-2021_01_08_425967 196 9 , , , 10_1101-2021_01_08_425967 196 10 171 171 CD 10_1101-2021_01_08_425967 196 11 - - SYM 10_1101-2021_01_08_425967 196 12 183 183 CD 10_1101-2021_01_08_425967 196 13 , , , 10_1101-2021_01_08_425967 196 14 doi:10.1007 doi:10.1007 NNP 10_1101-2021_01_08_425967 196 15 / / SYM 10_1101-2021_01_08_425967 196 16 s40595 s40595 NNP 10_1101-2021_01_08_425967 196 17 - - HYPH 10_1101-2021_01_08_425967 196 18 016 016 CD 10_1101-2021_01_08_425967 196 19 - - HYPH 10_1101-2021_01_08_425967 196 20 0086 0086 CD 10_1101-2021_01_08_425967 196 21 - - SYM 10_1101-2021_01_08_425967 196 22 9 9 CD 10_1101-2021_01_08_425967 196 23 . . . 10_1101-2021_01_08_425967 197 1 5 5 CD 10_1101-2021_01_08_425967 197 2 . . . 10_1101-2021_01_08_425967 198 1 Fyfe Fyfe NNP 10_1101-2021_01_08_425967 198 2 , , , 10_1101-2021_01_08_425967 198 3 S. S. NNP 10_1101-2021_01_08_425967 198 4 , , , 10_1101-2021_01_08_425967 198 5 Williams Williams NNP 10_1101-2021_01_08_425967 198 6 , , , 10_1101-2021_01_08_425967 198 7 C. C. NNP 10_1101-2021_01_08_425967 198 8 , , , 10_1101-2021_01_08_425967 198 9 Mason Mason NNP 10_1101-2021_01_08_425967 198 10 , , , 10_1101-2021_01_08_425967 198 11 O.J. O.J. NNP 10_1101-2021_01_08_425967 199 1 and and CC 10_1101-2021_01_08_425967 199 2 Pickup Pickup NNP 10_1101-2021_01_08_425967 199 3 , , , 10_1101-2021_01_08_425967 199 4 G.J. G.J. NNP 10_1101-2021_01_08_425967 200 1 2008 2008 CD 10_1101-2021_01_08_425967 200 2 . . . 10_1101-2021_01_08_425967 201 1 Apophenia Apophenia NNP 10_1101-2021_01_08_425967 201 2 , , , 10_1101-2021_01_08_425967 201 3 theory theory NN 10_1101-2021_01_08_425967 201 4 of of IN 10_1101-2021_01_08_425967 201 5 mind mind NN 10_1101-2021_01_08_425967 201 6 and and CC 10_1101-2021_01_08_425967 201 7 schizotypy schizotypy NN 10_1101-2021_01_08_425967 201 8 : : : 10_1101-2021_01_08_425967 201 9 perceiving perceive VBG 10_1101-2021_01_08_425967 201 10 meaning meaning NN 10_1101-2021_01_08_425967 201 11 and and CC 10_1101-2021_01_08_425967 201 12 intentionality intentionality NN 10_1101-2021_01_08_425967 201 13 in in IN 10_1101-2021_01_08_425967 201 14 randomness randomness NN 10_1101-2021_01_08_425967 201 15 . . . 10_1101-2021_01_08_425967 202 1 Cortex Cortex NNP 10_1101-2021_01_08_425967 202 2 44(10 44(10 CD 10_1101-2021_01_08_425967 202 3 ) ) -RRB- 10_1101-2021_01_08_425967 202 4 , , , 10_1101-2021_01_08_425967 202 5 pp pp NNP 10_1101-2021_01_08_425967 202 6 . . . 10_1101-2021_01_08_425967 203 1 1316–1325 1316–1325 CD 10_1101-2021_01_08_425967 203 2 , , , 10_1101-2021_01_08_425967 203 3 doi:10.1016 doi:10.1016 JJ 10_1101-2021_01_08_425967 203 4 / / SYM 10_1101-2021_01_08_425967 203 5 j.cortex.2007.07.009 j.cortex.2007.07.009 CD 10_1101-2021_01_08_425967 203 6 . . . 10_1101-2021_01_08_425967 204 1 6 6 CD 10_1101-2021_01_08_425967 204 2 . . . 10_1101-2021_01_08_425967 205 1 Getmansky Getmansky NNP 10_1101-2021_01_08_425967 205 2 , , , 10_1101-2021_01_08_425967 205 3 M. M. NNP 10_1101-2021_01_08_425967 205 4 , , , 10_1101-2021_01_08_425967 205 5 Lo Lo NNP 10_1101-2021_01_08_425967 205 6 , , , 10_1101-2021_01_08_425967 205 7 A.W. A.W. NNP 10_1101-2021_01_08_425967 206 1 and and CC 10_1101-2021_01_08_425967 206 2 Makarov Makarov NNP 10_1101-2021_01_08_425967 206 3 , , , 10_1101-2021_01_08_425967 206 4 I. I. NNP 10_1101-2021_01_08_425967 207 1 2004 2004 CD 10_1101-2021_01_08_425967 207 2 . . . 10_1101-2021_01_08_425967 208 1 An an DT 10_1101-2021_01_08_425967 208 2 econometric econometric JJ 10_1101-2021_01_08_425967 208 3 model model NN 10_1101-2021_01_08_425967 208 4 of of IN 10_1101-2021_01_08_425967 208 5 serial serial JJ 10_1101-2021_01_08_425967 208 6 correlation correlation NN 10_1101-2021_01_08_425967 208 7 and and CC 10_1101-2021_01_08_425967 208 8 illiquidity illiquidity NN 10_1101-2021_01_08_425967 208 9 in in IN 10_1101-2021_01_08_425967 208 10 hedge hedge NN 10_1101-2021_01_08_425967 208 11 fund fund NN 10_1101-2021_01_08_425967 208 12 returns return NNS 10_1101-2021_01_08_425967 208 13 . . . 10_1101-2021_01_08_425967 209 1 Journal Journal NNP 10_1101-2021_01_08_425967 209 2 of of IN 10_1101-2021_01_08_425967 209 3 financial financial JJ 10_1101-2021_01_08_425967 209 4 economics economics NNP 10_1101-2021_01_08_425967 209 5 74(3 74(3 NNP 10_1101-2021_01_08_425967 209 6 ) ) -RRB- 10_1101-2021_01_08_425967 209 7 , , , 10_1101-2021_01_08_425967 209 8 pp pp NNP 10_1101-2021_01_08_425967 209 9 . . . 10_1101-2021_01_08_425967 210 1 529–609 529–609 CD 10_1101-2021_01_08_425967 210 2 , , , 10_1101-2021_01_08_425967 210 3 doi:10.1016 doi:10.1016 JJ 10_1101-2021_01_08_425967 210 4 / / SYM 10_1101-2021_01_08_425967 210 5 j.jfineco.2004.04.001 j.jfineco.2004.04.001 NN 10_1101-2021_01_08_425967 210 6 . . . 10_1101-2021_01_08_425967 211 1 7 7 LS 10_1101-2021_01_08_425967 211 2 . . . 10_1101-2021_01_08_425967 212 1 Shen Shen NNP 10_1101-2021_01_08_425967 212 2 , , , 10_1101-2021_01_08_425967 212 3 J. J. NNP 10_1101-2021_01_08_425967 212 4 , , , 10_1101-2021_01_08_425967 212 5 Hu Hu NNP 10_1101-2021_01_08_425967 212 6 , , , 10_1101-2021_01_08_425967 212 7 Q. Q. NNP 10_1101-2021_01_08_425967 212 8 , , , 10_1101-2021_01_08_425967 212 9 Schrauder Schrauder NNP 10_1101-2021_01_08_425967 212 10 , , , 10_1101-2021_01_08_425967 212 11 M. M. NNP 10_1101-2021_01_08_425967 212 12 , , , 10_1101-2021_01_08_425967 212 13 et et NNP 10_1101-2021_01_08_425967 212 14 al al NNP 10_1101-2021_01_08_425967 212 15 . . . 10_1101-2021_01_08_425967 213 1 2014 2014 CD 10_1101-2021_01_08_425967 213 2 . . . 10_1101-2021_01_08_425967 214 1 Circulating circulate VBG 10_1101-2021_01_08_425967 214 2 miR-148b miR-148b NNS 10_1101-2021_01_08_425967 214 3 and and CC 10_1101-2021_01_08_425967 214 4 miR-133a miR-133a NNS 10_1101-2021_01_08_425967 214 5 as as IN 10_1101-2021_01_08_425967 214 6 biomarkers biomarker NNS 10_1101-2021_01_08_425967 214 7 for for IN 10_1101-2021_01_08_425967 214 8 breast breast NN 10_1101-2021_01_08_425967 214 9 cancer cancer NN 10_1101-2021_01_08_425967 214 10 detection detection NN 10_1101-2021_01_08_425967 214 11 . . . 10_1101-2021_01_08_425967 215 1 Oncotarget Oncotarget NNP 10_1101-2021_01_08_425967 215 2 5(14 5(14 NNP 10_1101-2021_01_08_425967 215 3 ) ) -RRB- 10_1101-2021_01_08_425967 215 4 , , , 10_1101-2021_01_08_425967 215 5 pp pp NNP 10_1101-2021_01_08_425967 215 6 . . . 10_1101-2021_01_08_425967 216 1 5284–5294 5284–5294 CD 10_1101-2021_01_08_425967 216 2 , , , 10_1101-2021_01_08_425967 216 3 doi:10.18632 doi:10.18632 NNP 10_1101-2021_01_08_425967 216 4 / / SYM 10_1101-2021_01_08_425967 216 5 oncotarget.2014 oncotarget.2014 NN 10_1101-2021_01_08_425967 216 6 . . . 10_1101-2021_01_08_425967 217 1 8 8 LS 10_1101-2021_01_08_425967 217 2 . . . 10_1101-2021_01_08_425967 218 1 Toyooka Toyooka NNP 10_1101-2021_01_08_425967 218 2 , , , 10_1101-2021_01_08_425967 218 3 S. S. NNP 10_1101-2021_01_08_425967 218 4 , , , 10_1101-2021_01_08_425967 218 5 Toyooka Toyooka NNP 10_1101-2021_01_08_425967 218 6 , , , 10_1101-2021_01_08_425967 218 7 K. K. NNP 10_1101-2021_01_08_425967 218 8 O. O. NNP 10_1101-2021_01_08_425967 218 9 , , , 10_1101-2021_01_08_425967 218 10 Maruyama Maruyama NNP 10_1101-2021_01_08_425967 218 11 , , , 10_1101-2021_01_08_425967 218 12 R. R. NNP 10_1101-2021_01_08_425967 218 13 , , , 10_1101-2021_01_08_425967 218 14 Virmani Virmani NNP 10_1101-2021_01_08_425967 218 15 , , , 10_1101-2021_01_08_425967 218 16 A. A. NNP 10_1101-2021_01_08_425967 218 17 K. K. NNP 10_1101-2021_01_08_425967 218 18 , , , 10_1101-2021_01_08_425967 218 19 Girard Girard NNP 10_1101-2021_01_08_425967 218 20 , , , 10_1101-2021_01_08_425967 218 21 L. L. NNP 10_1101-2021_01_08_425967 218 22 , , , 10_1101-2021_01_08_425967 218 23 Miyajima Miyajima NNP 10_1101-2021_01_08_425967 218 24 , , , 10_1101-2021_01_08_425967 218 25 K. K. NNP 10_1101-2021_01_08_425967 218 26 , , , 10_1101-2021_01_08_425967 218 27 ... ... . 10_1101-2021_01_08_425967 218 28 & & CC 10_1101-2021_01_08_425967 218 29 Brambilla Brambilla NNP 10_1101-2021_01_08_425967 218 30 , , , 10_1101-2021_01_08_425967 218 31 E. E. NNP 10_1101-2021_01_08_425967 218 32 ( ( -LRB- 10_1101-2021_01_08_425967 218 33 2001 2001 CD 10_1101-2021_01_08_425967 218 34 ) ) -RRB- 10_1101-2021_01_08_425967 218 35 . . . 10_1101-2021_01_08_425967 219 1 DNA DNA NNP 10_1101-2021_01_08_425967 219 2 Methylation Methylation NNP 10_1101-2021_01_08_425967 219 3 Profiles Profiles NNPS 10_1101-2021_01_08_425967 219 4 of of IN 10_1101-2021_01_08_425967 219 5 Lung Lung NNP 10_1101-2021_01_08_425967 219 6 Tumors Tumors NNP 10_1101-2021_01_08_425967 219 7 . . . 10_1101-2021_01_08_425967 220 1 Molecular molecular JJ 10_1101-2021_01_08_425967 220 2 cancer cancer NN 10_1101-2021_01_08_425967 220 3 therapeutics therapeutic NNS 10_1101-2021_01_08_425967 220 4 , , , 10_1101-2021_01_08_425967 220 5 1(1 1(1 NNP 10_1101-2021_01_08_425967 220 6 ) ) -RRB- 10_1101-2021_01_08_425967 220 7 , , , 10_1101-2021_01_08_425967 220 8 61 61 CD 10_1101-2021_01_08_425967 220 9 - - SYM 10_1101-2021_01_08_425967 220 10 67 67 CD 10_1101-2021_01_08_425967 220 11 . . . 10_1101-2021_01_08_425967 221 1 9 9 CD 10_1101-2021_01_08_425967 221 2 . . . 10_1101-2021_01_08_425967 222 1 Schieber Schieber NNP 10_1101-2021_01_08_425967 222 2 , , , 10_1101-2021_01_08_425967 222 3 T. t. NN 10_1101-2021_01_08_425967 222 4 A. a. NN 10_1101-2021_01_08_425967 222 5 , , , 10_1101-2021_01_08_425967 222 6 Carpi Carpi NNP 10_1101-2021_01_08_425967 222 7 , , , 10_1101-2021_01_08_425967 222 8 L. L. NNP 10_1101-2021_01_08_425967 222 9 , , , 10_1101-2021_01_08_425967 222 10 Díaz Díaz NNP 10_1101-2021_01_08_425967 222 11 - - HYPH 10_1101-2021_01_08_425967 222 12 Guilera Guilera NNP 10_1101-2021_01_08_425967 222 13 , , , 10_1101-2021_01_08_425967 222 14 A. a. NN 10_1101-2021_01_08_425967 222 15 , , , 10_1101-2021_01_08_425967 222 16 Pardalos Pardalos NNP 10_1101-2021_01_08_425967 222 17 , , , 10_1101-2021_01_08_425967 222 18 P. P. NNP 10_1101-2021_01_08_425967 222 19 M. M. NNP 10_1101-2021_01_08_425967 222 20 , , , 10_1101-2021_01_08_425967 222 21 Masoller Masoller NNP 10_1101-2021_01_08_425967 222 22 , , , 10_1101-2021_01_08_425967 222 23 C. C. NNP 10_1101-2021_01_08_425967 222 24 , , , 10_1101-2021_01_08_425967 222 25 & & CC 10_1101-2021_01_08_425967 222 26 Ravetti Ravetti NNP 10_1101-2021_01_08_425967 222 27 , , , 10_1101-2021_01_08_425967 222 28 M. M. NNP 10_1101-2021_01_08_425967 222 29 G. G. NNP 10_1101-2021_01_08_425967 222 30 ( ( -LRB- 10_1101-2021_01_08_425967 222 31 2017 2017 CD 10_1101-2021_01_08_425967 222 32 ) ) -RRB- 10_1101-2021_01_08_425967 222 33 . . . 10_1101-2021_01_08_425967 223 1 Quantification quantification NN 10_1101-2021_01_08_425967 223 2 of of IN 10_1101-2021_01_08_425967 223 3 network network NN 10_1101-2021_01_08_425967 223 4 structural structural JJ 10_1101-2021_01_08_425967 223 5 dissimilarities dissimilarity NNS 10_1101-2021_01_08_425967 223 6 . . . 10_1101-2021_01_08_425967 224 1 Nature nature NN 10_1101-2021_01_08_425967 224 2 communications communication NNS 10_1101-2021_01_08_425967 224 3 , , , 10_1101-2021_01_08_425967 224 4 8(1 8(1 NNP 10_1101-2021_01_08_425967 224 5 ) ) -RRB- 10_1101-2021_01_08_425967 224 6 , , , 10_1101-2021_01_08_425967 224 7 1 1 CD 10_1101-2021_01_08_425967 224 8 - - SYM 10_1101-2021_01_08_425967 224 9 10 10 CD 10_1101-2021_01_08_425967 224 10 . . . 10_1101-2021_01_08_425967 225 1 10 10 CD 10_1101-2021_01_08_425967 225 2 . . . 10_1101-2021_01_08_425967 226 1 Escorcia Escorcia NNP 10_1101-2021_01_08_425967 226 2 - - HYPH 10_1101-2021_01_08_425967 226 3 Rodríguez Rodríguez NNP 10_1101-2021_01_08_425967 226 4 , , , 10_1101-2021_01_08_425967 226 5 J. J. NNP 10_1101-2021_01_08_425967 226 6 M. M. NNP 10_1101-2021_01_08_425967 226 7 , , , 10_1101-2021_01_08_425967 226 8 Tauch Tauch NNP 10_1101-2021_01_08_425967 226 9 , , , 10_1101-2021_01_08_425967 226 10 A. a. NN 10_1101-2021_01_08_425967 226 11 , , , 10_1101-2021_01_08_425967 226 12 & & CC 10_1101-2021_01_08_425967 226 13 Freyre Freyre NNP 10_1101-2021_01_08_425967 226 14 - - HYPH 10_1101-2021_01_08_425967 226 15 González González NNP 10_1101-2021_01_08_425967 226 16 , , , 10_1101-2021_01_08_425967 226 17 J. J. NNP 10_1101-2021_01_08_425967 227 1 A. A. NNP 10_1101-2021_01_08_425967 228 1 ( ( -LRB- 10_1101-2021_01_08_425967 228 2 2020 2020 CD 10_1101-2021_01_08_425967 228 3 ) ) -RRB- 10_1101-2021_01_08_425967 228 4 . . . 10_1101-2021_01_08_425967 229 1 Abasy Abasy NNP 10_1101-2021_01_08_425967 229 2 Atlas Atlas NNP 10_1101-2021_01_08_425967 229 3 v2 v2 NN 10_1101-2021_01_08_425967 229 4 . . . 10_1101-2021_01_08_425967 230 1 2 2 LS 10_1101-2021_01_08_425967 230 2 : : : 10_1101-2021_01_08_425967 230 3 The the DT 10_1101-2021_01_08_425967 230 4 most most RBS 10_1101-2021_01_08_425967 230 5 comprehensive comprehensive JJ 10_1101-2021_01_08_425967 230 6 and and CC 10_1101-2021_01_08_425967 230 7 up up RB 10_1101-2021_01_08_425967 230 8 - - HYPH 10_1101-2021_01_08_425967 230 9 to to IN 10_1101-2021_01_08_425967 230 10 - - HYPH 10_1101-2021_01_08_425967 230 11 date date NN 10_1101-2021_01_08_425967 230 12 inventory inventory NN 10_1101-2021_01_08_425967 230 13 of of IN 10_1101-2021_01_08_425967 230 14 meta meta RB 10_1101-2021_01_08_425967 230 15 - - HYPH 10_1101-2021_01_08_425967 230 16 curated curate VBN 10_1101-2021_01_08_425967 230 17 , , , 10_1101-2021_01_08_425967 230 18 historical historical JJ 10_1101-2021_01_08_425967 230 19 , , , 10_1101-2021_01_08_425967 230 20 bacterial bacterial JJ 10_1101-2021_01_08_425967 230 21 regulatory regulatory JJ 10_1101-2021_01_08_425967 230 22 networks network NNS 10_1101-2021_01_08_425967 230 23 , , , 10_1101-2021_01_08_425967 230 24 their -PRON- PRP$ 10_1101-2021_01_08_425967 230 25 completeness completeness NN 10_1101-2021_01_08_425967 230 26 and and CC 10_1101-2021_01_08_425967 230 27 system system NN 10_1101-2021_01_08_425967 230 28 - - HYPH 10_1101-2021_01_08_425967 230 29 level level NN 10_1101-2021_01_08_425967 230 30 characterization characterization NN 10_1101-2021_01_08_425967 230 31 . . . 10_1101-2021_01_08_425967 231 1 Computational computational JJ 10_1101-2021_01_08_425967 231 2 and and CC 10_1101-2021_01_08_425967 231 3 Structural Structural NNP 10_1101-2021_01_08_425967 231 4 Biotechnology Biotechnology NNP 10_1101-2021_01_08_425967 231 5 Journal Journal NNP 10_1101-2021_01_08_425967 231 6 , , , 10_1101-2021_01_08_425967 231 7 doi:10.1016 doi:10.1016 JJ 10_1101-2021_01_08_425967 231 8 / / SYM 10_1101-2021_01_08_425967 231 9 j.csbj.2020.05.015 j.csbj.2020.05.015 NNS 10_1101-2021_01_08_425967 231 10 . . . 10_1101-2021_01_08_425967 232 1 11 11 CD 10_1101-2021_01_08_425967 232 2 . . . 10_1101-2021_01_08_425967 233 1 Barabasi Barabasi NNP 10_1101-2021_01_08_425967 233 2 , , , 10_1101-2021_01_08_425967 233 3 A. A. NNP 10_1101-2021_01_08_425967 233 4 L. L. NNP 10_1101-2021_01_08_425967 233 5 , , , 10_1101-2021_01_08_425967 233 6 & & CC 10_1101-2021_01_08_425967 233 7 Oltvai Oltvai NNP 10_1101-2021_01_08_425967 233 8 , , , 10_1101-2021_01_08_425967 233 9 Z. Z. NNP 10_1101-2021_01_08_425967 233 10 N. N. NNP 10_1101-2021_01_08_425967 233 11 ( ( -LRB- 10_1101-2021_01_08_425967 233 12 2004 2004 CD 10_1101-2021_01_08_425967 233 13 ) ) -RRB- 10_1101-2021_01_08_425967 233 14 . . . 10_1101-2021_01_08_425967 234 1 Network network NN 10_1101-2021_01_08_425967 234 2 biology biology NN 10_1101-2021_01_08_425967 234 3 : : : 10_1101-2021_01_08_425967 234 4 understanding understand VBG 10_1101-2021_01_08_425967 234 5 the the DT 10_1101-2021_01_08_425967 234 6 cell cell NN 10_1101-2021_01_08_425967 234 7 's 's POS 10_1101-2021_01_08_425967 234 8 functional functional JJ 10_1101-2021_01_08_425967 234 9 organization organization NN 10_1101-2021_01_08_425967 234 10 . . . 10_1101-2021_01_08_425967 235 1 Nature nature NN 10_1101-2021_01_08_425967 235 2 reviews review NNS 10_1101-2021_01_08_425967 235 3 genetics genetic NNS 10_1101-2021_01_08_425967 235 4 , , , 10_1101-2021_01_08_425967 235 5 5(2 5(2 NNP 10_1101-2021_01_08_425967 235 6 ) ) -RRB- 10_1101-2021_01_08_425967 235 7 , , , 10_1101-2021_01_08_425967 235 8 101 101 CD 10_1101-2021_01_08_425967 235 9 - - SYM 10_1101-2021_01_08_425967 235 10 113 113 CD 10_1101-2021_01_08_425967 235 11 , , , 10_1101-2021_01_08_425967 235 12 doi:10.1038 doi:10.1038 NNP 10_1101-2021_01_08_425967 235 13 / / SYM 10_1101-2021_01_08_425967 235 14 nrg1272 nrg1272 NN 10_1101-2021_01_08_425967 235 15 . . . 10_1101-2021_01_08_425967 236 1 .CC .CC NFP 10_1101-2021_01_08_425967 236 2 - - : 10_1101-2021_01_08_425967 236 3 BY by IN 10_1101-2021_01_08_425967 236 4 4.0 4.0 CD 10_1101-2021_01_08_425967 236 5 International international JJ 10_1101-2021_01_08_425967 236 6 licensemade licensemade NN 10_1101-2021_01_08_425967 236 7 available available JJ 10_1101-2021_01_08_425967 236 8 under under IN 10_1101-2021_01_08_425967 236 9 a a DT 10_1101-2021_01_08_425967 236 10 ( ( -LRB- 10_1101-2021_01_08_425967 236 11 which which WDT 10_1101-2021_01_08_425967 236 12 was be VBD 10_1101-2021_01_08_425967 236 13 not not RB 10_1101-2021_01_08_425967 236 14 certified certify VBN 10_1101-2021_01_08_425967 236 15 by by IN 10_1101-2021_01_08_425967 236 16 peer peer NN 10_1101-2021_01_08_425967 236 17 review review NN 10_1101-2021_01_08_425967 236 18 ) ) -RRB- 10_1101-2021_01_08_425967 236 19 is be VBZ 10_1101-2021_01_08_425967 236 20 the the DT 10_1101-2021_01_08_425967 236 21 author author NN 10_1101-2021_01_08_425967 236 22 / / SYM 10_1101-2021_01_08_425967 236 23 funder funder NN 10_1101-2021_01_08_425967 236 24 , , , 10_1101-2021_01_08_425967 236 25 who who WP 10_1101-2021_01_08_425967 236 26 has have VBZ 10_1101-2021_01_08_425967 236 27 granted grant VBN 10_1101-2021_01_08_425967 236 28 bioRxiv biorxiv IN 10_1101-2021_01_08_425967 236 29 a a DT 10_1101-2021_01_08_425967 236 30 license license NN 10_1101-2021_01_08_425967 236 31 to to TO 10_1101-2021_01_08_425967 236 32 display display VB 10_1101-2021_01_08_425967 236 33 the the DT 10_1101-2021_01_08_425967 236 34 preprint preprint NN 10_1101-2021_01_08_425967 236 35 in in IN 10_1101-2021_01_08_425967 236 36 perpetuity perpetuity NN 10_1101-2021_01_08_425967 236 37 . . . 10_1101-2021_01_08_425967 237 1 It -PRON- PRP 10_1101-2021_01_08_425967 237 2 is be VBZ 10_1101-2021_01_08_425967 237 3 The the DT 10_1101-2021_01_08_425967 237 4 copyright copyright NN 10_1101-2021_01_08_425967 237 5 holder holder NN 10_1101-2021_01_08_425967 237 6 for for IN 10_1101-2021_01_08_425967 237 7 this this DT 10_1101-2021_01_08_425967 237 8 preprintthis preprintthis NN 10_1101-2021_01_08_425967 237 9 version version NN 10_1101-2021_01_08_425967 237 10 posted post VBD 10_1101-2021_01_08_425967 237 11 January January NNP 10_1101-2021_01_08_425967 237 12 9 9 CD 10_1101-2021_01_08_425967 237 13 , , , 10_1101-2021_01_08_425967 237 14 2021 2021 CD 10_1101-2021_01_08_425967 237 15 . . . 10_1101-2021_01_08_425967 237 16 ; ; : 10_1101-2021_01_08_425967 237 17 https://doi.org/10.1101/2021.01.08.425967doi https://doi.org/10.1101/2021.01.08.425967doi ADD 10_1101-2021_01_08_425967 237 18 : : : 10_1101-2021_01_08_425967 237 19 bioRxiv biorxiv VB 10_1101-2021_01_08_425967 237 20 preprint preprint NN 10_1101-2021_01_08_425967 237 21 http://f1000.com/work/bibliography/3408741 http://f1000.com/work/bibliography/3408741 VBZ 10_1101-2021_01_08_425967 237 22 http://f1000.com/work/bibliography/3408741 http://f1000.com/work/bibliography/3408741 VBZ 10_1101-2021_01_08_425967 237 23 http://f1000.com/work/bibliography/3408741 http://f1000.com/work/bibliography/3408741 NNP 10_1101-2021_01_08_425967 237 24 http://f1000.com/work/bibliography/3408741 http://f1000.com/work/bibliography/3408741 NNP 10_1101-2021_01_08_425967 237 25 http://f1000.com/work/bibliography/2985013 http://f1000.com/work/bibliography/2985013 NNP 10_1101-2021_01_08_425967 237 26 http://f1000.com/work/bibliography/2985013 http://f1000.com/work/bibliography/2985013 NNP 10_1101-2021_01_08_425967 237 27 http://f1000.com/work/bibliography/2985013 http://f1000.com/work/bibliography/2985013 NNP 10_1101-2021_01_08_425967 237 28 http://f1000.com/work/bibliography/2985013 http://f1000.com/work/bibliography/2985013 NNP 10_1101-2021_01_08_425967 237 29 http://f1000.com/work/bibliography/2985013 http://f1000.com/work/bibliography/2985013 NNP 10_1101-2021_01_08_425967 237 30 http://f1000.com/work/bibliography/8693887 http://f1000.com/work/bibliography/8693887 NNP 10_1101-2021_01_08_425967 237 31 http://f1000.com/work/bibliography/8693887 http://f1000.com/work/bibliography/8693887 NNP 10_1101-2021_01_08_425967 237 32 http://f1000.com/work/bibliography/8693887 http://f1000.com/work/bibliography/8693887 NNP 10_1101-2021_01_08_425967 237 33 http://f1000.com/work/bibliography/8693887 http://f1000.com/work/bibliography/8693887 NNP 10_1101-2021_01_08_425967 237 34 http://f1000.com/work/bibliography/8561657 http://f1000.com/work/bibliography/8561657 NNP 10_1101-2021_01_08_425967 237 35 http://f1000.com/work/bibliography/8561657 http://f1000.com/work/bibliography/8561657 NNP 10_1101-2021_01_08_425967 237 36 http://f1000.com/work/bibliography/8561657 http://f1000.com/work/bibliography/8561657 NNP 10_1101-2021_01_08_425967 237 37 http://f1000.com/work/bibliography/8561657 http://f1000.com/work/bibliography/8561657 NNP 10_1101-2021_01_08_425967 237 38 https://doi.org/10.1101/2021.01.08.425967 https://doi.org/10.1101/2021.01.08.425967 NNP 10_1101-2021_01_08_425967 237 39 http://creativecommons.org/licenses/by/4.0/ http://creativecommons.org/licenses/by/4.0/ ADD