From e2293f36edc2dd8117ad7647f76d8195c975d3ee Mon Sep 17 00:00:00 2001 From: Julia Klugherz Date: Tue, 12 Nov 2024 10:30:36 -0500 Subject: [PATCH] handle wes/wgs inheritance edge case (#4440) * almost working * updates * or_missing * fix sample tracking logic * f string * another pass * minor things * less code * reuse as much code from _annotate_families_inheritance * rstructure passes inheritance field * fix _family_has_valid_inheritance * fix up test cases * oop * typo * typo 2 * PR comments * comments * extra lines --- .../families/WGS/F000002_2.ht/.README.txt.crc | Bin 12 -> 12 bytes .../families/WGS/F000002_2.ht/README.txt | 2 +- .../.index.crc | Bin .../.metadata.json.gz.crc | Bin .../index | Bin .../metadata.json.gz | Bin .../F000002_2.ht/rows/.metadata.json.gz.crc | Bin 16 -> 16 bytes .../WGS/F000002_2.ht/rows/metadata.json.gz | Bin 627 -> 628 bytes ...0-5efaaf66-a01a-4640-a3e4-aef656269368.crc | Bin 12 -> 0 bytes ...0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.crc | Bin 0 -> 12 bytes ...art-0-5efaaf66-a01a-4640-a3e4-aef656269368 | Bin 206 -> 0 bytes ...art-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac | Bin 0 -> 207 bytes hail_search/queries/base.py | 58 ++++++----- hail_search/queries/mito.py | 77 +++++++++++---- hail_search/test_search.py | 40 ++++---- hail_search/test_utils.py | 93 +++++++++++++++--- 16 files changed, 193 insertions(+), 77 deletions(-) rename hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/{part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx => part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx}/.index.crc (100%) rename hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/{part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx => part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx}/.metadata.json.gz.crc (100%) rename hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/{part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx => part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx}/index (100%) rename hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/{part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx => part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx}/metadata.json.gz (100%) delete mode 100644 hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/.part-0-5efaaf66-a01a-4640-a3e4-aef656269368.crc create mode 100644 hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/.part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.crc delete mode 100644 hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/part-0-5efaaf66-a01a-4640-a3e4-aef656269368 create mode 100644 hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/.README.txt.crc b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/.README.txt.crc index f7799b94778f02019a04657be1cc91ebeb101949..3b6f654d6c82ab84756a952e252b70193d3aaff9 100644 GIT binary patch literal 12 TcmYc;N@ieSU}AVIzG@->6E*{I literal 12 TcmYc;N@ieSU}6yY%H|FL5ds2{ diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/README.txt b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/README.txt index 3fea5d0da1..6eb9cb83f0 100644 --- a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/README.txt +++ b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/README.txt @@ -1,3 +1,3 @@ This folder comprises a Hail (www.hail.is) native Table or MatrixTable. Written with version 0.2.130-bea04d9c79b5 - Created at 2024/10/02 14:46:35 \ No newline at end of file + Created at 2024/11/04 13:45:23 \ No newline at end of file diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/.index.crc b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/.index.crc similarity index 100% rename from hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/.index.crc rename to hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/.index.crc diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/.metadata.json.gz.crc b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/.metadata.json.gz.crc similarity index 100% rename from hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/.metadata.json.gz.crc rename to hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/.metadata.json.gz.crc diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/index b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/index similarity index 100% rename from hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/index rename to hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/index diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/metadata.json.gz b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/metadata.json.gz similarity index 100% rename from hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-5efaaf66-a01a-4640-a3e4-aef656269368.idx/metadata.json.gz rename to hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/index/part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.idx/metadata.json.gz diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/.metadata.json.gz.crc b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/.metadata.json.gz.crc index caf4248bc39fd6678d852baffee083d06b11a820..6a1017e8ebf299656da8b2b4dee4cd373e563000 100644 GIT binary patch literal 16 XcmYc;N@ieSU}8A2OZP$7&J9}uDVPRw literal 16 XcmYc;N@ieSU}E_3?py2Xq+2ZjFBJy| diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/metadata.json.gz b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/metadata.json.gz index c18fceb46be2b260ee2b9874e13c6452c7f4e278..eeeb78776570901cc864e22a18bd0d1ed5646f88 100644 GIT binary patch delta 616 zcmV-u0+;>s1oQ-u7k@4Z5J7H0DMG4N-GcV86+*5(0dG?WIc8NB<-d2F?*vvVm3k=$ zl)M?wyf=Q4eI$}T1M$gRa(DrL|Lc0O1LhKote@aO{09<7Y#-x04MPYaCMyiFhyyc; z#6K1lmWLhiNg2Q_Fc3z*O~*8bg;sl}k7+r-0kKGGu`!sCRDT_;T@(u~B8kXc>aLqu zd2a+pO3}kZk-D-15o%Dee-Z$xm4Gr(?>GDDXN9fN*q`2n5!GJLy1pyW*)o4hR*BK^ zH`mcnaBKd*%*r)1_dx)vHT&D? z*l`ErDr6D16@MYGrHqmG6EbKdJsNN!{$YaG?{~e^Wxr$1)1?=#Lt#Ll+ba|ELlMHb zt)*dJV5#{Ogm+YL5x=_no~9c#1RA6kdz0_#dmacC>$Tu7nW=ETXzzxhs$7itAL!Y{ zih>{pT{59kMw;fUYdwP7Jr*hVnF;bB@KU|Z{BC9w4VZb z-a@Hk*ZBRzy0zJ-M$C{8H(l070gDtrPwGM+mJ?`r?^JnPcU$%4PCX~(KSDmEd2wj( zJdx5FRMTlzNr)-Fqe|ZhbI{}2Z(i(<&AkEVF74VK>J03j%ZK)md#=rU0rPsE=X5Ab z?*)JEsbSo}IND2Y)*nf%v4Rnn-6HTI^DuU0Tjd~~!o$ROI=${NsV*AWe>B025y34d zAo&~X44uB?cmuClYKb|sw33i4+;cQ{N)5F`iA_xtgCs@`)moWeN%9JAp*YYd2><}3 CHzjxg delta 615 zcmV-t0+{{u1oH%t7k`!zupl==DMG4NT|j%-3L!U{fVZiG9J4Bm^4~kocLJ44rC!Pb zC2z(v?~Pw%ABkYkKpZj?KD>ZG|9!LAf!8GlSwF#nI1eO@ynT%CEDRxpn5;15MLu{s zkvPYq!t$^Ke_RGI3p9k09}}0wuuyXEsbgBsX+T~i6yIo!3x6gL#x9Dv;*mgPCY0Sx zjJ!7jBPrS8p-5dB0S^_(*f|M+P?AF#sP~)xae88`O@I$h>Z$tux0 z{^dFv3hwm(x9NPmwFlozf>|?6)WDGb#zy_>^?USU)H8xDNu5t=ZpA zT&p{9tB^swEq@RFT8fLbpO8T#=~06V{vQ))zi-piWq)Gjr%Nwfhr)n8w^t_mha$Lk zTT8>Nz*6%`2=AHNB7Svsou+Fv1Qw(gdzbI(dmeBZt2OsuGE?Dv(cTS1Rk;{(KGCy@ z5d}dEs${~1h!o3L*Lo!9{Z~n;32E3#3%Jy*C94xoEq^v&#DMr=3KsrE-+ataX+H_# zyoFN7uJQYab!)RvjhG>yZn~_E1TT{Qc~Tepu$(}{d#B3Vy4$KRcj`GQZwUE{=Eb3X z@I*>yP)(;5*J>$_tD%bHPj9zHqlKql4vzdDXDuU$tx--88asd008!1 BAaVcz diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/.part-0-5efaaf66-a01a-4640-a3e4-aef656269368.crc b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/.part-0-5efaaf66-a01a-4640-a3e4-aef656269368.crc deleted file mode 100644 index d4dcde073f96bc3f5e9908e425b67b6ab38d26da..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 12 TcmYc;N@ieSU}E^a_mM3C6{G|b diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/.part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.crc b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/.part-0-d68dd2a3-0a18-42d9-9d62-d4fc646610ac.crc new file mode 100644 index 0000000000000000000000000000000000000000..4155311e5a4dac9c8a79c47c1560d5917061165e GIT binary patch literal 12 TcmYc;N@ieSU}88fdg&Yh6HNoR literal 0 HcmV?d00001 diff --git a/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/part-0-5efaaf66-a01a-4640-a3e4-aef656269368 b/hail_search/fixtures/GRCh38/SNV_INDEL/families/WGS/F000002_2.ht/rows/parts/part-0-5efaaf66-a01a-4640-a3e4-aef656269368 deleted file mode 100644 index e113fa74e796762da26b63b59a9957b9f99af9dd..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 206 zcmdnVz`*bWh&8tA|5f;r%F0l}!N|apoKa+WJdlaW(V5Yafti6pgu#Y|A(=sf=Yc&J z&*5Xcg_sya7~M4#pV%vWuvZaj{CGi|iP1e-f8pMiZ$h{1rFj^VYp?MxJCT0ZUX|s8 zy++&ii`tCRVS&LxAw`LK$r-7^egT%2dX}ao`Gy7tdIko}x-1M5EDTmPQi(g43m&tV z