PyPI - gwaslab - Versions diffs - 3.4.49__py3-none-any.whl → 3.5.1__py3-none-any.whl - Mend

gwaslab 3.4.49py3-none-any.whl → 3.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gwaslab might be problematic. Click here for more details.

Files changed (21) hide show

gwaslab/bd_get_hapmap3.py +3 -1
gwaslab/g_Sumstats.py +22 -10
gwaslab/g_version.py +2 -2
gwaslab/io_process_args.py +23 -0
gwaslab/qc_fix_sumstats.py +9 -5
gwaslab/util_in_get_sig.py +18 -2
gwaslab/vis_plot_credible sets.py +0 -0
gwaslab/viz_aux_annotate_plot.py +83 -242
gwaslab/viz_aux_property.py +2 -0
gwaslab/viz_aux_quickfix.py +9 -2
gwaslab/viz_aux_save_figure.py +2 -1
gwaslab/viz_plot_compare_effect.py +870 -523
gwaslab/viz_plot_mqqplot.py +74 -21
gwaslab/viz_plot_phe_heatmap.py +260 -0
gwaslab/viz_plot_stackedregional.py +1 -1
{gwaslab-3.4.49.dist-info → gwaslab-3.5.1.dist-info}/METADATA +3 -3
{gwaslab-3.4.49.dist-info → gwaslab-3.5.1.dist-info}/RECORD +21 -17
{gwaslab-3.4.49.dist-info → gwaslab-3.5.1.dist-info}/WHEEL +1 -1
{gwaslab-3.4.49.dist-info → gwaslab-3.5.1.dist-info}/LICENSE +0 -0
{gwaslab-3.4.49.dist-info → gwaslab-3.5.1.dist-info}/LICENSE_before_v3.4.39 +0 -0
{gwaslab-3.4.49.dist-info → gwaslab-3.5.1.dist-info}/top_level.txt +0 -0

gwaslab/bd_get_hapmap3.py CHANGED Viewed

@@ -47,8 +47,10 @@ def gethapmap3(sumstats,rsid="rsID",chrom="CHR", pos="POS", ea="EA", nea="NEA",b
     #rsid    A1      A2      #CHROM  POS
     #rs3094315       G       A       1       752566
-    if rsid in sumstats.columns and how=="inner":
+    if rsid in sumstats.columns:
+        log.write(" -rsID will be used for matching...", verbose=verbose)
         output = sumstats.loc[sumstats[rsid].isin(hapmap3_ref["rsid"].values),:].copy()
+        log.write(" -Raw input contains "+str(len(output))+" Hapmap3 variants based on rsID...", verbose=verbose)
         return output
     elif chrom in sumstats.columns and pos in sumstats.columns:

gwaslab/g_Sumstats.py CHANGED Viewed

@@ -81,6 +81,7 @@ from gwaslab.bd_get_hapmap3 import gethapmap3
 from gwaslab.util_abf_finemapping import abf_finemapping
 from gwaslab.util_abf_finemapping import make_cs
 import gc
+from gwaslab.viz_plot_phe_heatmap import _gwheatmap
 #20220309
 class Sumstats():
@@ -602,6 +603,11 @@ class Sumstats():
     def plot_daf(self, **kwargs):
         fig,outliers = plotdaf(self.data, **kwargs)
         return fig, outliers
+    def plot_gwheatmap(self, **kwargs):
+        fig = _gwheatmap(self.data, **kwargs)
+        return fig
     def plot_mqq(self, build=None, **kwargs):
         chrom="CHR"
@@ -705,7 +711,7 @@ class Sumstats():
         # return sumstats object
         return output
-    def check_cis(self, **kwargs):
+    def check_cis(self, gls=False, **kwargs):
         if "SNPID" in self.data.columns:
             id_to_use = "SNPID"
         else:
@@ -717,7 +723,13 @@ class Sumstats():
                            p="P",
                            log=self.log,
                            **kwargs)
-        # return sumstats object
+        # return sumstats object
+        if gls == True:
+            new_Sumstats_object = copy.deepcopy(self)
+            new_Sumstats_object.data = output
+            gc.collect()
+            return new_Sumstats_object
         return output
     def check_novel_set(self, **kwargs):
@@ -778,28 +790,28 @@ class Sumstats():
 ## LDSC ##############################################################################################
-    def estimate_h2_by_ldsc(self, build=None, verbose=True, match_allele=True, **kwargs):
+    def estimate_h2_by_ldsc(self, build=None, verbose=True, match_allele=True, how="right", **kwargs):
         if build is None:
             build = self.meta["gwaslab"]["genome_build"]
-        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=True, how="right" )
+        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=match_allele, how=how )
         self.ldsc_h2, self.ldsc_h2_results = _estimate_h2_by_ldsc(insumstats=insumstats, log=self.log, verbose=verbose, **kwargs)
-    def estimate_rg_by_ldsc(self, build=None, verbose=True, match_allele=True, **kwargs):
+    def estimate_rg_by_ldsc(self, build=None, verbose=True, match_allele=True, how="right",**kwargs):
         if build is None:
             build = self.meta["gwaslab"]["genome_build"]
-        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=True, how="right" )
+        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=match_allele, how=how )
         self.ldsc_rg = _estimate_rg_by_ldsc(insumstats=insumstats, log=self.log, verbose=verbose, **kwargs)
-    def estimate_h2_cts_by_ldsc(self, build=None, verbose=True, match_allele=True, **kwargs):
+    def estimate_h2_cts_by_ldsc(self, build=None, verbose=True, match_allele=True, how="right",**kwargs):
         if build is None:
             build = self.meta["gwaslab"]["genome_build"]
-        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=True, how="right" )
+        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=match_allele, how=how )
         self.ldsc_h2_cts  = _estimate_h2_cts_by_ldsc(insumstats=insumstats, log=self.log, verbose=verbose, **kwargs)
-    def estimate_partitioned_h2_by_ldsc(self, build=None, verbose=True, match_allele=True, **kwargs):
+    def estimate_partitioned_h2_by_ldsc(self, build=None, verbose=True, match_allele=True, how="right",**kwargs):
         if build is None:
             build = self.meta["gwaslab"]["genome_build"]
-        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=True, how="right" )
+        insumstats = gethapmap3(self.data.copy(), build=build, verbose=verbose , match_allele=match_allele, how=how )
         self.ldsc_partitioned_h2_summary, self.ldsc_partitioned_h2_results  = _estimate_partitioned_h2_by_ldsc(insumstats=insumstats, log=self.log, verbose=verbose, **kwargs)
 # external ################################################################################################

gwaslab/g_version.py CHANGED Viewed

@@ -15,8 +15,8 @@ def _get_version():
 def gwaslab_info():
     # version meta information
     dic={
-   "version":"3.4.49",
-   "release_date":"20241019"
+   "version":"3.5.1",
+   "release_date":"20241120"
     }
     return dic

gwaslab/io_process_args.py ADDED Viewed

@@ -0,0 +1,23 @@
+import copy
+def _merge_and_sync_dic(list_of_dics:list, default:dict) -> dict:
+    temp = copy.copy(default)
+    for dic in list_of_dics:
+        if isinstance(dic, dict):
+            temp.update(dic)
+    return temp
+def _list_func_args(func):
+    return func.__code__.co_varnames
+def _extract_kwargs(prefix:str, default:dict, kwargs:dict) -> dict:
+    extracted = []
+    for key,value in kwargs.items():
+        if key=="kwargs" or key=="args":
+            for key_nested,value_nested in kwargs[key].items():
+                if prefix in key_nested and "arg" in key_nested:
+                    extracted.append(value_nested)
+        else:
+            if prefix in key and "arg" in key:
+                extracted.append(value)
+    merged_arg = _merge_and_sync_dic(extracted, default)
+    return merged_arg

gwaslab/qc_fix_sumstats.py CHANGED Viewed

@@ -1579,14 +1579,14 @@ def liftover_variant(sumstats,
     try:
         if chain is None:
-            converter = get_lifter(from_build,to_build,one_based=True)
+            converter = get_lifter("hg{}".format(from_build),"hg{}".format(to_build),one_based=True)
         else:
-            converter = ChainFile(chain, one_based=True)
+            converter = ChainFile(chain,target="",query="", one_based=True)
     except:
         if chain is None:
-            converter = get_lifter(from_build,to_build)
+            converter = get_lifter("hg{}".format(from_build),"hg{}".format(to_build))
         else:
-            converter = ChainFile(chain)
+            converter = ChainFile(chain, target="",query="")
     dic= get_number_to_chr(in_chr=False,xymt=["X","Y","M"])
     dic2= get_chr_to_number(out_chr=False)
@@ -1627,11 +1627,15 @@ def parallelizeliftovervariant(sumstats,n_cores=1,chrom="CHR", pos="POS", from_b
     else:
         try:
             chain = get_chain(from_build=from_build, to_build=to_build)
-            log.write(" -Creating converter using ChainFile: {}".format(chain), verbose=verbose)
+            if chain is None or chain==False:
+                raise ValueError("")
+            log.write(" -Creating converter using provided ChainFile: {}".format(chain), verbose=verbose)
         except:
             chain = None
             lifter_from_build=from_build
             lifter_to_build=to_build
+            log.write(" -Try creating converter using liftover package", verbose=verbose)
     log.write(" -Creating converter : {} -> {}".format(lifter_from_build, lifter_to_build), verbose=verbose)
     # valid chr and pos
     pattern = r"\w\w\w0\w\w\w"

gwaslab/util_in_get_sig.py CHANGED Viewed

@@ -619,8 +619,10 @@ def _check_cis(insumstats,
     except:
         pass
-    allsig["CIS/TRANS"] = allsig.apply(lambda x: determine_if_cis(x, group_key,windowsizekb, reference_dict), axis=1)
+    #allsig["CIS/TRANS"] = allsig.apply(lambda x: determine_if_cis(x, group_key,windowsizekb, reference_dict), axis=1)
+    cis_tuples = allsig.apply(lambda x: determine_if_cis2(x, group_key,windowsizekb, reference_dict), axis=1)
+    allsig[["CIS/TRANS","REF_CHR","REF_START","REF_END"]] = pd.DataFrame(cis_tuples.tolist(), index=allsig.index)
     try:
         allsig = allsig.where(~pd.isna(allsig), pd.NA)
     except:
@@ -689,6 +691,20 @@ def determine_if_cis(x, group_key,windowsizekb, reference_dict):
     else:
         return "NoReference"
+def determine_if_cis2(x, group_key,windowsizekb, reference_dict):
+    if x[group_key] in reference_dict.keys():
+        is_same_chr = str(reference_dict[x[group_key]][0]) == str(x["CHR"])
+        is_large_than_start = int(reference_dict[x[group_key]][1]) - windowsizekb*1000 <= x["POS"]
+        is_smaller_than_end = int(reference_dict[x[group_key]][2]) + windowsizekb*1000 >= x["POS"]
+        if  is_same_chr and is_large_than_start  and is_smaller_than_end:
+            return "Cis", int(reference_dict[x[group_key]][0]), int(reference_dict[x[group_key]][1]), int(reference_dict[x[group_key]][2])
+        else:
+            return "Trans", int(reference_dict[x[group_key]][0]), int(reference_dict[x[group_key]][1]), int(reference_dict[x[group_key]][2])
+    else:
+        return "NoReference", pd.NA, pd.NA, pd.NA
 def determine_distance(allsig, knownsig):
     if len(allsig)==0:
         return allsig

gwaslab/vis_plot_credible sets.py ADDED Viewed

File without changes

gwaslab 3.4.49__py3-none-any.whl → 3.5.1__py3-none-any.whl

Potentially problematic release.

gwaslab 3.4.49py3-none-any.whl → 3.5.1py3-none-any.whl