Add JWAS tests to HSmice test.

author: Arun Isaac 2025-11-13 02:23:34 +0000
committer: Arun Isaac 2025-11-13 02:23:34 +0000
commit: 2bd7b74814ca208a30382c6ad847e169addc542d (patch)
tree: 89d51b7a3aeffe759474e52ae104ed9f1b74646e /e2e-tests/hsmice
parent: f0076f0a413ad3706e3b012b07e4a14c61c79b6e (diff)
download: pyhegp-2bd7b74814ca208a30382c6ad847e169addc542d.tar.gz
pyhegp-2bd7b74814ca208a30382c6ad847e169addc542d.tar.lz
pyhegp-2bd7b74814ca208a30382c6ad847e169addc542d.zip
2 files changed, 59 insertions, 0 deletions
diff --git a/e2e-tests/hsmice/jwas-gwas.jl b/e2e-tests/hsmice/jwas-gwas.jl
new file mode 100644
index 0000000..193b8ed
--- /dev/null
+++ b/e2e-tests/hsmice/jwas-gwas.jl
@@ -0,0 +1,46 @@
+using CSV, DataFrames, JWAS
+using Pipe: @pipe
+
+if length(ARGS) != 3
+    print(stderr, "Usage: julia jwas-gwas.jl GENOTYPE-FILE PHENOTYPE-FILE OUTPUT-GWAS-FILE\n")
+    exit(1)
+end
+genotype_file, phenotype_file, output_gwas_file = ARGS
+
+genotype = CSV.read(genotype_file, DataFrame; drop=[:reference])
+phenotype = @pipe(CSV.read(phenotype_file, DataFrame)
+                  |> select(_,
+                            "sample-id" => :sample_id,
+                            "Biochem.ALP.resid" => :alp))
+
+genotypes = get_genotypes(@pipe(
+    hcat(DataFrame(snp_id=string.(genotype.chromosome, ":", genotype.position)),
+         @pipe(genotype
+               |> select(_, Not([:chromosome, :position]))))
+    |> permutedims(_, :snp_id)
+    |> rename(_, :snp_id => :sample_id)),
+                          1.8e-5,
+                          G_is_marker_variance=true,
+                          quality_control=false,
+                          center=false,
+                          Pi=0.999,
+                          estimateScale=true)
+
+model = build_model("alp = intercept + genotypes")
+out = runMCMC(model,
+              phenotype,
+              Pi=0.99,
+              estimateScale=true,
+              chain_length=50000,
+              burnin=5000,
+              output_heritability=true,
+              output_samples_frequency=100,
+              # fix seed for reproducibility
+              seed=1)
+
+gwas = GWAS("results/MCMC_samples_marker_effects_genotypes_alp.txt")
+CSV.write(output_gwas_file,
+          transform(gwas,
+                    :marker_ID => ByRow(x -> split(x, ":")[1]) => :chromosome,
+                    :marker_ID => ByRow(x -> parse(Int, split(x, ":")[2])) => :position);
+          delim="\t")
diff --git a/e2e-tests/hsmice/jwas-manhattan.r b/e2e-tests/hsmice/jwas-manhattan.r
new file mode 100644
index 0000000..a437a8c
--- /dev/null
+++ b/e2e-tests/hsmice/jwas-manhattan.r
@@ -0,0 +1,13 @@
+library(dplyr)
+library(qqman)
+library(readr)
+
+args = commandArgs(trailingOnly=TRUE)
+if (length(args) != 1) {
+    write("Usage: Rscript jwas-manhattan.r GWAS-FILE", stderr())
+    quit(status=1)
+}
+gwas_file = args[1]
+
+gwas = mutate(read_tsv(gwas_file), antilog=10^(-modelfrequency))
+manhattan(gwas, chr="chromosome", bp="position", snp="marker_ID", p="antilog")
author	Arun Isaac	2025-11-13 02:23:34 +0000
committer	Arun Isaac	2025-11-13 02:23:34 +0000
commit	2bd7b74814ca208a30382c6ad847e169addc542d (patch)
tree	89d51b7a3aeffe759474e52ae104ed9f1b74646e /e2e-tests/hsmice
parent	f0076f0a413ad3706e3b012b07e4a14c61c79b6e (diff)
download	pyhegp-2bd7b74814ca208a30382c6ad847e169addc542d.tar.gz pyhegp-2bd7b74814ca208a30382c6ad847e169addc542d.tar.lz pyhegp-2bd7b74814ca208a30382c6ad847e169addc542d.zip