diff --git a/.gitignore b/.gitignore
index 8ad720caa..777fd2adc 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,5 +1,6 @@
# Cache with transcript/protein pickle files
.gpsea_cache
+dev/
# Byte-compiled / optimized / DLL files
__pycache__/
diff --git a/README.md b/README.md
index 2a498eb42..c4b00093d 100644
--- a/README.md
+++ b/README.md
@@ -3,7 +3,8 @@
![PyPi downloads](https://img.shields.io/pypi/dm/gpsea.svg?label=Pypi%20downloads)
![PyPI - Python Version](https://img.shields.io/pypi/pyversions/gpsea)
-GPSEA is a Python library for discovery of genotype-phenotype associations.
+GPSEA (Genotypes and Phenotypes - Statistical Evaluation of Associations, pronounced "G"-"P"-"C") is a Python package designed to support genotype-phenotype correlation analysis.
+
See the [Tutorial](https://monarch-initiative.github.io/gpsea/stable/tutorial.html)
and a comprehensive [User guide](https://monarch-initiative.github.io/gpsea/stable/user-guide/index.html)
diff --git a/docs/conf.py b/docs/conf.py
index 6233764c3..c311c2f80 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -60,9 +60,9 @@
# built documents.
#
# The short X.Y version.
-version = u'0.3'
+version = u'0.4'
# The full version, including alpha/beta/rc tags.
-release = u'0.3.0'
+release = u'0.4.0'
# The language for content autogenerated by Sphinx. Refer to documentation
# for a list of supported languages.
diff --git a/docs/index.rst b/docs/index.rst
index f9478fa29..5bcadd386 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -10,8 +10,8 @@ A key question in biology and human genetics concerns the relationships between
genetics, the focus is generally placed on the study of whether specific disease-causing alleles are associated with specific phenotypic
manifestations of the disease.
-`GPSEA` (genotypes and phenotypes - study and evaluation of associations) is a Python package designed to support genotype-phenotype correlation analysis.
-We pronounce GPSEA as "G"-"P"-"C". The input to `GPSEA` is a collection of `Global Alliance for Genomics and Health (GA4GH) Phenopackets
Variant key | +Variant (cDNA) | +Variant (protein) | +Effects | +Count | +
---|---|---|---|---|
12_114385521_114385521_C_T | +c.710G>A | +p.Arg237Gln | +missense | +22 | +
12_114401830_114401830_C_T | +c.238G>A | +p.Gly80Arg | +missense | +20 | +
12_114385563_114385563_G_A | +c.668C>T | +p.Thr223Met | +missense | +8 | +
12_114398675_114398675_G_T | +c.408C>A | +p.Tyr136Ter | +stop gained | +6 | +
12_114399514_114399514_A_C | +c.361T>G | +p.Trp121Gly | +missense, splice region | +5 | +
12_114403792_114403792_C_CG | +c.106_107insC | +p.Ser36ThrfsTer25 | +frameshift | +5 | +
12_114398682_114398682_C_CG | +c.400dup | +p.Arg134ProfsTer49 | +frameshift | +5 | +
12_114385474_114385474_A_G | +c.755+2T>C | +None | +splice donor | +4 | +
12_114398656_114398656_C_CG | +c.426dup | +p.Ala143ArgfsTer40 | +frameshift | +4 | +
12_114366360_114366360_C_T | +c.787G>A | +p.Val263Met | +missense | +4 | +
12_114385522_114385522_G_A | +c.709C>T | +p.Arg237Trp | +missense | +4 | +
12_114403798_114403798_G_GC | +c.100dup | +p.Ala34GlyfsTer27 | +frameshift | +4 | +
12_114399613_114399613_T_A | +c.262A>T | +p.Lys88Ter | +stop gained | +3 | +
12_114401827_114401827_T_A | +c.241A>T | +p.Arg81Trp | +missense, splice region | +3 | +
12_114366312_114366312_G_A | +c.835C>T | +p.Arg279Ter | +stop gained | +3 | +
12_114366366_114366366_T_A | +c.781A>T | +p.Ser261Cys | +missense | +3 | +
12_114403798_114403799_GC_G | +c.100del | +p.Ala34ProfsTer32 | +frameshift | +3 | +
12_114385475_114385475_C_T | +c.755+1G>A | +None | +splice donor | +3 | +
12_114401853_114401853_G_T | +c.215C>A | +p.Thr72Lys | +missense | +3 | +
12_114385521_114385521_C_G | +c.710G>C | +p.Arg237Pro | +missense | +2 | +
12_114398568_114398568_C_A | +c.510+5G>T | +None | +splice donor 5th base, intronic | +2 | +
12_114366207_114366208_GC_G | +c.939del | +p.Gln315ArgfsTer79 | +frameshift | +2 | +
12_114366274_114366274_G_T | +c.873C>A | +p.Tyr291Ter | +stop gained | +2 | +
12_114366267_114366267_C_A | +c.880G>T | +p.Glu294Ter | +stop gained | +2 | +
12_114398578_114398579_CA_C | +c.504del | +p.Phe168LeufsTer6 | +frameshift | +2 | +
12_114394762_114394763_CA_C | +c.641del | +p.Val214GlyfsTer12 | +frameshift | +2 | +
12_114398666_114398667_TG_T | +c.416del | +p.Pro139GlnfsTer11 | +frameshift | +2 | +
12_114403754_114403754_G_T | +c.145C>A | +p.Gln49Lys | +missense, splice region | +2 | +
12_114385550_114385550_A_AATTATTCTCAG | +c.680_681insCTGAGAATAAT | +p.Ile227_Glu228insTer | +inframe insertion, stop retainined | +2 | +
12_114366348_114366349_CT_C | +c.798del | +p.Val267TrpfsTer127 | +frameshift | +1 | +
12_114399559_114399559_T_C | +c.316A>G | +p.Ile106Val | +missense | +1 | +
12_114356064_114356065_TA_T | +c.1024del | +p.Tyr342ThrfsTer52 | +frameshift | +1 | +
12_114355755_114355756_TG_T | +c.1333del | +p.His445MetfsTer137 | +frameshift | +1 | +
12_114398632_114398632_G_A | +c.451C>T | +p.Gln151Ter | +stop gained | +1 | +
12_114401907_114401907_A_G | +c.161T>C | +p.Ile54Thr | +missense | +1 | +
12_114355723_114355723_G_A | +c.1366C>T | +p.Gln456Ter | +stop gained | +1 | +
12_114398602_114398602_T_G | +c.481A>C | +p.Thr161Pro | +missense | +1 | +
12_114398708_114398709_GC_G | +c.374del | +p.Gly125AlafsTer25 | +frameshift | +1 | +
12_114385553_114385553_C_A | +c.678G>T | +p.Lys226Asn | +missense | +1 | +
12_114399633_114399633_C_G | +c.243-1G>C | +None | +splice acceptor | +1 | +
12_114401873_114401874_TA_T | +c.194del | +p.Leu65GlnfsTer10 | +frameshift | +1 | +
12_114399594_114399594_A_C | +c.281T>G | +p.Leu94Arg | +missense | +1 | +
12_114399622_114399622_G_T | +c.253C>A | +p.Pro85Thr | +missense | +1 | +
12_114394743_114394746_TGTG_T | +c.658_660del | +p.His220del | +inframe deletion | +1 | +
12_114394820_114394820_C_G | +c.584G>C | +p.Gly195Ala | +missense | +1 | +
12_114401846_114401846_C_G | +c.222G>C | +p.Met74Ile | +missense | +1 | +
12_114366241_114366242_CT_C | +c.905del | +p.Gln302ArgfsTer92 | +frameshift | +1 | +
12_114355784_114355785_CA_C | +c.1304del | +p.Leu435ArgfsTer147 | +frameshift | +1 | +
12_114398626_114398627_CG_C | +c.456del | +p.Val153SerfsTer21 | +frameshift | +1 | +
12_114403859_114403859_G_T | +c.40C>A | +p.Pro14Thr | +missense | +1 | +
12_114399625_114399629_ACATC_A | +c.246_249del | +p.Met83PhefsTer6 | +frameshift | +1 | +
12_114394817_114394817_G_C | +c.587C>G | +p.Ser196Ter | +stop gained | +1 | +
12_114401921_114401921_C_G | +c.148-1G>C | +None | +splice acceptor | +1 | +
Phenotype MTC filter: HPO MTC filter
Multiple testing correction: fdr_bh
-Performed statistical tests for 17 out of the total of 260 HPO terms.
+Performed statistical tests for 16 out of the total of 260 HPO terms.
Code | @@ -59,80 +59,45 @@|||||
---|---|---|---|---|---|
TODO | +HMF01 | Skipping term with maximum frequency that was less than threshold 0.2 | 51 | ||
TODO | -Skipping general term | -44 | -|||
TODO | -Skipping term because all genotypes have same HPO observed proportions | -41 | -|||
TODO | -Skipping term with only 2 observations (not powered for 2x2) | -26 | -|||
TODO | -Skipping term with only 1 observations (not powered for 2x2) | -24 | -|||
TODO | -Skipping term with only 3 observations (not powered for 2x2) | -22 | +HMF02 | +Skipping term because no genotype has more than one observed HPO count | +3 |
TODO | -Skipping term with only 4 observations (not powered for 2x2) | -14 | +HMF03 | +Skipping term because of a child term with the same individual counts | +1 |
TODO | -Skipping term with only 6 observations (not powered for 2x2) | -12 | +HMF04 | +Skipping term because all genotypes have same HPO observed proportions | +41 |
TODO | -Skipping term with only 5 observations (not powered for 2x2) | -4 | +HMF05 | +Skipping term because one genotype had zero observations | +2 |
TODO | -Skipping term because no genotype has more than one observed HPO count | -3 | +HMF06 | +Skipping term with less than 7 observations (not powered for 2x2) | +102 |
TODO | -Skipping term because one genotype had zero observations | -2 | +HMF08 | +Skipping general term | +44 |
Code | @@ -59,80 +59,45 @@|||||
---|---|---|---|---|---|
TODO | -Skipping term with only 2 observations (not powered for 2x2) | -51 | -|||
TODO | -Skipping term because all genotypes have same HPO observed proportions | -50 | -|||
TODO | -Skipping general term | -44 | -|||
TODO | -Skipping term with only 3 observations (not powered for 2x2) | -27 | -|||
TODO | -Skipping term with only 6 observations (not powered for 2x2) | -19 | +HMF01 | +Skipping term with maximum frequency that was less than threshold 0.2 | +10 |
TODO | -Skipping term with only 4 observations (not powered for 2x2) | -16 | +HMF02 | +Skipping term because no genotype has more than one observed HPO count | +4 |
TODO | -Skipping term with only 5 observations (not powered for 2x2) | -10 | +HMF03 | +Skipping term because of a child term with the same individual counts | +1 |
TODO | -Skipping term with maximum frequency that was less than threshold 0.2 | -10 | +HMF04 | +Skipping term because all genotypes have same HPO observed proportions | +50 |
TODO | -Skipping term with only 1 observations (not powered for 2x2) | -7 | +HMF05 | +Skipping term because one genotype had zero observations | +5 |
TODO | -Skipping term because one genotype had zero observations | -5 | +HMF06 | +Skipping term with less than 7 observations (not powered for 2x2) | +130 |
TODO | -Skipping term because no genotype has more than one observed HPO count | -4 | +HMF08 | +Skipping general term | +44 |
Variant key | +Variant (cDNA) | +Variant (protein) | +Effects | +Count | +
---|---|---|---|---|
{{ vdata.variant_key }} | +{{ vdata.variant_name }} | +{{ vdata.protein_name }} | +{{ vdata.variant_effects }} | +{{ vdata.count }} | +