Contents

1 Introduction

This R package provides methods for genetic finemapping in inbred mice by taking advantage of their very high homozygosity rate (>95%).

Method fetch allows to download homozygous genotypes of 37 inbred mouse strains for a given genetic region.

2 Installation

if(!requireNamespace("BiocManager", quietly = TRUE))
    install.packages("BiocManager")
BiocManager::install("MouseFM")

3 Loading package

library(MouseFM)
#> 
#>   ---------
#>   
#>   For example usage please run: vignette('MouseFM')
#>   
#>   Github Repo: https://github.com/matmu/MouseFM
#>   MouseFM Backend: https://github.com/matmu/MouseFM-Backend  
#> 
#>   Citation appreciated:
#>   Munz M, Khodaygani M, Aherrahrou Z, Busch H, Wohlers I (2021) In silico candidate variant and gene identification using inbred mouse strains. PeerJ. doi:10.7717/peerj.11017
#>                         
#>   ---------

4 Example function calls

Fetch genotypes for region chr1:5000000-6000000.

df = fetch("chr1", start=5000000, end=6000000)
#> Query chr1:5,000,000-6,000,000

df[1:10,]
#>    chr     pos        rsid ref alt most_severe_consequence
#> 1    1 5000016  rs47088541   A   T          intron_variant
#> 2    1 5000029  rs48827827   G   A          intron_variant
#> 3    1 5000057  rs48099867   C   T          intron_variant
#> 4    1 5000062 rs246021564   G   C          intron_variant
#> 5    1 5000067 rs265132353   C   T          intron_variant
#> 6    1 5000068  rs51419610   A   G          intron_variant
#> 7    1 5000101 rs253320650   C   G          intron_variant
#> 8    1 5000156        <NA>   C   T          intron_variant
#> 9    1 5000157 rs216747169   G   A          intron_variant
#> 10   1 5000240        <NA>   T   G          intron_variant
#>                                                           consequences C57BL_6J
#> 1  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 2  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 3  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 4  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 5  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 6  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 7  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 8  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 9  non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#> 10 non_coding_transcript_variant,intron_variant,NMD_transcript_variant        0
#>    129P2_OlaHsd 129S1_SvImJ 129S5SvEvBrd AKR_J A_J BALB_cJ BTBR BUB_BnJ C3H_HeH
#> 1             0           0            0     0   0       0    0       0       1
#> 2             0           0            0     0   0       0    0       0       1
#> 3             0           0            0     0   0       0    0       0       1
#> 4             0           0            0     0   0       0    0       0       1
#> 5             0           0            0     0   0       0    0       0       1
#> 6             0           0            0     0   0       0    0       0       1
#> 7             0           0            0     0   0       0    0       0       1
#> 8             0           0            0     0   0       0    0       0       0
#> 9             0           0            0     0   0       0    0       0       1
#> 10            0           0            0     0   0       0    0       0       0
#>    C3H_HeJ C57BL_10J C57BL_6NJ C57BR_cdJ C57L_J C58_J CAST_EiJ CBA_J DBA_1J
#> 1        1         0         0         0      0     0        1     1      1
#> 2        1         0         0         0      0     0        0     1      1
#> 3        1         0         0         0      0     0        0     1      1
#> 4        1         0         0         0      0     0        0     1      1
#> 5        1         0         0         0      0     0        0     1      1
#> 6        1         0         0         0      0     0        0     1      1
#> 7        1         0         0         0      0     0        0     1      1
#> 8        0         0         0         0      0     0        0     0      0
#> 9        1         0         0         0      0     0        0     1      0
#> 10       0         0         0         0      0     0        0     0      0
#>    DBA_2J FVB_NJ I_LnJ KK_HiJ LEWES_EiJ LP_J MOLF_EiJ NOD_ShiLtJ NZB_B1NJ
#> 1       1      0     0      0         1    0        0          0        1
#> 2       1      0     0      0         1    0        0          0        0
#> 3       1      0     0      0         1    0        0          0        0
#> 4       1      0     0      0         1    0        0          0        0
#> 5       1      0     0      0         1    0        0          0        0
#> 6       1      0     0      0         1    0        0          0        0
#> 7       1      0     0      0         1    0        0          0        0
#> 8       0      0     0      0         0    0        0          0        1
#> 9       0      0     0      0         1    0        0          0        0
#> 10      0      0     0      0         0    0        0          0        1
#>    NZO_HlLtJ NZW_LacJ PWK_PhJ RF_J SEA_GnJ SPRET_EiJ ST_bJ WSB_EiJ ZALENDE_EiJ
#> 1          0        0       1    1       0         1     0       1           1
#> 2          0        0       1    1       0         1     0       1           1
#> 3          0        0       1    1       0         1     0       1           1
#> 4          0        0       1    1       0         1     0       1           1
#> 5          0        0       1    1       0         0     0       1           1
#> 6          0        0       1    1       0         1     0       1           1
#> 7          0        0       1    1       0         1     0       1           1
#> 8          0        0       0    0       0         0     0       0           0
#> 9          0        0       0    1       0         0     0       1           1
#> 10         0        0       0    0       0         0     0       0           0

View meta information

comment(df)
#> [1] "#Alleles of strain C57BL_6J represent the reference (ref) alleles"
#> [2] "#reference_version=GRCm38"

5 Output of Session Info

The output of sessionInfo() on the system on which this document was compiled:

sessionInfo()
#> R version 4.4.0 beta (2024-04-15 r86425)
#> Platform: x86_64-pc-linux-gnu
#> Running under: Ubuntu 22.04.4 LTS
#> 
#> Matrix products: default
#> BLAS:   /home/biocbuild/bbs-3.19-bioc/R/lib/libRblas.so 
#> LAPACK: /usr/lib/x86_64-linux-gnu/lapack/liblapack.so.3.10.0
#> 
#> locale:
#>  [1] LC_CTYPE=en_US.UTF-8       LC_NUMERIC=C              
#>  [3] LC_TIME=en_GB              LC_COLLATE=C              
#>  [5] LC_MONETARY=en_US.UTF-8    LC_MESSAGES=en_US.UTF-8   
#>  [7] LC_PAPER=en_US.UTF-8       LC_NAME=C                 
#>  [9] LC_ADDRESS=C               LC_TELEPHONE=C            
#> [11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C       
#> 
#> time zone: America/New_York
#> tzcode source: system (glibc)
#> 
#> attached base packages:
#> [1] stats     graphics  grDevices utils     datasets  methods   base     
#> 
#> other attached packages:
#> [1] MouseFM_1.13.0   BiocStyle_2.31.0
#> 
#> loaded via a namespace (and not attached):
#>  [1] KEGGREST_1.43.0         gtable_0.3.4            ggplot2_3.5.0          
#>  [4] xfun_0.43               bslib_0.7.0             httr2_1.0.1            
#>  [7] rlist_0.4.6.2           Biobase_2.63.1          vctrs_0.6.5            
#> [10] tools_4.4.0             generics_0.1.3          curl_5.2.1             
#> [13] stats4_4.4.0            tibble_3.2.1            fansi_1.0.6            
#> [16] AnnotationDbi_1.65.2    RSQLite_2.3.6           blob_1.2.4             
#> [19] pkgconfig_2.0.3         data.table_1.15.4       dbplyr_2.5.0           
#> [22] S4Vectors_0.41.6        lifecycle_1.0.4         GenomeInfoDbData_1.2.12
#> [25] compiler_4.4.0          stringr_1.5.1           Biostrings_2.71.5      
#> [28] progress_1.2.3          munsell_0.5.1           GenomeInfoDb_1.39.14   
#> [31] htmltools_0.5.8.1       sass_0.4.9              yaml_2.3.8             
#> [34] tidyr_1.3.1             pillar_1.9.0            crayon_1.5.2           
#> [37] jquerylib_0.1.4         cachem_1.0.8            gtools_3.9.5           
#> [40] tidyselect_1.2.1        digest_0.6.35           stringi_1.8.3          
#> [43] purrr_1.0.2             reshape2_1.4.4          dplyr_1.1.4            
#> [46] bookdown_0.39           grid_4.4.0              biomaRt_2.59.1         
#> [49] fastmap_1.1.1           colorspace_2.1-0        cli_3.6.2              
#> [52] magrittr_2.0.3          utf8_1.2.4              scales_1.3.0           
#> [55] filelock_1.0.3          prettyunits_1.2.0       UCSC.utils_0.99.7      
#> [58] rappdirs_0.3.3          bit64_4.0.5             rmarkdown_2.26         
#> [61] XVector_0.43.1          httr_1.4.7              bit_4.0.5              
#> [64] png_0.1-8               hms_1.1.3               memoise_2.0.1          
#> [67] evaluate_0.23           knitr_1.46              GenomicRanges_1.55.4   
#> [70] IRanges_2.37.1          BiocFileCache_2.11.2    rlang_1.1.3            
#> [73] Rcpp_1.0.12             glue_1.7.0              DBI_1.2.2              
#> [76] xml2_1.3.6              BiocManager_1.30.22     BiocGenerics_0.49.1    
#> [79] jsonlite_1.8.8          plyr_1.8.9              R6_2.5.1               
#> [82] zlibbioc_1.49.3