Title: | Genotype Simulations for Rare or Common Variants Using Haplotypes from 1000 Genomes |
---|---|
Description: | Generates realistic simulated genetic data in families or unrelated individuals. |
Authors: | Apostolos Dimitromanolakis <[email protected]>, Jingxiong Xu <[email protected]>, Agnieszka Krol <[email protected]>, Laurent Briollais <[email protected]> |
Maintainer: | Apostolos Dimitromanolakis <[email protected]> |
License: | GPL (>= 2) |
Version: | 1.40 |
Built: | 2025-01-09 07:11:54 UTC |
Source: | CRAN |
Documentation and examples can be found at the package directory folder inst / doc or at our github url: https://adimitromanolakis.github.io/sim1000G/ inst/doc/SimulatingFamilyData.html
See also our github repository page at: https://github.com/adimitromanolakis/sim1000G
Computes pairwise IBD1 for a specific pair of individuals. See function computePairIBD12 for description.
computePairIBD1(i, j)
computePairIBD1(i, j)
i |
Index of first individual |
j |
Index of second individual |
Mean IBD1 as computed from shared haplotypes
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) v = computePairIBD1(1, 3) cat("IBD1 of pair = ", v, "\n");
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) v = computePairIBD1(1, 3) cat("IBD1 of pair = ", v, "\n");
Computes pairwise IBD1/2 for a specific pair of individuals
computePairIBD12(i, j)
computePairIBD12(i, j)
i |
Index of first individual |
j |
Index of second individual |
Mean IBD1 and IBD2 as computed from shared haplotypes
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) v = computePairIBD12(1, 3) cat("IBD1 of pair = ", v[1], "\n"); cat("IBD2 of pair = ", v[2], "\n");
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) v = computePairIBD12(1, 3) cat("IBD1 of pair = ", v[1], "\n"); cat("IBD2 of pair = ", v[2], "\n");
Computes pairwise IBD2 for a specific pair of individuals
computePairIBD2(i, j)
computePairIBD2(i, j)
i |
Index of first individual |
j |
Index of second individual |
Mean IBD2 as computed from shared haplotypes
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) v = computePairIBD2(1, 3) cat("IBD2 of pair = ", v, "\n");
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) v = computePairIBD2(1, 3) cat("IBD2 of pair = ", v, "\n");
Creates a regional vcf file using bcftools to extract a region from 1000 genomes vcf files
createVCF()
createVCF()
none
This vector contains the density between two recombination events, as a cumulative density function.
crossoverCDFvector
crossoverCDFvector
An object of class logical
of length 1.
Downloads a genetic map for a particular chromosome under GRCh37 coordinates for use with sim1000G.
downloadGeneticMap(chromosome, dir = NA)
downloadGeneticMap(chromosome, dir = NA)
chromosome |
Chromosome number to download recombination distances from. |
dir |
Directory to save the genetic map to (default: temporary directory) |
downloadGeneticMap(22, dir=tempdir() )
downloadGeneticMap(22, dir=tempdir() )
Generates a recombination vector arising from one meiotic event. The origin of segments is coded as (0 - haplotype1 , 1 - haplotype2 )
generateChromosomeRecombinationPositions(chromosomeLength = 500)
generateChromosomeRecombinationPositions(chromosomeLength = 500)
chromosomeLength |
The length of the region in cm. |
library("sim1000G") # generate a recombination events for chromosome 4 readGeneticMap(4) generateChromosomeRecombinationPositions(500)
library("sim1000G") # generate a recombination events for chromosome 4 readGeneticMap(4) generateChromosomeRecombinationPositions(500)
Generates a fake genetic map that spans the whole genome.
generateFakeWholeGenomeGeneticMap(vcf)
generateFakeWholeGenomeGeneticMap(vcf)
vcf |
A vcf file read by function readVCF. |
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf("%s/region.vcf.gz", examples_dir) vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function # downloadGeneticMap generateFakeWholeGenomeGeneticMap(vcf) pdf(file=tempfile()) plotRegionalGeneticMap(seq(1e6,100e6,by=1e6/2)) dev.off()
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf("%s/region.vcf.gz", examples_dir) vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function # downloadGeneticMap generateFakeWholeGenomeGeneticMap(vcf) pdf(file=tempfile()) plotRegionalGeneticMap(seq(1e6,100e6,by=1e6/2)) dev.off()
Generate inter-recombination distances using a chi-square model. Note this are the distances between two succesive recombination events and not the absolute positions of the events. To generate the locations of the recombination events see the example below.
generateRecombinationDistances(n)
generateRecombinationDistances(n)
n |
Number of distances to generate |
vector of distances between two recombination events.
library("sim1000G") distances = generateRecombinationDistances(20) positions_of_recombination = cumsum(distances) if(0) hist(generateRecombinationDistances(20000),n=100)
library("sim1000G") distances = generateRecombinationDistances(20) positions_of_recombination = cumsum(distances) if(0) hist(generateRecombinationDistances(20000),n=100)
Generate recombination distances using a no-interference model.
generateRecombinationDistances_noInterference(n)
generateRecombinationDistances_noInterference(n)
n |
Number of distances to generate |
recombination distances in centimorgan
library("sim1000G") mean ( generateRecombinationDistances_noInterference ( 200 ) )
library("sim1000G") mean ( generateRecombinationDistances_noInterference ( 200 ) )
Genetates a recombination vector arising from one meiotic event. The origin of segments is coded as (0 - haplotype1 , 1 - haplotype2 )
generateSingleRecombinationVector(cm)
generateSingleRecombinationVector(cm)
cm |
The length of the region that we want to generate recombination distances. |
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() generateSingleRecombinationVector( 1:100 )
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() generateSingleRecombinationVector( 1:100 )
Generates a uniform genetic map by approximating 1 cm / Mbp. Only used for examples.
generateUniformGeneticMap()
generateUniformGeneticMap()
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf("%s/region.vcf.gz", examples_dir) vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function readGeneticMap generateUniformGeneticMap() pdf(file=tempfile()) plotRegionalGeneticMap(seq(1e6,100e6,by=1e6/2)) dev.off()
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf("%s/region.vcf.gz", examples_dir) vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function readGeneticMap generateUniformGeneticMap() pdf(file=tempfile()) plotRegionalGeneticMap(seq(1e6,100e6,by=1e6/2)) dev.off()
Holds the genetic map information that is used for simulations.
geneticMap
geneticMap
An object of class environment
of length 0.
Converts centimorgan position to base-pair. Return a list of centimorgan positions that correspond to the bp vector (in basepairs).
getCMfromBP(bp)
getCMfromBP(bp)
bp |
vector of base-pair positions |
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf("%s/region.vcf.gz", examples_dir) vcf = readVCF( vcf_file, maxNumberOfVariants = 100, min_maf = 0.12) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() getCMfromBP(seq(1e6,100e6,by=1e6))
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf("%s/region.vcf.gz", examples_dir) vcf = readVCF( vcf_file, maxNumberOfVariants = 100, min_maf = 0.12) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() getCMfromBP(seq(1e6,100e6,by=1e6))
Load some previously saved simulation data by function saveSimulation
loadSimulation(id)
loadSimulation(id)
id |
Name the simulation to load which was previously saved by saveSimulation |
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For a realistic genetic map # use the function readGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) saveSimulation("sim1") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.02 ,max_maf = 0.5) startSimulation(vcf, totalNumberOfIndividuals = 200) saveSimulation("sim2") loadSimulation("sim1")
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For a realistic genetic map # use the function readGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) saveSimulation("sim1") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.02 ,max_maf = 0.5) startSimulation(vcf, totalNumberOfIndividuals = 200) saveSimulation("sim2") loadSimulation("sim1")
Generates genotype data for a family of 3 generations
newFamily3generations(familyid, noffspring2 = 2, noffspring3 = c(1, 1))
newFamily3generations(familyid, noffspring2 = 2, noffspring3 = c(1, 1))
familyid |
What will be the family_id (for example: 100) |
noffspring2 |
Number of offspring in generation 2 |
noffspring3 |
Number of offspring in generation 3 (vector of length noffspring2) |
family structure object
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped_line = newFamily3generations(12, 3, c(3,3,2) )
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped_line = newFamily3generations(12, 3, c(3,3,2) )
Simulates genotypes for 1 family with n offspring
newFamilyWithOffspring(family_id, noffspring = 2)
newFamilyWithOffspring(family_id, noffspring = 2)
family_id |
What will be the family_id (for example: 100) |
noffspring |
Number of offsprings that this family will have |
family structure object
ped_line = newFamilyWithOffspring(10,3)
ped_line = newFamilyWithOffspring(10,3)
Simulates genotypes for 1 family with 1 offspring
newNuclearFamily(family_id)
newNuclearFamily(family_id)
family_id |
What will be the family_id (for example: 100) |
family structure object
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) genetic_map_of_region = system.file("examples", "chr4-geneticmap.txt", package = "sim1000G") readGeneticMapFromFile(genetic_map_of_region) startSimulation(vcf, totalNumberOfIndividuals = 1200) fam1 = newNuclearFamily(1) fam2 = newNuclearFamily(2) # See also the documentation on our github page
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) genetic_map_of_region = system.file("examples", "chr4-geneticmap.txt", package = "sim1000G") readGeneticMapFromFile(genetic_map_of_region) startSimulation(vcf, totalNumberOfIndividuals = 1200) fam1 = newNuclearFamily(1) fam2 = newNuclearFamily(2) # See also the documentation on our github page
Holds general package options
pkg.opts
pkg.opts
An object of class environment
of length 1.
The plot shows the centimorgan vs base-pair positions. The position of markers that have been read is also depicted as vertical lines
plotRegionalGeneticMap(bp)
plotRegionalGeneticMap(bp)
bp |
Vector of base-pair positions to generate a plot for library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = sprintf(" vcf = readVCF( vcf_file, maxNumberOfVariants = 100, min_maf = 0.12) # For realistic data use the function readGeneticMap generateUniformGeneticMap() pdf(file=tempfile()) plotRegionalGeneticMap(seq(1e6,100e6,by=1e6/2)) dev.off() |
Utility function that prints a matrix. Useful for IBD12 matrices.
printMatrix(m)
printMatrix(m)
m |
Matrix to be printed |
printMatrix ( matrix(runif(16), nrow=4) )
printMatrix ( matrix(runif(16), nrow=4) )
The map must contains a complete chromosome or enough markers to cover the area that will be simulated.
readGeneticMap(chromosome, filename = NA, dir = NA)
readGeneticMap(chromosome, filename = NA, dir = NA)
chromosome |
Chromosome number to download a genetic map for , or |
filename |
A filename of an existing genetic map to read from (default NA). |
dir |
Directory the map file will be saved (only if chromosome is specified). |
readGeneticMap(chromosome = 22)
readGeneticMap(chromosome = 22)
The file must be contain the following columns in the same order: chromosome, basepaire, rate(not used), centimorgan
readGeneticMapFromFile(filelocation)
readGeneticMapFromFile(filelocation)
filelocation |
Filename containing the genetic map |
## Not run: fname = downloadGeneticMap(10) cat("genetic map downloaded at :", fname, "\n") readGeneticMapFromFile(fname) ## End(Not run)
## Not run: fname = downloadGeneticMap(10) cat("genetic map downloaded at :", fname, "\n") readGeneticMapFromFile(fname) ## End(Not run)
Read a vcf file, with options to filter out low or high frequency markers.
readVCF(filename = "data.vcf", thin = NA, maxNumberOfVariants = 400, min_maf = 0.02, max_maf = NA, region_start = NA, region_end = NA)
readVCF(filename = "data.vcf", thin = NA, maxNumberOfVariants = 400, min_maf = 0.02, max_maf = NA, region_start = NA, region_end = NA)
filename |
Input VCF file |
thin |
How much to thin markers |
maxNumberOfVariants |
Maximum number of variants to keep from region |
min_maf |
Minimum allele frequency of markers to keep. If NA skip min_maf filtering. |
max_maf |
Maximum allele frequency of markers to keep. If NA skip max_maf filtering. |
region_start |
Extract a region from a vcf files with this starting basepair position |
region_end |
Extract a region from a vcf files with this ending basepair position |
VCF object to be used by startSimulation function.
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region-chr4-93-TMEM156.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 500 , min_maf = 0.02 ,max_maf = NA) str(as.list(vcf))
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region-chr4-93-TMEM156.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 500 , min_maf = 0.02 ,max_maf = NA) str(as.list(vcf))
Removes all individuals that have been simulated and resets the simulator.
resetSimulation()
resetSimulation()
nothing
resetSimulation()
resetSimulation()
Retrieve a matrix of simulated genotypes for a specific set of individual IDs
retrieveGenotypes(ids)
retrieveGenotypes(ids)
ids |
Vector of ids of individuals to retrieve. |
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) retrieveGenotypes(ped1$gtindex)
library("sim1000G") examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the function downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) retrieveGenotypes(ped1$gtindex)
Save the data for a simulation for later use. When simulating multiple populations it allows saving and restoring of simulation data for each population.
saveSimulation(id)
saveSimulation(id)
id |
Name the simulation will be saved as. |
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the functions downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) saveSimulation("sim1")
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100 , min_maf = 0.12 ,max_maf = NA) # For realistic data use the functions downloadGeneticMap generateUniformGeneticMap() startSimulation(vcf, totalNumberOfIndividuals = 200) ped1 = newNuclearFamily(1) saveSimulation("sim1")
Set recombination model to either poisson (no interference) or chi-square.
setRecombinationModel(model)
setRecombinationModel(model)
model |
Either "poisson" or "chisq" |
generateUniformGeneticMap() do_plots = 0 setRecombinationModel("chisq") if(do_plots == 1) hist(generateRecombinationDistances(100000),n=200) setRecombinationModel("poisson") if(do_plots == 1) hist(generateRecombinationDistances(100000),n=200)
generateUniformGeneticMap() do_plots = 0 setRecombinationModel("chisq") if(do_plots == 1) hist(generateRecombinationDistances(100000),n=200) setRecombinationModel("poisson") if(do_plots == 1) hist(generateRecombinationDistances(100000),n=200)
Holds data necessary for a simulation.
SIM
SIM
An object of class environment
of length 7.
Starts and initializes the data structures required for a simulation. A VCF file should be read beforehand with the function readVCF.
startSimulation(vcf, totalNumberOfIndividuals = 2000, subset = NA, randomdata = 0, typeOfGeneticMap = "download")
startSimulation(vcf, totalNumberOfIndividuals = 2000, subset = NA, randomdata = 0, typeOfGeneticMap = "download")
vcf |
Input vcf file of a region (can be .gz). Must contain phased data. |
totalNumberOfIndividuals |
Maximum Number of individuals to allocate memory for. Set it above the number of individuals you want to simulate. |
subset |
A subset of individual IDs to use for simulation |
randomdata |
If 1, disregards the genotypes in the vcf file and generates independent markers that are not in LD. |
typeOfGeneticMap |
Specify whether to download a genetic map for this chromosome |
library("sim1000G") library(gplots) examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100) genetic_map_of_region = system.file( "examples", "chr4-geneticmap.txt", package = "sim1000G" ) readGeneticMapFromFile(genetic_map_of_region) pdf(file=tempfile()) plotRegionalGeneticMap(vcf$vcf[,2]+1) dev.off() startSimulation(vcf, totalNumberOfIndividuals = 200)
library("sim1000G") library(gplots) examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 100) genetic_map_of_region = system.file( "examples", "chr4-geneticmap.txt", package = "sim1000G" ) readGeneticMapFromFile(genetic_map_of_region) pdf(file=tempfile()) plotRegionalGeneticMap(vcf$vcf[,2]+1) dev.off() startSimulation(vcf, totalNumberOfIndividuals = 200)
Generate a market subset of a vcf file
subsetVCF(vcf, var_index = NA, var_id = NA, individual_id = NA)
subsetVCF(vcf, var_index = NA, var_id = NA, individual_id = NA)
vcf |
VCF data as created by function readVCF |
var_index |
index of number to subset. Should be in the range 1..length(vcf$varid) |
var_id |
id of markers to subset. Should be a selection from vcf$varid. NA if no filtering on id to be performed. |
individual_id |
IDs of individuals to subset. Should be a selection from vcf$individual_id |
VCF object to be used by startSimulation function.
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region-chr4-93-TMEM156.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 500 , min_maf = 0.02 ,max_maf = NA) vcf2 = subsetVCF(vcf, var_index = 1:50)
examples_dir = system.file("examples", package = "sim1000G") vcf_file = file.path(examples_dir, "region-chr4-93-TMEM156.vcf.gz") vcf = readVCF( vcf_file, maxNumberOfVariants = 500 , min_maf = 0.02 ,max_maf = NA) vcf2 = subsetVCF(vcf, var_index = 1:50)
Writes a plink compatible PED/MAP file from the simulated genotypes
writePED(vcf, fam, filename = "out")
writePED(vcf, fam, filename = "out")
vcf |
vcf object used in simulation |
fam |
Individuals / families to be written |
filename |
Basename of output files (.ped/.map will be added automatically) |