本文整理汇总了Java中htsjdk.variant.vcf.VCFCodec类的典型用法代码示例。如果您正苦于以下问题:Java VCFCodec类的具体用法?Java VCFCodec怎么用?Java VCFCodec使用的例子?那么, 这里精选的类代码示例或许可以为您提供帮助。
VCFCodec类属于htsjdk.variant.vcf包,在下文中一共展示了VCFCodec类的15个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。
示例1: RODContentProvider
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
public RODContentProvider(String name, VcfRecordPartition partition, GenomeLocParser genomeLocParser) {
this.name = name;
VCFCodec codec = new VCFCodec();
VCFHeaderLineIterable headerLineIterable = new VCFHeaderLineIterable(partition.vcfHeader());
vcfFileHeader = (VCFHeader) codec.readActualHeader(headerLineIterable);
ArrayList<VariantContext> vcfRecords = new ArrayList<>();
CollectionConverter.asJavaList(partition.records())
.forEach(record -> vcfRecords.add(codec.decode(record.toString())));
//为vcfRecord进行排序
Collections.sort(vcfRecords,
(record1, record2) -> record1.getStart() - record2.getStart());
vcfRecords.forEach(context ->
features.add(new GATKFeature.TribbleGATKFeature(genomeLocParser, context, name)));
}
示例2: getStaticDataInstance
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
public static StaticData getStaticDataInstance(RefContigInfo refContigInfo,
boolean useGVCF,
SamHeaderInfo samHeaderInfo,
VcfHeaderInfo vcfHeaderInfo) {
StaticData data = new StaticData();
SAMSequenceDictionary samSequenceDictionary = SAMSequenceDictTransfer.transfer(refContigInfo);
data.genomeLocParser = new GenomeLocParser(samSequenceDictionary);
samHeaderInfo.addReadGroupInfo(ReadGroupInfo.apply("rg1", "sample1"));
SAMFileHeader header = SAMHeaderTransfer.transfer(samHeaderInfo);
List<SAMReadGroupRecord> readGroupInfos = header.getReadGroups();
List<String> samples = new ArrayList<>();
for (SAMReadGroupRecord readGroup : readGroupInfos) {
samples.add(readGroup.getSample());
}
data.haplotypeCaller = new HaplotypeCaller(data.genomeLocParser, samples, useGVCF);
data.basic2SAMRecordTransfer = new Basic2SAMRecordTransfer(header);
VCFCodec codec = new VCFCodec();
VCFHeaderLineIterable headerLineIterable = new VCFHeaderLineIterable(vcfHeaderInfo);
data.vcfFileHeader = (VCFHeader) codec.readActualHeader(headerLineIterable);
data.codec = codec;
return data;
}
示例3: toActiveRegionMapData
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
public ActiveRegionMapData toActiveRegionMapData(GenomeLocParser parser,
Basic2SAMRecordTransfer samTransfer,
VCFHeader vcfFileHeader,
VCFCodec codec) {
List<GATKSAMRecord> gatksamRecords = new ArrayList<>(reads.size());
for (BasicSamRecord record : reads) {
gatksamRecords.add(new GATKSAMRecord(samTransfer.transfer(record)));
}
this.activeRegion.setReads(gatksamRecords);
this.activeRegion.setGenomeLocParser(parser);
List<VariantContext> vcs = new ArrayList<>(rods.size());
for (VcfRecord vcfRecord : rods) {
vcs.add(codec.decode(vcfRecord.toString()));
}
RODContentProvider dbsnpProvider = new RODContentProvider(RODNames.DBSNP, vcfFileHeader, vcs, parser);
RODTraverser traverser = new RODTraverser(dbsnpProvider);
final List<RODRecordList> bindings = new ArrayList<>(1);
bindings.add(traverser.getOverlap(activeRegion.getExtendedLoc()));
RefMetaDataTracker tracker = new RefMetaDataTracker(bindings);
return new ActiveRegionMapData(activeRegion, tracker, fullReferenceWithPadding, refBases);
}
示例4: readVariations
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
/**
* Reads the variations data from the VCF file and loads it into a track
* @param vcfFile data source
* @param track for loading data
* @param chromosome reference sequence
* @param sampleIndex determines fro which sample from the file variations are loaded
* @param loadInfo if true data from the INFO fields from VCF file will be loaded into the track,
* otherwise it will be ignored
* @return {@code Track} filled with variations from a specified {@code VcfFile}
* @throws VcfReadingException
*/
@Override
public Track<Variation> readVariations(VcfFile vcfFile, final Track<Variation> track, Chromosome chromosome,
final Integer sampleIndex, final boolean loadInfo, final boolean collapse)
throws VcfReadingException {
try (FeatureReader<VariantContext> reader = AbstractFeatureReader.getFeatureReader(vcfFile.getPath(),
vcfFile.getIndex().getPath(), new VCFCodec(), true)) {
if (checkBounds(vcfFile, track, chromosome, loadInfo)) {
return track;
}
try (CloseableIterator<VariantContext> iterator = Utils.query(reader, chromosome.getName(), track
.getStartIndex(), track.getEndIndex())) {
VCFHeader header = (VCFHeader) reader.getHeader();
track.setBlocks(doReadVariations(iterator, track, header, vcfFile, sampleIndex, loadInfo, collapse));
}
} catch (IOException e) {
throw new VcfReadingException(vcfFile, e);
}
return track;
}
示例5: makeVcfReader
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
/**
* Create a VCFFile reader for given reference and fileName in application's file system, optionally uses index.
*
* @param vcfFile {@code VcfFile} a VcfFile object, representing a file in the system with set id, name and
* compressed options.
* @return {@code VCFFileReader} a reader to work with VCF file
*/
public FeatureReader<VariantContext> makeVcfReader(VcfFile vcfFile) {
File file = new File(vcfFile.getPath());
Assert.isTrue(file.exists(), getMessage(MessagesConstants.ERROR_FILE_NOT_FOUND, vcfFile.getPath()));
FeatureReader<VariantContext> reader;
double time1;
double time2;
if (vcfFile.getIndex() != null && StringUtils.isNotBlank(vcfFile.getIndex().getPath())) {
Assert.notNull(vcfFile.getIndex(), "VCF file should have an index");
File indexFile = new File(vcfFile.getIndex().getPath());
Assert.isTrue(indexFile.exists(), getMessage(MessagesConstants.ERROR_FILE_NOT_FOUND,
vcfFile.getIndex().getPath()));
time1 = Utils.getSystemTimeMilliseconds();
reader = AbstractFeatureReader.getFeatureReader(vcfFile.getPath(), vcfFile.getIndex().getPath(),
new VCFCodec(), true);
time2 = Utils.getSystemTimeMilliseconds();
} else {
time1 = Utils.getSystemTimeMilliseconds();
reader = AbstractFeatureReader.getFeatureReader(vcfFile.getPath(), new VCFCodec(), false);
time2 = Utils.getSystemTimeMilliseconds();
}
LOGGER.debug(getMessage(MessagesConstants.DEBUG_FILE_OPENING, vcfFile.getPath(), time2 - time1));
return reader;
}
示例6: readSingleHeader
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
public void readSingleHeader(Path vcfPath, Configuration conf) throws IOException {
FileSystem fs = vcfPath.getFileSystem(conf);
if(!fs.exists(vcfPath))
throw new RuntimeException(vcfPath.toString() + " don't exists.");
if(!fs.isFile(vcfPath)) {
throw new RuntimeException(vcfPath.toString() + " is not a file. GaeaSingleVcfHeader parser only support one vcf file.");
}
FSDataInputStream in = fs.open(vcfPath);
AsciiLineReaderIterator it = new AsciiLineReaderIterator(new AsciiLineReader(in));
VCFCodec codec = new VCFCodec();
Object header = codec.readHeader(it);
vcfHeader = (VCFHeader)(((FeatureCodecHeader)header).getHeaderValue());
sampleNames.addAll(vcfHeader.getGenotypeSamples());
buildHeaderInfo();
it.close();
}
示例7: processSV
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
private static Collection<EligibilityReport> processSV(final String patient, final File vcf, final BachelorEligibility eligibility) {
LOGGER.info("process sv: {}", vcf.getPath());
final StructuralVariantFactory factory = new StructuralVariantFactory();
try {
try (final AbstractFeatureReader<VariantContext, LineIterator> reader = AbstractFeatureReader.getFeatureReader(vcf.getPath(),
new VCFCodec(), false)) {
reader.iterator().forEach(factory::addVariantContext);
}
} catch (IOException e) {
LOGGER.error("error with SV file {}: {}", vcf.getPath(), e.getMessage());
return Collections.emptyList();
}
return eligibility.processStructuralVariants(patient, factory.results());
}
示例8: fromVCFFile
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
@NotNull
public List<SomaticVariant> fromVCFFile(@NotNull final String sample, @NotNull final String vcfFile) throws IOException {
final List<SomaticVariant> variants = Lists.newArrayList();
try (final AbstractFeatureReader<VariantContext, LineIterator> reader = getFeatureReader(vcfFile, new VCFCodec(), false)) {
final VCFHeader header = (VCFHeader) reader.getHeader();
if (!sampleInFile(sample, header)) {
throw new IllegalArgumentException("Sample " + sample + " not found in vcf file " + vcfFile);
}
if (!header.hasFormatLine("AD")) {
throw new IllegalArgumentException("Allelic depths is a required format field in vcf file " + vcfFile);
}
for (final VariantContext context : reader.iterator()) {
createVariant(sample, context).ifPresent(variants::add);
}
}
return variants;
}
示例9: addLineToIndex
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
/** Set vcfHeader and vcfCodec to null if reading non-vcf line.
* */
private void addLineToIndex(String line, TabixIndexCreator indexCreator, long filePosition, TabixFormat fmt, VCFHeader vcfHeader, VCFCodec vcfCodec) throws InvalidRecordException {
if(fmt.equals(TabixFormat.BED)){
BedLineCodec bedCodec= new BedLineCodec();
BedLine bed = bedCodec.decode(line);
indexCreator.addFeature(bed, filePosition);
} else if(fmt.equals(TabixFormat.GFF)){
GtfLine gtf= new GtfLine(line.split("\t"));
indexCreator.addFeature(gtf, filePosition);
} else if(fmt.equals(TabixFormat.VCF)) {
VariantContext vcf = vcfCodec.decode(line);
indexCreator.addFeature(vcf, filePosition);
} else {
System.err.println("Unexpected TabixFormat: " + fmt.sequenceColumn + " " + fmt.startPositionColumn);
throw new InvalidRecordException();
}
}
示例10: IntervalFeature
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
/**
* Create an IntervalFeature from a String. Typically this is a line read from file.
* vcfHeader can be null if trackformat is not VCF.
*/
public IntervalFeature(String line, TrackFormat format, VCFCodec vcfCodec) throws InvalidGenomicCoordsException{
if(format.equals(TrackFormat.BED) || format.equals(TrackFormat.BEDGRAPH) || format.equals(TrackFormat.BIGBED)){
this.intervalFeatureFromBedLine(line);
this.trackFormat= TrackFormat.BED;
} else if(format.equals(TrackFormat.GFF) || format.equals(TrackFormat.GTF)){
this.intervalFeatureFromGtfLine(line);
this.trackFormat= TrackFormat.GFF;
} else if(format.equals(TrackFormat.VCF)) {
this.variantContext= vcfCodec.decode(line);
this.setRaw(line);
this.trackFormat= TrackFormat.VCF;
this.chrom= this.variantContext.getContig();
this.from= this.setFromForVCF();
this.to= this.setToForVCF();
this.name= this.variantContext.getID();
} else {
System.err.println("Format " + format + " not supported");
throw new RuntimeException();
}
}
示例11: canFormatVCFLineStructVar
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
@Test
public void canFormatVCFLineStructVar() throws InvalidGenomicCoordsException, InvalidColourException, IOException, InvalidConfigException{
List<Double> rulerMap= new ArrayList<Double>();
for(int i= 1; i < 100; i++){
rulerMap.add((double)i);
}
// Prepare header
VCFFileReader reader = new VCFFileReader(new File("test_data/ALL.wgs.mergedSV.v8.20130502.svs.genotypes.vcf.gz"));
VCFHeader vcfHeader= reader.getFileHeader();
reader.close();
VCFCodec vcfCodec= new VCFCodec();
vcfCodec.setVCFHeader(vcfHeader, Utils.getVCFHeaderVersion(vcfHeader));
String vcfLine= "1 668630 DUP_delly_DUP20532 G <CN2> . PASS AC=64;AF=0.0127795;AFR_AF=0.0015;AMR_AF=0;AN=5008;CIEND=-150,150;CIPOS=-150,150;CS=DUP_delly;EAS_AF=0.0595;END=850204;EUR_AF=0.001;IMPRECISE;NS=2504;SAS_AF=0.001;SITEPOST=1;SVTYPE=DUP GT 0|0 0|0 0|0".replaceAll(" ", "\t");
IntervalFeature ift= new IntervalFeature(vcfLine, TrackFormat.VCF, vcfCodec);
ift.mapToScreen(rulerMap);
assertEquals(850204, ift.getTo());
assertEquals("|", ift.getIdeogram(true, true).get(0).format(true));
}
示例12: reindexVcfFile
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
/**
* Creates a feature index for {@link VcfFile}. If an index already exists, it will be deleted and created
* from scratch
* @param vcfFileId an ID of VCF file to reindex.
* @throws FeatureIndexException if an error occurred while writing index
*/
public VcfFile reindexVcfFile(long vcfFileId) throws FeatureIndexException {
VcfFile vcfFile = vcfFileManager.loadVcfFile(vcfFileId);
Reference reference = referenceGenomeManager.loadReferenceGenome(vcfFile.getReferenceId());
Map<String, Chromosome> chromosomeMap = reference.getChromosomes().stream().collect(
Collectors.toMap(BaseEntity::getName, chromosome -> chromosome));
List<GeneFile> geneFiles = reference.getGeneFile() != null ?
Collections.singletonList(reference.getGeneFile()) :
Collections.emptyList();
try {
fileManager.deleteFileFeatureIndex(vcfFile);
try (FeatureReader<VariantContext> reader = AbstractFeatureReader.getFeatureReader(vcfFile.getPath(),
new VCFCodec(), false)) {
VcfFilterInfo info = getFiltersInfo(reader);
featureIndexManager.makeIndexForVcfReader(vcfFile, reader, geneFiles, chromosomeMap, info);
}
} catch (IOException e) {
throw new FeatureIndexException(vcfFile, e);
}
return vcfFile;
}
示例13: createVcfFromUrl
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
private VcfFile createVcfFromUrl(final IndexedFileRegistrationRequest request,
final Map<String, Chromosome> chromosomeMap, Reference reference) {
final VcfFile vcfFile;
try (FeatureReader<VariantContext> reader = AbstractFeatureReader.getFeatureReader(request.getPath(),
request.getIndexPath(), new VCFCodec(), true)) {
vcfFile = createVcfFile(request, reader);
boolean hasVariations = false;
for (Map.Entry<String, Chromosome> chrEntry : chromosomeMap.entrySet()) {
CloseableIterator<VariantContext> iterator = Utils.query(reader, chrEntry.getKey(), 1,
chrEntry.getValue().getSize());
if (iterator.hasNext()) {
hasVariations = true;
break;
}
}
Assert.isTrue(hasVariations, getMessage(MessagesConstants.ERROR_FILE_CORRUPTED_OR_EMPTY, request.getPath(),
reference.getName()));
} catch (IOException e) {
throw new RegistrationException(getMessage(ERROR_REGISTER_FILE, request.getName()), e);
}
biologicalDataItemManager.createBiologicalDataItem(vcfFile.getIndex());
vcfFileManager.createVcfFile(vcfFile);
return vcfFile;
}
示例14: serialisationTest
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
@Test
public void serialisationTest() throws IOException, ClassNotFoundException {
Resource resource = context.getResource("classpath:templates/samples.vcf");
List<VcfIndexEntry> writtenEntries = new ArrayList<>();
List<VcfIndexEntry> diskBasedList = new DiskBasedList<VcfIndexEntry>(MAX_IN_MEMORY_ITEMS_COUNT).adaptToList();
try (FeatureReader<VariantContext> reader = AbstractFeatureReader
.getFeatureReader(resource.getFile().getAbsolutePath(), new VCFCodec(), false)
) {
for (VariantContext variantContext : reader.iterator()) {
VcfIndexEntry vcfIndexEntry = createTestEntry(variantContext);
writtenEntries.add(vcfIndexEntry);
diskBasedList.add(vcfIndexEntry);
}
}
for (int i = 0; i < 3; i++) {
assertLists(writtenEntries, diskBasedList);
}
}
示例15: testVariantAdapter
import htsjdk.variant.vcf.VCFCodec; //导入依赖的package包/类
@Test(dataProvider = "VariantDataProvider")
public void testVariantAdapter(final List<Variant> expectedVariantList) {
// The test suite for reading in VCF files is FeatureDataSourceUnitTest.
try (FeatureDataSource<VariantContext> featureSource = new FeatureDataSource<>(QUERY_TEST_VCF, new VCFCodec())) {
List<Variant> variantList = new ArrayList<>();
for (VariantContext feature : featureSource) {
VariantContextVariantAdapter va = new VariantContextVariantAdapter(feature);
variantList.add(va);
}
// Now, test to see that every variant is in in the expected set.
Assert.assertEquals(variantList.size(), expectedVariantList.size());
for (Variant v : variantList) {
boolean matchFound = false;
for (Variant vv : expectedVariantList) {
if (VariantUtils.variantsAreEqual(v, vv)) {
matchFound = true;
}
}
Assert.assertTrue(matchFound, v.toString());
}
}
}