|
13 | 13 |
|
14 | 14 | # Set any default paths and constants
|
15 | 15 | my ( $tumor_id, $normal_id ) = ( "TUMOR", "NORMAL" );
|
16 |
| -my ( $vep_path, $vep_data, $vep_forks, $buffer_size, $any_allele, $inhibit_vep, $online ) = ( "$ENV{HOME}/vep", "$ENV{HOME}/.vep", 4, 5000, 0, 0, 0 ); |
17 |
| -my ( $ref_fasta, $filter_vcf ) = ( "$ENV{HOME}/.vep/homo_sapiens/95_GRCh37/Homo_sapiens.GRCh37.75.dna.primary_assembly.fa.gz", "$ENV{HOME}/.vep/ExAC_nonTCGA.r0.3.1.sites.vep.vcf.gz" ); |
| 16 | +my ( $vep_path, $vep_data, $vep_forks, $buffer_size, $any_allele, $inhibit_vep, $online ) = ( "$ENV{HOME}/miniconda3/bin", "$ENV{HOME}/.vep", 4, 5000, 0, 0, 0 ); |
| 17 | +my ( $ref_fasta, $filter_vcf ) = ( "$ENV{HOME}/.vep/homo_sapiens/101_GRCh37/Homo_sapiens.GRCh37.dna.toplevel.fa.gz", "" ); |
18 | 18 | my ( $species, $ncbi_build, $cache_version, $maf_center, $retain_info, $retain_fmt, $min_hom_vaf, $max_filter_ac ) = ( "homo_sapiens", "GRCh37", "", ".", "", "", 0.7, 10 );
|
19 | 19 | my $perl_bin = $Config{perlpath};
|
20 | 20 |
|
@@ -392,8 +392,7 @@ sub GetBiotypePriority {
|
392 | 392 | # ::NOTE:: If input had no variants, don't break here, so we can continue to create an empty MAF
|
393 | 393 | ( !@regions_split or %flanking_bps ) or die "ERROR: You're either using an outdated samtools, or --ref-fasta is not the same genome build as your --input-vcf.";
|
394 | 394 |
|
395 |
| -# Skip filtering if not handling GRCh37, and filter-vcf is pointing to the default GRCh37 ExAC VCF |
396 |
| -if(( $species eq "homo_sapiens" and $ncbi_build eq "GRCh37" and $filter_vcf ) or ( $filter_vcf and $filter_vcf ne "$ENV{HOME}/.vep/ExAC_nonTCGA.r0.3.1.sites.vep.vcf.gz" )) { |
| 395 | +if( $filter_vcf ) { |
397 | 396 | ( -s $filter_vcf ) or die "ERROR: Provided --filter-vcf is missing or empty: $filter_vcf\n";
|
398 | 397 | # Query each variant locus on the filter VCF, using tabix, just like we used samtools earlier
|
399 | 398 | ( $lines, @regions_split ) = ( "", ());
|
@@ -436,7 +435,7 @@ sub GetBiotypePriority {
|
436 | 435 | warn "STATUS: Running VEP and writing to: $output_vcf\n";
|
437 | 436 | # Make sure we can find the VEP script
|
438 | 437 | my $vep_script = ( -s "$vep_path/vep" ? "$vep_path/vep" : "$vep_path/variant_effect_predictor.pl" );
|
439 |
| - ( -s $vep_script ) or die "ERROR: Cannot find VEP script in path: $vep_path\n"; |
| 438 | + ( -s $vep_script ) or die "ERROR: Cannot find VEP script under: $vep_path\n"; |
440 | 439 |
|
441 | 440 | # Contruct VEP command using some default options and run it
|
442 | 441 | my $vep_cmd = "$perl_bin $vep_script --species $species --assembly $ncbi_build --no_progress --no_stats --buffer_size $buffer_size --sift b --ccds --uniprot --hgvs --symbol --numbers --domains --gene_phenotype --canonical --protein --biotype --uniprot --tsl --variant_class --shift_hgvs 1 --check_existing --total_length --allele_number --no_escape --xref_refseq --failed 1 --vcf --flag_pick_allele --pick_order canonical,tsl,biotype,rank,ccds,length --dir $vep_data --fasta $ref_fasta --format vcf --input_file $input_vcf --output_file $output_vcf";
|
@@ -1136,12 +1135,12 @@ =head1 OPTIONS
|
1136 | 1135 | --any-allele When reporting co-located variants, allow mismatched variant alleles too
|
1137 | 1136 | --inhibit-vep Skip running VEP, but extract VEP annotation in VCF if found
|
1138 | 1137 | --online Use useastdb.ensembl.org instead of local cache (supports only GRCh38 VCFs listing <100 events)
|
1139 |
| - --ref-fasta Reference FASTA file [~/.vep/homo_sapiens/95_GRCh37/Homo_sapiens.GRCh37.75.dna.primary_assembly.fa.gz] |
1140 |
| - --filter-vcf A VCF for FILTER tag common_variant. Set to 0 to disable [~/.vep/ExAC_nonTCGA.r0.3.1.sites.vep.vcf.gz] |
| 1138 | + --ref-fasta Reference FASTA file [~/.vep/homo_sapiens/101_GRCh37/Homo_sapiens.GRCh37.dna.toplevel.fa.gz] |
| 1139 | + --filter-vcf A VCF for FILTER tag common_variant; Disabled by default [] |
1141 | 1140 | --max-filter-ac Use tag common_variant if the filter-vcf reports a subpopulation AC higher than this [10]
|
1142 | 1141 | --species Ensembl-friendly name of species (e.g. mus_musculus for mouse) [homo_sapiens]
|
1143 | 1142 | --ncbi-build NCBI reference assembly of variants MAF (e.g. GRCm38 for mouse) [GRCh37]
|
1144 |
| - --cache-version Version of offline cache to use with VEP (e.g. 75, 84, 91) [Default: Installed version] |
| 1143 | + --cache-version Version of offline cache to use with VEP (e.g. 75, 91, 101) [Default: Installed version] |
1145 | 1144 | --maf-center Variant calling center to report in MAF [.]
|
1146 | 1145 | --retain-info Comma-delimited names of INFO fields to retain as extra columns in MAF []
|
1147 | 1146 | --retain-fmt Comma-delimited names of FORMAT fields to retain as extra columns in MAF []
|
|
0 commit comments