Skip to content

The Structure of a Search Strategies File

Karolis Ramanauskas edited this page Aug 14, 2023 · 8 revisions
[T2-RNases]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 175
max_query_length = 350

max_query_identity = 0.80

# Length in Nucleotides
min_target_orf_length = 500
max_target_orf_length = 1200

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 70
best_hit_overhang = 0.15
best_hit_score_edge = 0.15
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries = ("Ribonuclease T2"[Title] OR "RNase T2"[Title] OR "S-RNase"[Title]) AND (200[SLEN]:350[SLEN]) AND Eudicots[Organism] NOT (partial OR putative OR predicted OR "binding protein" OR thioredoxin)

# FASTA files (Amino Acid)
fasta_files_aa = input/T2-RNases.fasta

# -----------------------------------------------------------------------------

[F-boxes]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 340
max_query_length = 450

max_query_identity = 0.99

# Length in Nucleotides
min_target_orf_length = 800
max_target_orf_length = 1500

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 85
best_hit_overhang = 0.2
best_hit_score_edge = 0.1
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries = ("S-locus F-box" OR "S locus F-box" OR "S-haplotype-specific" OR "SLF" OR "SLFL" OR "SFB" OR "SFBB") AND (340[SLEN]:450[SLEN]) AND eudicotyledons[Organism] NOT (predicted[Title] OR partial OR putative OR hypothetical OR "non-S")

# FASTA files (Amino Acid)
fasta_files_aa = input/F-boxes.fasta

# -----------------------------------------------------------------------------

[RubisCO-SSU]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 150
max_query_length = 200

max_query_identity = 0.80

# Length in Nucleotides
min_target_orf_length = 500
max_target_orf_length = 600

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 70
best_hit_overhang = 0.15
best_hit_score_edge = 0.15
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries =

# FASTA files (Amino Acid)
fasta_files_aa = input/rubisco_ssu.fasta

# -----------------------------------------------------------------------------

[Elong-factor-1-alpha]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 430
max_query_length = 460

max_query_identity = 0.80

# Length in Nucleotides
min_target_orf_length = 1250
max_target_orf_length = 1400

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 70
best_hit_overhang = 0.15
best_hit_score_edge = 0.15
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries =

# FASTA files (Amino Acid)
fasta_files_aa = input/elong_factor_1_alpha.fasta

# -----------------------------------------------------------------------------

[Alpha-tubulin]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 430
max_query_length = 460

max_query_identity = 0.80

# Length in Nucleotides
min_target_orf_length = 1250
max_target_orf_length = 1400

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 70
best_hit_overhang = 0.15
best_hit_score_edge = 0.15
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries =

# FASTA files (Amino Acid)
fasta_files_aa = input/alpha_tubulin.fasta

# -----------------------------------------------------------------------------

[Actin]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 350
max_query_length = 390

max_query_identity = 0.80

# Length in Nucleotides
min_target_orf_length = 1050
max_target_orf_length = 1200

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 70
best_hit_overhang = 0.15
best_hit_score_edge = 0.15
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries =

# FASTA files (Amino Acid)
fasta_files_aa = input/actin.fasta

# -----------------------------------------------------------------------------

[GLO]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 180
max_query_length = 220

max_query_identity = 0.95

# Length in Nucleotides
min_target_orf_length = 500
max_target_orf_length = 900

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 80
best_hit_overhang = 0.2
best_hit_score_edge = 0.1
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries =

# FASTA files (Amino Acid)
fasta_files_aa = input/GLO.fasta

# -----------------------------------------------------------------------------

[CYP]
# nucleus, plastid, mitochondrion
# Note: use nucleus for non-eukaryotes.
organelle = nucleus

# Length in Amino Acids
min_query_length = 340
max_query_length = 600

max_query_identity = 0.95

# Length in Nucleotides
min_target_orf_length = 1000
max_target_orf_length = 2000

# BLAST assemblies
evalue = 1e-20
max_hsps = 4
qcov_hsp_perc = 80
best_hit_overhang = 0.2
best_hit_score_edge = 0.1
max_target_seqs = 500

# Pfam families
pfam_families =

# NCBI protein accessions
ncbi_accessions_aa =

# NCBI Entrez search queries
entrez_search_queries =

# FASTA files (Amino Acid)
fasta_files_aa = input/CYP.fasta
Clone this wiki locally