Skip to content

Commit

Permalink
Truncated main workflow (#638)
Browse files Browse the repository at this point in the history
* Add options to truncate sequences from main workflow

* Update gitignore

* Fill missing lineage/clade values before DB push
  • Loading branch information
atc3 authored Jan 17, 2024
1 parent c389d1e commit 2b208d3
Show file tree
Hide file tree
Showing 16 changed files with 440 additions and 4 deletions.
7 changes: 5 additions & 2 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -98,6 +98,8 @@ data_flu/**
data_gisaid_flu/**
data_gisaid_rsv/**
data_genbank_rsv/**
data_6month
data_6month/**

# Ignore server passwords
server/htpasswd
Expand All @@ -108,7 +110,8 @@ daily_update.sh
daily_update_new.sh
daily_update_rsv.sh
daily_update_sars2_genbank.sh
daily_update_sars2_gisaid.sh
daily_update_sars2_gisaid_full.sh
daily_update_sars2_gisaid_6month.sh
update_gisaid.sh
update_genbank.sh
filter_list.txt
Expand Down Expand Up @@ -143,4 +146,4 @@ data_flu_small/**
workflow_main/notebooks/**

# SnapGene - temp files
static_data/flu/alignments/.sglock/**
static_data/flu/alignments/.sglock/**
14 changes: 14 additions & 0 deletions config/config_flu_genbank.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,20 @@ chunk_size: 10000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1", "2", "3", "4", "5", "6", "7", "8"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_flu_gisaid.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,20 @@ chunk_size: 10000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1", "2", "3", "4", "5", "6", "7", "8"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_flu_gisaid_dev.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,20 @@ chunk_size: 10000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1", "2", "3", "4", "5", "6", "7", "8"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_rsv_custom.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_rsv_genbank.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_sars2_alpha.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_sars2_custom.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_sars2_genbank.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_sars2_genbank_dev.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
14 changes: 14 additions & 0 deletions config/config_sars2_gisaid.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,20 @@ chunk_size: 100000
# ANALYSIS
# --------------------

# Don't process sequences prior to this date
# Leave empty to ignore
start_date_cutoff:
# Don't process sequences after this date
# Leave empty to ignore
end_date_cutoff:

# Don't process sequences after X days ago
# Leave empty to ignore
start_date_cutoff_days_ago:
# Don't process sequences prior to X days ago
# Leave empty to ignore
end_date_cutoff_days_ago:

segments: ["1"]

# Insertions or deletions with more than this difference in bases between the
Expand Down
Loading

0 comments on commit 2b208d3

Please sign in to comment.