-
Notifications
You must be signed in to change notification settings - Fork 3
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
changing model directories for testing
- Loading branch information
Borbála Farkas
authored and
Borbála Farkas
committed
Oct 28, 2024
1 parent
b6821a3
commit 7fdf35d
Showing
41 changed files
with
165 additions
and
1,577 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,41 @@ | ||
from viewser import Queryset, Column | ||
|
||
def generate(): | ||
""" | ||
Contains the configuration for the input data in the form of a viewser queryset. That is the data from viewser that is used to train the model. | ||
This configuration is "behavioral" so modifying it will affect the model's runtime behavior and integration into the deployment system. | ||
There is no guarantee that the model will work if the input data configuration is changed here without changing the model settings and algorithm accordingly. | ||
Returns: | ||
- queryset_base (Queryset): A queryset containing the base data for the model training. | ||
""" | ||
|
||
# VIEWSER 6, Example configuration. Modify as needed. | ||
|
||
queryset_base = (Queryset("caring_fish", "priogrid_month") | ||
# Create a new column 'ln_sb_best' using data from 'priogrid_month' and 'ged_sb_best_count_nokgi' column | ||
# Apply logarithmic transformation, handle missing values by replacing them with NA | ||
.with_column(Column("ln_sb_best", from_loa="priogrid_month", from_column="ged_sb_best_count_nokgi") | ||
.transform.ops.ln().transform.missing.replace_na()) | ||
|
||
# Create a new column 'ln_ns_best' using data from 'priogrid_month' and 'ged_ns_best_count_nokgi' column | ||
# Apply logarithmic transformation, handle missing values by replacing them with NA | ||
.with_column(Column("ln_ns_best", from_loa="priogrid_month", from_column="ged_ns_best_count_nokgi") | ||
.transform.ops.ln().transform.missing.replace_na()) | ||
|
||
# Create a new column 'ln_os_best' using data from 'priogrid_month' and 'ged_os_best_count_nokgi' column | ||
# Apply logarithmic transformation, handle missing values by replacing them with NA | ||
.with_column(Column("ln_os_best", from_loa="priogrid_month", from_column="ged_os_best_count_nokgi") | ||
.transform.ops.ln().transform.missing.replace_na()) | ||
|
||
# Create columns for month and year_id | ||
.with_column(Column("month", from_loa="month", from_column="month")) | ||
.with_column(Column("year_id", from_loa="country_year", from_column="year_id")) | ||
|
||
# Create columns for country_id, col, and row | ||
.with_column(Column("c_id", from_loa="country_year", from_column="country_id")) | ||
.with_column(Column("col", from_loa="priogrid", from_column="col")) | ||
.with_column(Column("row", from_loa="priogrid", from_column="row")) | ||
) | ||
|
||
return queryset_base |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,3 @@ | ||
# Model README | ||
## Model name: caring_fish | ||
## Created on: 2024-10-28 16:45:11.931747 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,20 @@ | ||
""" | ||
Deployment Configuration Script | ||
This script defines the deployment configuration settings for the application. | ||
It includes the deployment status and any additional settings specified. | ||
Deployment Status: | ||
- shadow: The deployment is shadowed and not yet active. | ||
- deployed: The deployment is active and in use. | ||
- baseline: The deployment is in a baseline state, for reference or comparison. | ||
- deprecated: The deployment is deprecated and no longer supported. | ||
Additional settings can be included in the configuration dictionary as needed. | ||
""" | ||
|
||
def get_deployment_config(): | ||
# Deployment settings | ||
deployment_config = {'deployment_status': 'shadow'} | ||
return deployment_config |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,14 @@ | ||
def get_hp_config(): | ||
""" | ||
Contains the hyperparameter configurations for model training. | ||
This configuration is "operational" so modifying these settings will impact the model's behavior during the training. | ||
Returns: | ||
- hyperparameters (dict): A dictionary containing hyperparameters for training the model, which determine the model's behavior during the training phase. | ||
""" | ||
|
||
hyperparameters = { | ||
'model': 'LightBGM', # The model algorithm used. Eg. "LSTM", "CNN", "Transformer" | ||
# Add more hyperparameters as needed | ||
} | ||
return hyperparameters |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,19 @@ | ||
def get_meta_config(): | ||
""" | ||
Contains the meta data for the model (model algorithm, name, target variable, and level of analysis). | ||
This config is for documentation purposes only, and modifying it will not affect the model, the training, or the evaluation. | ||
Returns: | ||
- meta_config (dict): A dictionary containing model meta configuration. | ||
""" | ||
|
||
meta_config = { | ||
"name": "caring_fish", # Eg. happy_kitten | ||
"algorithm": "LightBGM", # Eg. "LSTM", "CNN", "Transformer" | ||
# Uncomment and modify the following lines as needed for additional metadata: | ||
# "target(S)": ["ln_sb_best", "ln_ns_best", "ln_os_best", "ln_sb_best_binarized", "ln_ns_best_binarized", "ln_os_best_binarized"], | ||
"queryset": "escwa001_cflong", | ||
# "level": "pgm", | ||
# "creator": "Your name here" | ||
} | ||
return meta_config |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
def get_sweep_config(): | ||
""" | ||
Contains the configuration for hyperparameter sweeps using WandB. | ||
This configuration is "operational" so modifying it will change the search strategy, parameter ranges, and other settings for hyperparameter tuning aimed at optimizing model performance. | ||
Returns: | ||
- sweep_config (dict): A dictionary containing the configuration for hyperparameter sweeps, defining the methods and parameter ranges used to search for optimal hyperparameters. | ||
""" | ||
|
||
sweep_config = { | ||
'method': 'grid', | ||
} | ||
|
||
# Example metric setup: | ||
metric = { | ||
'name': 'MSE', | ||
'goal': 'minimize' | ||
} | ||
sweep_config['metric'] = metric | ||
|
||
# Example parameters setup: | ||
parameters_dict = { | ||
'model': { | ||
'value': 'LightBGM' # Eg. "LSTM", "CNN", "Transformer" | ||
}, | ||
} | ||
sweep_config['parameters'] = parameters_dict | ||
|
||
return sweep_config |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
import time | ||
import wandb | ||
import sys | ||
import logging | ||
logging.basicConfig(filename='run.log', encoding='utf-8', level=logging.INFO, | ||
format='%(asctime)s - %(levelname)s - %(message)s') | ||
logger = logging.getLogger(__name__) | ||
from pathlib import Path | ||
# Set up the path to include common_utils module | ||
PATH = Path(__file__) | ||
sys.path.insert(0, str(Path( | ||
*[i for i in PATH.parts[:PATH.parts.index("views_pipeline") + 1]]) / "common_utils")) # PATH_COMMON_UTILS | ||
# Import necessary functions for project setup and model execution | ||
from set_path import setup_project_paths | ||
setup_project_paths(PATH) | ||
from utils_cli_parser import parse_args, validate_arguments | ||
from execute_model_runs import execute_sweep_run, execute_single_run | ||
|
||
if __name__ == "__main__": | ||
# Parse command-line arguments | ||
args = parse_args() | ||
|
||
# Validate the arguments to ensure they are correct | ||
validate_arguments(args) | ||
# Log in to Weights & Biases (wandb) | ||
wandb.login() | ||
# Record the start time | ||
start_t = time.time() | ||
# Execute the model run based on the sweep flag | ||
if args.sweep: | ||
execute_sweep_run(args) # Execute sweep run | ||
else: | ||
execute_single_run(args) # Execute single run | ||
# Record the end time | ||
end_t = time.time() | ||
|
||
# Calculate and print the runtime in minutes | ||
minutes = (end_t - start_t) / 60 | ||
logger.info(f'Done. Runtime: {minutes:.3f} minutes') |
File renamed without changes.
Binary file not shown.
This file was deleted.
Oops, something went wrong.
Empty file.
This file was deleted.
Oops, something went wrong.
This file was deleted.
Oops, something went wrong.
Oops, something went wrong.