Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add configurations for target setting for workload variants #706

Closed
wants to merge 46 commits into from
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
46 commits
Select commit Hold shift + click to select a range
f9892b1
add tuning points for criteo variants
priyakasimbeg Feb 10, 2024
bcb80ca
fastmri tuning search
priyakasimbeg Feb 10, 2024
f45bd2f
fastmri tuning search
priyakasimbeg Feb 10, 2024
8b49604
add targetsetting hparams for fastmri, resnet, vit, conformer variants
priyakasimbeg Feb 14, 2024
f592f31
Merge branch 'dev' into variants_target_setting
priyakasimbeg Feb 14, 2024
01a320f
add deepspeech variant targets
priyakasimbeg Feb 14, 2024
7337063
add tuning hparams for target setting for ogbg and wmt variants
priyakasimbeg Feb 14, 2024
281f8ad
add tuning hparams for deepspeech variants
priyakasimbeg Feb 14, 2024
e8b662d
add dataset and steps defaults for workloads
priyakasimbeg Feb 14, 2024
ec148f7
add tunig search space for deepspeech variant target setting
priyakasimbeg Feb 14, 2024
3f16434
config for target setting
priyakasimbeg Feb 15, 2024
a7b0d81
modify target setting config
priyakasimbeg Feb 15, 2024
f379c43
add deepspeech target setting configs
priyakasimbeg Feb 15, 2024
2ae0c2a
modify configs for target setting
priyakasimbeg Feb 15, 2024
81d8278
modify run_workloads.py
priyakasimbeg Feb 15, 2024
f9c1542
fix logic with runs
priyakasimbeg Feb 15, 2024
66a7917
relax docker version
priyakasimbeg Feb 15, 2024
1f65c08
remove dependencies
priyakasimbeg Feb 15, 2024
aa18a68
fixes
priyakasimbeg Feb 15, 2024
10b128c
fix
priyakasimbeg Feb 15, 2024
3000318
fixes in variant workload names
priyakasimbeg Feb 15, 2024
31b7252
merge
priyakasimbeg Mar 5, 2024
add2aaf
add configs for failed variants
priyakasimbeg Mar 5, 2024
a9a601e
fix config
priyakasimbeg Mar 5, 2024
5775b21
Merge branch 'dev' into variants_target_setting
priyakasimbeg Mar 5, 2024
99c5863
Merge branch 'dev' into variants_target_setting
priyakasimbeg Mar 7, 2024
0fa2a39
add flag to run_workloads scoring script
priyakasimbeg Mar 7, 2024
a3ae86d
fix
priyakasimbeg Mar 7, 2024
99da6ba
modify experiments
priyakasimbeg Mar 12, 2024
745fcba
fix config
priyakasimbeg Mar 12, 2024
dfda021
fix
priyakasimbeg Mar 12, 2024
0666662
temp fix
priyakasimbeg Mar 13, 2024
dacc4b8
fix imagenet variant targets
priyakasimbeg Mar 15, 2024
1ca2709
Merge branch 'imagenet_variant_target_fixes' into variants_target_set…
priyakasimbeg Mar 15, 2024
1cbb893
modify configs for variants
priyakasimbeg Mar 15, 2024
19ecfe4
fixes
priyakasimbeg Mar 15, 2024
7deedfc
lint fix
priyakasimbeg Mar 18, 2024
695684c
formatting
priyakasimbeg Mar 18, 2024
89913c9
fix typo
priyakasimbeg Mar 18, 2024
0906471
debugging
priyakasimbeg Mar 18, 2024
80f30bb
fix
priyakasimbeg Mar 19, 2024
e19220c
formatting
priyakasimbeg Mar 19, 2024
9b6e1f7
Merge branch 'dev' into variants_target_setting
priyakasimbeg Mar 20, 2024
5a881d8
Merge branch 'dev' into variants_target_setting
priyakasimbeg Mar 20, 2024
3a9b0a3
fix typos
priyakasimbeg Mar 20, 2024
1cc5107
add logs for debugging
priyakasimbeg Mar 22, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -272,11 +272,11 @@ def use_silu(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.22009
return 1 - 0.22009

@property
def test_target_value(self) -> float:
return 0.3426
return 1 - 0.3426


class ImagenetResNetGELUWorkload(ImagenetResNetWorkload):
Expand All @@ -287,11 +287,11 @@ def use_gelu(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.22077
return 1 - 0.22077

@property
def test_target_value(self) -> float:
return 0.3402
return 1 - 0.3402


class ImagenetResNetLargeBNScaleWorkload(ImagenetResNetWorkload):
Expand All @@ -302,8 +302,8 @@ def bn_init_scale(self) -> float:

@property
def validation_target_value(self) -> float:
return 0.23474
return 1 - 0.23474

@property
def test_target_value(self) -> float:
return 0.3577
return 1 - 0.3577
Original file line number Diff line number Diff line change
Expand Up @@ -326,11 +326,11 @@ def use_silu(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.22009
return 1 - 0.22009

@property
def test_target_value(self) -> float:
return 0.342
return 1 - 0.342


class ImagenetResNetGELUWorkload(ImagenetResNetWorkload):
Expand All @@ -341,11 +341,11 @@ def use_gelu(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.22077
return 1 - 0.22077

@property
def test_target_value(self) -> float:
return 0.3402
return 1 - 0.3402


class ImagenetResNetLargeBNScaleWorkload(ImagenetResNetWorkload):
Expand All @@ -356,8 +356,8 @@ def bn_init_scale(self) -> float:

@property
def validation_target_value(self) -> float:
return 0.23474
return 1 - 0.23474

@property
def test_target_value(self) -> float:
return 0.3577
return 1 - 0.3577
Original file line number Diff line number Diff line change
Expand Up @@ -99,11 +99,11 @@ def use_glu(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.2233
return 1 - 0.2233

@property
def test_target_value(self) -> float:
return 0.3455
return 1 - 0.3455


class ImagenetVitPostLNWorkload(ImagenetVitWorkload):
Expand All @@ -114,11 +114,11 @@ def use_post_layer_norm(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.24688
return 1 - 0.24688

@property
def test_target_value(self) -> float:
return 0.3714
return 1 - 0.3714


class ImagenetVitMapWorkload(ImagenetVitWorkload):
Expand All @@ -129,8 +129,8 @@ def use_map(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.22886
return 1 - 0.22886

@property
def test_target_value(self) -> float:
return 0.3477
return 1 - 0.3477
Original file line number Diff line number Diff line change
Expand Up @@ -90,11 +90,11 @@ def use_glu(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.2233
return 1 - 0.2233

@property
def test_target_value(self) -> float:
return 0.3455
return 1 - 0.3455


class ImagenetVitPostLNWorkload(ImagenetVitWorkload):
Expand All @@ -105,11 +105,11 @@ def use_post_layer_norm(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.24688
return 1 - 0.24688

@property
def test_target_value(self) -> float:
return 0.3714
return 1 - 0.3714


class ImagenetVitMapWorkload(ImagenetVitWorkload):
Expand All @@ -120,8 +120,8 @@ def use_map(self) -> bool:

@property
def validation_target_value(self) -> float:
return 0.22886
return 1 - 0.22886

@property
def test_target_value(self) -> float:
return 0.3477
return 1 - 0.3477
Original file line number Diff line number Diff line change
Expand Up @@ -107,13 +107,29 @@ class LibriSpeechDeepSpeechTanhWorkload(LibriSpeechDeepSpeechWorkload):
def use_tanh(self) -> bool:
return True

@property
def validation_target_value(self) -> float:
return 0.133449

@property
def test_target_value(self) -> float:
return 0.079810


class LibriSpeechDeepSpeechNoResNetWorkload(LibriSpeechDeepSpeechWorkload):

@property
def enable_residual_connections(self) -> bool:
return False

@property
def validation_target_value(self) -> float:
return 0.105042

@property
def test_target_value(self) -> float:
return 0.060388


class LibriSpeechDeepSpeechNormAndSpecAugWorkload(LibriSpeechDeepSpeechWorkload
):
Expand All @@ -137,3 +153,11 @@ def freq_mask_count(self) -> int:
@property
def time_mask_count(self) -> int:
return 15

@property
def validation_target_value(self) -> float:
return 0.131553

@property
def test_target_value(self) -> float:
return 0.082442
2 changes: 1 addition & 1 deletion algorithmic_efficiency/workloads/workloads.py
Original file line number Diff line number Diff line change
Expand Up @@ -78,7 +78,7 @@
},
'imagenet_vit_map': {
'workload_path': 'imagenet_vit/imagenet',
'workload_class_name': 'ImagenetVitMapLNWorkload',
'workload_class_name': 'ImagenetVitMapWorkload',
},
'librispeech_conformer': {
'workload_path': 'librispeech_conformer/librispeech',
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
{
"learning_rate": {
"feasible_points": [
0.002517072211464665
]
},
"beta1": {
"feasible_points": [
0.9908351643533544
]
},
"beta2": {
"feasible_points": [
0.9859568907533993
]
},
"warmup_steps": {
"feasible_points": [
799
]
},
"weight_decay": {
"feasible_points": [
0.12274552870237089
]
}
}

Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
{
"learning_rate": {
"feasible_points": [
0.05493199486120455
]
},
"beta1": {
"feasible_points": [
0.954922991734919
]
},
"beta2": {
"feasible_points": [
0.9986188074995163
]
},
"warmup_steps": {
"feasible_points": [
799
]
},
"weight_decay": {
"feasible_points": [
0.00011065469792077193
]
}
}

Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
{
"learning_rate": {
"feasible_points": [
0.001493629901423942
]
},
"beta1": {
"feasible_points": [
0.9592129978682067
]
},
"beta2": {
"feasible_points": [
0.9824918272399145
]
},
"warmup_steps": {
"feasible_points": [
399
]
},
"weight_decay": {
"feasible_points": [
0.00038587516415285595
]
}
}

Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
{
"learning_rate": {
"feasible_points": [
0.008334676559764446
]
},
"beta1": {
"feasible_points": [
0.8294338711079317
]
},
"beta2": {
"feasible_points": [
0.8551723332825868
]
},
"warmup_steps": {
"feasible_points": [
2714
]
},
"weight_decay": {
"feasible_points": [
0.01371235755699044
]
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
{
"learning_rate": {
"feasible_points": [
0.006173154695175443
]
},
"beta1": {
"feasible_points": [
0.8496694604806512
]
},
"beta2": {
"feasible_points": [
0.4639437428687345
]
},
"warmup_steps": {
"feasible_points": [
1357
]
},
"weight_decay": {
"feasible_points": [
0.1679001017957879
]
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
{
"learning_rate": {
"feasible_points": [
0.04037951750205473
]
},
"beta1": {
"feasible_points": [
0.9932215932637941
]
},
"beta2": {
"feasible_points": [
0.9425306939334134
]
},
"warmup_steps": {
"feasible_points": [
542
]
},
"weight_decay": {
"feasible_points": [
0.14877061239151607
]
}
}
Loading
Loading