-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathconfig.py
More file actions
45 lines (31 loc) · 1.09 KB
/
config.py
File metadata and controls
45 lines (31 loc) · 1.09 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
import os
import torch
# Paths
PATH_LOGS = os.environ.get("PATH_LOGS", "./runs")
PATH_BASE_MODELS = os.environ.get("PATH_BASE_MODELS", "./base_models")
PATH_CACHE_DATASETS = os.environ.get("PATH_CACHE_DATASETS", "./data/cache")
PATH_CHECKPOINT_MODELS = os.environ.get("PATH_CHECKPOINT_MODELS", "./models")
PATH_SAVE_NL_ENCODER = os.environ.get("PATH_SAVE_NL_ENCODER", "./models/codecg-nl-encoder")
PATH_SAVE_NL_DECODER = os.environ.get("PATH_SAVE_NL_DECODER", "./models/codecg-nl-decoder")
PATH_SAVE_NL_LM = os.environ.get("PATH_SAVE_NL_LM", "./models/code-cg-nl-lm/lm.pt")
# Hyperparams
GLOBAL_SEED = 42
TOKENIZER_MODEL = "Salesforce/codet5-base"
NL_ENCODER_BASE_MODEL = "roberta-base"
NL_DECODER_BASE_MODEL = "gpt2"
PL_ENCODER_BASE_MODEL = ""
VOCAB_SIZE = 32100
MAX_SEQUENCE_LENGTH = 128
PADDING = "max_length"
MAX_EPOCHS = 20
BATCH_SIZE = 32
LEARNING_RATE = 3e-5
WEIGHT_DECAY = 1e-4
DROPOUT_RATE = 1e-3
DATASET_NAME = "code_x_glue_ct_code_to_text"
PL = "python"
# Hardware
NUM_WORKERS = min(4, int(os.cpu_count() / 2))
AVAIL_GPUS = min(1, torch.cuda.device_count())
# Project
PROJECT_NAME = "CodeCG"