{"SEQ_LEN": 64, "BATCH_SIZE": 8, "EPOCHS": 4, "EMBED_DIM": 128, "NUM_HEADS": 4, "NUM_LAYERS": 2, "LR": 0.0003, "TOKENIZER_NAME": "gpt2", "DEVICE": "cuda"} |
{"SEQ_LEN": 64, "BATCH_SIZE": 8, "EPOCHS": 4, "EMBED_DIM": 128, "NUM_HEADS": 4, "NUM_LAYERS": 2, "LR": 0.0003, "TOKENIZER_NAME": "gpt2", "DEVICE": "cuda"} |