Seq2Seq Minimal Start
Generic Encoder-Decoder minimal start
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
import logging
import pandas as pd
from simpletransformers.seq2seq import Seq2SeqModel, Seq2SeqArgs
logging.basicConfig(level=logging.INFO)
transformers_logger = logging.getLogger("transformers")
transformers_logger.setLevel(logging.WARNING)
train_data = [
[
"Perseus “Percy” Jackson is the main protagonist and the narrator of the Percy Jackson and the Olympians series.",
"Percy is the protagonist of Percy Jackson and the Olympians",
],
[
"Annabeth Chase is one of the main protagonists in Percy Jackson and the Olympians.",
"Annabeth is a protagonist in Percy Jackson and the Olympians.",
],
]
train_df = pd.DataFrame(train_data, columns=["input_text", "target_text"])
eval_data = [
[
"Grover Underwood is a satyr and the Lord of the Wild. He is the satyr who found the demigods Thalia Grace, Nico and Bianca di Angelo, Percy Jackson, Annabeth Chase, and Luke Castellan.",
"Grover is a satyr who found many important demigods.",
],
[
"Thalia Grace is the daughter of Zeus, sister of Jason Grace. After several years as a pine tree on Half-Blood Hill, she got a new job leading the Hunters of Artemis.",
"Thalia is the daughter of Zeus and leader of the Hunters of Artemis.",
],
]
eval_df = pd.DataFrame(eval_data, columns=["input_text", "target_text"])
# Configure the model
model_args = Seq2SeqArgs()
model_args.num_train_epochs = 200
model_args.evaluate_generated_text = True
model_args.evaluate_during_training = True
model_args.evaluate_during_training_verbose = True
model = Seq2SeqModel(
"roberta",
"roberta-base",
"bert-base-cased",
args=model_args,
)
# Train the model
model.train_model(train_df, eval_data=eval_df)
# Evaluate the model
result = model.eval_model(eval_df)
# Use the model for prediction
print(
model.predict(
[
"Tyson is a Cyclops, a son of Poseidon, and Percy Jackson’s half brother. He is the current general of the Cyclopes army."
]
)
)
# Loading a saved model
model_reloaded = Seq2SeqModel(
"roberta",
encoder_decoder_name="outputs",
args=model_args,
)
# Use the model for prediction
print(
model_reloaded.predict(
[
"Tyson is a Cyclops, a son of Poseidon, and Percy Jackson’s half brother. He is the current general of the Cyclopes army."
]
)
)
BART Model
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
import logging
import pandas as pd
from simpletransformers.seq2seq import Seq2SeqModel, Seq2SeqArgs
logging.basicConfig(level=logging.INFO)
transformers_logger = logging.getLogger("transformers")
transformers_logger.setLevel(logging.WARNING)
train_data = [
[
"Perseus “Percy” Jackson is the main protagonist and the narrator of the Percy Jackson and the Olympians series.",
"Percy is the protagonist of Percy Jackson and the Olympians",
],
[
"Annabeth Chase is one of the main protagonists in Percy Jackson and the Olympians.",
"Annabeth is a protagonist in Percy Jackson and the Olympians.",
],
]
train_df = pd.DataFrame(train_data, columns=["input_text", "target_text"])
eval_data = [
[
"Grover Underwood is a satyr and the Lord of the Wild. He is the satyr who found the demigods Thalia Grace, Nico and Bianca di Angelo, Percy Jackson, Annabeth Chase, and Luke Castellan.",
"Grover is a satyr who found many important demigods.",
],
[
"Thalia Grace is the daughter of Zeus, sister of Jason Grace. After several years as a pine tree on Half-Blood Hill, she got a new job leading the Hunters of Artemis.",
"Thalia is the daughter of Zeus and leader of the Hunters of Artemis.",
],
]
eval_df = pd.DataFrame(eval_data, columns=["input_text", "target_text"])
# Configure the model
model_args = Seq2SeqArgs()
model_args.num_train_epochs = 200
model_args.evaluate_generated_text = True
model_args.evaluate_during_training = True
model_args.evaluate_during_training_verbose = True
model = Seq2SeqModel(
encoder_decoder_type="bart",
encoder_decoder_name="facebook/bart-large",
args=model_args,
)
# Train the model
model.train_model(train_df, eval_data=eval_df)
# Evaluate the model
result = model.eval_model(eval_df)
# Use the model for prediction
print(
model.predict(
[
"Tyson is a Cyclops, a son of Poseidon, and Percy Jackson’s half brother. He is the current general of the Cyclopes army."
]
)
)
# Loading a saved model
model_reloaded = Seq2SeqModel(
encoder_decoder_type="bart",
encoder_decoder_name="outputs",
args=model_args,
)
# Use the model for prediction
print(
model_reloaded.predict(
[
"Tyson is a Cyclops, a son of Poseidon, and Percy Jackson’s half brother. He is the current general of the Cyclopes army."
]
)
)
MarianMT Model
Note: MarianMT models are not intended to be trained/fine-tuned. There are thousands of ready-to-use translation models available. See here.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import logging
import pandas as pd
from simpletransformers.seq2seq import Seq2SeqModel, Seq2SeqArgs
logging.basicConfig(level=logging.INFO)
transformers_logger = logging.getLogger("transformers")
transformers_logger.setLevel(logging.WARNING)
model_args = Seq2SeqArgs()
model_args.num_beams = 10
model = Seq2SeqModel(
encoder_decoder_type="marian",
encoder_decoder_name="Helsinki-NLP/opus-mt-en-de",
args=model_args,
)
src = [
"Perseus “Percy” Jackson is the main protagonist and the narrator of the Percy Jackson and the Olympians series.",
"Annabeth Chase is one of the main protagonists in Percy Jackson and the Olympians.",
"Thalia Grace is the daughter of Zeus, sister of Jason Grace. After several years as a pine tree on Half-Blood Hill, she got a new job leading the Hunters of Artemis.",
]
predictions = model.predict(src)
for en, de in zip(src, predictions):
print("-------------")
print(en)
print(de)
print()