lingvo/lingvo/tasks/mt/params/wmtm16_en_de.py at master · tensorflow/lingvo

History

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

91

92

93

94

95

96

97

98

99

100

101

102

103

104

105

106

107

108

109

110

111

112

113

#

# Licensed under the Apache License, Version 2.0 (the "License");

# you may not use this file except in compliance with the License.

# You may obtain a copy of the License at

#

# http://www.apache.org/licenses/LICENSE-2.0

#

# Unless required by applicable law or agreed to in writing, software

# distributed under the License is distributed on an "AS IS" BASIS,

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

# See the License for the specific language governing permissions and

# limitations under the License.

# ==============================================================================

"""Train NMT Models on WMT'16 MMT English-German machine translation task."""

import os

from lingvo import model_registry

from lingvo.core import base_model_params

from lingvo.tasks.mt import base_config

from lingvo.tasks.mt import input_generator

from lingvo.tasks.mt import model

@model_registry.RegisterSingleTaskModel

class WmtCaptionEnDeTransformer(base_model_params.SingleTaskModelParams):

"""Params for WMT'16 En->De Captions (ignoring the images)."""

# Generated using scripts in lingvo/mt/tools.

DATADIR = '/tmp/wmtm16/wpm/'

VOCAB_SIZE = 2000

VOCAB_FILE = 'wpm-ende-2k.voc'

def _CommonInputParams(self, is_eval):

"""Input generator params for WMT'16 En->De."""

p = input_generator.NmtInput.Params()

if is_eval:

p.file_random_seed = 27182818

p.file_parallelism = 1

p.file_buffer_size = 1

p.bucket_upper_bound = [10, 14, 19, 26, 36, 50, 70, 98, 137, 200]

p.bucket_batch_limit = [16] * 8 + [4] * 2

else:

p.file_random_seed = 0

p.file_parallelism = 1

p.file_buffer_size = 29000

p.bucket_upper_bound = [14, 17, 20, 24, 29, 35, 45, 75]

p.bucket_batch_limit = [292, 240, 204, 170, 141, 117, 91, 54]

p.tokenizer.vocab_size = self.VOCAB_SIZE

p.tokenizer.token_vocab_filepath = os.path.join(self.DATADIR,

self.VOCAB_FILE)

return p

def Train(self):

p = self._CommonInputParams(is_eval=False)

p.file_pattern = 'tfrecord:' + os.path.join(self.DATADIR, 'train.tfrecords')

p.num_samples = 29000

return p

def Dev(self):

p = input_generator.NmtInput.Params()

p.file_pattern = 'tfrecord:' + os.path.join(self.DATADIR, 'val.tfrecords')

p.num_samples = 1014

return p

def Test(self):

p = input_generator.NmtInput.Params()

p.file_pattern = 'tfrecord:' + os.path.join(self.DATADIR, 'test.tfrecords')

p.num_samples = 1000

return p

def Task(self):

p = base_config.SetupTransformerParams(

model.TransformerModel.Params(),

name='wmt14_en_de_transformer_base',

vocab_size=self.VOCAB_SIZE,

model_dim=256,

hidden_dim=512,

num_heads=2,

num_layers=2,

residual_dropout_prob=0.2,

input_dropout_prob=0.2,

learning_rate=1.0,

warmup_steps=1000)

p.eval.samples_per_summary = 7500

p.train.save_interval_seconds = 60

p.train.max_steps = 12000

return p

@model_registry.RegisterSingleTaskModel

class WmtCaptionEnDeTransformerCloudTpu(WmtCaptionEnDeTransformer):

"""Params for WMT'16 En->De Captions (ignoring the images) on TPU."""

def _CommonInputParams(self, is_eval):

p = super()._CommonInputParams(is_eval)

p.pad_to_max_seq_length = True

p.source_max_length = p.bucket_upper_bound[-1]

p.bucket_batch_limit = [16] * len(p.bucket_batch_limit)

return p

def Task(self):

p = super().Task()

p.encoder.token_emb.max_num_shards = 1

p.decoder.token_emb.max_num_shards = 1

return p

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

wmtm16_en_de.py

wmtm16_en_de.py

Files

wmtm16_en_de.py

Latest commit

History

wmtm16_en_de.py

File metadata and controls