blob: cf3b09b84617ec32bc04175c4fa4db2afbdbd5b8 [file] [log] [blame]
daza85347472020-11-23 18:43:33 +01001[paths]
dazad7d70752021-01-12 18:17:49 +01002train = "/vol/netapp/daza/datasets/TIGER_conll/data_splits/train/Tiger.ALL.Orth.train.spacy"
3dev = "/vol/netapp/daza/datasets/TIGER_conll/data_splits/test/Tiger.NewOrth.test.spacy"
daza85347472020-11-23 18:43:33 +01004vectors = null
5init_tok2vec = null
6
7[system]
8gpu_allocator = "pytorch"
9seed = 0
10
11[nlp]
12lang = "de"
13pipeline = ["transformer","tagger"]
14tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
15disabled = []
16before_creation = null
17after_creation = null
18after_pipeline_creation = null
19
20[components]
21
22[components.tagger]
23factory = "tagger"
24
25[components.tagger.model]
26@architectures = "spacy.Tagger.v1"
27nO = null
28
29[components.tagger.model.tok2vec]
30@architectures = "spacy-transformers.TransformerListener.v1"
31grad_factor = 1.0
32pooling = {"@layers":"reduce_mean.v1"}
33
34[components.transformer]
35factory = "transformer"
36max_batch_items = 4096
37set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
38
39[components.transformer.model]
40@architectures = "spacy-transformers.TransformerModel.v1"
41name = "bert-base-german-cased"
42
43[components.transformer.model.get_spans]
44@span_getters = "spacy-transformers.strided_spans.v1"
45window = 128
46stride = 96
47
48[components.transformer.model.tokenizer_config]
49use_fast = true
50
51[corpora]
52
53[corpora.dev]
54@readers = "spacy.Corpus.v1"
55path = ${paths.dev}
56max_length = 0
57gold_preproc = false
58limit = 0
59augmenter = null
60
61[corpora.train]
62@readers = "spacy.Corpus.v1"
63path = ${paths.train}
64max_length = 500
65gold_preproc = false
66limit = 0
67augmenter = null
68
69[training]
70accumulate_gradient = 3
71dev_corpus = "corpora.dev"
72train_corpus = "corpora.train"
73seed = ${system.seed}
74gpu_allocator = ${system.gpu_allocator}
75dropout = 0.1
76patience = 1600
77max_epochs = 0
78max_steps = 20000
79eval_frequency = 200
80frozen_components = []
81before_to_disk = null
82
83[training.batcher]
84@batchers = "spacy.batch_by_padded.v1"
85discard_oversize = true
86size = 2000
87buffer = 256
88get_length = null
89
90[training.logger]
91@loggers = "spacy.ConsoleLogger.v1"
92progress_bar = false
93
94[training.optimizer]
95@optimizers = "Adam.v1"
96beta1 = 0.9
97beta2 = 0.999
98L2_is_weight_decay = true
99L2 = 0.01
100grad_clip = 1.0
101use_averages = false
102eps = 0.00000001
103
104[training.optimizer.learn_rate]
105@schedules = "warmup_linear.v1"
106warmup_steps = 250
107total_steps = 20000
108initial_rate = 0.00005
109
110[training.score_weights]
111tag_acc = 1.0
112
113[pretraining]
114
115[initialize]
116vectors = null
117init_tok2vec = ${paths.init_tok2vec}
118vocab_data = null
119lookups = null
120
121[initialize.components]
122
123[initialize.tokenizer]