Skip to content

Instantly share code, notes, and snippets.

@Hironsan
Created November 9, 2022 12:56
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save Hironsan/86d9461d66f1065fe0e3dc23b27b34bb to your computer and use it in GitHub Desktop.
Save Hironsan/86d9461d66f1065fe0e3dc23b27b34bb to your computer and use it in GitHub Desktop.
[paths]
train = "./train.spacy"
dev = "./dev.spacy"
init_tok2vec = null
vectors = null
[corpora]
[corpora.train]
@readers = "spacy.Corpus.v1"
path = ${paths.train}
[corpora.dev]
@readers = "spacy.Corpus.v1"
path = ${paths.dev}
[system]
gpu_allocator = null
seed = 0
[nlp]
lang = "en"
pipeline = ["partial_ner"]
tokenizer = {"@tokenizers": "character_tokenizer.v1"}
disabled = []
before_creation = null
after_creation = null
after_pipeline_creation = null
batch_size = 15
[nlp.tokenizer]
[components]
[components.partial_ner]
factory = "partial_ner"
[components.partial_ner.loss]
@losses = "spacy-partial-tagger.ExpectedEntityRatioLoss.v1"
padding_index = -1
unknown_index = -100
outside_index = 0
[components.partial_ner.label_indexer]
@label_indexers = "spacy-partial-tagger.TransformerLabelIndexer.v1"
padding_index = ${components.partial_ner.loss.padding_index}
unknown_index= ${components.partial_ner.loss.unknown_index}
[components.partial_ner.model]
@architectures = "spacy-partial-tagger.PartialTagger.v1"
[components.partial_ner.model.misaligned_tok2vec]
@architectures = "spacy-partial-tagger.MisalignedTok2VecTransformer.v1"
model_name = "roberta-base"
[components.partial_ner.model.encoder]
@architectures = "spacy-partial-tagger.LinearCRFEncoder.v1"
nI = 768
nO = null
dropout = 0.2
[components.partial_ner.model.decoder]
@architectures = "spacy-partial-tagger.ConstrainedViterbiDecoder.v1"
padding_index = ${components.partial_ner.loss.padding_index}
[training]
dev_corpus = "corpora.dev"
train_corpus = "corpora.train"
seed = ${system.seed}
gpu_allocator = ${system.gpu_allocator}
accumulate_gradient = 1
max_steps = 20000
patience = 10000
eval_frequency = 1000
frozen_components = []
before_to_disk = null
[training.batcher]
@batchers = "spacy.batch_by_sequence.v1"
size = 15
get_length = null
[training.logger]
@loggers = "spacy.ConsoleLogger.v1"
progress_bar = false
[training.optimizer]
@optimizers = "Adam.v1"
beta1 = 0.9
beta2 = 0.999
L2_is_weight_decay = false
use_averages = false
grad_clip = 5.0
[training.optimizer.learn_rate]
@schedules = "slanted_triangular.v1"
max_rate = 0.00002
num_steps = ${training.max_steps}
cut_frac = 0.1
ratio = 16
t = -1
[training.score_weights]
ents_per_type = null
ents_f = 1.0
ents_p = 0.0
ents_r = 0.0
[pretraining]
[initialize]
[initialize.components]
[initialize.tokenizer]
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment