-
Notifications
You must be signed in to change notification settings - Fork 6
Open
Description
Microbert's allennlp version seems to suffer from this issue allenai/allennlp#5666 which per the comments on that issue, is fixed by running
pip install cached-path==1.1.2
immediately after running pip install -r requirements.txt in the installation instructions.
But the need to use that allennlp version I think might also be getting me bitten by allenai/allennlp#4317 or similar; while trying to pretrain a Bert on Coptic with python main.py bert train , I'm getting
2023-02-10 20:54:36,408 - INFO - allennlp.common.params - dataset_reader.readers.mlm.token_indexers.tokens.token_min_padding_length = 0
2023-02-10 20:54:36,408 - INFO - allennlp.common.params - dataset_reader.readers.mlm.token_indexers.tokens.model_name = berts/coptic/mlm-xpos-parser_layers-3_heads-5_hidden-100
2023-02-10 20:54:36,408 - INFO - allennlp.common.params - dataset_reader.readers.mlm.token_indexers.tokens.namespace = tags
2023-02-10 20:54:36,408 - INFO - allennlp.common.params - dataset_reader.readers.mlm.token_indexers.tokens.max_length = None
2023-02-10 20:54:36,408 - INFO - allennlp.common.params - dataset_reader.readers.mlm.token_indexers.tokens.tokenizer_kwargs = None
2023-02-10 20:54:36,413 - CRITICAL - root - Uncaught exception
Traceback (most recent call last):
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/data/tokenizers/pretrained_transformer_tokenizer.py", line 83, in __init__
self._reverse_engineer_special_tokens("a", "b", model_name, tokenizer_kwargs)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/data/tokenizers/pretrained_transformer_tokenizer.py", line 136, in _reverse_engineer_special_tokens
assert dummy_a != dummy_b
AssertionError
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/tmp/pycharm_project_494/main.py", line 131, in <module>
top()
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/core.py", line 1130, in __call__
return self.main(*args, **kwargs)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/core.py", line 1055, in main
rv = self.invoke(ctx)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/core.py", line 1657, in invoke
return _process_result(sub_ctx.command.invoke(sub_ctx))
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/core.py", line 1657, in invoke
return _process_result(sub_ctx.command.invoke(sub_ctx))
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/core.py", line 1404, in invoke
return ctx.invoke(self.callback, **ctx.params)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/core.py", line 760, in invoke
return __callback(*args, **kwargs)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/click/decorators.py", line 26, in new_func
return f(get_current_context(), *args, **kwargs)
File "/tmp/pycharm_project_494/embur/commands/bert.py", line 147, in train
model = train_model_from_file(config.pretrain_jsonnet, config.experiment_dir, overrides=overrides)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/commands/train.py", line 177, in train_model_from_file
return train_model(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/commands/train.py", line 258, in train_model
model = _train_worker(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/commands/train.py", line 494, in _train_worker
train_loop = TrainModel.from_params(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 604, in from_params
return retyped_subclass.from_params(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 636, in from_params
kwargs = create_kwargs(constructor_to_inspect, cls, params, **extras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 206, in create_kwargs
constructed_arg = pop_and_construct_arg(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 314, in pop_and_construct_arg
return construct_arg(class_name, name, popped_params, annotation, default, **extras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 348, in construct_arg
result = annotation.from_params(params=popped_params, **subextras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 604, in from_params
return retyped_subclass.from_params(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 636, in from_params
kwargs = create_kwargs(constructor_to_inspect, cls, params, **extras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 206, in create_kwargs
constructed_arg = pop_and_construct_arg(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 314, in pop_and_construct_arg
return construct_arg(class_name, name, popped_params, annotation, default, **extras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 394, in construct_arg
value_dict[key] = construct_arg(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 348, in construct_arg
result = annotation.from_params(params=popped_params, **subextras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 604, in from_params
return retyped_subclass.from_params(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 636, in from_params
kwargs = create_kwargs(constructor_to_inspect, cls, params, **extras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 206, in create_kwargs
constructed_arg = pop_and_construct_arg(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 314, in pop_and_construct_arg
return construct_arg(class_name, name, popped_params, annotation, default, **extras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 394, in construct_arg
value_dict[key] = construct_arg(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 348, in construct_arg
result = annotation.from_params(params=popped_params, **subextras)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 604, in from_params
return retyped_subclass.from_params(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/common/from_params.py", line 638, in from_params
return constructor_to_call(**kwargs) # type: ignore
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/data/token_indexers/pretrained_transformer_mismatched_indexer.py", line 58, in __init__
self._matched_indexer = PretrainedTransformerIndexer(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/data/token_indexers/pretrained_transformer_indexer.py", line 56, in __init__
self._allennlp_tokenizer = PretrainedTransformerTokenizer(
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/data/tokenizers/pretrained_transformer_tokenizer.py", line 87, in __init__
self._reverse_engineer_special_tokens("1", "2", model_name, tokenizer_kwargs)
File "/storage/condaenvs/thisenv/lib/python3.9/site-packages/allennlp/data/tokenizers/pretrained_transformer_tokenizer.py", line 136, in _reverse_engineer_special_tokens
assert dummy_a != dummy_b
AssertionError
Process finished with exit code 1
Reactions are currently unavailable
Metadata
Metadata
Assignees
Labels
No labels