diff options
author | Aarni Koskela <akx@iki.fi> | 2023-12-30 22:20:30 +0000 |
---|---|---|
committer | Aarni Koskela <akx@iki.fi> | 2023-12-31 11:22:43 +0000 |
commit | 5768afc776a66bb94e77a9c1daebeea58fa731d5 (patch) | |
tree | 06c015a95076b2de579a72750aa7862a9615ed09 /modules/xlmr.py | |
parent | a84e842189f5599fd354147f72d1a9b9ed0716c8 (diff) | |
download | stable-diffusion-webui-gfx803-5768afc776a66bb94e77a9c1daebeea58fa731d5.tar.gz stable-diffusion-webui-gfx803-5768afc776a66bb94e77a9c1daebeea58fa731d5.tar.bz2 stable-diffusion-webui-gfx803-5768afc776a66bb94e77a9c1daebeea58fa731d5.zip |
Add utility to inspect a model's parameters (to get dtype/device)
Diffstat (limited to 'modules/xlmr.py')
-rw-r--r-- | modules/xlmr.py | 5 |
1 files changed, 4 insertions, 1 deletions
diff --git a/modules/xlmr.py b/modules/xlmr.py index a407a3ca..6e000a56 100644 --- a/modules/xlmr.py +++ b/modules/xlmr.py @@ -5,6 +5,9 @@ from transformers.models.xlm_roberta.configuration_xlm_roberta import XLMRoberta from transformers import XLMRobertaModel,XLMRobertaTokenizer from typing import Optional +from modules.torch_utils import get_param + + class BertSeriesConfig(BertConfig): def __init__(self, vocab_size=30522, hidden_size=768, num_hidden_layers=12, num_attention_heads=12, intermediate_size=3072, hidden_act="gelu", hidden_dropout_prob=0.1, attention_probs_dropout_prob=0.1, max_position_embeddings=512, type_vocab_size=2, initializer_range=0.02, layer_norm_eps=1e-12, pad_token_id=0, position_embedding_type="absolute", use_cache=True, classifier_dropout=None,project_dim=512, pooler_fn="average",learn_encoder=False,model_type='bert',**kwargs): @@ -62,7 +65,7 @@ class BertSeriesModelWithTransformation(BertPreTrainedModel): self.post_init() def encode(self,c): - device = next(self.parameters()).device + device = get_param(self).device text = self.tokenizer(c, truncation=True, max_length=77, |