Source code for gnes.encoder.text.bert

from typing import List

import numpy as np

from ..base import CompositionalTrainableBase, BaseTextEncoder
from ...helper import batching


[docs]class BertEncoder(BaseTextEncoder): store_args_kwargs = True is_trained = True def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) self._bc_encoder_args = args self._bc_encoder_kwargs = kwargs
[docs] def post_init(self): from bert_serving.client import BertClient self.bc_encoder = BertClient(*self._bc_encoder_args, **self._bc_encoder_kwargs)
[docs] @batching def encode(self, text: List[str], *args, **kwargs) -> np.ndarray: return self.bc_encoder.encode(text, *args, **kwargs) # type: np.ndarray
[docs] def close(self): self.bc_encoder.close()
[docs]class BertEncoderWithServer(CompositionalTrainableBase):
[docs] def encode(self, text: List[str], *args, **kwargs) -> np.ndarray: return self.components['bert_client'].encode(text, *args, **kwargs)
[docs]class BertEncoderServer(BaseTextEncoder): store_args_kwargs = True is_trained = True def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) bert_args = ['-%s' % v for v in args] for k, v in kwargs.items(): bert_args.append('-%s' % k) bert_args.append(str(v)) self._bert_args = bert_args
[docs] def post_init(self): from bert_serving.server import BertServer from bert_serving.server import get_args_parser self.bert_server = BertServer(get_args_parser().parse_args(self._bert_args)) self.bert_server.start() self.bert_server.is_ready.wait()
[docs] def close(self): self.bert_server.close()