tokenization_convbert.py 1.1 KB

123456789101112131415161718192021222324252627282930
  1. # Copyright The HuggingFace Inc. team. All rights reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. """Tokenization classes for ConvBERT."""
  15. from ...models.bert.tokenization_bert import BertTokenizer
  16. class ConvBertTokenizer(BertTokenizer):
  17. r"""
  18. Construct a ConvBERT tokenizer (backed by HuggingFace's tokenizers library). Based on WordPiece.
  19. This tokenizer inherits from [`BertTokenizer`] which contains most of the main methods. Users should
  20. refer to this superclass for more information regarding those methods.
  21. """
  22. pass
  23. __all__ = ["ConvBertTokenizer"]