Update README.md
Browse files
README.md
CHANGED
|
@@ -53,14 +53,19 @@ SpanExtractor and text_normalize are implemented in [`code`](https://github.com/
|
|
| 53 |
import logging
|
| 54 |
from typing import Optional, Tuple
|
| 55 |
import re
|
| 56 |
-
from transformers import AutoModel, PhobertTokenizerFast
|
|
|
|
| 57 |
|
| 58 |
from utils.span_extractor import SpanExtractor
|
| 59 |
from utils.process_data import text_normalize
|
| 60 |
import torch
|
| 61 |
|
| 62 |
-
model = AutoModel.from_pretrained(
|
| 63 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
|
| 65 |
span_ex =SpanExtractor(tokenizer)
|
| 66 |
|
|
|
|
| 53 |
import logging
|
| 54 |
from typing import Optional, Tuple
|
| 55 |
import re
|
| 56 |
+
from transformers import AutoModel, PhobertTokenizerFast,AutoTokenizer
|
| 57 |
+
import torch.nn.functional as F
|
| 58 |
|
| 59 |
from utils.span_extractor import SpanExtractor
|
| 60 |
from utils.process_data import text_normalize
|
| 61 |
import torch
|
| 62 |
|
| 63 |
+
model = AutoModel.from_pretrained(
|
| 64 |
+
"tkhangg0910/viconbert-base",
|
| 65 |
+
trust_remote_code=True,
|
| 66 |
+
ignore_mismatched_sizes=True
|
| 67 |
+
)
|
| 68 |
+
tokenizer = AutoTokenizer.from_pretrained("tkhangg0910/viconbert-base", use_fast=True)
|
| 69 |
|
| 70 |
span_ex =SpanExtractor(tokenizer)
|
| 71 |
|