Commit
·
3c74d65
1
Parent(s):
916a2d5
Update README.md
Browse files
README.md
CHANGED
@@ -21,6 +21,8 @@ BERTikal [1] is a cased BERT-base model for the Brazilian legal language and was
|
|
21 |
|
22 |
## Usage
|
23 |
|
|
|
|
|
24 |
```python
|
25 |
from transformers import AutoTokenizer # Or BertTokenizer
|
26 |
from transformers import AutoModelForPreTraining # Or BertForPreTraining for loading pretraining heads
|
@@ -30,7 +32,6 @@ model = AutoModelForPreTraining.from_pretrained('felipemaiapolo/legalnlp-bert')
|
|
30 |
tokenizer = AutoTokenizer.from_pretrained('felipemaiapolo/legalnlp-bert', do_lower_case=False)
|
31 |
```
|
32 |
|
33 |
-
|
34 |
### Ex. BERT embeddings
|
35 |
|
36 |
```python
|
@@ -40,12 +41,12 @@ pipe = pipeline("feature-extraction", model='felipemaiapolo/legalnlp-bert')
|
|
40 |
encoded_sentence = pipe('Juíz negou o recurso.')
|
41 |
```
|
42 |
|
43 |
-
### Masked language modeling prediction
|
44 |
|
45 |
```python
|
46 |
from transformers import pipeline
|
47 |
|
48 |
-
pipe = pipeline('fill-mask', model=
|
49 |
|
50 |
pipe('Juíz negou o [MASK].')
|
51 |
# [{'score': 0.6387444734573364,
|
|
|
21 |
|
22 |
## Usage
|
23 |
|
24 |
+
### Ex. Loading model for general use
|
25 |
+
|
26 |
```python
|
27 |
from transformers import AutoTokenizer # Or BertTokenizer
|
28 |
from transformers import AutoModelForPreTraining # Or BertForPreTraining for loading pretraining heads
|
|
|
32 |
tokenizer = AutoTokenizer.from_pretrained('felipemaiapolo/legalnlp-bert', do_lower_case=False)
|
33 |
```
|
34 |
|
|
|
35 |
### Ex. BERT embeddings
|
36 |
|
37 |
```python
|
|
|
41 |
encoded_sentence = pipe('Juíz negou o recurso.')
|
42 |
```
|
43 |
|
44 |
+
### Ex. Masked language modeling prediction
|
45 |
|
46 |
```python
|
47 |
from transformers import pipeline
|
48 |
|
49 |
+
pipe = pipeline('fill-mask', model='felipemaiapolo/legalnlp-bert')
|
50 |
|
51 |
pipe('Juíz negou o [MASK].')
|
52 |
# [{'score': 0.6387444734573364,
|