Update README.md
Browse files
README.md
CHANGED
@@ -6,6 +6,10 @@ tags:
|
|
6 |
- DNA
|
7 |
- biology
|
8 |
- genomics
|
|
|
|
|
|
|
|
|
9 |
---
|
10 |
# Plant foundation DNA large language models
|
11 |
|
@@ -38,7 +42,7 @@ Here is a simple code for inference:
|
|
38 |
```python
|
39 |
from transformers import AutoModelForSequenceClassification, AutoTokenizer, pipeline
|
40 |
|
41 |
-
model_name = 'plant-dnabert-lncRNAs'
|
42 |
# load model and tokenizer
|
43 |
model = AutoModelForSequenceClassification.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
|
44 |
tokenizer = AutoTokenizer.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
|
@@ -60,4 +64,4 @@ Detailed training procedure can be found in our manuscript.
|
|
60 |
|
61 |
|
62 |
#### Hardware
|
63 |
-
Model was trained on a NVIDIA GTX1080Ti GPU (11 GB).
|
|
|
6 |
- DNA
|
7 |
- biology
|
8 |
- genomics
|
9 |
+
datasets:
|
10 |
+
- zhangtaolab/plant-multi-species-lncRNAs
|
11 |
+
base_model:
|
12 |
+
- zhangtaolab/plant-dnabert-BPE
|
13 |
---
|
14 |
# Plant foundation DNA large language models
|
15 |
|
|
|
42 |
```python
|
43 |
from transformers import AutoModelForSequenceClassification, AutoTokenizer, pipeline
|
44 |
|
45 |
+
model_name = 'plant-dnabert-BPE-lncRNAs'
|
46 |
# load model and tokenizer
|
47 |
model = AutoModelForSequenceClassification.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
|
48 |
tokenizer = AutoTokenizer.from_pretrained(f'zhangtaolab/{model_name}', trust_remote_code=True)
|
|
|
64 |
|
65 |
|
66 |
#### Hardware
|
67 |
+
Model was trained on a NVIDIA GTX1080Ti GPU (11 GB).
|