Update README.md
Browse files
README.md
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
license: apache-2.0
|
3 |
---
|
4 |
|
5 |
-
# LucaGPLM
|
6 |
|
7 |
-
LucaGPLM - The LUCA
|
8 |
|
9 |
## Installation
|
10 |
|
@@ -20,14 +20,17 @@ pip install lucagplm
|
|
20 |
from lucagplm import LucaGPLMModel, LucaGPLMTokenizer
|
21 |
|
22 |
# Load model
|
23 |
-
model = LucaGPLMModel.from_pretrained("
|
24 |
-
tokenizer = LucaGPLMTokenizer.from_pretrained("
|
25 |
|
26 |
# Example usage
|
27 |
seq = "ATCG"
|
|
|
28 |
inputs = tokenizer(seq, seq_type="gene",return_tensors="pt")
|
29 |
outputs = model(**inputs)
|
30 |
|
|
|
|
|
31 |
seq = "NSQTA"
|
32 |
inputs = tokenizer(seq, seq_type="prot",return_tensors="pt")
|
33 |
outputs = model(**inputs)
|
|
|
2 |
license: apache-2.0
|
3 |
---
|
4 |
|
5 |
+
# LucaOne/LucaGPLM(old checkpoint)
|
6 |
|
7 |
+
LucaOne/LucaGPLM - The LUCA Gene-Protein language model.
|
8 |
|
9 |
## Installation
|
10 |
|
|
|
20 |
from lucagplm import LucaGPLMModel, LucaGPLMTokenizer
|
21 |
|
22 |
# Load model
|
23 |
+
model = LucaGPLMModel.from_pretrained("LucaGroup/LucaOne-default-step5.6M")
|
24 |
+
tokenizer = LucaGPLMTokenizer.from_pretrained("LucaGroup/LucaOne-default-step5.6M")
|
25 |
|
26 |
# Example usage
|
27 |
seq = "ATCG"
|
28 |
+
# seq_type="gene", which includes DNA or RNA(Nucleotide Sequences)
|
29 |
inputs = tokenizer(seq, seq_type="gene",return_tensors="pt")
|
30 |
outputs = model(**inputs)
|
31 |
|
32 |
+
print(outputs.last_hidden_state.shape)
|
33 |
+
|
34 |
seq = "NSQTA"
|
35 |
inputs = tokenizer(seq, seq_type="prot",return_tensors="pt")
|
36 |
outputs = model(**inputs)
|