Update README.md
Browse files
README.md
CHANGED
@@ -6,28 +6,24 @@ tags:
|
|
6 |
- Test Generation
|
7 |
- research abstract
|
8 |
datasets: pt-sk/research_papers_short
|
|
|
9 |
---
|
10 |
-
```
|
11 |
-
from huggingface_hub import login
|
12 |
-
login()
|
13 |
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
path_or_fileobj="/content/drive/MyDrive/mamba_research_test",
|
18 |
-
path_in_repo="mamba_research_test",
|
19 |
-
repo_id="pt-sk/mamba_scratch",
|
20 |
-
repo_type="model",
|
21 |
-
commit_message="uploaded model file"
|
22 |
-
)
|
23 |
|
24 |
-
from huggingface_hub import HfApi
|
25 |
-
api = HfApi()
|
26 |
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
|
|
|
|
|
|
|
|
|
|
|
31 |
|
32 |
-
|
33 |
-
```
|
|
|
|
6 |
- Test Generation
|
7 |
- research abstract
|
8 |
datasets: pt-sk/research_papers_short
|
9 |
+
metrics: CrossEntropyLoss
|
10 |
---
|
|
|
|
|
|
|
11 |
|
12 |
+
Optimizer: AdamW
|
13 |
+
Leanring Rate: 0.001
|
14 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
15 |
|
|
|
|
|
16 |
|
17 |
+
Import the scripts from the code folder
|
18 |
+
```
|
19 |
+
from model import Mamba, ModelArgs
|
20 |
+
```
|
21 |
+
|
22 |
+
Loading Model
|
23 |
+
```
|
24 |
+
mamba_model = Mamba.from_pretrained("pt-sk/mamba").to("cuda")
|
25 |
+
```
|
26 |
|
27 |
+
Loading Tokenizer
|
28 |
+
```
|
29 |
+
tokenizer = AutoTokenizer.from_pretrained('pt-sk/mamba')
|