Locutusque
commited on
Commit
•
5e5c79d
1
Parent(s):
af28e3c
Update README.md
Browse files
README.md
CHANGED
@@ -21,8 +21,8 @@ This a fine-tuned version of gpt2 on Locutusque/InstructMix.
|
|
21 |
This model performs significantly better than Locutusque/gpt2-conversational-or-qa. Here are the training results:
|
22 |
|
23 |
|
24 |
-
- BLEU -
|
25 |
-
- Perplexity -
|
26 |
### Model Description
|
27 |
|
28 |
<!-- Provide a longer summary of what this model is. -->
|
@@ -87,8 +87,8 @@ Use the code below to get started with the model.
|
|
87 |
import torch
|
88 |
from transformers import GPT2Tokenizer, GPT2LMHeadModel
|
89 |
|
90 |
-
tokenizer = GPT2Tokenizer.from_pretrained('gpt2-conversational-retrain')
|
91 |
-
model = GPT2LMHeadModel.from_pretrained('gpt2-conversational-retrain')
|
92 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
93 |
model.to(device)
|
94 |
def generate_text(model, tokenizer, prompt, max_length=1024):
|
|
|
21 |
This model performs significantly better than Locutusque/gpt2-conversational-or-qa. Here are the training results:
|
22 |
|
23 |
|
24 |
+
- BLEU - 30
|
25 |
+
- Perplexity - 5
|
26 |
### Model Description
|
27 |
|
28 |
<!-- Provide a longer summary of what this model is. -->
|
|
|
87 |
import torch
|
88 |
from transformers import GPT2Tokenizer, GPT2LMHeadModel
|
89 |
|
90 |
+
tokenizer = GPT2Tokenizer.from_pretrained('gpt2-large-conversational-retrain')
|
91 |
+
model = GPT2LMHeadModel.from_pretrained('gpt2-large-conversational-retrain')
|
92 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
93 |
model.to(device)
|
94 |
def generate_text(model, tokenizer, prompt, max_length=1024):
|