norallm
/

normistral-7b-warm

Text Generation

Norwegian Bokmål

Norwegian Nynorsk

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

davda54 commited on Feb 9

Commit

62557df

•

1 Parent(s): 90f7ec2

Update README.md

Files changed (1) hide show

README.md +1 -24

README.md CHANGED Viewed

@@ -329,10 +329,9 @@ pip install accelerate
 ```python
-from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
-# First, we will have to import the tokenizer and the language model
 tokenizer = AutoTokenizer.from_pretrained("norallm/normistral-7b-warm")
 # This setup needs about 8gb VRAM
@@ -344,26 +343,4 @@ model = AutoModelForCausalLM.from_pretrained(
     load_in_8bit=True,
     torch_dtype=torch.bfloat16
 )
-# Now we will define the zero-shot prompt template
-prompt = """Engelsk: {0}
-Bokmål:"""
-# A function that will take care of generating the output
-@torch.no_grad()
-def generate(text):
-    text = prompt.format(text)
-    input_ids = tokenizer(text, return_tensors='pt').input_ids.cuda()
-    prediction = model.generate(
-        input_ids,
-        max_new_tokens=64,
-        do_sample=False,
-        eos_token_id=tokenizer('\n').input_ids
-    )
-    return tokenizer.decode(prediction[0, input_ids.size(1):]).strip()
-# Now you can simply call the generate function with an English text you want to translate:
-generate("I'm super excited about this Norwegian NORA model! Can it translate these sentences?")
 ```

 ```python
 import torch
+from transformers import AutoTokenizer, AutoModelForCausalLM
 tokenizer = AutoTokenizer.from_pretrained("norallm/normistral-7b-warm")
 # This setup needs about 8gb VRAM
     load_in_8bit=True,
     torch_dtype=torch.bfloat16
 )
 ```