TwT-6
/

cr-model

Text Generation

Eval Results (legacy)

text-generation-inference

Model card Files Files and versions

TwT-6 commited on May 8, 2024

Commit

88679c6

·

verified ·

1 Parent(s): 35cd376

Update README.md

Files changed (1) hide show

README.md +7 -0

README.md CHANGED Viewed

@@ -7,7 +7,9 @@ My model is a state-of-the-art language processing AI designed to understand and
 How to use？
 from transformers import AutoModelForCausalLM, AutoTokenizer
 from transformers.generation import GenerationConfig
 import torch
@@ -15,12 +17,17 @@ model = AutoModelForCausalLM.from_pretrained(
     'TwT-6/open_llm_leaderboard_demo',
     attn_implementation="flash_attention_2",
     trust_remote_code=True, torch_dtype=torch.bfloat16, device_map="auto").eval()
 tokenizer = AutoTokenizer.from_pretrained('TwT-6/open_llm_leaderboard_demo', trust_remote_code=True)
 inputs = '你好'
 inputs = f'<|omni_start|>### User:\n{inputs}\n\n### Assistant:\n'
 inputs = tokenizer(inputs, return_tensors="pt").to('cuda')
 output_ids = model.generate(**inputs)[0].cpu()
 output = tokenizer.decode(output_ids[inputs.input_ids.shape[-1]:])
 print(output)

 How to use？
 from transformers import AutoModelForCausalLM, AutoTokenizer
 from transformers.generation import GenerationConfig
 import torch
     'TwT-6/open_llm_leaderboard_demo',
     attn_implementation="flash_attention_2",
     trust_remote_code=True, torch_dtype=torch.bfloat16, device_map="auto").eval()
 tokenizer = AutoTokenizer.from_pretrained('TwT-6/open_llm_leaderboard_demo', trust_remote_code=True)
 inputs = '你好'
 inputs = f'<|omni_start|>### User:\n{inputs}\n\n### Assistant:\n'
 inputs = tokenizer(inputs, return_tensors="pt").to('cuda')
 output_ids = model.generate(**inputs)[0].cpu()
 output = tokenizer.decode(output_ids[inputs.input_ids.shape[-1]:])
 print(output)