-
-
Notifications
You must be signed in to change notification settings - Fork 5.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
--------- Co-authored-by: cal066 <[email protected]> Co-authored-by: oobabooga <[email protected]> Co-authored-by: randoentity <[email protected]>
- Loading branch information
1 parent
8dbaa20
commit 7a4fcee
Showing
9 changed files
with
188 additions
and
43 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,76 @@ | ||
from ctransformers import AutoConfig, AutoModelForCausalLM | ||
|
||
from modules import shared | ||
from modules.callbacks import Iteratorize | ||
from modules.logging_colors import logger | ||
|
||
|
||
class CtransformersModel: | ||
def __init__(self): | ||
pass | ||
|
||
@classmethod | ||
def from_pretrained(self, path): | ||
result = self() | ||
|
||
# ctransformers uses -1 for random seed | ||
config = AutoConfig.from_pretrained( | ||
str(path), | ||
threads=shared.args.threads, | ||
gpu_layers=shared.args.n_gpu_layers, | ||
batch_size=shared.args.n_batch, | ||
stream=True, | ||
seed=(-1 if shared.args.llama_cpp_seed == 0 else shared.args.llama_cpp_seed) | ||
) | ||
|
||
self.model = AutoModelForCausalLM.from_pretrained( | ||
str(result.model_dir(path) if result.model_type_is_auto() else path), | ||
model_type=(None if result.model_type_is_auto() else shared.args.model_type), | ||
config=config | ||
) | ||
|
||
logger.info(f'Using ctransformers model_type: {self.model.model_type} for {self.model.model_path}') | ||
return result, result | ||
|
||
def model_type_is_auto(self): | ||
return shared.args.model_type == "Auto" or shared.args.model_type == "None" | ||
|
||
def model_dir(self, path): | ||
if path.is_file(): | ||
return path.parent | ||
|
||
return path | ||
|
||
def encode(self, string, **kwargs): | ||
return self.model.tokenize(string) | ||
|
||
def decode(self, ids): | ||
return self.model.detokenize(ids) | ||
|
||
def generate(self, prompt, state, callback=None): | ||
prompt = prompt if type(prompt) is str else prompt.decode() | ||
generator = self.model._stream( | ||
prompt=prompt, | ||
max_new_tokens=state['max_new_tokens'], | ||
temperature=state['temperature'], | ||
top_p=state['top_p'], | ||
top_k=state['top_k'], | ||
repetition_penalty=state['repetition_penalty'], | ||
threads=shared.args.threads | ||
) | ||
|
||
output = "" | ||
for token in generator: | ||
if callback: | ||
callback(token) | ||
|
||
output += token | ||
|
||
return output | ||
|
||
def generate_with_streaming(self, *args, **kwargs): | ||
with Iteratorize(self.generate, args, kwargs, callback=None) as generator: | ||
reply = '' | ||
for token in generator: | ||
reply += token | ||
yield reply |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters