|
@@ -50,7 +50,9 @@ async def create_item(request: Request):
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
- model_file = "chatglm-6b"
|
|
|
+ #model_file = "chatglm-6b"
|
|
|
+ #model_file = "THUDM/chatglm-6b-int4-qe"
|
|
|
+ model_file = "chatglm-6b-int4-qe"
|
|
|
tokenizer = AutoTokenizer.from_pretrained(model_file, trust_remote_code=True)
|
|
|
#quantization_config= BitsAndBytesConfig(load_in_8bit=True)
|
|
|
|