Spaces:

Jaamie
/

SafeSpace-AI

Sleeping

Jaamie commited on Apr 16

Commit

2e238f3

verified ·

1 Parent(s): 69dd81f

Upload 2 files

Using a quantised version of the gemma-9b (neuralmagic/gemma-2-9b-it-quantized.w4a16)

Files changed (2) hide show

app.py CHANGED Viewed

@@ -161,8 +161,8 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # #model = AutoModelForCausalLM.from_pretrained(READER_MODEL_NAME)
 # model = AutoModelForCausalLM.from_pretrained(READER_MODEL_NAME).to(device)
-#model_id = "neuralmagic/gemma-2-9b-it-quantized.w4a16"
-model_id = "TheBloke/Gemma-2-7B-IT-GGUF"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,

 # #model = AutoModelForCausalLM.from_pretrained(READER_MODEL_NAME)
 # model = AutoModelForCausalLM.from_pretrained(READER_MODEL_NAME).to(device)
+model_id = "neuralmagic/gemma-2-9b-it-quantized.w4a16"
+#model_id = "TheBloke/Gemma-2-7B-IT-GGUF"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,

requirements.txt CHANGED Viewed

@@ -13,4 +13,6 @@ openai-whisper
 uuid
 textwrap3
 python-dotenv

 uuid
 textwrap3
 python-dotenv
+pyngrok
+compressed-tensors