Spaces:

AFischer1985
/

BERUFENET.AI

Running

App Files Files Community

AFischer1985 commited on Oct 15, 2024

Commit

66cb21c

verified ·

1 Parent(s): a2398ee

Update to Jina-embeddings

Browse files

Files changed (1) hide show

run.py +57 -37

run.py CHANGED Viewed

@@ -2,10 +2,9 @@
 # Title:  BERUFENET.AI
 # Author: Andreas Fischer
 # Date:   January 4th, 2024
-# Last update: February 8th, 2024
 #############################################################################
-import os
 dbPath="/home/af/Schreibtisch/Code/gradio/BERUFENET/db"
 if(os.path.exists(dbPath)==False): dbPath="/home/user/app/db"
@@ -15,42 +14,52 @@ print(dbPath)
 #-----------
 import chromadb
-#client = chromadb.Client()
 path=dbPath
 client = chromadb.PersistentClient(path=path)
 print(client.heartbeat())
 print(client.get_version())
 print(client.list_collections())
 from chromadb.utils import embedding_functions
-default_ef = embedding_functions.DefaultEmbeddingFunction()
-sentence_transformer_ef = embedding_functions.SentenceTransformerEmbeddingFunction(model_name="T-Systems-onsite/cross-en-de-roberta-sentence-transformer")
 #instructor_ef = embedding_functions.InstructorEmbeddingFunction(model_name="hkunlp/instructor-large", device="cuda")
 print(str(client.list_collections()))
 global collection
-if("name=BerufenetDB1" in str(client.list_collections())): #(False):
   print("BerufenetDB1 found!")
-  collection = client.get_collection(name="BerufenetDB1", embedding_function=sentence_transformer_ef)
 print("Database ready!")
 print(collection.count())
-# Model
-#-------
-from huggingface_hub import InferenceClient
-import gradio as gr
-client = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")
 # Gradio-GUI
 #------------
 import gradio as gr
 import json
 def format_prompt(message, history):
   prompt = "" #"<s>"
   #for user_prompt, bot_response in history:
@@ -59,26 +68,17 @@ def format_prompt(message, history):
   prompt += f"[INST] {message} [/INST]"
   return prompt
-def response(
-    prompt, history, temperature=0.9, max_new_tokens=500, top_p=0.95, repetition_penalty=1.0,
-):
-    temperature = float(temperature)
-    if temperature < 1e-2: temperature = 1e-2
-    top_p = float(top_p)
-    generate_kwargs = dict(
-        temperature=temperature,
-        max_new_tokens=max_new_tokens,
-        top_p=top_p,
-        repetition_penalty=repetition_penalty,
-        do_sample=True,
-        seed=42,
-    )
     addon=""
     results=collection.query(
       query_texts=[prompt],
-      n_results=5,
-      #where={"source": "google-docs"}
-      #where_document={"$contains":"search_string"}
     )
     dists=["<br><small>(relevance: "+str(round((1-d)*100)/100)+";" for d in results['distances'][0]]
     sources=["source: "+s["source"]+")</small>" for s in results['metadatas'][0]]
@@ -89,14 +89,34 @@ def response(
     if(len(results)>1):
       addon=" Bitte berücksichtige bei deiner Antwort ggf. folgende Auszüge aus unserer Datenbank, sofern sie für die Antwort erforderlich sind. Beantworte die Frage knapp und präzise. Ignoriere unpassende Datenbank-Auszüge OHNE sie zu kommentieren, zu erwähnen oder aufzulisten:\n"+"\n".join(results)
     system="Du bist ein deutschsprachiges KI-basiertes Assistenzsystem, das zu jedem Anliegen möglichst geeignete Berufe empfiehlt."+addon+"\n\nUser-Anliegen:"
-    formatted_prompt = format_prompt(system+"\n"+prompt, history)
-    stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
-    for response in stream:
         output += response.token.text
         yield output
     output=output+"\n\n<br><details open><summary><strong>Sources</strong></summary><br><ul>"+ "".join(["<li>" + s + "</li>" for s in combination])+"</ul></details>"
     yield output
-gr.ChatInterface(response, chatbot=gr.Chatbot(value=[[None,"Herzlich willkommen! Ich bin ein KI-basiertes Assistenzsystem, das für jede Anfrage die am besten passenden Berufe empfiehlt.<br>Erzähle mir, was du gerne tust!"]],render_markdown=True),title="German BERUFENET-RAG-Interface to the Hugging Face Hub").queue().launch(share=True) #False, server_name="0.0.0.0", server_port=7864)
 print("Interface up and running!")

 # Title:  BERUFENET.AI
 # Author: Andreas Fischer
 # Date:   January 4th, 2024
+# Last update: October 15th, 2024
 #############################################################################
 dbPath="/home/af/Schreibtisch/Code/gradio/BERUFENET/db"
 if(os.path.exists(dbPath)==False): dbPath="/home/user/app/db"
 #-----------
 import chromadb
+from chromadb import Documents, EmbeddingFunction, Embeddings
+import torch # chromaDB
+from transformers import AutoTokenizer, AutoModel # chromaDB
+jina = AutoModel.from_pretrained('jinaai/jina-embeddings-v2-base-de', trust_remote_code=True, torch_dtype=torch.bfloat16)
+#jira.save_pretrained("jinaai_jina-embeddings-v2-base-de")
+device='cuda:0' if torch.cuda.is_available() else 'cpu'
+jina.to(device) #cuda:0
+print(device)
+class JinaEmbeddingFunction(EmbeddingFunction):
+  def __call__(self, input: Documents) -> Embeddings:
+    embeddings = jina.encode(input) #max_length=2048
+    return(embeddings.tolist())
 path=dbPath
 client = chromadb.PersistentClient(path=path)
 print(client.heartbeat())
 print(client.get_version())
 print(client.list_collections())
 from chromadb.utils import embedding_functions
+#default_ef = embedding_functions.DefaultEmbeddingFunction()
+#sentence_transformer_ef = embedding_functions.SentenceTransformerEmbeddingFunction(model_name="T-Systems-onsite/cross-en-de-roberta-sentence-transformer")
 #instructor_ef = embedding_functions.InstructorEmbeddingFunction(model_name="hkunlp/instructor-large", device="cuda")
+jina_ef=JinaEmbeddingFunction()
+embeddingFunction=jina_ef
 print(str(client.list_collections()))
 global collection
+if("name=BerufenetDB1" in str(client.list_collections())):
   print("BerufenetDB1 found!")
+  collection = client.get_collection(name=, embedding_function=embeddingFunction)
 print("Database ready!")
 print(collection.count())
 # Gradio-GUI
 #------------
+from huggingface_hub import InferenceClient
 import gradio as gr
 import json
+myModel="mistralai/Mixtral-8x7B-Instruct-v0.1"
 def format_prompt(message, history):
   prompt = "" #"<s>"
   #for user_prompt, bot_response in history:
   prompt += f"[INST] {message} [/INST]"
   return prompt
+def response(prompt, history, hfToken):
+    inferenceClient=""
+    if(hfToken.startswith("hf_")): # use HF-hub with custom token if token is provided
+      inferenceClient = InferenceClient(model=myModel, token=hfToken)
+    else:
+      inferenceClient = InferenceClient(myModel)
+    generate_kwargs = dict(temperature=float(0.9), max_new_tokens=500, top_p=0.95, repetition_penalty=1.0, do_sample=True, seed=42)
     addon=""
     results=collection.query(
       query_texts=[prompt],
+      n_results=5
     )
     dists=["<br><small>(relevance: "+str(round((1-d)*100)/100)+";" for d in results['distances'][0]]
     sources=["source: "+s["source"]+")</small>" for s in results['metadatas'][0]]
     if(len(results)>1):
       addon=" Bitte berücksichtige bei deiner Antwort ggf. folgende Auszüge aus unserer Datenbank, sofern sie für die Antwort erforderlich sind. Beantworte die Frage knapp und präzise. Ignoriere unpassende Datenbank-Auszüge OHNE sie zu kommentieren, zu erwähnen oder aufzulisten:\n"+"\n".join(results)
     system="Du bist ein deutschsprachiges KI-basiertes Assistenzsystem, das zu jedem Anliegen möglichst geeignete Berufe empfiehlt."+addon+"\n\nUser-Anliegen:"
+    formatted_prompt = format_prompt(system+"\n"+prompt, history)
     output = ""
+    print(""+str(inferenceClient))
+    try:
+      stream = inferenceClient.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
+      for response in stream:
         output += response.token.text
         yield output
+    except Exception as e:
+      output = "Für weitere Antworten von der KI gebe bitte einen gültigen HuggingFace-Token an."
+      if(len(combination)>0):
+        output += "\nBis dahin helfen dir hoffentlich die folgenden Quellen weiter:"
+      yield output
+      print(str(e))
     output=output+"\n\n<br><details open><summary><strong>Sources</strong></summary><br><ul>"+ "".join(["<li>" + s + "</li>" for s in combination])+"</ul></details>"
     yield output
+gr.ChatInterface(
+  response,
+  chatbot=gr.Chatbot(value=[[None,"Herzlich willkommen! Ich bin ein KI-basiertes Assistenzsystem, das für jede Anfrage die am besten passenden Berufe empfiehlt.<br>Erzähle mir, was du gerne tust!"]],render_markdown=True),
+  title="BERUFENET.AI (Jina-Embeddings)",
+  additional_inputs=[
+    gr.Textbox(
+      value="",
+      label="HF_token"),
+  ]
+  ).queue().launch(share=True) #False, server_name="0.0.0.0", server_port=7864)
 print("Interface up and running!")