Final_Assignment_Template

Running

Coool2 commited on 7 days ago

Commit

95f4977

verified ·

1 Parent(s): 2281e58

Update agent.py

Files changed (1) hide show

agent.py CHANGED Viewed

@@ -99,12 +99,13 @@ code_llm = HuggingFaceLLM(
 embed_model = HuggingFaceEmbedding(
     model_name="llamaindex/vdr-2b-multi-v1",
-    device="cpu",  # "mps" for mac, "cuda" for nvidia GPUs
     trust_remote_code=True,
     model_kwargs={
-        "torch_dtype": torch.float16,
-        "device_map": "auto"  # Optional: for better GPU memory management
-    })
 Settings.llm = proj_llm
 Settings.embed_model = embed_model
@@ -266,8 +267,8 @@ class DynamicQueryEngineManager:
                     top_n=3,
                     device="cpu",
                     model_kwargs={
-                        "torch_dtype": torch.float16,
-                        "device_map": "auto"
                     }
                 )
             def postprocess_nodes(self, nodes, query_bundle):

 embed_model = HuggingFaceEmbedding(
     model_name="llamaindex/vdr-2b-multi-v1",
+    device="cpu",
     trust_remote_code=True,
     model_kwargs={
+        "torch_dtype": torch.float32,  # Use float32 for CPU
+        "low_cpu_mem_usage": True,     # Still get memory optimization
+    }
+)
 Settings.llm = proj_llm
 Settings.embed_model = embed_model
                     top_n=3,
                     device="cpu",
                     model_kwargs={
+                        "torch_dtype": torch.float32,  # Use float32 for CPU
+                        "low_cpu_mem_usage": True,     # Still get memory optimization
                     }
                 )
             def postprocess_nodes(self, nodes, query_bundle):