Spaces:

achraf2203
/

RAG-Chatbot

Sleeping

mohamedachraf commited on Aug 4

Commit

831dfea

1 Parent(s): f27624c

modify the pipeline

Files changed (1) hide show

app.py CHANGED Viewed

@@ -31,11 +31,11 @@ import tempfile
 # Prompt template
 template = """Context: {context}
-Question: {question}
-Answer: Based on the provided context, """
-QA_PROMPT = PromptTemplate(template=template, input_variables=["question", "context"])
 # Load Phi-2 model from hugging face hub
 model_id = "microsoft/phi-2"
@@ -148,18 +148,16 @@ def generate(question, answer, text_file, max_new_tokens):
         )
         phi2_pipeline = pipeline(
             "text-generation",
-            tokenizer=tokenizer,
             model=model,
             max_new_tokens=max_new_tokens,
             pad_token_id=tokenizer.eos_token_id,
             eos_token_id=tokenizer.eos_token_id,
-            do_sample=True,
-            temperature=0.7,
-            top_p=0.9,
-            repetition_penalty=1.1,
             streamer=streamer,
         )
         hf_model = HuggingFacePipeline(pipeline=phi2_pipeline)
         qa_chain, vectorstore = get_retrieval_qa_chain(text_file, hf_model)

 # Prompt template
 template = """Context: {context}
+Question: {query}
+Answer:"""
+QA_PROMPT = PromptTemplate(template=template, input_variables=["query", "context"])
 # Load Phi-2 model from hugging face hub
 model_id = "microsoft/phi-2"
         )
         phi2_pipeline = pipeline(
             "text-generation",
             model=model,
+            tokenizer=tokenizer,
             max_new_tokens=max_new_tokens,
+            do_sample=False,               # ← greedy
             pad_token_id=tokenizer.eos_token_id,
             eos_token_id=tokenizer.eos_token_id,
             streamer=streamer,
         )
         hf_model = HuggingFacePipeline(pipeline=phi2_pipeline)
         qa_chain, vectorstore = get_retrieval_qa_chain(text_file, hf_model)