grantly/rag.py at main · SimPPL/grantly · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
#Streamlit code with all the functionalities.
import os
import sys
import types
from pathlib import Path
import streamlit as st
from langchain_community.document_loaders import PyPDFLoader, UnstructuredWordDocumentLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain_openai import OpenAIEmbeddings, ChatOpenAI
from langchain_community.vectorstores import FAISS
from langchain_community.retrievers import BM25Retriever
import dspy  # type: ignore
from dspy import Prediction  # type: ignore
import base64
from io import BytesIO
import requests
import json
import openai
from openai import OpenAI
from mistralai import Mistral # type: ignore
from streamlit_pdf_viewer import pdf_viewer # type: ignore
from langchain_pinecone import PineconeVectorStore
import hashlib
from vendor_dsparse import parse_and_chunk_text

pinecone_api_key = st.secrets["PINECONE_API_KEY"]
pinecone_env = st.secrets.get("PINECONE_ENVIRONMENT", "us-east-1")
index_name = "grant-rag"

from pinecone import Pinecone, ServerlessSpec

pc = Pinecone(api_key=pinecone_api_key)
if index_name not in pc.list_indexes().names():
    pc.create_index(
        name=index_name,
        dimension=1536,
        metric="cosine",
        spec=ServerlessSpec(cloud="aws", region=pinecone_env)
    )

from grant_cot_module import GrantCoTModule
optimized_cot = GrantCoTModule()
optimized_cot.load("optimized_grant_cot.json")

# --- LiteLLM Patch ---
os.environ["LITELLM_USE_CACHE"] = "False"
os.environ["LITELLM_LOGGING"] = "False"
dummy_module = types.SimpleNamespace()
dummy_module.TranscriptionCreateParams = types.SimpleNamespace()
dummy_module.TranscriptionCreateParams.__annotations__ = {}
sys.modules["litellm.litellm_core_utils.openai_types"] = dummy_module

# --- API Key ---
OPENAI_API_KEY = st.secrets["OPENAI_API_KEY"]
MISTRAL_API_KEY = st.secrets["MISTRAL_API_KEY"]

# --- DSPy Init ---
lm = dspy.LM("openai/gpt-4o", api_key=OPENAI_API_KEY)
try:
    dspy.configure(lm=lm)
except RuntimeError:
    pass

#function to fetch answers from google usoing the Perplexity API
def fetch_with_perplexity(query, api_key):
    url = "https://api.perplexity.ai/chat/completions"
    headers = {
        "Authorization": f"Bearer {api_key}",
        "Content-Type": "application/json"
    }
    payload = {
        "model": "sonar-pro",
        "messages": [{"role": "user", "content": query}],
        "search": True
    }
    try:
        response = requests.post(url, headers=headers, json=payload, timeout=30)
        response.raise_for_status()
        return response.json()["choices"][0]["message"]["content"]
    except Exception as e:
        return f"🌐 Perplexity API error: {e}"

# Function for editing the answers given by the model. I have given everything possible in the arguments so that it has all the context to edit the answer.
def refine_answer_with_instruction(system_prompt, context, original_question, optimized_question, previous_answer, user_instruction):
    refine_prompt = f"""
        {system_prompt}
        Below is the context and the original exchange. The user now wants to refine the answer with additional instructions.

        Context:
        {context}

        Original Question: {original_question}
        Optimized Question: {optimized_question}

        Previous Answer:
        {previous_answer}

        User Instruction:
        {user_instruction}

        Refined Answer:
        """
    client = OpenAI(api_key=OPENAI_API_KEY)
    response = client.chat.completions.create(
        model="gpt-4o",
        messages=[{"role": "user", "content": refine_prompt}],
        temperature=0.3
    )
    return response.choices[0].message.content.strip()

# Function to extract text from PDF using Mistral OCR when added to the pdf viewer.
def extract_text_with_mistral_ocr(uploaded_pdf):
    # Read the uploaded PDF file
    pdf_bytes = uploaded_pdf.read()
    base64_pdf = base64.b64encode(pdf_bytes).decode('utf-8')

    # Initialize Mistral client
    api_key = MISTRAL_API_KEY
    client = Mistral(api_key=api_key)

    # Process the PDF with Mistral OCR
    ocr_response = client.ocr.process(
        model="mistral-ocr-latest",
        document={
            "type": "document_url",
            "document_url": f"data:application/pdf;base64,{base64_pdf}"
        },
        include_image_base64=False  # Set to True if you want images included
    )

    # Concatenate markdown content from all pages
    extracted_text = "\n\n".join(page.markdown for page in ocr_response.pages)
    return extracted_text


# Function to extract questions from the uploaded document using GPT-4o.
def extract_questions_with_gpt4o(document_text, api_key):
    prompt = f"""
Extract all questions from the following grant or fellowship document text. Return ONLY the questions as a JSON list.

Text:
\"\"\"
{document_text}
\"\"\"

Questions:
"""
    client = OpenAI(api_key=api_key)
    response = client.chat.completions.create(
        model="gpt-4o",
        messages=[{"role": "user", "content": prompt}],
        temperature=0
    )
    content = response.choices[0].message.content
    import json, re
    try:
        questions = json.loads(content)
    except Exception:
        match = re.search(r"\[.*\]", content, re.DOTALL)
        if match:
            questions = json.loads(match.group(0))
        else:
            questions = []
    return questions

# --- Streamlit Setup ---
st.set_page_config(page_title="Grant & Fellowship Chat Assistant", layout="wide")
col1, col2, col3 , col4, col5= st.columns([1, 1, 1, 1,1])  # center column is 2× wider
with col3:
    st.markdown(
        """
        <link href="https://fonts.googleapis.com/css?family=Pacifico&display=swap" rel="stylesheet">
        <h1 style='font-family: Pacifico, cursiv; text-align: center;'>
            Grantly
        </h1>
        """,
        unsafe_allow_html=True
    )

# --- Optional Sidebar Context ---
with st.sidebar:
    st.markdown("### 📥 Upload Grant/Reference Documents")
    new_grant_file = st.file_uploader(
        "Upload a new PDF or DOCX to be added to the Grants folder and vectorstore:",
        type=["pdf", "docx"],
        key="grant_uploader"
    )

    st.markdown("---")

    # 🆕 Combined Grant URL and Grant Name Input
    st.markdown("#### 🌐 Grant Website or Name")
    grant_combined_input = st.text_area(
        "Paste the grant/fellowship website link and/or name:",
        help="Example:\nhttps://gatesfoundation.org/grants\nGates Foundation Grand Challenges 2025"
    )

    st.markdown("---")

    # File uploader (sidebar)
    uploaded_pdf = st.file_uploader(
        "📂 Upload a Grant PDF",
        type=["pdf"],
        label_visibility="visible"
    )

    pdf_text = ""
    if uploaded_pdf:
        file_ext = Path(uploaded_pdf.name).suffix.lower()

        # 👀 Preview first
        if file_ext == ".pdf":
            pdf_bytes = uploaded_pdf.read()
            pdf_viewer(input=pdf_bytes, width=700, height=900, annotations=[])
            uploaded_pdf.seek(0)

        else:
            st.error("Unsupported format.")
            st.stop()

        # 🔍 Send PDF or Docx directly to Mistral OCR afterwards
        with st.spinner("🔍 Extracting text via Mistral OCR..."):
            api_key = st.secrets["MISTRAL_API_KEY"]
            client = Mistral(api_key=api_key)

            base64_file = base64.b64encode(uploaded_pdf.read()).decode("utf-8")
            ocr_response = client.ocr.process(
                model="mistral-ocr-latest",
                document={"type": "document_url", "document_url": f"data:application/{file_ext[1:]};base64,{base64_file}"},
                include_image_base64=False,
                image_limit=0
            )

            pdf_text = "\n\n".join(page.markdown for page in ocr_response.pages)


        # --- Question Extraction with GPT-4o ---
        if pdf_text and "extracted_questions" not in st.session_state:
            with st.spinner("🔍 Extracting questions from document..."):
                questions = extract_questions_with_gpt4o(
                    pdf_text, OPENAI_API_KEY
                )
                st.session_state.extracted_questions = questions

        if st.session_state.get("extracted_questions"):
            st.markdown("### 📋 Extracted Questions")
            for i, q in enumerate(st.session_state.extracted_questions):
                btn_label = q[:75] + "..." if len(q) > 75 else q
                if st.button(btn_label, key=f"q_{i}"):
                    st.session_state.raw_query = q
                    st.rerun()
                    st.session_state.input_triggered_by_click = True

# --- Fetch Grant Information from Perplexity ---
webpage_text = ""
if grant_combined_input.strip():
    with st.spinner("🌐 Fetching Grant Info via Perplexity..."):
        try:
            browse_query = f"""
            You are a researcher. Please extract all important information from the provided URL (if present) and the grant name.

            Input:
            {grant_combined_input}

            Return a clean detailed structured text.
            """
            webpage_text = fetch_with_perplexity(browse_query, st.secrets["PERPLEXITY_API_KEY"])
        except Exception as e:
            st.warning(f"🌐 Could not fetch grant data: {e}")

    # if webpage_text.strip():
    #     st.markdown("### 🌐 Grant/Fellowship Information Retrieved from the Web")
    #     st.info(webpage_text)

col1, col2, col3 = st.columns([5, 1, 1])
with col3:
    if st.button("🧹 Clear Chat"):
        st.session_state.clear()
        st.rerun()

# Handle clear chat logic
if st.session_state.get("clear_chat"):
    st.session_state.clear()
    st.rerun()

# --- Defaults ---
if "chat_history" not in st.session_state:
    st.session_state.chat_history = []

if "latest_system_prompt" not in st.session_state:
    st.session_state.latest_system_prompt = ""

if "latest_context" not in st.session_state:
    st.session_state.latest_context = ""

if "selected_template" not in st.session_state:
    st.session_state.selected_template = "Personal Fellowships"

# --- Config ---
embedding_model = "text-embedding-3-small"
doc_dir = "Grants"
persist_dir = "./vectorstore"
chunk_size = 1000
chunk_overlap = 200
top_k_vector = 15
top_k_bm25 = 3
top_k_final = 5

embedding_model = "text-embedding-3-small"
embeddings = OpenAIEmbeddings(model=embedding_model, openai_api_key=OPENAI_API_KEY)

# --- Document Loader ---
# @st.cache_resource
# def load_all_documents():
#     all_chunks = []
#     for path in Path(doc_dir).rglob("*"):
#         if path.suffix not in [".pdf", ".docx"]:
#             continue
#         loader = PyPDFLoader(str(path)) if path.suffix == ".pdf" else UnstructuredWordDocumentLoader(str(path))
#         try:
#             docs = loader.load()
#             for doc in docs:  # For each raw doc
#                 agentic_chunks = parse_and_chunk_text(doc.page_content, chunk_size=chunk_size, overlap=chunk_overlap)
#                 for i, chunk in enumerate(agentic_chunks):
#                     chunk.metadata["filename"] = str(path.relative_to(doc_dir)).replace("\\", "/")
#                     chunk.metadata["chunk_id"] = i
#                     all_chunks.append(chunk)
#         except Exception as e:
#             st.warning(f"❌ Error loading {path}: {e}")
#     return all_chunks

# chunks = load_all_documents()

index = pc.Index(index_name)
vectorstore = PineconeVectorStore(index=index, embedding=embeddings)

# --- Vectorstore ---
def create_and_populate_vectorstore(chunks):
    embeddings = OpenAIEmbeddings(model=embedding_model, openai_api_key=OPENAI_API_KEY)
    pc = Pinecone(api_key=pinecone_api_key)
    index = pc.Index(index_name)
    vectorstore = PineconeVectorStore(index=index, embedding=embeddings)
    # vectorstore.add_documents(chunks)   (for bulk upload)
    return vectorstore


def get_file_hash(file_path):
    """Returns a short hash of the file contents."""
    BUF_SIZE = 65536
    sha256 = hashlib.sha256()
    with open(file_path, 'rb') as f:
        while True:
            data = f.read(BUF_SIZE)
            if not data:
                break
            sha256.update(data)
    return sha256.hexdigest()[:10]

# Function to add a newly uploaded grant document to the vectorstore
if new_grant_file:
    file_path = Path("Grants") / new_grant_file.name
    with open(file_path, "wb") as f:
        f.write(new_grant_file.read())
    st.success(f"✅ Saved `{new_grant_file.name}` to Grants/")

    loader = PyPDFLoader(str(file_path)) if file_path.suffix == ".pdf" else UnstructuredWordDocumentLoader(str(file_path))
    try:
        docs = loader.load()
        new_chunks = []
        for doc in docs:
            # Corrected variable name:
            agentic_chunks = parse_and_chunk_text(doc.page_content, chunk_size=chunk_size, overlap=chunk_overlap)
            new_chunks.extend(agentic_chunks)

        doc_hash = get_file_hash(file_path)
        ids = []
        for i, chunk in enumerate(new_chunks):
            chunk.metadata["filename"] = str(file_path.relative_to("Grants")).replace("\\", "/")
            chunk.metadata["chunk_id"] = i
            ids.append(f"{doc_hash}#{i}")

        vectorstore.add_documents(new_chunks, ids=ids)
        st.success("✅ Document successfully embedded and added to Pinecone vectorstore!")
    except Exception as e:
        st.error(f"❌ Failed to process document: {e}")

# --- DSPy Modules ---
class QueryOptimizationModule(dspy.Module):
    def __init__(self):
        super().__init__()
        self.optimize = dspy.Predict("query -> optimized_query")

    def forward(self, query):
        llm = ChatOpenAI(openai_api_key=OPENAI_API_KEY, temperature=0)
        prompt = (
            "Rewrite the following grant application question to be as clear, specific, and context-rich as possible for searching a knowledge base. "
            "Do not add unrelated information. Only return the improved query.\n\n"
            f"Original question: {query}\n\nOptimized query:"
        )
        return llm.invoke(prompt).content.strip()

class HybridRetrievalModule(dspy.Module):
    """Hybrid retrieval first vector then BM25 on that pool of documents."""
    def __init__(self, vectorstore):
        super().__init__()
        self.vectorstore = vectorstore

    def forward(self, optimized_query, top_k_vector=50, top_k_bm25=5):
        # 1. Retrieve initial pool from vector
        vector_docs = self.vectorstore.similarity_search(optimized_query, k=top_k_vector)

        # 2. Apply BM25 on this pool
        bm25 = BM25Retriever.from_documents(vector_docs)
        bm25_docs = bm25.invoke(optimized_query)[:top_k_bm25]

        # 3. Combine and de-duplicate
        combined = { (d.metadata['filename'], d.metadata['chunk_id']): d
                     for d in vector_docs + bm25_docs }

        return list(combined.values())

class RerankModule(dspy.Module):
    def __init__(self):
        super().__init__()
        self.rerank = dspy.Predict("question, docs -> top_docs")

    def forward(self, question, docs, top_n=5):
        llm = ChatOpenAI(openai_api_key=OPENAI_API_KEY, temperature=0)
        scored = []
        for doc in docs:
            prompt = f"""You are a helpful assistant. Score how relevant this chunk is to answering the user's question.
            Chunk:
            \"\"\"{doc.page_content}\"\"\"
            Question: {question}
            Score (0 to 10):"""
            try:
                score = float(llm.predict(prompt).strip())
            except:
                score = 0.0
            scored.append((score, doc))
        return [doc for score, doc in sorted(scored, reverse=True, key=lambda x: x[0])[:top_n]]

class GrantRAG(dspy.Module):
    def __init__(self):
        super().__init__()
        self.generate = dspy.Predict("system_prompt, context, question, history -> answer")

    def forward(self, system_prompt, context, question, history):
        return self.generate(system_prompt=system_prompt, context=context, question=question, history=history)

# --- Template Buttons ---
st.markdown("📋 **Choose Grant Type Template**")
col1, col2, col3 = st.columns(3)
if col1.button("🎓 Personal Fellowships"):
    st.session_state.selected_template = "Personal Fellowships"
if col2.button("💼 Industry Grants"):
    st.session_state.selected_template = "Industry Grants"
if col3.button("🔬 Academic Research Grants"):
    st.session_state.selected_template = "Academic Research Grants"
st.markdown(f"📌 **Selected Template:** `{st.session_state.selected_template}`")

# --- Query Input ---
query = st.chat_input("Ask something about your grant/fellowship...")

if st.session_state.get("input_triggered_by_click") and not query:
    query = st.session_state.raw_query
    st.session_state.input_triggered_by_click = False  # Reset

if query:
    with st.spinner("🔍 Optimizing Query..."):
        query_optimizer = QueryOptimizationModule()
        optimized_query = query_optimizer(query)
        st.session_state.optimized_query = optimized_query
        st.session_state.raw_query = query
        st.session_state.proceed_triggered = False

if "optimized_query" in st.session_state and not st.session_state.get("proceed_triggered", False):
    st.markdown("### ✍️ Optimized Query")
    edited_query = st.text_area("Modify the optimized query below if needed:", st.session_state.optimized_query)
    if st.button("✅ Proceed with this optimized query"):
        st.session_state.optimized_query = edited_query.strip()
        st.session_state.proceed_triggered = True
        st.rerun()

# --- Retrieval + Answer ---
if st.session_state.get("proceed_triggered", False):
    with st.spinner("🔍 Retrieving + Generating Answer..."):
        retriever = HybridRetrievalModule(vectorstore)
        initial_docs = retriever(st.session_state.optimized_query, top_k_vector=top_k_vector, top_k_bm25=top_k_bm25)
        reranker = RerankModule()
        top_docs = reranker(st.session_state.optimized_query, initial_docs, top_n=top_k_final)

        context, inline_map = "", {}
        for doc in top_docs:
            cid = doc.metadata["chunk_id"]
            marker = f"[Chunk {cid}](#chunk-{cid})"
            context += f"{marker}\n{doc.page_content}\n\n---\n\n"
            inline_map[marker] = (cid, doc.metadata["filename"], doc.page_content)

        full_history = ""
        for turn in st.session_state.chat_history:
            full_history += f"User: {turn['question']}\nAssistant: {turn['answer']}\n\n"

        # --- System Prompt ---
        if st.session_state.selected_template == "Personal Fellowships":
             system_prompt = f"""You are a helpful assistant for personal fellowship applications. You will be given:
            - The original question asked by the user,
            - An optimized version of that question for improved clarity,
            - A set of retrieved document chunks related to past applications.

            Your job is to generate an accurate, helpful, and clear answer using only the information from the retrieved chunks. Do not invent information. If the documents are unable to provide information relevant to the query, say so.
            Most fellowships have a specific call for applications and they have a focus on finding and selecting certain types of individuals with particular kinds of experiences. You must identify the key requirements of the call for fellows and develop an understanding of what the priorities for the fellowship are as stated in the call for applications in the current cycle
            You must also search for past fellows and review their profiles and work experience including any projects they pitched for the fellowship so that you understand what kinds of fellows were previously selected including what they had in common
            In preparing your set of answers for the fellowship, you must review the background and work history of the individual applying for the project in order to identify specific experiences they may have had that are relevant to mention in response to the fellowship call
            Some fellowships are research focused while others are industry focused. Each has a preference for the kind of impact they want to see: gauge the priorities from the call for applicants or from the organizational background and position your answers accordingly
            Fellowships usually require precise answers that include quantitative, high-impact outcomes so you must identify the outcomes that the applicant has delivered in the past.
            But remember to ensure the outcomes are aligned with the focus area of the fellowship. Do not pick random outcomes that may not fall within the scope of the call for proposals. Prioritize recent achievements and organize them by the skill that they highlight so that when you mention multiple achievements they do not feel discordant.
            When presenting different aspects of an applicant’s profile, pick ones that relate to a particular theme that you are expressing in each answer, responding specifically to the question that is provided with an understanding of the recent developments in the field
            Your answers must feel coherent, human-written, and impressive without using flowery language that sounds like a language model created it
            Remember that you must be realistic in your answers and try to provide evidence of the current gaps and how your proposed solution or project may bridge these gaps
            Fellowships want ambitious individuals. When you are writing your answers, be bold and be ambitious. But always remember to make claims that the applicant has demonstrably made past progress on. Making arbitrary claims hurts the applicant rather than helping them. Be bold but be pragmatic in presenting your answers.

            Cite chunks inline using this format: [Chunk X].

            Original Question: {st.session_state.raw_query}
            """

        elif st.session_state.selected_template == "Industry Grants":
            system_prompt = f"""
            You are a helpful assistant for writing industry-focused grant proposals. You will be given:
            - The original question asked by the user,
            - An optimized version of that question for improved clarity,
            - A set of retrieved document chunks related to successful past grant proposals, industry standards, and background information about the applicant and their venture.

            Your job is to generate an accurate, clear, and compelling answer using only the information from the retrieved chunks. Do not invent information. If the documents do not provide information relevant to the query, state this clearly.

            When writing industry-based grant proposals, you must:
                - Identify and address the specific requirements, priorities, and evaluation criteria of the grant call, referencing the current cycle’s guidelines and any relevant industry trends.
                - Clearly define the problem or industry gap being addressed, using quantitative data, statistics, and real-world examples, especially those relevant to the applicant’s operational geographies.
                - Articulate the innovation or solution, describing its technical and practical merits, how it advances the state of the art, and how it compares to existing alternatives. Highlight unique features, scalability, and competitive advantages.
                - Demonstrate the impact and relevance of the project for the industry, community, or society, using concrete examples and anticipated outcomes. Address economic, social, and policy implications where relevant.
                - Provide a detailed methodology or plan of work, outlining the approach, timeline, milestones, and risk mitigation strategies. Ensure the plan is feasible and aligns with industry best practices.
                - Present a well-justified budget, linking requested funds to specific activities and outcomes. Include any co-funding, partnerships, or sustainability plans for post-grant continuation.
                - Highlight the qualifications and diversity of the team, referencing specific expertise, roles, and past achievements. Where possible, include brief bios of key personnel and their relevant experience, especially as it relates to the proposal’s focus area.
                - Situate the proposal within the broader competitive and regulatory landscape, referencing direct and indirect competitors, relevant standards, or compliance requirements.
                - Reference past successes, partnerships, and recognition (e.g., awards, accelerator participation, impact metrics) to demonstrate credibility and track record.
                - If asked about limitations or risks, answer candidly, referencing any known gaps or challenges and the strategies in place to address them.

            Your answers must:
                - Be structured according to industry grant writing best practices, including clear sections such as Executive Summary, Problem Statement, Solution/Innovation, Methodology, Impact, Team, Budget, Evaluation, and Sustainability.
                - Be specific, actionable, and tailored to the question, avoiding generic statements.
                - Use evidence and examples from the retrieved chunks to support all claims.
                - Clearly articulate what differentiates the applicant’s approach or solution from others in the field.
                - Maintain a professional yet accessible tone, suitable for reviewers from both technical and non-technical backgrounds.
                - When discussing scale, sustainability, or vision, connect the proposal to broader industry trends and long-term goals.
                - If the retrieved documents do not provide sufficient information to answer the query, say so clearly.

            Cite chunks inline using this format: [Chunk X].

            Original Question: {st.session_state.raw_query}
            """

        else:
            system_prompt = f"""You are an expert assistant for preparing a **Research Grant Application Section or Literature Review**.

            Your role is to:
            - Provide a tailored, coherent, and insightful write-up.
            - Support your narrative with **citations from retrieved documents** in the form [Chunk X].

            This will help the applicant:
            - Clearly state their **research question**, **hypotheses** (if provided), and **research context**.
            - Provide a **critical review of related literature**, identifying key contributors, gaps in knowledge, and how this proposal will advance understanding.

            To do this effectively, consider:

            ➥ The **original question**, which guides the proposal's main inquiry.
            ➥ Hypotheses or sub-questions, if provided, to structure your narrative.
            ➥ Names of key researchers, keywords, focus areas, or time periods the applicant highlights (this can help you filter and emphasize relevant context).
            ➥ The **research design constraints** (if any), to align your content with what's feasible.
            ➥ Whether the applicant wants a:
            - Literature Review Section (critical review, related work, gaps).
            - Research Section (aims, hypotheses, significance, methods).

            Your answer should:
            - Be coherent, clear, and tailored to the applicant's context.
            - Provide a strong **rationale and significance**, demonstrating knowledge of the field and how this proposal adds to it.
            - Be backed by **citations to retrieved documents**.

            ---

            Original Question: {st.session_state.raw_query}
            """

        # Added context from uploaded documents
        if pdf_text.strip():
            system_prompt += "\n\n---\n📄 Uploaded Grant PDF Content:\n" + pdf_text.strip()

        # Added context from website
        if webpage_text.strip():
            system_prompt += "\n\n---\n🌐 Retrieved Grant/Fellowship Info from Website:\n" + webpage_text.strip()

        # Store for use in Edit Answer later
        st.session_state.latest_system_prompt = system_prompt
        st.session_state.latest_context = context

        cot_result = optimized_cot(question=st.session_state.optimized_query)
        answer = cot_result.answer
        reasoning = cot_result.reasoning

        # --- Internet (Perplexity) Fetch and Answer Generation ---
        pplx_answer = None
        pplx_generated_answer = None
        if st.session_state.selected_template == "Academic Research Grants":
            with st.spinner("🌐 Fetching Internet Context via Perplexity..."):
                pplx_answer = fetch_with_perplexity(st.session_state.raw_query, st.secrets["PERPLEXITY_API_KEY"])

            if pplx_answer:
                web_prompt = f"""
                You are an academic research assistant. Based ONLY on the following Internet information, answer the user's question clearly and accurately.

                --- Internet Context ---
                {pplx_answer}
                ------------------------

                User's Question: {st.session_state.raw_query}

                Answer:
                """
                web_llm = ChatOpenAI(openai_api_key=OPENAI_API_KEY, temperature=0.3)
                pplx_generated_answer = web_llm.invoke(web_prompt).content.strip()

        # --- Store everything in session ---
        history_item = {
            "question": st.session_state.raw_query,
            "optimized_query": st.session_state.optimized_query,
            "reasoning": reasoning,
            "answer": answer,
            "sources": inline_map,
            "system_prompt": system_prompt,
            "context": context
        }
        if pplx_answer:
            history_item["pplx_answer"] = pplx_answer  # raw web search
        if pplx_generated_answer:
            history_item["pplx_generated_answer"] = pplx_generated_answer  # full generated answer from web

        st.session_state.chat_history.append(history_item)
        st.session_state.proceed_triggered = False

# --- Chat History ---
if st.session_state.get("chat_history"):
    for turn in st.session_state.chat_history:
        st.chat_message("user").markdown(turn["question"])
        st.chat_message("assistant").markdown(turn.get("answer", ""))

        with st.expander("✏️ Edit Answer"):
            edit_instruction = st.text_area(
                f"Provide edits or additions for this answer:",
                key=f"instruction_{hash(turn['question'])}"
            )
            if st.button("🔄 Apply Instruction", key=f"apply_{hash(turn['question'])}"):
                with st.spinner("✍️ Refining answer..."):
                    refined = refine_answer_with_instruction(
                    system_prompt=st.session_state.get("latest_system_prompt", ""),
                    context=st.session_state.get("latest_context", ""),
                    original_question=turn['question'],
                    optimized_question=turn['optimized_query'],
                    previous_answer=turn['answer'],
                    user_instruction=edit_instruction
                    )
                    turn['answer'] = refined
                    st.rerun()

        # Show separate Perplexity Internet-generated Assistant answer
        if "pplx_generated_answer" in turn:
            st.chat_message("assistant").markdown("🌐 **Answer based on Internet Search (Perplexity):**")
            st.chat_message("assistant").markdown(turn["pplx_generated_answer"])

        # Optional: show raw Internet context separately
        if "pplx_answer" in turn:
            with st.expander("🌐 Internet Context Summary (Perplexity)"):
                st.markdown(turn["pplx_answer"])

        if "reasoning" in turn:
            st.markdown(f"**🧠 Reasoning:** {turn['reasoning']}")

        st.markdown(f"**Optimized Query Used:** {turn.get('optimized_query', '')}")

        with st.expander("📄 Source Chunks"):
            for marker, (cid, fname, content) in turn["sources"].items():
                anchor = f"chunk-{cid}"
                st.markdown(f"<a name='{anchor}'></a>", unsafe_allow_html=True)
                st.markdown(f"**{marker}** — *{fname}*")
                st.code(content.strip())