File size: 4,322 Bytes
7e9684b
 
4c66227
7e9684b
 
 
 
4c66227
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7e9684b
 
 
 
4c66227
 
 
7e9684b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
import json
from langchain.schema import SystemMessage, HumanMessage
                  
def get_optimized_search_messages(query):
    messages = [
        SystemMessage(
            content="""
                You are a serach query optimizer specialist.
                Provide a better search query for web search engine to answer the given question, end the queries with ’**’
                Tips:
                    Identify the key concepts in the question
                    Remove filler words like "how to", "what is", "I want to"
                    Removed style such as "in the style of", "engaging", "short", "long"
                    Remove lenght instruction (example: essay, article, letter, blog, post, blogpost, etc)
                    Keep it short, around 3-7 words total
                    Put the most important keywords first
                    Remove formatting instructions
                    Remove style instructions (exmaple: in the style of, engaging, short, long)
                    Remove lenght instruction (example: essay, article, letter, etc)
                Example:
                    Question: How do I bake chocolate chip cookies from scratch?
                    Search query: chocolate chip cookies recipe from scratch**
                Example:
                    Question: I would like you to show me a time line of Marie Curie life. Show results as a markdown table
                    Search query: Marie Curie timeline**
                Example:
                    Question: I would like you to write a long article on nato vs russia. Use know geopolical frameworks.
                    Search query: geopolitics nato russia**
                Example:
                    Question: Write a engaging linkedin post about Andrew Ng
                    Search query: Andrew Ng**
                Example:
                    Question: Write a short artible about the solar system in the style of Carl Sagan
                    Search query: solar system**
                Example:
                    Question: Should I use Kubernetes? Answer in the style of Gilfoyde from the TV show Silicon Valley
                    Search query: Kubernetes decision**
                Example:
                    Question: biography of napoleon. include a table with the major events.
                    Search query: napoleon biography events**
                """
        ),
        HumanMessage(
            content=f"""
                Provide a better search query for web search engine to answer the given question, provide only one search query and nothing else, end the queries with ’**’.              
                Question: {query}
                Search query: 
            """
        ),
    ]
    return messages

def get_query_with_sources_messages(query, relevant_docs):
    messages = [
        SystemMessage(
            content="""
    You are an expert research assistant.
    You are provided with a Context in JSON format and a Question.

    Use RAG to answer the Question, providing references and links to the Context material you retrieve and use in your answer:
    When generating your answer, follow these steps:
    - Retrieve the most relevant context material from your knowledge base to help answer the question
    - Cite the references you use by including the title, author, publication, and a link to each source
    - Synthesize the retrieved information into a clear, informative answer to the question
    - Format your answer in Markdown, using heading levels 2-3 as needed
    - Include a "References" section at the end with the full citations and link for each source you used


    Example of Context JSON entry:
    {
        "page_content": "This provides access to material related to ...",
        "metadata": {
            "title": "Introduction - Marie Curie: Topics in Chronicling America",
            "link": "https://guides.loc.gov/chronicling-america-marie-curie"
        }
    }

    """
        ),
        HumanMessage(
            content= f"""
        Context information is below.
        Context: 
        ---------------------
        {json.dumps(relevant_docs, indent=2, ensure_ascii=False)}
        ---------------------
        Question: {query}
        Answer:
    """
        ),
    ]
    return messages