forked from llmware-ai/llmware
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgetting_started_with_rag.py
81 lines (57 loc) · 3.56 KB
/
getting_started_with_rag.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
"""This example demonstrates Retrieval Augmented Retrieval (RAG) """
import os
from llmware.library import Library
from llmware.retrieval import Query
from llmware.prompts import Prompt
from llmware.setup import Setup
# A self-contained end-to-end example of RAG
def end_to_end_rag(model_name, vector_db="faiss"):
# Create a library called "Agreements", and load it with llmware sample files
print (f"\n > Creating library 'Agreements'...")
library = Library().create_new_library("Agreements")
sample_files_path = Setup().load_sample_files()
library.add_files(os.path.join(sample_files_path,"Agreements"))
# Create vector embeddings for the library using the "industry-bert-contracts" model and store them in Milvus
print (f"\n > Generating vector embeddings using embedding model: 'industry-bert-contracts'...")
library.install_new_embedding(embedding_model_name="industry-bert-contracts", vector_db=vector_db)
# Perform a semantic search against our library. This will gather evidence to be used in the LLM prompt
print (f"\n > Performing a semantic query...")
os.environ["TOKENIZERS_PARALLELISM"] = "false" # Avoid a HuggingFace tokenizer warning
query_results = Query(library).semantic_query("Termination", result_count=20)
# Create a new prompter and add the query_results captured above
prompt_text = "Summarize the termination provisions"
print (f"\n > Prompting LLM with '{prompt_text}'")
prompter = Prompt().load_model(model_name)
sources = prompter.add_source_query_results(query_results)
# Prompt the LLM with the sources and a query string
responses = prompter.prompt_with_source(prompt_text, prompt_name="summarize_with_bullets")
for response in responses:
print ("\n > LLM response\n" + response["llm_response"])
# Finally, generate a CSV report that can be shared
print (f"\n > Generating CSV report...")
report_data = prompter.send_to_human_for_review()
print ("File: " + report_data["report_fp"] + "\n")
return 0
if __name__ == "__main__":
model_name = "llmware/bling-1b-0.1"
# To use an API key based model,
# (1) update the model name, e.g., model_name = "gpt-4"
# (2) set API key in environment variable, e.g., os.environ["USER_MANAGED_OPENAI_API_KEY"] = "<your-key>"
# to update the vector_db, please change the name below, and review the Embedding examples for configuration, if required
end_to_end_rag(model_name, vector_db="faiss")
# **********************************************************************************************************
# ************************************** SAMPLE OUTPUT *****************************************************
# **********************************************************************************************************
'''
> Creating library 'Agreements'...
> Generating vector embeddings using embedding model: 'industry-bert-contracts'...
> Performing a semantic query...
> Prompting LLM with 'Summarize the termination provisions'
> LLM response
- Employment period ends on the first occurrence of either the 6th anniversary of the effective date or a company sale.
- Early termination possible as outlined in sections 3.1 through 3.4.
- Employer can terminate executive's employment under section 3.1 anytime without cause, with at least 30 days' prior written notice.
- If notice is given, the executive is allowed to seek other employment during the notice period.
> Generating CSV report...
File: /Users/.../llmware_data/prompt_history/interaction_report_Fri Dec 8 10:13:51 2023.csv
'''