-
Notifications
You must be signed in to change notification settings - Fork 10
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Capturing vectorstore deployment url (#80)
* update vectorstore deployment url Signed-off-by: sachintendulkar576123 <[email protected]>
- Loading branch information
1 parent
1495544
commit b17c2d1
Showing
10 changed files
with
963 additions
and
5 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,218 @@ | ||
import os | ||
from datasets import load_dataset | ||
from haystack import Document, Pipeline | ||
from haystack.components.builders import PromptBuilder | ||
from haystack.components.embedders import ( | ||
SentenceTransformersDocumentEmbedder, | ||
SentenceTransformersTextEmbedder, | ||
) | ||
from haystack.components.generators import OpenAIGenerator | ||
from haystack_integrations.components.retrievers.opensearch import OpenSearchEmbeddingRetriever | ||
from haystack_integrations.document_stores.opensearch import OpenSearchDocumentStore | ||
|
||
from haystack.document_stores.types import DuplicatePolicy | ||
from haystack.utils import Secret | ||
from opentelemetry.sdk.trace.export import BatchSpanProcessor, ConsoleSpanExporter | ||
from monocle_apptrace.instrumentor import setup_monocle_telemetry | ||
from monocle_apptrace.wrap_common import llm_wrapper, task_wrapper | ||
from monocle_apptrace.wrapper import WrapperMethod | ||
|
||
def haystack_app(): | ||
|
||
setup_monocle_telemetry( | ||
workflow_name="haystack_app_1", | ||
span_processors=[BatchSpanProcessor(ConsoleSpanExporter())], | ||
wrapper_methods=[ | ||
|
||
|
||
]) | ||
|
||
# initialize | ||
|
||
api_key = os.getenv("OPENAI_API_KEY") | ||
http_auth=("sachin-opensearch", "Sachin@123") | ||
generator = OpenAIGenerator( | ||
api_key=Secret.from_token(api_key), model="gpt-3.5-turbo" | ||
) | ||
document_store = OpenSearchDocumentStore(hosts="https://search-sachin-opensearch-cvvd5pdeyrme2l2y26xmcpkm2a.us-east-1.es.amazonaws.com", use_ssl=True, | ||
verify_certs=True, http_auth=http_auth) | ||
model = "sentence-transformers/all-mpnet-base-v2" | ||
|
||
# documents = [Document(content="There are over 7,000 languages spoken around the world today."), | ||
# Document(content="Elephants have been observed to behave in a way that indicates a high level of self-awareness, such as recognizing themselves in mirrors."), | ||
# Document(content="In certain parts of the world, like the Maldives, Puerto Rico, and San Diego, you can witness the phenomenon of bioluminescent waves.")] | ||
|
||
dataset = load_dataset("bilgeyucel/seven-wonders", split="train") | ||
documents = [Document(content=doc["content"], meta=doc["meta"]) for doc in dataset] | ||
document_embedder = SentenceTransformersDocumentEmbedder(model=model) | ||
document_embedder.warm_up() | ||
documents_with_embeddings = document_embedder.run(documents) | ||
|
||
document_store.write_documents(documents_with_embeddings.get("documents"), policy=DuplicatePolicy.SKIP) | ||
|
||
|
||
# embedder to embed user query | ||
text_embedder = SentenceTransformersTextEmbedder( | ||
model="sentence-transformers/all-mpnet-base-v2" | ||
) | ||
|
||
# get relevant documents from embedded query | ||
retriever = OpenSearchEmbeddingRetriever(document_store=document_store) | ||
|
||
# use documents to build the prompt | ||
template = """ | ||
Given the following information, answer the question. | ||
Context: | ||
{% for document in documents %} | ||
{{ document.content }} | ||
{% endfor %} | ||
Question: {{question}} | ||
Answer: | ||
""" | ||
|
||
prompt_builder = PromptBuilder(template=template) | ||
|
||
basic_rag_pipeline = Pipeline() | ||
# Add components to your pipeline | ||
basic_rag_pipeline.add_component("text_embedder", text_embedder) | ||
basic_rag_pipeline.add_component("retriever", retriever) | ||
basic_rag_pipeline.add_component("prompt_builder", prompt_builder) | ||
basic_rag_pipeline.add_component("llm", generator) | ||
|
||
# Now, connect the components to each other | ||
basic_rag_pipeline.connect("text_embedder.embedding", "retriever.query_embedding") | ||
basic_rag_pipeline.connect("retriever", "prompt_builder.documents") | ||
basic_rag_pipeline.connect("prompt_builder", "llm") | ||
|
||
question = "What does Rhodes Statue look like?" | ||
|
||
response = basic_rag_pipeline.run( | ||
{"text_embedder": {"text": question}, "prompt_builder": {"question": question}} | ||
) | ||
|
||
# print(response["llm"]["replies"][0]) | ||
|
||
|
||
haystack_app() | ||
|
||
# { | ||
# "name": "haystack.retriever", | ||
# "context": { | ||
# "trace_id": "0xa599cf84e013b83c58e3afaf8a7058f8", | ||
# "span_id": "0x90b01a17810b9b38", | ||
# "trace_state": "[]" | ||
# }, | ||
# "kind": "SpanKind.INTERNAL", | ||
# "parent_id": "0x557fc857283d8651", | ||
# "start_time": "2024-11-26T09:52:00.845732Z", | ||
# "end_time": "2024-11-26T09:52:01.742785Z", | ||
# "status": { | ||
# "status_code": "UNSET" | ||
# }, | ||
# "attributes": { | ||
# "span.type": "retrieval", | ||
# "entity.count": 2, | ||
# "entity.1.name": "OpenSearchDocumentStore", | ||
# "entity.1.type": "vectorstore.OpenSearchDocumentStore", | ||
# "entity.1.deployment": "https://search-sachin-opensearch-cvvd5pdeyrme2l2y26xmcpkm2a.us-east-1.es.amazonaws.com:443", | ||
# "entity.2.name": "sentence-transformers/all-mpnet-base-v2", | ||
# "entity.2.type": "model.embedding.sentence-transformers/all-mpnet-base-v2" | ||
# }, | ||
# "events": [], | ||
# "links": [], | ||
# "resource": { | ||
# "attributes": { | ||
# "service.name": "haystack_app_1" | ||
# }, | ||
# "schema_url": "" | ||
# } | ||
# } | ||
# { | ||
# "name": "haystack.components.generators.openai.OpenAIGenerator", | ||
# "context": { | ||
# "trace_id": "0xa599cf84e013b83c58e3afaf8a7058f8", | ||
# "span_id": "0x1de03fa69ab19977", | ||
# "trace_state": "[]" | ||
# }, | ||
# "kind": "SpanKind.INTERNAL", | ||
# "parent_id": "0x557fc857283d8651", | ||
# "start_time": "2024-11-26T09:52:01.742785Z", | ||
# "end_time": "2024-11-26T09:52:03.804858Z", | ||
# "status": { | ||
# "status_code": "UNSET" | ||
# }, | ||
# "attributes": { | ||
# "span.type": "inference", | ||
# "entity.count": 2, | ||
# "entity.1.type": "inference.azure_oai", | ||
# "entity.1.inference_endpoint": "https://api.openai.com/v1/", | ||
# "entity.2.name": "gpt-3.5-turbo", | ||
# "entity.2.type": "model.llm.gpt-3.5-turbo" | ||
# }, | ||
# "events": [ | ||
# { | ||
# "name": "metadata", | ||
# "timestamp": "2024-11-26T09:52:03.804858Z", | ||
# "attributes": { | ||
# "completion_tokens": 126, | ||
# "prompt_tokens": 2433, | ||
# "total_tokens": 2559 | ||
# } | ||
# } | ||
# ], | ||
# "links": [], | ||
# "resource": { | ||
# "attributes": { | ||
# "service.name": "haystack_app_1" | ||
# }, | ||
# "schema_url": "" | ||
# } | ||
# } | ||
# { | ||
# "name": "haystack.core.pipeline.pipeline.Pipeline", | ||
# "context": { | ||
# "trace_id": "0xa599cf84e013b83c58e3afaf8a7058f8", | ||
# "span_id": "0x557fc857283d8651", | ||
# "trace_state": "[]" | ||
# }, | ||
# "kind": "SpanKind.INTERNAL", | ||
# "parent_id": null, | ||
# "start_time": "2024-11-26T09:52:00.681588Z", | ||
# "end_time": "2024-11-26T09:52:03.805858Z", | ||
# "status": { | ||
# "status_code": "UNSET" | ||
# }, | ||
# "attributes": { | ||
# "monocle_apptrace.version": "0.3.0", | ||
# "span.type": "workflow", | ||
# "entity.1.name": "haystack_app_1", | ||
# "entity.1.type": "workflow.haystack" | ||
# }, | ||
# "events": [ | ||
# { | ||
# "name": "data.input", | ||
# "timestamp": "2024-11-26T09:52:00.684591Z", | ||
# "attributes": { | ||
# "question": "What does Rhodes Statue look like?" | ||
# } | ||
# }, | ||
# { | ||
# "name": "data.output", | ||
# "timestamp": "2024-11-26T09:52:03.805858Z", | ||
# "attributes": { | ||
# "response": [ | ||
# "The Rhodes Statue was a colossal statue of the Greek sun-god Helios, standing approximately 33 meters (108 feet) high. It featured a standard rendering of a head with curly hair and spikes of bronze or silver flame radiating from it. The statue was constructed with iron tie bars and brass plates to form the skin, and filled with stone blocks during construction. The statue collapsed at the knees during an earthquake in 226 BC and remained on the ground for over 800 years. It was ultimately destroyed and the remains were sold. The exact appearance of the statue, aside from its size and head details, is unknown." | ||
# ] | ||
# } | ||
# } | ||
# ], | ||
# "links": [], | ||
# "resource": { | ||
# "attributes": { | ||
# "service.name": "haystack_app_1" | ||
# }, | ||
# "schema_url": "" | ||
# } | ||
# } |
Oops, something went wrong.