Changed the langChain dir name to langchain

2025-12-05 02:17:31 +00:00 · 2025-08-21 19:51:33 -07:00 · 2025-08-21 19:51:33 -07:00 · 0da0732b07
commit 0da0732b07
parent 84c960e9b5
2 changed files with 521 additions and 0 deletions
--- a/docs/notebooks/langchain/langchain-llama-stack.py
+++ b/docs/notebooks/langchain/langchain-llama-stack.py
@ -0,0 +1,288 @@
+import os
+import re
+import html
+import requests
+from bs4 import BeautifulSoup
+from readability import Document as ReadabilityDocument
+from markdownify import markdownify
+from langchain_community.document_loaders import PyPDFLoader, TextLoader
+import tempfile
+
+from llama_stack_client import LlamaStackClient
+
+from langchain_core.language_models.llms import LLM
+from typing import Optional, List, Any
+from langchain.chains import LLMChain
+from langchain_core.prompts import PromptTemplate
+from rich.pretty import pprint
+
+# Global variables
+client = None
+llm = None
+summary_chain = None
+facts_chain = None
+qa_chain = None
+processed_docs = {}
+
+# Prompt Templates (defined globally)
+summary_template = PromptTemplate(
+    input_variables=["document"],
+    template="""Create a concise summary of this document in 5-10 sentences:
+
+{document}
+
+SUMMARY:"""
+)
+
+facts_template = PromptTemplate(
+    input_variables=["document"],
+    template="""Extract the most important facts from this document. List them as bullet points:
+
+{document}
+
+KEY FACTS:
+-"""
+)
+
+qa_template = PromptTemplate(
+    input_variables=["document", "question"],
+    template="""Based on the following document, answer the question. If the answer isn't in the document, say so.
+
+DOCUMENT:
+{document}
+
+QUESTION: {question}
+
+ANSWER:"""
+)
+
+class LlamaStackLLM(LLM):
+    """Simple LangChain wrapper for Llama Stack"""
+
+    # Pydantic model fields
+    client: Any = None
+    model_id: str = "llama3:70b-instruct"
+
+    def __init__(self, client, model_id: str = "llama3:70b-instruct"):
+        # Initialize with field values
+        super().__init__(client=client, model_id=model_id)
+
+    def _call(self, prompt: str, stop: Optional[List[str]] = None, **kwargs) -> str:
+        """Make inference call to Llama Stack"""
+        response = self.client.inference.chat_completion(
+            model_id=self.model_id,
+            messages=[{"role": "user", "content": prompt}]
+        )
+        return response.completion_message.content
+
+    @property
+    def _llm_type(self) -> str:
+        return "llama_stack"
+
+
+def load_document(source: str) -> str:
+    is_url = source.startswith(('http://', 'https://'))
+    is_pdf = source.lower().endswith('.pdf')
+    if is_pdf:
+        return load_pdf(source, is_url=is_url)
+    elif is_url:
+        return load_from_url(source)
+    else:
+        raise ValueError(f"Unsupported format. Use URLs or PDF files.")
+
+
+def load_pdf(source: str, is_url: bool = False) -> str:
+    if is_url:
+        response = requests.get(source)
+        response.raise_for_status()
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as temp_file:
+            temp_file.write(response.content)
+            file_path = temp_file.name
+    else:
+        file_path = source
+    try:
+        loader = PyPDFLoader(file_path)
+        docs = loader.load()
+        return "\\n\\n".join([doc.page_content for doc in docs])
+    finally:
+        if is_url:
+            os.remove(file_path)
+
+
+def load_from_url(url: str) -> str:
+    headers = {'User-Agent': 'Mozilla/5.0 (compatible; DocumentLoader/1.0)'}
+    response = requests.get(url, headers=headers, timeout=15)
+    response.raise_for_status()
+    doc = ReadabilityDocument(response.text)
+    html_main = doc.summary(html_partial=True)
+    soup = BeautifulSoup(html_main, "html.parser")
+    for tag in soup(["script", "style", "noscript", "header", "footer", "nav", "aside"]):
+        tag.decompose()
+    md_text = markdownify(str(soup), heading_style="ATX")
+    md_text = html.unescape(md_text)
+    md_text = re.sub(r"\n{3,}", "\n\n", md_text).strip()
+    return md_text
+
+def process_document(source: str):
+    global summary_chain, facts_chain, processed_docs
+
+    print(f"📄 Loading document from: {source}")
+    document = load_document(source)
+    print(f"✅ Loaded {len(document):,} characters")
+    print("\n📝 Generating summary...")
+    summary = summary_chain.invoke({"document": document})["text"]
+    print("Summary generated")
+    print("🔍 Extracting key facts...")
+    facts = facts_chain.invoke({"document": document})["text"]
+    processed_docs[source] = {
+        "document": document,
+        "summary": summary,
+        "facts": facts
+    }
+    print(f"\n✅ Processing complete!")
+    print(f"📊 Document: {len(document):,} chars")
+    print(f"📝 Summary: {summary[:100]}...")
+    print(f"🔍 Facts: {facts[:1000]}...")
+    return processed_docs[source]
+
+def ask_question(question: str, source: str = None):
+    """Answer questions about processed documents"""
+    global qa_chain, processed_docs
+
+    if not processed_docs:
+        return "No documents processed yet. Use process_document() first."
+    if source and source in processed_docs:
+        doc_data = processed_docs[source]
+    else:
+        # Use the most recent document
+        doc_data = list(processed_docs.values())[-1]
+    answer = qa_chain.invoke({
+        "document": doc_data["document"],
+        "question": question
+    })["text"]
+    return answer
+
+
+def interactive_demo():
+    print("\n🎯 Interactive Document Processing Demo")
+    print("Commands:")
+    print("  load <url_or_path>  - Process a document")
+    print("  ask <question>      - Ask about the document")
+    print("  summary            - Show document summary")
+    print("  facts              - Show extracted facts")
+    print("  help               - Show commands")
+    print("  quit               - Exit demo")
+
+    while True:
+        try:
+            command = input("\n> ").strip()
+            if command.lower() in ['quit', 'exit']:
+                print("👋 Thanks for exploring LangChain chains!")
+                break
+            elif command.lower() == 'help':
+                print("\nCommands:")
+                print("  load <url_or_path>  - Process a document")
+                print("  ask <question>      - Ask about the document")
+                print("  summary            - Show document summary")
+                print("  facts              - Show extracted facts")
+            elif command.startswith('load '):
+                source = command[5:].strip()
+                if source:
+                    try:
+                        process_document(source)
+                    except Exception as e:
+                        print(f"❌ Error processing document: {e}")
+                else:
+                    print("❓ Please provide a URL or file path")
+            elif command.startswith('ask '):
+                question = command[4:].strip()
+                if question:
+                    try:
+                        answer = ask_question(question)
+                        print(f"\n💬 Q: {question}")
+                        print(f"📝 A: {answer}")
+                    except Exception as e:
+                        print(f"❌ Error: {e}")
+                else:
+                    print("❓ Please provide a question")
+            elif command.lower() == 'summary':
+                if processed_docs:
+                    latest_doc = list(processed_docs.values())[-1]
+                    print(f"\n📝 Summary:\n{latest_doc['summary']}")
+                else:
+                    print("❓ No documents processed yet")
+            elif command.lower() == 'facts':
+                if processed_docs:
+                    latest_doc = list(processed_docs.values())[-1]
+                    print(f"\n🔍 Key Facts:\n{latest_doc['facts']}")
+                else:
+                    print("❓ No documents processed yet")
+            else:
+                print("❓ Unknown command. Type 'help' for options")
+        except (EOFError, KeyboardInterrupt):
+            print("\n👋 Goodbye!")
+            break
+
+
+def main():
+    global client, llm, summary_chain, facts_chain, qa_chain, processed_docs
+
+    print("🚀 Starting LangChain + Llama Stack Document Processing Demo")
+
+    client = LlamaStackClient(
+        base_url="http://localhost:8321/",
+    )
+
+    # Initialize the LangChain-compatible LLM
+    llm = LlamaStackLLM(client)
+
+    # Test the wrapper
+    test_response = llm.invoke("Can you help me with the document processing?")
+    print(f"✅ LangChain wrapper working!")
+    print(f"Response: {test_response[:100]}...")
+
+    print("Available models:")
+    for m in client.models.list():
+        print(f"- {m.identifier}")
+
+    print("----")
+    print("Available shields (safety models):")
+    for s in client.shields.list():
+        print(s.identifier)
+    print("----")
+
+    # model_id = "llama3.2:3b"
+    model_id = "ollama/llama3:70b-instruct"
+
+    response = client.inference.chat_completion(
+        model_id=model_id,
+        messages=[
+            {"role": "system", "content": "You are a friendly assistant."},
+            {"role": "user", "content": "Write a two-sentence poem about llama."},
+        ],
+    )
+
+    print(response.completion_message.content)
+
+    # Create chains by combining our LLM with prompt templates
+    summary_chain = LLMChain(llm=llm, prompt=summary_template)
+    facts_chain = LLMChain(llm=llm, prompt=facts_template)
+    qa_chain = LLMChain(llm=llm, prompt=qa_template)
+
+    # Initialize storage for processed documents
+    processed_docs = {}
+
+    print("✅ Created 3 prompt templates:")
+    print("  • Summary: Condenses documents into key points")
+    print("  • Facts: Extracts important information as bullets")
+    print("  • Q&A: Answers questions based on document content")
+
+    # Test template formatting
+    test_prompt = summary_template.format(document="This is a sample document about AI...")
+    print(f"\n📝 Example prompt: {len(test_prompt)} characters")
+
+    # Start the interactive demo
+    interactive_demo()
+
+if __name__ == "__main__":
+    main()