typesense
diff --git a/‎examples/streaming_conversation_search.py‎
Lines changed: 239 additions & 0 deletions b/‎examples/streaming_conversation_search.py‎
Lines changed: 239 additions & 0 deletions
diff --git a/‎examples/streaming_test_simple.py‎
Lines changed: 67 additions & 0 deletions b/‎examples/streaming_test_simple.py‎
Lines changed: 67 additions & 0 deletions
@@ -0,0 +1,239 @@
+"""
+Example: Streaming Conversation Search
+
+This script demonstrates how to use streaming conversation search with Typesense.
+It requires:
+1. A running Typesense server (default: localhost:8108)
+2. An OpenAI API key set in OPEN_AI_KEY (in .env file or environment)
+
+Usage:
+    python examples/streaming_conversation_search.py
+"""
+
+import os
+import sys
+
+from dotenv import load_dotenv
+
+load_dotenv()
+
+curr_dir = os.path.dirname(os.path.realpath(__file__))
+sys.path.insert(1, os.path.abspath(os.path.join(curr_dir, os.pardir, "src")))
+
+import typesense
+from typesense.types.document import MessageChunk, StreamConfig
+
+# Configuration
+API_KEY = os.environ.get("TYPESENSE_API_KEY", "xyz")
+HOST = os.environ.get("TYPESENSE_HOST", "localhost")
+PORT = os.environ.get("TYPESENSE_PORT", "8108")
+OPENAI_KEY = os.environ.get("OPEN_AI_KEY", "")
+
+if not OPENAI_KEY:
+    print("Error: OPEN_AI_KEY environment variable is required")
+    print("Set it in a .env file or pass it directly")
+    sys.exit(1)
+
+# Create client (use longer timeout for streaming)
+client = typesense.Client({
+    "api_key": API_KEY,
+    "nodes": [{"host": HOST, "port": PORT, "protocol": "http"}],
+    "connection_timeout_seconds": 120,
+})
+
+COLLECTION_NAME = "streaming-example-essays"
+CONVERSATION_STORE_NAME = "streaming-example-conversation-store"
+MODEL_NAME = "streaming-example-model"
+
+# Collection schema with embedding
+collection_schema = {
+    "name": COLLECTION_NAME,
+    "fields": [
+        {"name": "title", "type": "string"},
+        {"name": "content", "type": "string"},
+        {
+            "name": "embedding",
+            "type": "float[]",
+            "embed": {
+                "from": ["content"],
+                "model_config": {
+                    "model_name": "openai/text-embedding-3-small",
+                    "api_key": OPENAI_KEY,
+                },
+            },
+        },
+    ],
+}
+
+# Conversation history collection schema (required for conversation models)
+conversation_store_schema = {
+    "name": CONVERSATION_STORE_NAME,
+    "fields": [
+        {"name": "conversation_id", "type": "string"},
+        {"name": "model_id", "type": "string"},
+        {"name": "timestamp", "type": "int32"},
+        {"name": "role", "type": "string", "index": False},
+        {"name": "message", "type": "string", "index": False},
+    ],
+}
+
+# Conversation model schema
+conversation_model_schema = {
+    "id": MODEL_NAME,
+    "model_name": "openai/gpt-4o-mini",
+    "api_key": OPENAI_KEY,
+    "history_collection": CONVERSATION_STORE_NAME,
+    "system_prompt": "You are a helpful assistant. Answer questions based on the provided context.",
+    "max_bytes": 16384,
+}
+
+# Sample documents
+documents = [
+    {
+        "title": "The Maker's Schedule",
+        "content": """
+        One reason programmers dislike meetings so much is that they're on a different 
+        type of schedule from other people. Meetings cost them more. There are two types 
+        of schedule, which I'll call the manager's schedule and the maker's schedule. 
+        The manager's schedule is for bosses. It's embodied in the traditional appointment 
+        book, with each day cut into one hour intervals. You can block off several hours 
+        for a single task if you need to, but by default you change what you're doing 
+        every hour. When you use time that way, it's merely a practical problem to meet 
+        with someone. The maker's schedule is different. Writers, programmers, and artists 
+        typically work in longer time units.
+        """,
+    },
+    {
+        "title": "How to Do What You Love",
+        "content": """
+        To do something well you have to like it. That idea is not exactly novel. 
+        We've got it down to four words: "Do what you love." But it's not enough just 
+        to tell people that. Doing what you love is complicated. The very idea is 
+        foreign to most people. It's not as easy as it sounds. You have to find work 
+        that you enjoy, and that's harder than most people think.
+        """,
+    },
+]
+
+
+def setup():
+    """Set up collection and conversation model."""
+    # Clean up existing resources
+    try:
+        client.conversations_models[MODEL_NAME].delete()
+    except Exception:
+        pass
+
+    try:
+        client.collections[COLLECTION_NAME].delete()
+    except Exception:
+        pass
+
+    try:
+        client.collections[CONVERSATION_STORE_NAME].delete()
+    except Exception:
+        pass
+
+    # Create conversation history collection first
+    print(f"Creating conversation store '{CONVERSATION_STORE_NAME}'...")
+    client.collections.create(conversation_store_schema)
+
+    # Create main collection
+    print(f"Creating collection '{COLLECTION_NAME}'...")
+    client.collections.create(collection_schema)
+
+    # Index documents
+    print("Indexing documents...")
+    for doc in documents:
+        client.collections[COLLECTION_NAME].documents.create(doc)
+
+    # Create conversation model
+    print(f"Creating conversation model '{MODEL_NAME}'...")
+    client.conversations_models.create(conversation_model_schema)
+
+    print("Setup complete!\n")
+
+
+def cleanup():
+    """Clean up resources."""
+    try:
+        client.conversations_models[MODEL_NAME].delete()
+    except Exception:
+        pass
+
+    try:
+        client.collections[COLLECTION_NAME].delete()
+    except Exception:
+        pass
+
+    try:
+        client.collections[CONVERSATION_STORE_NAME].delete()
+    except Exception:
+        pass
+
+
+def streaming_search_example():
+    """Demonstrate streaming conversation search."""
+    print("=" * 60)
+    print("Streaming Conversation Search Example")
+    print("=" * 60)
+
+    # Track streamed chunks
+    message_parts: list[str] = []
+
+    def on_chunk(chunk: MessageChunk) -> None:
+        """Called for each streamed message chunk."""
+        message_parts.append(chunk["message"])
+        # Print chunk immediately (no newline for streaming effect)
+        print(chunk["message"], end="", flush=True)
+
+    def on_complete(response: dict) -> None:
+        """Called when streaming is complete."""
+        print("\n")  # Newline after streaming
+        print("-" * 40)
+        print(f"Streaming complete! Found {response.get('found', 0)} documents")
+
+    def on_error(error: BaseException) -> None:
+        """Called if an error occurs."""
+        print(f"\nError: {error}")
+
+    stream_config: StreamConfig = {
+        "on_chunk": on_chunk,
+        "on_complete": on_complete,
+        "on_error": on_error,
+    }
+
+    query = "What is the maker's schedule and why do programmers prefer it?"
+    print(f"\nQuery: {query}\n")
+    print("Streaming response:")
+    print("-" * 40)
+
+    # Perform streaming search
+    response = client.collections[COLLECTION_NAME].documents.search({
+        "q": query,
+        "query_by": "embedding",
+        "conversation": True,
+        "conversation_stream": True,
+        "conversation_model_id": MODEL_NAME,
+        "stream_config": stream_config,
+    })
+
+    # The full message from chunks
+    full_message = "".join(message_parts)
+    print(f"\nFull streamed message length: {len(full_message)} characters")
+
+    return response
+
+
+def main():
+    try:
+        setup()
+        streaming_search_example()
+    finally:
+        print("\nCleaning up...")
+        cleanup()
+        print("Done!")
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,67 @@
+"""
+Simple test script for async streaming conversation search against the demo endpoint.
+"""
+
+import asyncio
+import os
+import sys
+
+curr_dir = os.path.dirname(os.path.realpath(__file__))
+sys.path.insert(1, os.path.abspath(os.path.join(curr_dir, os.pardir, "src")))
+
+import typesense
+from typesense.types.document import MessageChunk, StreamConfigBuilder
+
+# Use the public demo endpoint
+client = typesense.AsyncClient({
+    "api_key": "8hLCPSQTYcBuK29zY5q6Xhin7ONxHy99",
+    "nodes": [{"host": "qtg5aekc2iosjh93p.a1.typesense.net", "port": "443", "protocol": "https"}],
+    "connection_timeout_seconds": 120,
+})
+
+COLLECTION_NAME = "pg-essays"
+MODEL_ID = "gpt-4-turbo-model-222"
+
+
+async def main():
+    print("Testing async streaming conversation search...")
+    print("=" * 60)
+
+    message_parts: list[str] = []
+    stream = StreamConfigBuilder()
+
+    @stream.on_chunk
+    def handle_chunk(chunk: MessageChunk) -> None:
+        message_parts.append(chunk["message"])
+        print(chunk["message"], end="", flush=True)
+
+    @stream.on_complete
+    def handle_complete(response: dict) -> None:
+        print("\n")
+        print("-" * 40)
+        print(f"Streaming complete! Found {response.get('found', 0)} documents")
+
+    @stream.on_error
+    def handle_error(error: BaseException) -> None:
+        print(f"\nError: {error}")
+
+    query = "What are the characteristics of a good startup idea?"
+    print(f"Query: {query}\n")
+    print("Streaming response:")
+    print("-" * 40)
+
+    response = await client.collections[COLLECTION_NAME].documents.search({
+        "q": query,
+        "query_by": "embedding",
+        "conversation": True,
+        "conversation_stream": True,
+        "conversation_model_id": MODEL_ID,
+        "exclude_fields": "embedding",
+        "stream_config": stream,
+    })
+
+    print(f"\nFull message length: {len(''.join(message_parts))} characters")
+
+
+if __name__ == "__main__":
+    asyncio.run(main())