Merge remote-tracking branch 'upstream/main' into docs-faq

llmware-ai · Jun 2, 2024 · 609f361 · 609f361
2 parents 87990e6 + 92d495f
commit 609f361
Show file tree

Hide file tree

Showing 16 changed files with 2,389 additions and 405 deletions.
diff --git a/README.md b/README.md
@@ -804,6 +804,14 @@ Questions and discussions are welcome in our [github discussions](https://github
 
 See also [additional deployment/install release notes in wheel_archives](https://github.com/llmware-ai/llmware/tree/main/wheel_archives)   
 
+**Wednesday, May 29 - v0.3.0-WIP**  
+- Added support for new Milvus Lite embedded 'no-install' database - see [example](https://github.com/llmware-ai/llmware/tree/main/examples/Embedding/using_milvus_lite.py).   
+- Added two new SLIM models to catalog and agent processes - ['q-gen'](https://github.com/llmware-ai/llmware/tree/main/examples/SLIM-Agents/using-slim-q-gen.py) and ['qa-gen'](https://github.com/llmware-ai/llmware/tree/main/examples/SLIM-Agents/using-slim-qa-gen.py)    
+- Updated model class instantiation to provide more extensibility to add new classes in different modules  
+- Planning to remove torch and transformers from pip install package  
+- If cloning the repo, please see the new welcome_to_llmware.sh and welcome_to_llmware_windows.sh fast install scripts  
+- Changes merged in main branch and will be released in pypi targeting end of week  
+
 **Wednesday, May 22 - v0.2.15**  
 - Improvements in Model class handling of Pytorch and Transformers dependencies (just-in-time loading, if needed)  
 - Expanding API endpoint options and inference server functionality - see new [client access options](https://github.com/llmware-ai/llmware/tree/main/examples/Use_Cases/llmware_inference_api_client.py)  and [server_launch](https://github.com/llmware-ai/llmware/tree/main/examples/Use_Cases/llmware_inference_server.py)  

diff --git a/docker-compose_mongo_milvus.yaml b/docker-compose_mongo_milvus.yaml
@@ -0,0 +1,83 @@
+version: "3.5"
+
+services:
+  mongodb:
+    container_name: mongodb
+    image: mongo:5.0.10
+    # To secure MongoDB, uncomment and set the following values
+    # environment:
+    #   - MONGO_INITDB_DATABASE=admin
+    #   - MONGO_INITDB_ROOT_USERNAME=admin
+    #   - MONGO_INITDB_ROOT_PASSWORD=changeme
+    volumes:
+      - llmware-mongodb:/data/db
+    ports:
+      - '27017:27017'
+
+  etcd:
+    container_name: milvus-etcd
+    image: quay.io/coreos/etcd:v3.5.5
+    environment:
+      - ETCD_AUTO_COMPACTION_MODE=revision
+      - ETCD_AUTO_COMPACTION_RETENTION=1000
+      - ETCD_QUOTA_BACKEND_BYTES=4294967296
+      - ETCD_SNAPSHOT_COUNT=50000
+    volumes:
+      - llmware-etcd:/etcd
+    command: etcd -advertise-client-urls=http://127.0.0.1:2379 -listen-client-urls http://0.0.0.0:2379 --data-dir /etcd
+    healthcheck:
+      test: ["CMD", "etcdctl", "endpoint", "health"]
+      interval: 30s
+      timeout: 20s
+      retries: 3
+
+  minio:
+    container_name: milvus-minio
+    image: minio/minio:RELEASE.2023-03-20T20-16-18Z
+    environment:
+      MINIO_ACCESS_KEY: minioadmin
+      MINIO_SECRET_KEY: minioadmin
+    ports:
+      - "9001:9001"
+      - "9000:9000"
+    volumes:
+      - llmware-minio:/minio_data
+    command: minio server /minio_data --console-address ":9001"
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:9000/minio/health/live"]
+      interval: 30s
+      timeout: 20s
+      retries: 3
+
+  milvus:
+    container_name: milvus
+    image: milvusdb/milvus:v2.3.0
+    command: ["milvus", "run", "standalone"]
+    environment:
+      ETCD_ENDPOINTS: etcd:2379
+      MINIO_ADDRESS: minio:9000
+    volumes:
+      - llmware-milvus:/var/lib/milvus
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:9091/healthz"]
+      interval: 30s
+      start_period: 90s
+      timeout: 20s
+      retries: 3
+    ports:
+      - "19530:19530"
+      - "9091:9091"
+    depends_on:
+      - "etcd"
+      - "minio"
+
+volumes:
+    llmware-mongodb:
+      driver: local
+    llmware-etcd:
+      driver: local
+    llmware-minio:
+      driver: local
+    llmware-milvus:
+      driver: local
+
diff --git a/docs/Gemfile b/docs/Gemfile
@@ -6,6 +6,7 @@ source 'https://rubygems.org'
 #
 gem "jekyll", "~> 4.3.2" # installed by `gem jekyll`
 gem "just-the-docs", "0.7.0" # pinned to the current release
+gem "rexml", "3.2.8" # pinned to that version to fix security alert
 
 #
 # Gems that are only loaded if they are configured correctly.

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
@@ -75,7 +75,8 @@ GEM
     rb-fsevent (0.11.2)
     rb-inotify (0.10.1)
       ffi (~> 1.0)
-    rexml (3.2.6)
+    rexml (3.2.8)
+      strscan (>= 3.0.9)
     rouge (4.1.3)
     ruby2_keywords (0.0.5)
     safe_yaml (1.0.5)
@@ -87,6 +88,7 @@ GEM
     sawyer (0.9.2)
       addressable (>= 2.3.5)
       faraday (>= 0.17.3, < 3)
+    strscan (3.1.0)
     terminal-table (3.0.2)
       unicode-display_width (>= 1.1.1, < 3)
     unicode-display_width (2.4.2)
@@ -103,6 +105,7 @@ DEPENDENCIES
   jekyll-include-cache
   jekyll-seo-tag
   just-the-docs (= 0.7.0)
+  rexml (= 3.2.8)
 
 BUNDLED WITH
    2.5.6
diff --git a/examples/Embedding/using_milvus_lite.py b/examples/Embedding/using_milvus_lite.py
@@ -0,0 +1,145 @@
+
+""" This example is a fast start with Milvus Lite, which is a 'no-install' file-based version of Milvus, intended
+for rapid prototyping.   A couple of key points to note:
+
+    -- Platform - per Milvus docs, Milvus Lite is designed for Mac and Linux (not on Windows currently)
+    -- PyMilvus - need to `pip install pymilvus>=2.4.2`
+    -- within LLMWare:  set MilvusConfig().set_config("lite", True)
+"""
+
+import os
+from llmware.library import Library
+from llmware.retrieval import Query
+from llmware.setup import Setup
+from llmware.status import Status
+from llmware.models import ModelCatalog
+from llmware.configs import LLMWareConfig, MilvusConfig
+
+from importlib import util
+
+if not util.find_spec("pymilvus"):
+    print("\nto run this example with pymilvus, you need to install pymilvus:  pip3 install pymilvus>=2.4.2")
+
+
+def setup_library(library_name):
+
+    """ Note: this setup_library method is provided to enable a self-contained example to create a test library """
+
+    #   Step 1 - Create library which is the main 'organizing construct' in llmware
+    print ("\nupdate: Creating library: {}".format(library_name))
+
+    library = Library().create_new_library(library_name)
+
+    #   check the embedding status 'before' installing the embedding
+    embedding_record = library.get_embedding_status()
+    print("embedding record - before embedding ", embedding_record)
+
+    #   Step 2 - Pull down the sample files from S3 through the .load_sample_files() command
+    #   --note: if you need to refresh the sample files, set 'over_write=True'
+    print ("update: Downloading Sample Files")
+
+    sample_files_path = Setup().load_sample_files(over_write=False)
+
+    #   Step 3 - point ".add_files" method to the folder of documents that was just created
+    #   this method parses the documents, text chunks, and captures in database
+
+    print("update: Parsing and Text Indexing Files")
+
+    library.add_files(input_folder_path=os.path.join(sample_files_path, "Agreements"),
+                      chunk_size=400, max_chunk_size=600, smart_chunking=1)
+
+    return library
+
+
+def install_vector_embeddings(library, embedding_model_name):
+
+    """ This method is the core example of installing an embedding on a library.
+        -- two inputs - (1) a pre-created library object and (2) the name of an embedding model """
+
+    library_name = library.library_name
+    vector_db = LLMWareConfig().get_vector_db()
+
+    print(f"\nupdate: Starting the Embedding: "
+          f"library - {library_name} - "
+          f"vector_db - {vector_db} - "
+          f"model - {embedding_model_name}")
+
+    #   *** this is the one key line of code to create the embedding ***
+    library.install_new_embedding(embedding_model_name=embedding_model, vector_db=vector_db,batch_size=100)
+
+    #   note: for using llmware as part of a larger application, you can check the real-time status by polling Status()
+    #   --both the EmbeddingHandler and Parsers write to Status() at intervals while processing
+    update = Status().get_embedding_status(library_name, embedding_model)
+    print("update: Embeddings Complete - Status() check at end of embedding - ", update)
+
+    # Start using the new vector embeddings with Query
+    sample_query = "incentive compensation"
+    print("\n\nupdate: Run a sample semantic/vector query: {}".format(sample_query))
+
+    #   queries are constructed by creating a Query object, and passing a library as input
+    query_results = Query(library).semantic_query(sample_query, result_count=20)
+
+    for i, entries in enumerate(query_results):
+
+        #   each query result is a dictionary with many useful keys
+
+        text = entries["text"]
+        document_source = entries["file_source"]
+        page_num = entries["page_num"]
+        vector_distance = entries["distance"]
+
+        #   to see all of the dictionary keys returned, uncomment the line below
+        #   print("update: query_results - all - ", i, entries)
+
+        #  for display purposes only, we will only show the first 125 characters of the text
+        if len(text) > 125:  text = text[0:125] + " ... "
+
+        print("\nupdate: query results - {} - document - {} - page num - {} - distance - {} "
+              .format( i, document_source, page_num, vector_distance))
+
+        print("update: text sample - ", text)
+
+    #   lets take a look at the library embedding status again at the end to confirm embeddings were created
+    embedding_record = library.get_embedding_status()
+
+    print("\nupdate:  embedding record - ", embedding_record)
+
+    return 0
+
+
+if __name__ == "__main__":
+
+    #   Fast Start configuration - will use no-install embedded sqlite
+    #   -- if you have installed Mongo or Postgres, then change the .set_active_db accordingly
+
+    LLMWareConfig().set_active_db("sqlite")
+
+    #   set the "lite" flag in MilvusConfig to True -> to use server version, set to False (which is default)
+    MilvusConfig().set_config("lite", True)
+    LLMWareConfig().set_vector_db("milvus")
+
+    #   Step 1 - create library
+    library = setup_library("ex2_milvus_lite")
+
+    #   Step 2 - Select any embedding model in the LLMWare catalog
+
+    #   to see a list of the embedding models supported, uncomment the line below and print the list
+    embedding_models = ModelCatalog().list_embedding_models()
+
+    #   for i, models in enumerate(embedding_models):
+    #       print("embedding models: ", i, models)
+
+    #   for this first embedding, we will use a very popular and fast sentence transformer
+    embedding_model = "mini-lm-sbert"
+
+    #   note: if you want to swap out "mini-lm-sbert" for Open AI 'text-embedding-ada-002', uncomment these lines:
+    #   embedding_model = "text-embedding-ada-002"
+    #   os.environ["USER_MANAGED_OPENAI_API_KEY"] = "<insert-your-openai-api-key>"
+
+    #   run the core script
+    install_vector_embeddings(library, embedding_model)
+
+
+
+
+