Merge branch 'main' into add-speech-recognition

huggingface · Jan 8, 2025 · 9de7304 · 9de7304
2 parents d2193ba + 952da0d
commit 9de7304
Show file tree

Hide file tree

Showing 117 changed files with 4,009 additions and 2,049 deletions.
diff --git a/.env b/.env
@@ -1,99 +1,32 @@
 # Use .env.local to change these variables
 # DO NOT EDIT THIS FILE WITH SENSITIVE DATA
 
-MONGODB_URL=#your mongodb URL here
+### MongoDB ###
+MONGODB_URL=#your mongodb URL here, use chat-ui-db image if you don't want to set this
 MONGODB_DB_NAME=chat-ui
 MONGODB_DIRECT_CONNECTION=false
 
-COOKIE_NAME=hf-chat
-COOKIE_SAMESITE=
-COOKIE_SECURE=
-TRUSTED_EMAIL_HEADER= # only set this if you understand the implications
 
-HF_TOKEN=#hf_<token> from https://huggingface.co/settings/token
+### Endpoints config ###
 HF_API_ROOT=https://api-inference.huggingface.co/models
-
+# HF_TOKEN is used for a lot of things, not only for inference but also fetching tokenizers, etc.
+# We recommend using an HF_TOKEN even if you use a local endpoint.
+HF_TOKEN= #get it from https://huggingface.co/settings/token
+# API Keys for providers, you will need to specify models in the MODELS section but these keys can be kept secret
 OPENAI_API_KEY=#your openai api key here
 ANTHROPIC_API_KEY=#your anthropic api key here
 CLOUDFLARE_ACCOUNT_ID=#your cloudflare account id here
 CLOUDFLARE_API_TOKEN=#your cloudflare api token here
 COHERE_API_TOKEN=#your cohere api token here
 GOOGLE_GENAI_API_KEY=#your google genai api token here
 
-HF_ACCESS_TOKEN=#LEGACY! Use HF_TOKEN instead
-
-# used to activate search with web functionality. disabled if none are defined. choose one of the following:
-YDC_API_KEY=#your docs.you.com api key here
-SERPER_API_KEY=#your serper.dev api key here
-SERPAPI_KEY=#your serpapi key here
-SERPSTACK_API_KEY=#your serpstack api key here
-SEARCHAPI_KEY=#your searchapi api key here
-USE_LOCAL_WEBSEARCH=#set to true to parse google results yourself, overrides other API keys
-SEARXNG_QUERY_URL=# where '<query>' will be replaced with query keywords see https://docs.searxng.org/dev/search_api.html eg https://searxng.yourdomain.com/search?q=<query>&engines=duckduckgo,google&format=json
-BING_SUBSCRIPTION_KEY=#your key
-PLAYWRIGHT_ADBLOCKER=true
 
-WEBSEARCH_ALLOWLIST=`[]` # if it's defined, allow websites from only this list.
-WEBSEARCH_BLOCKLIST=`[]` # if it's defined, block websites from this list.
-WEBSEARCH_JAVASCRIPT=true # CPU usage reduces by 60% on average by disabling javascript. Enable to improve website compatibility
-WEBSEARCH_TIMEOUT = 3500 # in milliseconds, determines how long to wait to load a page before timing out
-
-# Parameters to enable open id login
-OPENID_CONFIG=`{
-  "PROVIDER_URL": "",
-  "CLIENT_ID": "",
-  "CLIENT_SECRET": "",
-  "SCOPES": "",
-  "NAME_CLAIM": ""
-}`
-
-# /!\ legacy openid settings, prefer the config above
-OPENID_CLIENT_ID=
-OPENID_CLIENT_SECRET=
-OPENID_SCOPES="openid profile" # Add "email" for some providers like Google that do not provide preferred_username
-OPENID_NAME_CLAIM="name" # Change to "username" for some providers that do not provide name
-OPENID_PROVIDER_URL=https://huggingface.co # for Google, use https://accounts.google.com
-OPENID_TOLERANCE=
-OPENID_RESOURCE=
-
-# Parameters to enable a global mTLS context for client fetch requests
-USE_CLIENT_CERTIFICATE=false
-CERT_PATH=#
-KEY_PATH=#
-CA_PATH=#
-CLIENT_KEY_PASSWORD=#
-REJECT_UNAUTHORIZED=true
-
-TEXT_EMBEDDING_MODELS = `[
-  {
-    "name": "Xenova/gte-small",
-    "displayName": "Xenova/gte-small",
-    "description": "Local embedding model running on the server.",
-    "chunkCharLength": 512,
-    "endpoints": [
-      { "type": "transformersjs" }
-    ]
-  }
-]`
-
-# 'name', 'userMessageToken', 'assistantMessageToken' are required
+### Models ###
+## Models can support many different endpoints, check the documentation for more details
 MODELS=`[
     {
-      "name": "mistralai/Mistral-7B-Instruct-v0.1",
-      "displayName": "mistralai/Mistral-7B-Instruct-v0.1",
-      "description": "Mistral 7B is a new Apache 2.0 model, released by Mistral AI that outperforms Llama2 13B in benchmarks.",
-      "websiteUrl": "https://mistral.ai/news/announcing-mistral-7b/",
-      "preprompt": "",
-      "chatPromptTemplate" : "<s>{{#each messages}}{{#ifUser}}[INST] {{#if @first}}{{#if @root.preprompt}}{{@root.preprompt}}\n{{/if}}{{/if}}{{content}} [/INST]{{/ifUser}}{{#ifAssistant}}{{content}}</s>{{/ifAssistant}}{{/each}}",
-      "parameters": {
-        "temperature": 0.1,
-        "top_p": 0.95,
-        "repetition_penalty": 1.2,
-        "top_k": 50,
-        "truncate": 3072,
-        "max_new_tokens": 1024,
-        "stop": ["</s>"]
-      },
+      "name": "NousResearch/Hermes-3-Llama-3.1-8B",
+      "description": "Nous Research's latest Hermes 3 release in 8B size.",
       "promptExamples": [
         {
           "title": "Write an email from bullet list",
@@ -108,78 +41,160 @@ MODELS=`[
       ]
     }
 ]`
-
-OLD_MODELS=`[]`# any removed models, `{ name: string, displayName?: string, id?: string }`
-TASK_MODEL= # name of the model used for tasks such as summarizing title, creating query, etc.
-
-PUBLIC_ORIGIN=#https://huggingface.co
-PUBLIC_SHARE_PREFIX=#https://hf.co/chat
-PUBLIC_GOOGLE_ANALYTICS_ID=#G-XXXXXXXX / Leave empty to disable
-PUBLIC_PLAUSIBLE_SCRIPT_URL=#/js/script.js / Leave empty to disable
-PUBLIC_ANNOUNCEMENT_BANNERS=`[
-    {
-    "title": "Code Llama 70B is available! 🦙",
-    "linkTitle": "try it",
-    "linkHref": "https://huggingface.co/chat?model=codellama/CodeLlama-70b-Instruct-hf"
+## Text Embedding Models used for websearch
+# Default is a model that runs locally on CPU.
+TEXT_EMBEDDING_MODELS = `[
+  {
+    "name": "Xenova/gte-small",
+    "displayName": "Xenova/gte-small",
+    "description": "Local embedding model running on the server.",
+    "chunkCharLength": 512,
+    "endpoints": [
+      { "type": "transformersjs" }
+    ]
   }
 ]`
 
-PUBLIC_APPLE_APP_ID=#1234567890 / Leave empty to disable
+## Removed models, useful for migrating conversations
+# { name: string, displayName?: string, id?: string, transferTo?: string }`
+OLD_MODELS=`[]`
 
-PARQUET_EXPORT_DATASET=
-PARQUET_EXPORT_HF_TOKEN=
-ADMIN_API_SECRET=# secret to admin API calls, like computing usage stats or exporting parquet data
+## Task model
+# name of the model used for tasks such as summarizing title, creating query, etc.
+# if not set, the first model in MODELS will be used
+TASK_MODEL=
 
-PARQUET_EXPORT_SECRET=#DEPRECATED, use ADMIN_API_SECRET instead
 
-RATE_LIMIT= # /!\ Legacy definition of messages per minute. Use USAGE_LIMITS.messagesPerMinute instead
+### Authentication ###
+# Parameters to enable open id login
+OPENID_CONFIG=
 MESSAGES_BEFORE_LOGIN=# how many messages a user can send in a conversation before having to login. set to 0 to force login right away
-PUBLIC_APP_GUEST_MESSAGE=# a message to the guest user. If not set, a default message will be used
+# if it's defined, only these emails will be allowed to use login
+ALLOWED_USER_EMAILS=`[]` 
+# valid alternative redirect URLs for OAuth, used for HuggingChat apps
+ALTERNATIVE_REDIRECT_URLS=`[]` 
+### Cookies
+# name of the cookie used to store the session
+COOKIE_NAME=hf-chat
+# specify secure behaviour for cookies 
+COOKIE_SAMESITE=# can be "lax", "strict", "none" or left empty
+COOKIE_SECURE=# set to true to only allow cookies over https
 
-APP_BASE="" # base path of the app, e.g. /chat, left blank as default
+
+### Websearch ###
+## API Keys used to activate search with web functionality. websearch is disabled if none are defined. choose one of the following:
+YDC_API_KEY=#your docs.you.com api key here
+SERPER_API_KEY=#your serper.dev api key here
+SERPAPI_KEY=#your serpapi key here
+SERPSTACK_API_KEY=#your serpstack api key here
+SEARCHAPI_KEY=#your searchapi api key here
+USE_LOCAL_WEBSEARCH=#set to true to parse google results yourself, overrides other API keys
+SEARXNG_QUERY_URL=# where '<query>' will be replaced with query keywords see https://docs.searxng.org/dev/search_api.html eg https://searxng.yourdomain.com/search?q=<query>&engines=duckduckgo,google&format=json
+BING_SUBSCRIPTION_KEY=#your key
+## Websearch configuration
+PLAYWRIGHT_ADBLOCKER=true
+WEBSEARCH_ALLOWLIST=`[]` # if it's defined, allow websites from only this list.
+WEBSEARCH_BLOCKLIST=`[]` # if it's defined, block websites from this list.
+WEBSEARCH_JAVASCRIPT=true # CPU usage reduces by 60% on average by disabling javascript. Enable to improve website compatibility
+WEBSEARCH_TIMEOUT = 3500 # in milliseconds, determines how long to wait to load a page before timing out
+ENABLE_LOCAL_FETCH=false #set to true to allow fetches on the local network. /!\ Only enable this if you have the proper firewall rules to prevent SSRF attacks and understand the implications.
+
+
+## Public app configuration ##
+PUBLIC_APP_GUEST_MESSAGE=# a message to the guest user. If not set, no message will be shown. Only used if you have authentication enabled.
 PUBLIC_APP_NAME=ChatUI # name used as title throughout the app
 PUBLIC_APP_ASSETS=chatui # used to find logos & favicons in static/$PUBLIC_APP_ASSETS
-PUBLIC_APP_COLOR=blue # can be any of tailwind colors: https://tailwindcss.com/docs/customizing-colors#default-color-palette
-PUBLIC_APP_DESCRIPTION=# description used throughout the app (if not set, a default one will be used)
-PUBLIC_APP_DATA_SHARING=#set to 1 to enable options & text regarding data sharing
-PUBLIC_APP_DISCLAIMER=#set to 1 to show a disclaimer on login page
-PUBLIC_APP_DISCLAIMER_MESSAGE="Disclaimer: AI is an area of active research with known problems such as biased generation and misinformation. Do not use this application for high-stakes decisions or advice. Do not insert your personal data, especially sensitive, like health data."
-LLM_SUMMARIZATION=true
+PUBLIC_APP_DESCRIPTION=# description used throughout the app
+PUBLIC_APP_DATA_SHARING=# Set to 1 to enable an option in the user settings to share conversations with model authors
+PUBLIC_APP_DISCLAIMER=# Set to 1 to show a disclaimer on login page
+PUBLIC_APP_DISCLAIMER_MESSAGE=# Message to show on the login page
+PUBLIC_ANNOUNCEMENT_BANNERS=`[
+    {
+    "title": "chat-ui is now open source!",
+    "linkTitle": "check it out",
+    "linkHref": "https://github.com/huggingface/chat-ui"
+  }
+]`
+PUBLIC_SMOOTH_UPDATES=false # set to true to enable smoothing of messages client-side, can be CPU intensive
+PUBLIC_ORIGIN=#https://huggingface.co
+PUBLIC_SHARE_PREFIX=#https://hf.co/chat
+
+# mostly huggingchat specific
+PUBLIC_GOOGLE_ANALYTICS_ID=#G-XXXXXXXX / Leave empty to disable
+PUBLIC_PLAUSIBLE_SCRIPT_URL=#/js/script.js / Leave empty to disable
+PUBLIC_APPLE_APP_ID=#1234567890 / Leave empty to disable
 
-EXPOSE_API=true
-USE_HF_TOKEN_IN_API=false
-# PUBLIC_APP_NAME=HuggingChat
-# PUBLIC_APP_ASSETS=huggingchat
-# PUBLIC_APP_COLOR=yellow
-# PUBLIC_APP_DESCRIPTION="Making the community's best AI chat models available to everyone."
-# PUBLIC_APP_DATA_SHARING=1
-# PUBLIC_APP_DISCLAIMER=1
 
+### Feature Flags ###
+LLM_SUMMARIZATION=true # generate conversation titles with LLMs
 ENABLE_ASSISTANTS=false #set to true to enable assistants feature
 ENABLE_ASSISTANTS_RAG=false # /!\ This will let users specify arbitrary URLs that the server will then request. Make sure you have the proper firewall rules in place. 
-REQUIRE_FEATURED_ASSISTANTS=false
-ENABLE_LOCAL_FETCH=false #set to true to disable the blocklist for local fetches. Only enable this if you have the proper firewall rules to prevent SSRF attacks and understand the implications.
-ALTERNATIVE_REDIRECT_URLS=`[]` #valide alternative redirect URL for OAuth
-WEBHOOK_URL_REPORT_ASSISTANT=#provide webhook url to get notified when an assistant gets reported
+REQUIRE_FEATURED_ASSISTANTS=false # require featured assistants to show in the list
+COMMUNITY_TOOLS=false # set to true to enable community tools
+EXPOSE_API=true # make the /api routes available
+ALLOW_IFRAME=true # Allow the app to be embedded in an iframe
 
-ALLOWED_USER_EMAILS=`[]` # if it's defined, only these emails will be allowed to use the app
 
+### Tools ###
+# Check out public config in `chart/env/prod.yaml` for more details
+TOOLS=`[]` 
+
+### Rate limits ### 
+# See `src/lib/server/usageLimits.ts`
+# {
+#   conversations: number, # how many conversations
+#   messages: number, # how many messages in a conversation
+#   assistants: number, # how many assistants
+#   messageLength: number, # how long can a message be before we cut it off
+#   messagesPerMinute: number, # how many messages per minute
+#   tools: number # how many tools
+# }
 USAGE_LIMITS=`{}`
 
-ALLOW_IFRAME=true
-ALLOW_INSECURE_COOKIES=false # recommended to keep this to false but set to true if you need to run over http without tls
+
+### HuggingFace specific ###
+# Let user authenticate with their HF token in the /api routes. This is only useful if you have OAuth configured with huggingface.
+USE_HF_TOKEN_IN_API=false
+## Feature flag & admin settings
+# Used for setting early access & admin flags to users
+HF_ORG_ADMIN=
+HF_ORG_EARLY_ACCESS=
+WEBHOOK_URL_REPORT_ASSISTANT=#provide slack webhook url to get notified for reports/feature requests
+
+
+
+### Metrics ###
 METRICS_ENABLED=false
 METRICS_PORT=5565
 LOG_LEVEL=info
 
 
-TOOLS=`[]` 
-BODY_SIZE_LIMIT=15728640
+### Parquet export ###
+# Not in use anymore but useful to export conversations to a parquet file as a HuggingFace dataset
+PARQUET_EXPORT_DATASET=
+PARQUET_EXPORT_HF_TOKEN=
+ADMIN_API_SECRET=# secret to admin API calls, like computing usage stats or exporting parquet data
 
-HF_ORG_ADMIN=
-HF_ORG_EARLY_ACCESS=
 
-PUBLIC_SMOOTH_UPDATES=false
-COMMUNITY_TOOLS=false
+### Docker build variables ### 
+# These values cannot be updated at runtime
+# They need to be passed when building the docker image
+# See https://github.com/huggingface/chat-ui/main/.github/workflows/deploy-prod.yml#L44-L47
+APP_BASE="" # base path of the app, e.g. /chat, left blank as default
+PUBLIC_APP_COLOR=blue # can be any of tailwind colors: https://tailwindcss.com/docs/customizing-colors#default-color-palette
+### Body size limit for SvelteKit https://svelte.dev/docs/kit/adapter-node#Environment-variables-BODY_SIZE_LIMIT
+BODY_SIZE_LIMIT=15728640
+PUBLIC_COMMIT_SHA=
 
-PUBLIC_COMMIT_SHA=
+### LEGACY parameters
+HF_ACCESS_TOKEN=#LEGACY! Use HF_TOKEN instead
+ALLOW_INSECURE_COOKIES=false # LEGACY! Use COOKIE_SECURE and COOKIE_SAMESITE instead
+PARQUET_EXPORT_SECRET=#DEPRECATED, use ADMIN_API_SECRET instead
+RATE_LIMIT= # /!\ DEPRECATED definition of messages per minute. Use USAGE_LIMITS.messagesPerMinute instead
+OPENID_CLIENT_ID=
+OPENID_CLIENT_SECRET=
+OPENID_SCOPES="openid profile" # Add "email" for some providers like Google that do not provide preferred_username
+OPENID_NAME_CLAIM="name" # Change to "username" for some providers that do not provide name
+OPENID_PROVIDER_URL=https://huggingface.co # for Google, use https://accounts.google.com
+OPENID_TOLERANCE=
+OPENID_RESOURCE=
diff --git a/.github/workflows/build-image.yml b/.github/workflows/build-image.yml
@@ -61,6 +61,9 @@ jobs:
           username: ${{ github.repository_owner }}
           password: ${{ secrets.GITHUB_TOKEN }}
 
+      - name: Inject slug/short variables
+        uses: rlespinasse/[email protected]
+
       - name: Build and Publish Docker Image with DB
         uses: docker/build-push-action@v5
         with:
@@ -70,8 +73,11 @@ jobs:
           tags: ${{ steps.meta.outputs.tags }}
           labels: ${{ steps.meta.outputs.labels }}
           platforms: linux/amd64,linux/arm64
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
           build-args: |
             INCLUDE_DB=true
+            PUBLIC_COMMIT_SHA=${{ env.GITHUB_SHA_SHORT }}
   build-and-publish-image-nodb:
     runs-on: ubuntu-latest
     steps:
@@ -115,6 +121,9 @@ jobs:
           username: ${{ github.repository_owner }}
           password: ${{ secrets.GITHUB_TOKEN }}
 
+      - name: Inject slug/short variables
+        uses: rlespinasse/[email protected]
+
       - name: Build and Publish Docker Image without DB
         uses: docker/build-push-action@v5
         with:
@@ -124,5 +133,8 @@ jobs:
           tags: ${{ steps.meta.outputs.tags }}
           labels: ${{ steps.meta.outputs.labels }}
           platforms: linux/amd64,linux/arm64
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
           build-args: |
             INCLUDE_DB=false
+            PUBLIC_COMMIT_SHA=${{ env.GITHUB_SHA_SHORT }}
diff --git a/.github/workflows/deploy-prod.yml b/.github/workflows/deploy-prod.yml
@@ -29,6 +29,9 @@ jobs:
       - name: Set up Docker Buildx
         uses: docker/setup-buildx-action@v3
 
+      - name: Inject slug/short variables
+        uses: rlespinasse/[email protected]
+
       - name: Build and Publish HuggingChat image
         uses: docker/build-push-action@v5
         with:
@@ -45,6 +48,7 @@ jobs:
             INCLUDE_DB=false
             APP_BASE=/chat
             PUBLIC_APP_COLOR=yellow
+            PUBLIC_COMMIT_SHA=${{ env.GITHUB_SHA_SHORT }}
   deploy:
     name: Deploy on prod
     runs-on: ubuntu-latest