From 03f00c9e6f98583dd0e9b68a122e735c0c716ddc Mon Sep 17 00:00:00 2001
From: Zhichang Yu <yuzhichang@gmail.com>
Date: Tue, 10 Dec 2024 16:32:58 +0800
Subject: [PATCH 1/2] Rename page_num_list, top_list, position_list (#3940)

### What problem does this PR solve?

Rename page_num_list, top_list, position_list to page_num_int, top_int,
position_int

### Type of change

- [x] Refactoring
---
 Dockerfile                 | 16 +++++++++++---
 api/apps/chunk_app.py      |  2 +-
 api/apps/sdk/doc.py        |  2 +-
 conf/infinity_mapping.json |  6 ++---
 graphrag/search.py         |  2 +-
 rag/app/presentation.py    | 14 +++++-------
 rag/nlp/__init__.py        | 19 ++++++++--------
 rag/nlp/search.py          |  9 ++++----
 rag/svr/task_executor.py   |  6 ++---
 rag/utils/es_conn.py       | 10 +++++++--
 rag/utils/infinity_conn.py | 45 +++++++++++++++++++++++++++++++++-----
 11 files changed, 89 insertions(+), 42 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index 3e316e87a1..c8f3e7f01a 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -34,9 +34,15 @@ RUN --mount=type=bind,from=infiniflow/ragflow_deps:latest,source=/,target=/deps
     cp /deps/cl100k_base.tiktoken /ragflow/9b5ad71b2ce5302211f9c61530b329a4922fc6a4
 
 ENV TIKA_SERVER_JAR="file:///ragflow/tika-server-standard-3.0.0.jar"
+ENV DEBIAN_FRONTEND=noninteractive
 
 # Setup apt
-# cv2 requires libGL.so.1
+# Python package and implicit dependencies:
+# opencv-python: libglib2.0-0 libglx-mesa0 libgl1
+# aspose-slides: pkg-config libicu-dev libgdiplus         libssl1.1_1.1.1f-1ubuntu2_amd64.deb
+# python-pptx:   default-jdk                              tika-server-standard-3.0.0.jar
+# selenium:      libatk-bridge2.0-0                       chrome-linux64-121-0-6167-85
+# Building C extensions: libpython3-dev libgtk-4-1 libnss3 xdg-utils libgbm-dev
 RUN --mount=type=cache,id=ragflow_apt,target=/var/cache/apt,sharing=locked \
     if [ "$NEED_MIRROR" == "1" ]; then \
         sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list; \
@@ -47,8 +53,12 @@ RUN --mount=type=cache,id=ragflow_apt,target=/var/cache/apt,sharing=locked \
     apt update && \
     apt --no-install-recommends install -y ca-certificates && \
     apt update && \
-    DEBIAN_FRONTEND=noninteractive apt install -y curl libpython3-dev nginx libglib2.0-0 libglx-mesa0 pkg-config libicu-dev libgdiplus default-jdk python3-pip pipx \
-    libatk-bridge2.0-0 libgtk-4-1 libnss3 xdg-utils unzip libgbm-dev wget git nginx libgl1 vim less
+    apt install -y libglib2.0-0 libglx-mesa0 libgl1 && \
+    apt install -y pkg-config libicu-dev libgdiplus && \
+    apt install -y default-jdk && \
+    apt install -y libatk-bridge2.0-0 && \
+    apt install -y libpython3-dev libgtk-4-1 libnss3 xdg-utils libgbm-dev && \
+    apt install -y python3-pip pipx nginx unzip curl wget git vim less
 
 RUN if [ "$NEED_MIRROR" == "1" ]; then \
         pip3 config set global.index-url https://pypi.tuna.tsinghua.edu.cn/simple && \
diff --git a/api/apps/chunk_app.py b/api/apps/chunk_app.py
index d60483ad44..6dc1f9b646 100644
--- a/api/apps/chunk_app.py
+++ b/api/apps/chunk_app.py
@@ -71,7 +71,7 @@ def list_chunk():
                 "question_kwd": sres.field[id].get("question_kwd", []),
                 "image_id": sres.field[id].get("img_id", ""),
                 "available_int": int(sres.field[id].get("available_int", 1)),
-                "positions": json.loads(sres.field[id].get("position_list", "[]")),
+                "positions": sres.field[id].get("position_int", []),
             }
             assert isinstance(d["positions"], list)
             assert len(d["positions"]) == 0 or (isinstance(d["positions"][0], list) and len(d["positions"][0]) == 5)
diff --git a/api/apps/sdk/doc.py b/api/apps/sdk/doc.py
index 6bcbe58e72..7fa6458461 100644
--- a/api/apps/sdk/doc.py
+++ b/api/apps/sdk/doc.py
@@ -846,7 +846,7 @@ def list_chunks(tenant_id, dataset_id, document_id):
                 "question_kwd": sres.field[id].get("question_kwd", []),
                 "img_id": sres.field[id].get("img_id", ""),
                 "available_int": sres.field[id].get("available_int", 1),
-                "positions": sres.field[id].get("position_int", "").split("\t"),
+                "positions": sres.field[id].get("position_int", []),
             }
             if len(d["positions"]) % 5 == 0:
                 poss = []
diff --git a/conf/infinity_mapping.json b/conf/infinity_mapping.json
index a9d1d4f0ee..118f205f99 100644
--- a/conf/infinity_mapping.json
+++ b/conf/infinity_mapping.json
@@ -16,9 +16,9 @@
 	"content_with_weight": {"type": "varchar", "default": ""},
 	"content_ltks": {"type": "varchar", "default": ""},
 	"content_sm_ltks": {"type": "varchar", "default": ""},
-	"page_num_list": {"type": "varchar", "default": ""},
-	"top_list": {"type": "varchar", "default": ""},
-	"position_list": {"type": "varchar", "default": ""},
+	"page_num_int": {"type": "varchar", "default": ""},
+	"top_int": {"type": "varchar", "default": ""},
+	"position_int": {"type": "varchar", "default": ""},
 	"weight_int": {"type": "integer", "default": 0},
 	"weight_flt": {"type": "float", "default": 0.0},
 	"rank_int": {"type": "integer", "default": 0},
diff --git a/graphrag/search.py b/graphrag/search.py
index 4e9f444817..a803494bbc 100644
--- a/graphrag/search.py
+++ b/graphrag/search.py
@@ -58,7 +58,7 @@ def merge_into_first(sres, title="") -> dict[str, str]:
         matchDense = self.get_vector(qst, emb_mdl, 1024, req.get("similarity", 0.1))
         q_vec = matchDense.embedding_data
         src = req.get("fields", ["docnm_kwd", "content_ltks", "kb_id", "img_id", "title_tks", "important_kwd",
-                                 "doc_id", f"q_{len(q_vec)}_vec", "position_list", "name_kwd",
+                                 "doc_id", f"q_{len(q_vec)}_vec", "position_int", "name_kwd",
                                  "available_int", "content_with_weight",
                                  "weight_int", "weight_flt"
                                  ])
diff --git a/rag/app/presentation.py b/rag/app/presentation.py
index bebf64bff9..a3305bdc11 100644
--- a/rag/app/presentation.py
+++ b/rag/app/presentation.py
@@ -20,7 +20,6 @@
 from rag.nlp import rag_tokenizer
 from deepdoc.parser import PdfParser, PptParser, PlainParser
 from PyPDF2 import PdfReader as pdf2_read
-import json
 
 
 class Ppt(PptParser):
@@ -109,9 +108,9 @@ def chunk(filename, binary=None, from_page=0, to_page=100000,
             d = copy.deepcopy(doc)
             pn += from_page
             d["image"] = img
-            d["page_num_list"] = json.dumps([pn + 1])
-            d["top_list"] = json.dumps([0])
-            d["position_list"] = json.dumps([(pn + 1, 0, img.size[0], 0, img.size[1])])
+            d["page_num_int"] = [pn + 1]
+            d["top_int"] = [0]
+            d["position_int"] = [(pn + 1, 0, img.size[0], 0, img.size[1])]
             tokenize(d, txt, eng)
             res.append(d)
         return res
@@ -125,10 +124,9 @@ def chunk(filename, binary=None, from_page=0, to_page=100000,
             pn += from_page
             if img:
                 d["image"] = img
-            d["page_num_list"] = json.dumps([pn + 1])
-            d["top_list"] = json.dumps([0])
-            d["position_list"] = json.dumps([
-                (pn + 1, 0, img.size[0] if img else 0, 0, img.size[1] if img else 0)])
+            d["page_num_int"] = [pn + 1]
+            d["top_int"] = [0]
+            d["position_int"] = [(pn + 1, 0, img.size[0] if img else 0, 0, img.size[1] if img else 0)]
             tokenize(d, txt, eng)
             res.append(d)
         return res
diff --git a/rag/nlp/__init__.py b/rag/nlp/__init__.py
index 69573375a8..2aaf98aab0 100644
--- a/rag/nlp/__init__.py
+++ b/rag/nlp/__init__.py
@@ -22,7 +22,6 @@
 from . import rag_tokenizer
 import re
 import copy
-import json
 import roman_numbers as r
 from word2number import w2n
 from cn2an import cn2an
@@ -311,16 +310,16 @@ def tokenize_table(tbls, doc, eng, batch_size=10):
 def add_positions(d, poss):
     if not poss:
         return
-    page_num_list = []
-    position_list = []
-    top_list = []
+    page_num_int = []
+    position_int = []
+    top_int = []
     for pn, left, right, top, bottom in poss:
-        page_num_list.append(int(pn + 1))
-        top_list.append(int(top))
-        position_list.append((int(pn + 1), int(left), int(right), int(top), int(bottom)))
-    d["page_num_list"] = json.dumps(page_num_list)
-    d["position_list"] = json.dumps(position_list)
-    d["top_list"] = json.dumps(top_list)
+        page_num_int.append(int(pn + 1))
+        top_int.append(int(top))
+        position_int.append((int(pn + 1), int(left), int(right), int(top), int(bottom)))
+    d["page_num_int"] = page_num_int
+    d["position_int"] = position_int
+    d["top_int"] = top_int
 
 
 def remove_contents_table(sections, eng=False):
diff --git a/rag/nlp/search.py b/rag/nlp/search.py
index c8de4df056..9f877ef4fb 100644
--- a/rag/nlp/search.py
+++ b/rag/nlp/search.py
@@ -16,7 +16,6 @@
 
 import logging
 import re
-import json
 from dataclasses import dataclass
 
 from rag.utils import rmSpace
@@ -74,7 +73,7 @@ def search(self, req, idx_names: str | list[str], kb_ids: list[str], emb_mdl=Non
         offset, limit = pg * ps, (pg + 1) * ps
 
         src = req.get("fields", ["docnm_kwd", "content_ltks", "kb_id", "img_id", "title_tks", "important_kwd",
-                                 "doc_id", "position_list", "knowledge_graph_kwd", "question_kwd", "question_tks",
+                                 "doc_id", "page_num_int", "top_int", "create_timestamp_flt", "knowledge_graph_kwd", "question_kwd", "question_tks",
                                  "available_int", "content_with_weight", "pagerank_fea"])
         kwds = set([])
 
@@ -82,6 +81,8 @@ def search(self, req, idx_names: str | list[str], kb_ids: list[str], emb_mdl=Non
         q_vec = []
         if not qst:
             if req.get("sort"):
+                orderBy.asc("page_num_int")
+                orderBy.asc("top_int")
                 orderBy.desc("create_timestamp_flt")
             res = self.dataStore.search(src, [], filters, [], orderBy, offset, limit, idx_names, kb_ids)
             total=self.dataStore.getTotal(res)
@@ -340,7 +341,7 @@ def floor_sim(score):
             chunk = sres.field[id]
             dnm = chunk["docnm_kwd"]
             did = chunk["doc_id"]
-            position_list = chunk.get("position_list", "[]")
+            position_int = chunk.get("position_int", [])
             d = {
                 "chunk_id": id,
                 "content_ltks": chunk["content_ltks"],
@@ -354,7 +355,7 @@ def floor_sim(score):
                 "vector_similarity": vsim[i],
                 "term_similarity": tsim[i],
                 "vector": chunk.get(vector_column, zero_vector),
-                "positions": json.loads(position_list)
+                "positions": position_int,
             }
             if highlight and sres.highlight:
                 if id in sres.highlight:
diff --git a/rag/svr/task_executor.py b/rag/svr/task_executor.py
index 606bb07571..902c1e31ae 100644
--- a/rag/svr/task_executor.py
+++ b/rag/svr/task_executor.py
@@ -211,9 +211,9 @@ def build_chunks(task, progress_callback):
         if not d.get("image"):
             _ = d.pop("image", None)
             d["img_id"] = ""
-            d["page_num_list"] = json.dumps([])
-            d["position_list"] = json.dumps([])
-            d["top_list"] = json.dumps([])
+            d["page_num_int"] = []
+            d["position_int"] = []
+            d["top_int"] = []
             docs.append(d)
             continue
 
diff --git a/rag/utils/es_conn.py b/rag/utils/es_conn.py
index a473833f45..35d6428695 100644
--- a/rag/utils/es_conn.py
+++ b/rag/utils/es_conn.py
@@ -185,8 +185,14 @@ def search(self, selectFields: list[str], highlightFields: list[str], condition:
             orders = list()
             for field, order in orderBy.fields:
                 order = "asc" if order == 0 else "desc"
-                orders.append({field: {"order": order, "unmapped_type": "float",
-                                       "mode": "avg", "numeric_type": "double"}})
+                if field in ["page_num_int", "top_int"]:
+                    order_info = {"order": order, "unmapped_type": "float",
+                                "mode": "avg", "numeric_type": "double"}
+                elif field.endswith("_int") or field.endswith("_flt"):
+                    order_info = {"order": order, "unmapped_type": "float"}
+                else:
+                    order_info = {"order": order, "unmapped_type": "text"}
+                orders.append({field: order_info})
             s = s.sort(*orders)
 
         if limit > 0:
diff --git a/rag/utils/infinity_conn.py b/rag/utils/infinity_conn.py
index 5c0e2ef695..227c0bc6a4 100644
--- a/rag/utils/infinity_conn.py
+++ b/rag/utils/infinity_conn.py
@@ -297,7 +297,7 @@ def search(
                 df_list.append(kb_res)
         self.connPool.release_conn(inf_conn)
         res = concat_dataframes(df_list, selectFields)
-        logger.debug("INFINITY search tables: " + str(table_list))
+        logger.debug(f"INFINITY search tables: {str(table_list)}, result: {str(res)}")
         return res
 
     def get(
@@ -307,8 +307,10 @@ def get(
         db_instance = inf_conn.get_database(self.dbName)
         df_list = list()
         assert isinstance(knowledgebaseIds, list)
+        table_list = list()
         for knowledgebaseId in knowledgebaseIds:
             table_name = f"{indexName}_{knowledgebaseId}"
+            table_list.append(table_name)
             table_instance = db_instance.get_table(table_name)
             kb_res = table_instance.output(["*"]).filter(f"id = '{chunkId}'").to_pl()
             if len(kb_res) != 0 and kb_res.shape[0] > 0:
@@ -316,6 +318,7 @@ def get(
 
         self.connPool.release_conn(inf_conn)
         res = concat_dataframes(df_list, ["id"])
+        logger.debug(f"INFINITY get tables: {str(table_list)}, result: {str(res)}")
         res_fields = self.getFields(res, res.columns)
         return res_fields.get(chunkId, None)
 
@@ -349,15 +352,22 @@ def insert(
             for k, v in d.items():
                 if k.endswith("_kwd") and isinstance(v, list):
                     d[k] = " ".join(v)
-                if k == 'kb_id':
+                elif k == 'kb_id':
                     if isinstance(d[k], list):
                         d[k] = d[k][0] # since d[k] is a list, but we need a str
+                elif k == "position_int":
+                    assert isinstance(v, list)
+                    arr = [num for row in v for num in row]
+                    d[k] = "_".join(f"{num:08x}" for num in arr)
+                elif k in ["page_num_int", "top_int", "position_int"]:
+                    assert isinstance(v, list)
+                    d[k] = "_".join(f"{num:08x}" for num in v)
         ids = ["'{}'".format(d["id"]) for d in documents]
         str_ids = ", ".join(ids)
         str_filter = f"id IN ({str_ids})"
         table_instance.delete(str_filter)
         # for doc in documents:
-        #     logger.info(f"insert position_list: {doc['position_list']}")
+        #     logger.info(f"insert position_int: {doc['position_int']}")
         # logger.info(f"InfinityConnection.insert {json.dumps(documents)}")
         table_instance.insert(documents)
         self.connPool.release_conn(inf_conn)
@@ -367,8 +377,8 @@ def insert(
     def update(
             self, condition: dict, newValue: dict, indexName: str, knowledgebaseId: str
     ) -> bool:
-        # if 'position_list' in newValue:
-        #     logger.info(f"upsert position_list: {newValue['position_list']}")
+        # if 'position_int' in newValue:
+        #     logger.info(f"update position_int: {newValue['position_int']}")
         inf_conn = self.connPool.get_conn()
         db_instance = inf_conn.get_database(self.dbName)
         table_name = f"{indexName}_{knowledgebaseId}"
@@ -377,6 +387,16 @@ def update(
         for k, v in newValue.items():
             if k.endswith("_kwd") and isinstance(v, list):
                 newValue[k] = " ".join(v)
+            elif k == 'kb_id':
+                if isinstance(newValue[k], list):
+                    newValue[k] = newValue[k][0] # since d[k] is a list, but we need a str
+            elif k == "position_int":
+                assert isinstance(v, list)
+                arr = [num for row in v for num in row]
+                newValue[k] = "_".join(f"{num:08x}" for num in arr)
+            elif k in ["page_num_int", "top_int"]:
+                assert isinstance(v, list)
+                newValue[k] = "_".join(f"{num:08x}" for num in v)
         table_instance.update(filter, newValue)
         self.connPool.release_conn(inf_conn)
         return True
@@ -423,9 +443,22 @@ def getFields(self, res, fields: list[str]) -> list[str, dict]:
                 v = res[fieldnm][i]
                 if isinstance(v, Series):
                     v = list(v)
-                elif fieldnm == "important_kwd":
+                elif fieldnm.endswith("_kwd"):
                     assert isinstance(v, str)
                     v = v.split()
+                elif fieldnm == "position_int":
+                    assert isinstance(v, str)
+                    if v:
+                        arr = [int(hex_val, 16) for hex_val in v.split('_')]
+                        v = [arr[i:i + 4] for i in range(0, len(arr), 4)]
+                    else:
+                        v = []
+                elif fieldnm in ["page_num_int", "top_int"]:
+                    assert isinstance(v, str)
+                    if v:
+                        v = [int(hex_val, 16) for hex_val in v.split('_')]
+                    else:
+                        v = []
                 else:
                     if not isinstance(v, str):
                         v = str(v)

From fc4e644e5f174d0364eb3137fe31be0c78d91ee0 Mon Sep 17 00:00:00 2001
From: balibabu <cike8899@users.noreply.github.com>
Date: Tue, 10 Dec 2024 16:36:16 +0800
Subject: [PATCH 2/2] Feat: Modify the data structure of the chunk in the
 conversation #3909 (#3955)

### What problem does this PR solve?

Feat: Modify the data structure of the chunk in the conversation #3909

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
---
 .../api-service/chat-api-key-modal/index.tsx  |   2 +-
 .../chat-overview-modal/api-content.tsx       |  17 +--
 .../api-service/embed-modal/index.less        |   4 +
 .../api-service/embed-modal/index.tsx         |  35 +++++-
 web/src/components/api-service/hooks.ts       |  55 ++++++---
 web/src/components/message-item/index.tsx     |   5 +-
 web/src/components/pdf-drawer/hooks.ts        |   8 +-
 web/src/components/pdf-drawer/index.tsx       |   3 +-
 web/src/components/pdf-previewer/index.tsx    |   7 +-
 web/src/hooks/chat-hooks.ts                   |   8 +-
 web/src/hooks/document-hooks.ts               |   5 +-
 web/src/hooks/logic-hooks.ts                  |   2 +
 web/src/hooks/user-setting-hooks.tsx          |  24 +++-
 web/src/interfaces/database/chat.ts           |  19 +++-
 web/src/locales/config.ts                     |   2 +-
 web/src/locales/en.ts                         |   1 +
 web/src/locales/ja.ts                         |  33 +++---
 web/src/locales/zh-traditional.ts             |   1 +
 web/src/locales/zh.ts                         |   1 +
 web/src/pages/chat/index.tsx                  |  35 +++---
 web/src/pages/chat/markdown-content/index.tsx |  18 +--
 web/src/pages/chat/share/large.tsx            |  31 +++--
 web/src/pages/chat/shared-hooks.ts            | 107 ++++++------------
 web/src/pages/flow/header/index.tsx           |  47 ++++----
 web/src/pages/flow/hooks.tsx                  |  14 +++
 web/src/utils/authorization-util.ts           |   6 +-
 web/src/utils/document-util.ts                |  10 +-
 27 files changed, 301 insertions(+), 199 deletions(-)

diff --git a/web/src/components/api-service/chat-api-key-modal/index.tsx b/web/src/components/api-service/chat-api-key-modal/index.tsx
index e586d37273..2497f0fa26 100644
--- a/web/src/components/api-service/chat-api-key-modal/index.tsx
+++ b/web/src/components/api-service/chat-api-key-modal/index.tsx
@@ -63,7 +63,7 @@ const ChatApiKeyModal = ({
         <Button
           onClick={createToken}
           loading={creatingLoading}
-          disabled={tokenList.length > 0}
+          disabled={tokenList?.length > 0}
         >
           {t('createNewKey')}
         </Button>
diff --git a/web/src/components/api-service/chat-overview-modal/api-content.tsx b/web/src/components/api-service/chat-overview-modal/api-content.tsx
index 033e28e8f9..cd00e69fe8 100644
--- a/web/src/components/api-service/chat-overview-modal/api-content.tsx
+++ b/web/src/components/api-service/chat-overview-modal/api-content.tsx
@@ -3,8 +3,7 @@ import apiDoc from '@parent/docs/references/http_api_reference.md';
 import MarkdownPreview from '@uiw/react-markdown-preview';
 import { Button, Card, Flex, Space } from 'antd';
 import ChatApiKeyModal from '../chat-api-key-modal';
-import EmbedModal from '../embed-modal';
-import { usePreviewChat, useShowEmbedModal } from '../hooks';
+import { usePreviewChat } from '../hooks';
 import BackendServiceApi from './backend-service-api';
 
 const ApiContent = ({
@@ -22,10 +21,10 @@ const ApiContent = ({
     hideModal: hideApiKeyModal,
     showModal: showApiKeyModal,
   } = useSetModalState();
-  const { embedVisible, hideEmbedModal, showEmbedModal, embedToken } =
-    useShowEmbedModal(idKey, id);
+  // const { embedVisible, hideEmbedModal, showEmbedModal, embedToken } =
+  //   useShowEmbedModal(idKey);
 
-  const { handlePreview } = usePreviewChat(idKey, id);
+  const { handlePreview } = usePreviewChat(idKey);
 
   return (
     <div>
@@ -36,7 +35,9 @@ const ApiContent = ({
             <Flex gap={8} vertical>
               <Space size={'middle'}>
                 <Button onClick={handlePreview}>{t('preview')}</Button>
-                <Button onClick={showEmbedModal}>{t('embedded')}</Button>
+                {/* <Button onClick={() => showEmbedModal(id)}>
+                  {t('embedded')}
+                </Button> */}
               </Space>
             </Flex>
           </Card>
@@ -50,13 +51,13 @@ const ApiContent = ({
           idKey={idKey}
         ></ChatApiKeyModal>
       )}
-      {embedVisible && (
+      {/* {embedVisible && (
         <EmbedModal
           token={embedToken}
           visible={embedVisible}
           hideModal={hideEmbedModal}
         ></EmbedModal>
-      )}
+      )} */}
     </div>
   );
 };
diff --git a/web/src/components/api-service/embed-modal/index.less b/web/src/components/api-service/embed-modal/index.less
index b2c0cfbba8..cf39347008 100644
--- a/web/src/components/api-service/embed-modal/index.less
+++ b/web/src/components/api-service/embed-modal/index.less
@@ -6,3 +6,7 @@
   padding: 10px;
   background-color: #ffffff09;
 }
+
+.id {
+  .linkText();
+}
diff --git a/web/src/components/api-service/embed-modal/index.tsx b/web/src/components/api-service/embed-modal/index.tsx
index 7c142b7205..1caee0a644 100644
--- a/web/src/components/api-service/embed-modal/index.tsx
+++ b/web/src/components/api-service/embed-modal/index.tsx
@@ -1,21 +1,33 @@
 import CopyToClipboard from '@/components/copy-to-clipboard';
 import HightLightMarkdown from '@/components/highlight-markdown';
+import { SharedFrom } from '@/constants/chat';
 import { useTranslate } from '@/hooks/common-hooks';
 import { IModalProps } from '@/interfaces/common';
-import { Card, Modal, Tabs, TabsProps } from 'antd';
+import { Card, Modal, Tabs, TabsProps, Typography } from 'antd';
+
 import styles from './index.less';
 
+const { Paragraph, Link } = Typography;
+
 const EmbedModal = ({
   visible,
   hideModal,
   token = '',
-}: IModalProps<any> & { token: string }) => {
+  form,
+  beta = '',
+  isAgent,
+}: IModalProps<any> & {
+  token: string;
+  form: SharedFrom;
+  beta: string;
+  isAgent: boolean;
+}) => {
   const { t } = useTranslate('chat');
 
   const text = `
   ~~~ html
   <iframe
-  src="${location.origin}/chat/share?shared_id=${token}"
+  src="${location.origin}/chat/share?shared_id=${token}&from=${form}&auth=${beta}"
   style="width: 100%; height: 100%; min-height: 600px"
   frameborder="0"
 >
@@ -63,6 +75,23 @@ const EmbedModal = ({
       onCancel={hideModal}
     >
       <Tabs defaultActiveKey="1" items={items} onChange={onChange} />
+      <div className="text-base font-medium mt-4 mb-1">
+        {t(isAgent ? 'flow' : 'chat', { keyPrefix: 'header' })}
+        <span className="ml-1 inline-block">ID</span>
+      </div>
+      <Paragraph copyable={{ text: token }} className={styles.id}>
+        {token}
+      </Paragraph>
+      <Link
+        href={
+          isAgent
+            ? 'https://ragflow.io/docs/dev/http_api_reference#create-session-with-an-agent'
+            : 'https://ragflow.io/docs/dev/http_api_reference#create-session-with-chat-assistant'
+        }
+        target="_blank"
+      >
+        {t('howUseId')}
+      </Link>
     </Modal>
   );
 };
diff --git a/web/src/components/api-service/hooks.ts b/web/src/components/api-service/hooks.ts
index 006cbe43ef..16878d84d8 100644
--- a/web/src/components/api-service/hooks.ts
+++ b/web/src/components/api-service/hooks.ts
@@ -6,6 +6,7 @@ import {
 } from '@/hooks/common-hooks';
 import {
   useCreateSystemToken,
+  useFetchManualSystemTokenList,
   useFetchSystemTokenList,
   useRemoveSystemToken,
 } from '@/hooks/user-setting-hooks';
@@ -17,9 +18,7 @@ import { useCallback } from 'react';
 export const useOperateApiKey = (idKey: string, dialogId?: string) => {
   const { removeToken } = useRemoveSystemToken();
   const { createToken, loading: creatingLoading } = useCreateSystemToken();
-  const { data: tokenList, loading: listLoading } = useFetchSystemTokenList({
-    [idKey]: dialogId,
-  });
+  const { data: tokenList, loading: listLoading } = useFetchSystemTokenList();
 
   const showDeleteConfirm = useShowDeleteConfirm();
 
@@ -72,49 +71,68 @@ export const useShowTokenEmptyError = () => {
   return { showTokenEmptyError };
 };
 
+export const useShowBetaEmptyError = () => {
+  const { t } = useTranslate('chat');
+
+  const showBetaEmptyError = useCallback(() => {
+    message.error(t('betaError'));
+  }, [t]);
+  return { showBetaEmptyError };
+};
+
 const getUrlWithToken = (token: string, from: string = 'chat') => {
   const { protocol, host } = window.location;
   return `${protocol}//${host}/chat/share?shared_id=${token}&from=${from}`;
 };
 
-const useFetchTokenListBeforeOtherStep = (idKey: string, dialogId?: string) => {
+const useFetchTokenListBeforeOtherStep = () => {
   const { showTokenEmptyError } = useShowTokenEmptyError();
+  const { showBetaEmptyError } = useShowBetaEmptyError();
+
+  const { data: tokenList, fetchSystemTokenList } =
+    useFetchManualSystemTokenList();
 
-  const { data: tokenList, refetch } = useFetchSystemTokenList({
-    [idKey]: dialogId,
-  });
+  let token = '',
+    beta = '';
 
-  const token =
+  if (Array.isArray(tokenList) && tokenList.length > 0) {
+    token = tokenList[0].token;
+    beta = tokenList[0].beta;
+  }
+
+  token =
     Array.isArray(tokenList) && tokenList.length > 0 ? tokenList[0].token : '';
 
   const handleOperate = useCallback(async () => {
-    const ret = await refetch();
-    const list = ret.data;
+    const ret = await fetchSystemTokenList();
+    const list = ret;
     if (Array.isArray(list) && list.length > 0) {
+      if (!list[0].beta) {
+        showBetaEmptyError();
+        return false;
+      }
       return list[0]?.token;
     } else {
       showTokenEmptyError();
       return false;
     }
-  }, [showTokenEmptyError, refetch]);
+  }, [fetchSystemTokenList, showBetaEmptyError, showTokenEmptyError]);
 
   return {
     token,
+    beta,
     handleOperate,
   };
 };
 
-export const useShowEmbedModal = (idKey: string, dialogId?: string) => {
+export const useShowEmbedModal = () => {
   const {
     visible: embedVisible,
     hideModal: hideEmbedModal,
     showModal: showEmbedModal,
   } = useSetModalState();
 
-  const { handleOperate, token } = useFetchTokenListBeforeOtherStep(
-    idKey,
-    dialogId,
-  );
+  const { handleOperate, token, beta } = useFetchTokenListBeforeOtherStep();
 
   const handleShowEmbedModal = useCallback(async () => {
     const succeed = await handleOperate();
@@ -128,11 +146,12 @@ export const useShowEmbedModal = (idKey: string, dialogId?: string) => {
     hideEmbedModal,
     embedVisible,
     embedToken: token,
+    beta,
   };
 };
 
-export const usePreviewChat = (idKey: string, dialogId?: string) => {
-  const { handleOperate } = useFetchTokenListBeforeOtherStep(idKey, dialogId);
+export const usePreviewChat = (idKey: string) => {
+  const { handleOperate } = useFetchTokenListBeforeOtherStep();
 
   const open = useCallback(
     (t: string) => {
diff --git a/web/src/components/message-item/index.tsx b/web/src/components/message-item/index.tsx
index eab098056c..9e152c6072 100644
--- a/web/src/components/message-item/index.tsx
+++ b/web/src/components/message-item/index.tsx
@@ -1,8 +1,7 @@
 import { ReactComponent as AssistantIcon } from '@/assets/svg/assistant.svg';
 import { MessageType } from '@/constants/chat';
 import { useSetModalState } from '@/hooks/common-hooks';
-import { IReference } from '@/interfaces/database/chat';
-import { IChunk } from '@/interfaces/database/knowledge';
+import { IReference, IReferenceChunk } from '@/interfaces/database/chat';
 import classNames from 'classnames';
 import { memo, useCallback, useEffect, useMemo, useState } from 'react';
 
@@ -31,7 +30,7 @@ interface IProps extends Partial<IRemoveMessageById>, IRegenerateMessage {
   sendLoading?: boolean;
   nickname?: string;
   avatar?: string;
-  clickDocumentButton?: (documentId: string, chunk: IChunk) => void;
+  clickDocumentButton?: (documentId: string, chunk: IReferenceChunk) => void;
   index: number;
   showLikeButton?: boolean;
 }
diff --git a/web/src/components/pdf-drawer/hooks.ts b/web/src/components/pdf-drawer/hooks.ts
index 022b29f84d..fe65009aa0 100644
--- a/web/src/components/pdf-drawer/hooks.ts
+++ b/web/src/components/pdf-drawer/hooks.ts
@@ -1,14 +1,16 @@
 import { useSetModalState } from '@/hooks/common-hooks';
-import { IChunk } from '@/interfaces/database/knowledge';
+import { IReferenceChunk } from '@/interfaces/database/chat';
 import { useCallback, useState } from 'react';
 
 export const useClickDrawer = () => {
   const { visible, showModal, hideModal } = useSetModalState();
-  const [selectedChunk, setSelectedChunk] = useState<IChunk>({} as IChunk);
+  const [selectedChunk, setSelectedChunk] = useState<IReferenceChunk>(
+    {} as IReferenceChunk,
+  );
   const [documentId, setDocumentId] = useState<string>('');
 
   const clickDocumentButton = useCallback(
-    (documentId: string, chunk: IChunk) => {
+    (documentId: string, chunk: IReferenceChunk) => {
       showModal();
       setSelectedChunk(chunk);
       setDocumentId(documentId);
diff --git a/web/src/components/pdf-drawer/index.tsx b/web/src/components/pdf-drawer/index.tsx
index 77aa85358c..a584c2aa4d 100644
--- a/web/src/components/pdf-drawer/index.tsx
+++ b/web/src/components/pdf-drawer/index.tsx
@@ -1,11 +1,12 @@
 import { IModalProps } from '@/interfaces/common';
+import { IReferenceChunk } from '@/interfaces/database/chat';
 import { IChunk } from '@/interfaces/database/knowledge';
 import { Drawer } from 'antd';
 import DocumentPreviewer from '../pdf-previewer';
 
 interface IProps extends IModalProps<any> {
   documentId: string;
-  chunk: IChunk;
+  chunk: IChunk | IReferenceChunk;
 }
 
 export const PdfDrawer = ({
diff --git a/web/src/components/pdf-previewer/index.tsx b/web/src/components/pdf-previewer/index.tsx
index 6c470aad92..1bb44383e4 100644
--- a/web/src/components/pdf-previewer/index.tsx
+++ b/web/src/components/pdf-previewer/index.tsx
@@ -2,7 +2,9 @@ import {
   useGetChunkHighlights,
   useGetDocumentUrl,
 } from '@/hooks/document-hooks';
+import { IReferenceChunk } from '@/interfaces/database/chat';
 import { IChunk } from '@/interfaces/database/knowledge';
+import FileError from '@/pages/document-viewer/file-error';
 import { Skeleton } from 'antd';
 import { useEffect, useRef, useState } from 'react';
 import {
@@ -13,13 +15,12 @@ import {
   PdfLoader,
   Popup,
 } from 'react-pdf-highlighter';
-
-import FileError from '@/pages/document-viewer/file-error';
 import { useCatchDocumentError } from './hooks';
+
 import styles from './index.less';
 
 interface IProps {
-  chunk: IChunk;
+  chunk: IChunk | IReferenceChunk;
   documentId: string;
   visible: boolean;
 }
diff --git a/web/src/hooks/chat-hooks.ts b/web/src/hooks/chat-hooks.ts
index 7346c04753..2cb461e37b 100644
--- a/web/src/hooks/chat-hooks.ts
+++ b/web/src/hooks/chat-hooks.ts
@@ -504,11 +504,17 @@ export const useCreateNextSharedConversation = () => {
   return { data, loading, createSharedConversation: mutateAsync };
 };
 
-export const useFetchNextSharedConversation = (conversationId: string) => {
+// deprecated
+export const useFetchNextSharedConversation = (
+  conversationId?: string | null,
+) => {
   const { data, isPending: loading } = useQuery({
     queryKey: ['fetchSharedConversation'],
     enabled: !!conversationId,
     queryFn: async () => {
+      if (!conversationId) {
+        return {};
+      }
       const { data } = await chatService.getExternalConversation(
         null,
         conversationId,
diff --git a/web/src/hooks/document-hooks.ts b/web/src/hooks/document-hooks.ts
index 17995b93c7..215d9b1d75 100644
--- a/web/src/hooks/document-hooks.ts
+++ b/web/src/hooks/document-hooks.ts
@@ -1,3 +1,4 @@
+import { IReferenceChunk } from '@/interfaces/database/chat';
 import { IDocumentInfo } from '@/interfaces/database/document';
 import { IChunk } from '@/interfaces/database/knowledge';
 import { IChangeParserConfigRequestBody } from '@/interfaces/request/document';
@@ -32,7 +33,9 @@ export const useGetDocumentUrl = (documentId?: string) => {
   return getDocumentUrl;
 };
 
-export const useGetChunkHighlights = (selectedChunk: IChunk) => {
+export const useGetChunkHighlights = (
+  selectedChunk: IChunk | IReferenceChunk,
+) => {
   const [size, setSize] = useState({ width: 849, height: 1200 });
 
   const highlights: IHighlight[] = useMemo(() => {
diff --git a/web/src/hooks/logic-hooks.ts b/web/src/hooks/logic-hooks.ts
index 4208974929..5c8afebb1e 100644
--- a/web/src/hooks/logic-hooks.ts
+++ b/web/src/hooks/logic-hooks.ts
@@ -12,6 +12,7 @@ import { PaginationProps, message } from 'antd';
 import { FormInstance } from 'antd/lib';
 import axios from 'axios';
 import { EventSourceParserStream } from 'eventsource-parser/stream';
+import { omit } from 'lodash';
 import {
   ChangeEventHandler,
   useCallback,
@@ -336,6 +337,7 @@ export const useSelectDerivedMessages = () => {
           }),
           prompt: answer.prompt,
           audio_binary: answer.audio_binary,
+          ...omit(answer, 'reference'),
         },
       ];
     });
diff --git a/web/src/hooks/user-setting-hooks.tsx b/web/src/hooks/user-setting-hooks.tsx
index 6b14f3536f..2f19cb9c80 100644
--- a/web/src/hooks/user-setting-hooks.tsx
+++ b/web/src/hooks/user-setting-hooks.tsx
@@ -169,17 +169,34 @@ export const useFetchSystemStatus = () => {
   };
 };
 
-export const useFetchSystemTokenList = (params: Record<string, any>) => {
+export const useFetchManualSystemTokenList = () => {
+  const {
+    data,
+    isPending: loading,
+    mutateAsync,
+  } = useMutation({
+    mutationKey: ['fetchManualSystemTokenList'],
+    mutationFn: async () => {
+      const { data } = await userService.listToken();
+
+      return data?.data ?? [];
+    },
+  });
+
+  return { data, loading, fetchSystemTokenList: mutateAsync };
+};
+
+export const useFetchSystemTokenList = () => {
   const {
     data,
     isFetching: loading,
     refetch,
   } = useQuery<IToken[]>({
-    queryKey: ['fetchSystemTokenList', params],
+    queryKey: ['fetchSystemTokenList'],
     initialData: [],
     gcTime: 0,
     queryFn: async () => {
-      const { data } = await userService.listToken(params);
+      const { data } = await userService.listToken();
 
       return data?.data ?? [];
     },
@@ -213,6 +230,7 @@ export const useRemoveSystemToken = () => {
 
 export const useCreateSystemToken = () => {
   const queryClient = useQueryClient();
+
   const {
     data,
     isPending: loading,
diff --git a/web/src/interfaces/database/chat.ts b/web/src/interfaces/database/chat.ts
index e00d4ed7ed..7b21510cc1 100644
--- a/web/src/interfaces/database/chat.ts
+++ b/web/src/interfaces/database/chat.ts
@@ -1,5 +1,4 @@
 import { MessageType } from '@/constants/chat';
-import { IChunk } from './knowledge';
 
 export interface PromptConfig {
   empty_response: string;
@@ -35,7 +34,7 @@ export interface IDialog {
   description: string;
   icon: string;
   id: string;
-  dialog_id?: string;
+  dialog_id: string;
   kb_ids: string[];
   kb_names: string[];
   language: string;
@@ -75,8 +74,21 @@ export interface Message {
   audio_binary?: string;
 }
 
+export interface IReferenceChunk {
+  id: string;
+  content: null;
+  document_id: string;
+  document_name: string;
+  dataset_id: string;
+  image_id: string;
+  similarity: number;
+  vector_similarity: number;
+  term_similarity: number;
+  positions: number[];
+}
+
 export interface IReference {
-  chunks: IChunk[];
+  chunks: IReferenceChunk[];
   doc_aggs: Docagg[];
   total: number;
 }
@@ -117,6 +129,7 @@ export interface IToken {
   token: string;
   update_date?: any;
   update_time?: any;
+  beta: string;
 }
 
 export interface IStats {
diff --git a/web/src/locales/config.ts b/web/src/locales/config.ts
index 0da80e594d..83f6ca42db 100644
--- a/web/src/locales/config.ts
+++ b/web/src/locales/config.ts
@@ -2,11 +2,11 @@ import i18n from 'i18next';
 import LanguageDetector from 'i18next-browser-languagedetector';
 import { initReactI18next } from 'react-i18next';
 
-import { createTranslationTable, flattenObject } from './until';
 import translation_en from './en';
 import translation_es from './es';
 import translation_id from './id';
 import translation_ja from './ja';
+import { createTranslationTable, flattenObject } from './until';
 import translation_vi from './vi';
 import translation_zh from './zh';
 import translation_zh_traditional from './zh-traditional';
diff --git a/web/src/locales/en.ts b/web/src/locales/en.ts
index 06ec1c56fd..cc9fb5bc95 100644
--- a/web/src/locales/en.ts
+++ b/web/src/locales/en.ts
@@ -432,6 +432,7 @@ The above is the content you need to summarize.`,
       partialTitle: 'Partial Embed',
       extensionTitle: 'Chrome Extension',
       tokenError: 'Please create API Token first!',
+      betaError: 'The beta field of the API Token cannot be empty!',
       searching: 'searching...',
       parsing: 'Parsing',
       uploading: 'Uploading',
diff --git a/web/src/locales/ja.ts b/web/src/locales/ja.ts
index 9f55d1d8c2..0a0f63e655 100644
--- a/web/src/locales/ja.ts
+++ b/web/src/locales/ja.ts
@@ -33,6 +33,7 @@ export default {
       pleaseSelect: '選択してください',
       pleaseInput: '入力してください',
       submit: '送信',
+      japanese: '日本語',
     },
     login: {
       login: 'ログイン',
@@ -85,8 +86,7 @@ export default {
       name: '名前',
       namePlaceholder: '名前を入力してください',
       doc: 'ドキュメント',
-      datasetDescription:
-        '😉 パースが成功すると、質問と回答が可能になります。',
+      datasetDescription: '😉 パースが成功すると、質問と回答が可能になります。',
       addFile: 'ファイルを追加',
       searchFiles: 'ファイルを検索',
       localFiles: 'ローカルファイル',
@@ -157,8 +157,7 @@ export default {
       topK: 'トップK',
       topKTip: `Kチャンクがリランキングモデルに供給されます。`,
       delimiter: `区切り文字`,
-      delimiterTip:
-        '複数文字の区切り文字をサポートしています。',
+      delimiterTip: '複数文字の区切り文字をサポートしています。',
       html4excel: 'ExcelをHTMLに変換',
       html4excelTip: `有効にすると、スプレッドシートはHTMLテーブルとして解析されます。それ以外の場合、キーと値のペアとして解析されます。`,
       autoKeywords: '自動キーワード',
@@ -182,7 +181,7 @@ export default {
       embeddingModelTip:
         'チャンクを埋め込みに変換するモデルです。一度チャンクが作成されると変更できません。',
       permissionsTip:
-        "「チーム」に設定すると、全てのチームメンバーがナレッジベースを管理できます。",
+        '「チーム」に設定すると、全てのチームメンバーがナレッジベースを管理できます。',
       chunkTokenNumberTip:
         'チャンクのトークンしきい値を設定します。このしきい値を下回る段落は、次の段落と結合され、しきい値を超えた時点でチャンクが作成されます。',
       chunkMethod: 'チャンク方法',
@@ -201,8 +200,7 @@ export default {
       methodExamplesDescription:
         '以下のスクリーンショットは明確な説明のために提供されています。',
       dialogueExamplesTitle: '会話の例',
-      methodEmpty:
-        'ナレッジベースカテゴリの視覚的説明がここに表示されます',
+      methodEmpty: 'ナレッジベースカテゴリの視覚的説明がここに表示されます',
       book: `<p>対応ファイル形式は<b>DOCX</b>, <b>PDF</b>, <b>TXT</b>です。</p><p>
       PDF形式の書籍では、解析時間を短縮するため、<i>ページ範囲</i>を設定してください。</p>`,
       laws: `<p>対応ファイル形式は<b>DOCX</b>, <b>PDF</b>, <b>TXT</b>です。</p><p>
@@ -305,7 +303,7 @@ export default {
       entityTypes: 'エンティティタイプ',
       pageRank: 'ページランク',
       pageRankTip: `これは関連性スコアを高めるために使用されます。すべての取得されたチャンクの関連性スコアにこの数値が加算されます。
-特定のナレッジベースを最初に検索したい場合は、他のものよりも高いページランクスコアを設定してください。`
+特定のナレッジベースを最初に検索したい場合は、他のものよりも高いページランクスコアを設定してください。`,
     },
     chunk: {
       chunk: 'チャンク',
@@ -360,8 +358,7 @@ export default {
       {knowledge}
       上記がナレッジベースです。`,
       systemMessage: '入力してください！',
-      systemTip:
-        'LLMが質問に答える際に従う指示を設定します。',
+      systemTip: 'LLMが質問に答える際に従う指示を設定します。',
       topN: 'トップN',
       topNTip: `類似度スコアがしきい値を超えるチャンクのうち、上位N件のみがLLMに供給されます。`,
       variable: '変数',
@@ -406,7 +403,8 @@ export default {
       quote: '引用を表示',
       quoteTip: '元のテキストの出典を表示しますか？',
       selfRag: 'Self-RAG',
-      selfRagTip: '詳細は次を参照してください：https://huggingface.co/papers/2310.11511',
+      selfRagTip:
+        '詳細は次を参照してください：https://huggingface.co/papers/2310.11511',
       overview: 'チャットID',
       pv: 'メッセージ数',
       uv: 'アクティブユーザー数',
@@ -486,7 +484,7 @@ export default {
       newPassword: '新しいパスワード',
       newPasswordMessage: 'パスワードを入力してください！',
       newPasswordDescription:
-        '新しいパスワードは8文字以上でなければなりません。',    
+        '新しいパスワードは8文字以上でなければなりません。',
       confirmPassword: '新しいパスワードの確認',
       confirmPasswordMessage: 'パスワードを確認してください！',
       confirmPasswordNonMatchMessage:
@@ -568,7 +566,7 @@ export default {
       SparkModelNameMessage: 'Sparkモデルを選択してください',
       addSparkAPIPassword: 'Spark APIパスワード',
       SparkAPIPasswordMessage: 'APIパスワードを入力してください',
-      addSparkAPPID: 'Spark APPID',          
+      addSparkAPPID: 'Spark APPID',
       SparkAPPIDMessage: 'APPIDを入力してください',
       addSparkAPISecret: 'Spark APIシークレット',
       SparkAPISecretMessage: 'APIシークレットを入力してください',
@@ -579,8 +577,7 @@ export default {
       yiyanAKMessage: 'APIキーを入力してください',
       addyiyanSK: 'yiyanシークレットキー',
       yiyanSKMessage: 'シークレットキーを入力してください',
-      FishAudioModelNameMessage:
-        '音声合成モデルに名前を付けてください',
+      FishAudioModelNameMessage: '音声合成モデルに名前を付けてください',
       addFishAudioAK: 'Fish Audio APIキー',
       addFishAudioAKMessage: 'APIキーを入力してください',
       addFishAudioRefID: 'FishAudio参照ID',
@@ -700,7 +697,7 @@ export default {
       relevantDescription: `LLMを使用して、上流の出力がユーザーの最新のクエリに関連しているかどうかを評価するコンポーネント。各判定結果に対して次のコンポーネントを指定してください。`,
       rewriteQuestionDescription: `ナレッジベースから関連情報を取得できなかった場合にユーザーのクエリを修正するコンポーネント。定義されたループの上限に達するまでこのプロセスを繰り返します。上流が「Relevant」、下流が「Retrieval」であることを確認してください。`,
       messageDescription:
-        "静的メッセージを送信するコンポーネント。複数のメッセージが提供されている場合は、その中からランダムに1つを選択して送信します。下流がインターフェースコンポーネント「Answer」であることを確認してください。",
+        '静的メッセージを送信するコンポーネント。複数のメッセージが提供されている場合は、その中からランダムに1つを選択して送信します。下流がインターフェースコンポーネント「Answer」であることを確認してください。',
       keywordDescription: `ユーザーの入力からトップNの検索結果を取得するコンポーネント。使用前にTopNの値が適切に設定されていることを確認してください。`,
       switchDescription: `前のコンポーネントの出力に基づいて条件を評価し、それに応じて実行の流れを指示するコンポーネント。ケースを定義し、各ケースのアクションまたは条件が満たされない場合のデフォルトアクションを指定することで、複雑な分岐ロジックを可能にします。`,
       wikipediaDescription: `wikipedia.orgから検索を行うコンポーネントで、TopNを使用して検索結果の数を指定します。既存のナレッジベースを補完します。`,
@@ -800,7 +797,7 @@ export default {
         news: 'ニュースと情報',
         law: '法律と規制',
         contract: '契約',
-      },      
+      },
       baiduSourceLangOptions: {
         auto: '自動検出',
         zh: '中国語',
@@ -1089,4 +1086,4 @@ export default {
       chat: 'チャット',
     },
   },
-};
\ No newline at end of file
+};
diff --git a/web/src/locales/zh-traditional.ts b/web/src/locales/zh-traditional.ts
index 8c1bcf904a..807ec96b9c 100644
--- a/web/src/locales/zh-traditional.ts
+++ b/web/src/locales/zh-traditional.ts
@@ -414,6 +414,7 @@ export default {
       partialTitle: '部分嵌入',
       extensionTitle: 'Chrome 插件',
       tokenError: '請先創建 API Token!',
+      betaError: 'API Token的beta欄位不可以為空！',
       searching: '搜索中',
       parsing: '解析中',
       uploading: '上傳中',
diff --git a/web/src/locales/zh.ts b/web/src/locales/zh.ts
index 7c05488bc9..fb8ed55a9e 100644
--- a/web/src/locales/zh.ts
+++ b/web/src/locales/zh.ts
@@ -431,6 +431,7 @@ export default {
       partialTitle: '部分嵌入',
       extensionTitle: 'Chrome 插件',
       tokenError: '请先创建 API Token!',
+      betaError: 'API Token的beta字段不可以为空！',
       searching: '搜索中',
       parsing: '解析中',
       uploading: '上传中',
diff --git a/web/src/pages/chat/index.tsx b/web/src/pages/chat/index.tsx
index 03b132ae52..ffc1461f1e 100644
--- a/web/src/pages/chat/index.tsx
+++ b/web/src/pages/chat/index.tsx
@@ -29,18 +29,20 @@ import {
   useSelectDerivedConversationList,
 } from './hooks';
 
+import EmbedModal from '@/components/api-service/embed-modal';
+import { useShowEmbedModal } from '@/components/api-service/hooks';
 import SvgIcon from '@/components/svg-icon';
 import { useTheme } from '@/components/theme-provider';
+import { SharedFrom } from '@/constants/chat';
 import {
   useClickConversationCard,
   useClickDialogCard,
   useFetchNextDialogList,
   useGetChatSearchParams,
 } from '@/hooks/chat-hooks';
-import { useSetModalState, useTranslate } from '@/hooks/common-hooks';
+import { useTranslate } from '@/hooks/common-hooks';
 import { useSetSelectedRecord } from '@/hooks/logic-hooks';
 import { IDialog } from '@/interfaces/database/chat';
-import ChatIdModal from './chat-id-modal';
 import styles from './index.less';
 
 const { Text } = Typography;
@@ -82,13 +84,10 @@ const Chat = () => {
     showDialogEditModal,
   } = useEditDialog();
   const { t } = useTranslate('chat');
-  const {
-    visible: overviewVisible,
-    hideModal: hideOverviewModal,
-    showModal: showOverviewModal,
-  } = useSetModalState();
   const { currentRecord, setRecord } = useSetSelectedRecord<IDialog>();
   const [controller, setController] = useState(new AbortController());
+  const { showEmbedModal, hideEmbedModal, embedVisible, beta } =
+    useShowEmbedModal();
 
   const handleAppCardEnter = (id: string) => () => {
     handleItemEnter(id);
@@ -120,7 +119,7 @@ const Chat = () => {
       info?.domEvent?.preventDefault();
       info?.domEvent?.stopPropagation();
       setRecord(dialog);
-      showOverviewModal();
+      showEmbedModal();
     };
 
   const handleRemoveConversation =
@@ -193,7 +192,7 @@ const Chat = () => {
         label: (
           <Space>
             <KeyOutlined />
-            {t('overview')}
+            {t('publish', { keyPrefix: 'flow' })}
           </Space>
         ),
       },
@@ -374,14 +373,16 @@ const Chat = () => {
         initialName={initialConversationName}
         loading={conversationRenameLoading}
       ></RenameModal>
-      {overviewVisible && (
-        <ChatIdModal
-          visible={overviewVisible}
-          hideModal={hideOverviewModal}
-          id={currentRecord.id}
-          name={currentRecord.name}
-          idKey="dialogId"
-        ></ChatIdModal>
+
+      {embedVisible && (
+        <EmbedModal
+          visible={embedVisible}
+          hideModal={hideEmbedModal}
+          token={currentRecord.id}
+          form={SharedFrom.Chat}
+          beta={beta}
+          isAgent={false}
+        ></EmbedModal>
       )}
     </Flex>
   );
diff --git a/web/src/pages/chat/markdown-content/index.tsx b/web/src/pages/chat/markdown-content/index.tsx
index bf2b5dc01e..5e0d30c209 100644
--- a/web/src/pages/chat/markdown-content/index.tsx
+++ b/web/src/pages/chat/markdown-content/index.tsx
@@ -1,7 +1,6 @@
 import Image from '@/components/image';
 import SvgIcon from '@/components/svg-icon';
-import { IReference } from '@/interfaces/database/chat';
-import { IChunk } from '@/interfaces/database/knowledge';
+import { IReference, IReferenceChunk } from '@/interfaces/database/chat';
 import { getExtension } from '@/utils/document-util';
 import { InfoCircleOutlined } from '@ant-design/icons';
 import { Button, Flex, Popover, Space } from 'antd';
@@ -11,6 +10,7 @@ import Markdown from 'react-markdown';
 import reactStringReplace from 'react-string-replace';
 import SyntaxHighlighter from 'react-syntax-highlighter';
 import rehypeKatex from 'rehype-katex';
+import rehypeRaw from 'rehype-raw';
 import remarkGfm from 'remark-gfm';
 import remarkMath from 'remark-math';
 import { visitParents } from 'unist-util-visit-parents';
@@ -36,7 +36,7 @@ const MarkdownContent = ({
   content: string;
   loading: boolean;
   reference: IReference;
-  clickDocumentButton?: (documentId: string, chunk: IChunk) => void;
+  clickDocumentButton?: (documentId: string, chunk: IReferenceChunk) => void;
 }) => {
   const { t } = useTranslation();
   const { setDocumentIds, data: fileThumbnails } =
@@ -54,7 +54,7 @@ const MarkdownContent = ({
   }, [reference, setDocumentIds]);
 
   const handleDocumentButtonClick = useCallback(
-    (documentId: string, chunk: IChunk, isPdf: boolean) => () => {
+    (documentId: string, chunk: IReferenceChunk, isPdf: boolean) => () => {
       if (!isPdf) {
         return;
       }
@@ -85,15 +85,15 @@ const MarkdownContent = ({
       const chunks = reference?.chunks ?? [];
       const chunkItem = chunks[chunkIndex];
       const document = reference?.doc_aggs?.find(
-        (x) => x?.doc_id === chunkItem?.doc_id,
+        (x) => x?.doc_id === chunkItem?.document_id,
       );
       const documentId = document?.doc_id;
       const fileThumbnail = documentId ? fileThumbnails[documentId] : '';
       const fileExtension = documentId ? getExtension(document?.doc_name) : '';
-      const imageId = chunkItem?.img_id;
+      const imageId = chunkItem?.image_id;
       return (
         <Flex
-          key={chunkItem?.chunk_id}
+          key={chunkItem?.id}
           gap={10}
           className={styles.referencePopoverWrapper}
         >
@@ -116,7 +116,7 @@ const MarkdownContent = ({
           <Space direction={'vertical'}>
             <div
               dangerouslySetInnerHTML={{
-                __html: DOMPurify.sanitize(chunkItem?.content_with_weight),
+                __html: DOMPurify.sanitize(chunkItem?.content ?? ''),
               }}
               className={styles.chunkContentText}
             ></div>
@@ -176,7 +176,7 @@ const MarkdownContent = ({
 
   return (
     <Markdown
-      rehypePlugins={[rehypeWrapReference, rehypeKatex]}
+      rehypePlugins={[rehypeWrapReference, rehypeKatex, rehypeRaw]}
       remarkPlugins={[remarkGfm, remarkMath]}
       components={
         {
diff --git a/web/src/pages/chat/share/large.tsx b/web/src/pages/chat/share/large.tsx
index d941b54565..d63b56e23b 100644
--- a/web/src/pages/chat/share/large.tsx
+++ b/web/src/pages/chat/share/large.tsx
@@ -1,21 +1,23 @@
 import MessageInput from '@/components/message-input';
 import MessageItem from '@/components/message-item';
+import { useClickDrawer } from '@/components/pdf-drawer/hooks';
 import { MessageType, SharedFrom } from '@/constants/chat';
-import { useFetchNextSharedConversation } from '@/hooks/chat-hooks';
 import { useSendButtonDisabled } from '@/pages/chat/hooks';
 import { Flex, Spin } from 'antd';
 import { forwardRef } from 'react';
 import {
-  useCreateSharedConversationOnMount,
   useGetSharedChatSearchParams,
   useSendSharedMessage,
 } from '../shared-hooks';
 import { buildMessageItemReference } from '../utils';
+
+import PdfDrawer from '@/components/pdf-drawer';
 import styles from './index.less';
 
 const ChatContainer = () => {
-  const { conversationId } = useCreateSharedConversationOnMount();
-  const { data } = useFetchNextSharedConversation(conversationId);
+  const { from, sharedId: conversationId } = useGetSharedChatSearchParams();
+  const { visible, hideModal, documentId, selectedChunk, clickDocumentButton } =
+    useClickDrawer();
 
   const {
     handlePressEnter,
@@ -25,9 +27,13 @@ const ChatContainer = () => {
     loading,
     ref,
     derivedMessages,
-  } = useSendSharedMessage(conversationId);
+    hasError,
+  } = useSendSharedMessage();
   const sendDisabled = useSendButtonDisabled(value);
-  const { from } = useGetSharedChatSearchParams();
+
+  if (!conversationId) {
+    return <div>empty</div>;
+  }
 
   return (
     <>
@@ -44,7 +50,7 @@ const ChatContainer = () => {
                     reference={buildMessageItemReference(
                       {
                         message: derivedMessages,
-                        reference: data?.data?.reference,
+                        reference: [],
                       },
                       message,
                     )}
@@ -54,6 +60,7 @@ const ChatContainer = () => {
                       derivedMessages?.length - 1 === i
                     }
                     index={i}
+                    clickDocumentButton={clickDocumentButton}
                   ></MessageItem>
                 );
               })}
@@ -65,7 +72,7 @@ const ChatContainer = () => {
         <MessageInput
           isShared
           value={value}
-          disabled={false}
+          disabled={hasError}
           sendDisabled={sendDisabled}
           conversationId={conversationId}
           onInputChange={handleInputChange}
@@ -75,6 +82,14 @@ const ChatContainer = () => {
           showUploadIcon={from === SharedFrom.Chat}
         ></MessageInput>
       </Flex>
+      {visible && (
+        <PdfDrawer
+          visible={visible}
+          hideModal={hideModal}
+          documentId={documentId}
+          chunk={selectedChunk}
+        ></PdfDrawer>
+      )}
     </>
   );
 };
diff --git a/web/src/pages/chat/shared-hooks.ts b/web/src/pages/chat/shared-hooks.ts
index 8508746e58..99bab686b2 100644
--- a/web/src/pages/chat/shared-hooks.ts
+++ b/web/src/pages/chat/shared-hooks.ts
@@ -1,83 +1,41 @@
 import { MessageType, SharedFrom } from '@/constants/chat';
-import {
-  useCreateNextSharedConversation,
-  useFetchNextSharedConversation,
-} from '@/hooks/chat-hooks';
+import { useCreateNextSharedConversation } from '@/hooks/chat-hooks';
 import {
   useSelectDerivedMessages,
   useSendMessageWithSse,
 } from '@/hooks/logic-hooks';
 import { Message } from '@/interfaces/database/chat';
-import api from '@/utils/api';
+import { message } from 'antd';
+import { get } from 'lodash';
 import trim from 'lodash/trim';
 import { useCallback, useEffect, useState } from 'react';
 import { useSearchParams } from 'umi';
 import { v4 as uuid } from 'uuid';
 import { useHandleMessageInputChange } from './hooks';
 
-export const useCreateSharedConversationOnMount = () => {
-  const [currentQueryParameters] = useSearchParams();
-  const [conversationId, setConversationId] = useState('');
-
-  const { createSharedConversation: createConversation } =
-    useCreateNextSharedConversation();
-  const sharedId = currentQueryParameters.get('shared_id');
-  const userId = currentQueryParameters.get('user_id');
-
-  const setConversation = useCallback(async () => {
-    if (sharedId) {
-      const data = await createConversation(userId ?? undefined);
-      const id = data.data?.id;
-      if (id) {
-        setConversationId(id);
-      }
-    }
-  }, [createConversation, sharedId, userId]);
-
-  useEffect(() => {
-    setConversation();
-  }, [setConversation]);
+const isCompletionError = (res: any) =>
+  res && (res?.response.status !== 200 || res?.data?.code !== 0);
 
-  return { conversationId };
+export const useSendButtonDisabled = (value: string) => {
+  return trim(value) === '';
 };
 
-export const useSelectNextSharedMessages = (conversationId: string) => {
-  const { data, loading } = useFetchNextSharedConversation(conversationId);
-
-  const {
-    derivedMessages,
-    ref,
-    setDerivedMessages,
-    addNewestAnswer,
-    addNewestQuestion,
-    removeLatestMessage,
-  } = useSelectDerivedMessages();
-
-  useEffect(() => {
-    setDerivedMessages(data?.data?.message);
-  }, [setDerivedMessages, data]);
+export const useGetSharedChatSearchParams = () => {
+  const [searchParams] = useSearchParams();
 
   return {
-    derivedMessages,
-    addNewestAnswer,
-    addNewestQuestion,
-    removeLatestMessage,
-    loading,
-    ref,
-    setDerivedMessages,
+    from: searchParams.get('from') as SharedFrom,
+    sharedId: searchParams.get('shared_id'),
   };
 };
 
-export const useSendButtonDisabled = (value: string) => {
-  return trim(value) === '';
-};
-
-export const useSendSharedMessage = (conversationId: string) => {
+export const useSendSharedMessage = () => {
+  const { from, sharedId: conversationId } = useGetSharedChatSearchParams();
   const { createSharedConversation: setConversation } =
     useCreateNextSharedConversation();
   const { handleInputChange, value, setValue } = useHandleMessageInputChange();
   const { send, answer, done } = useSendMessageWithSse(
-    api.completeExternalConversation,
+    `/api/v1/${from === SharedFrom.Agent ? 'agentbots' : 'chatbots'}/${conversationId}/completions`,
   );
   const {
     derivedMessages,
@@ -85,24 +43,25 @@ export const useSendSharedMessage = (conversationId: string) => {
     removeLatestMessage,
     addNewestAnswer,
     addNewestQuestion,
-    loading,
-  } = useSelectNextSharedMessages(conversationId);
+  } = useSelectDerivedMessages();
+  const [hasError, setHasError] = useState(false);
 
   const sendMessage = useCallback(
     async (message: Message, id?: string) => {
       const res = await send({
         conversation_id: id ?? conversationId,
-        quote: false,
-        messages: [...(derivedMessages ?? []), message],
+        quote: true,
+        question: message.content,
+        session_id: get(derivedMessages, '0.session_id'),
       });
 
-      if (res && (res?.response.status !== 200 || res?.data?.code !== 0)) {
+      if (isCompletionError(res)) {
         // cancel loading
         setValue(message.content);
         removeLatestMessage();
       }
     },
-    [conversationId, derivedMessages, removeLatestMessage, setValue, send],
+    [send, conversationId, derivedMessages, setValue, removeLatestMessage],
   );
 
   const handleSendMessage = useCallback(
@@ -120,6 +79,18 @@ export const useSendSharedMessage = (conversationId: string) => {
     [conversationId, setConversation, sendMessage],
   );
 
+  const fetchSessionId = useCallback(async () => {
+    const ret = await send({ question: '' });
+    if (isCompletionError(ret)) {
+      message.error(ret?.data.message);
+      setHasError(true);
+    }
+  }, [send]);
+
+  useEffect(() => {
+    fetchSessionId();
+  }, [fetchSessionId, send]);
+
   useEffect(() => {
     if (answer.answer) {
       addNewestAnswer(answer);
@@ -154,16 +125,8 @@ export const useSendSharedMessage = (conversationId: string) => {
     value,
     sendLoading: !done,
     ref,
-    loading,
+    loading: false,
     derivedMessages,
-  };
-};
-
-export const useGetSharedChatSearchParams = () => {
-  const [searchParams] = useSearchParams();
-
-  return {
-    from: searchParams.get('from') as SharedFrom,
-    sharedId: searchParams.get('shared_id'),
+    hasError,
   };
 };
diff --git a/web/src/pages/flow/header/index.tsx b/web/src/pages/flow/header/index.tsx
index 6bf5aa9e37..5b5d47574b 100644
--- a/web/src/pages/flow/header/index.tsx
+++ b/web/src/pages/flow/header/index.tsx
@@ -1,13 +1,15 @@
-import ChatOverviewModal from '@/components/api-service/chat-overview-modal';
-import { useSetModalState, useTranslate } from '@/hooks/common-hooks';
+import EmbedModal from '@/components/api-service/embed-modal';
+import { useShowEmbedModal } from '@/components/api-service/hooks';
+import { SharedFrom } from '@/constants/chat';
+import { useTranslate } from '@/hooks/common-hooks';
 import { useFetchFlow } from '@/hooks/flow-hooks';
 import { ArrowLeftOutlined } from '@ant-design/icons';
 import { Button, Flex, Space } from 'antd';
 import { useCallback } from 'react';
 import { Link, useParams } from 'umi';
-import FlowIdModal from '../flow-id-modal';
 import {
   useGetBeginNodeDataQuery,
+  useGetBeginNodeDataQueryIsEmpty,
   useSaveGraph,
   useSaveGraphBeforeOpeningDebugDrawer,
   useWatchAgentChange,
@@ -25,15 +27,16 @@ const FlowHeader = ({ showChatDrawer, chatDrawerVisible }: IProps) => {
   const { handleRun } = useSaveGraphBeforeOpeningDebugDrawer(showChatDrawer);
   const { data } = useFetchFlow();
   const { t } = useTranslate('flow');
-  const {
-    visible: overviewVisible,
-    hideModal: hideOverviewModal,
-    // showModal: showOverviewModal,
-  } = useSetModalState();
-  const { visible, hideModal, showModal } = useSetModalState();
   const { id } = useParams();
   const time = useWatchAgentChange(chatDrawerVisible);
   const getBeginNodeDataQuery = useGetBeginNodeDataQuery();
+  const { showEmbedModal, hideEmbedModal, embedVisible, beta } =
+    useShowEmbedModal();
+  const isBeginNodeDataQueryEmpty = useGetBeginNodeDataQueryIsEmpty();
+
+  const handleShowEmbedModal = useCallback(() => {
+    showEmbedModal();
+  }, [showEmbedModal]);
 
   const handleRunAgent = useCallback(() => {
     const query: BeginQuery[] = getBeginNodeDataQuery();
@@ -70,23 +73,25 @@ const FlowHeader = ({ showChatDrawer, chatDrawerVisible }: IProps) => {
           <Button type="primary" onClick={() => saveGraph()}>
             <b>{t('save')}</b>
           </Button>
-          {/* <Button type="primary" onClick={showOverviewModal} disabled>
+          <Button
+            type="primary"
+            onClick={handleShowEmbedModal}
+            disabled={!isBeginNodeDataQueryEmpty}
+          >
             <b>{t('publish')}</b>
-          </Button> */}
-          <Button type="primary" onClick={showModal}>
-            <b>Agent ID</b>
           </Button>
         </Space>
       </Flex>
-      {overviewVisible && (
-        <ChatOverviewModal
-          visible={overviewVisible}
-          hideModal={hideOverviewModal}
-          id={id!}
-          idKey="canvasId"
-        ></ChatOverviewModal>
+      {embedVisible && (
+        <EmbedModal
+          visible={embedVisible}
+          hideModal={hideEmbedModal}
+          token={id!}
+          form={SharedFrom.Agent}
+          beta={beta}
+          isAgent
+        ></EmbedModal>
       )}
-      {visible && <FlowIdModal hideModal={hideModal}></FlowIdModal>}
     </>
   );
 };
diff --git a/web/src/pages/flow/hooks.tsx b/web/src/pages/flow/hooks.tsx
index a8f7df5c2f..21a238483f 100644
--- a/web/src/pages/flow/hooks.tsx
+++ b/web/src/pages/flow/hooks.tsx
@@ -474,6 +474,20 @@ export const useGetBeginNodeDataQuery = () => {
   return getBeginNodeDataQuery;
 };
 
+export const useGetBeginNodeDataQueryIsEmpty = () => {
+  const [isBeginNodeDataQueryEmpty, setIsBeginNodeDataQueryEmpty] =
+    useState(false);
+  const getBeginNodeDataQuery = useGetBeginNodeDataQuery();
+  const nodes = useGraphStore((state) => state.nodes);
+
+  useEffect(() => {
+    const query: BeginQuery[] = getBeginNodeDataQuery();
+    setIsBeginNodeDataQueryEmpty(query.length === 0);
+  }, [getBeginNodeDataQuery, nodes]);
+
+  return isBeginNodeDataQueryEmpty;
+};
+
 export const useSaveGraphBeforeOpeningDebugDrawer = (show: () => void) => {
   const { saveGraph, loading } = useSaveGraph();
   const { resetFlow } = useResetFlow();
diff --git a/web/src/utils/authorization-util.ts b/web/src/utils/authorization-util.ts
index 60a4ad77c8..f920944630 100644
--- a/web/src/utils/authorization-util.ts
+++ b/web/src/utils/authorization-util.ts
@@ -47,9 +47,9 @@ const storage = {
 };
 
 export const getAuthorization = () => {
-  const sharedId = getSearchValue('shared_id');
-  const authorization = sharedId
-    ? 'Bearer ' + sharedId
+  const auth = getSearchValue('auth');
+  const authorization = auth
+    ? 'Bearer ' + auth
     : storage.getAuthorization() || '';
 
   return authorization;
diff --git a/web/src/utils/document-util.ts b/web/src/utils/document-util.ts
index 3b3f310002..16cc5eaa9c 100644
--- a/web/src/utils/document-util.ts
+++ b/web/src/utils/document-util.ts
@@ -1,10 +1,12 @@
 import { Images, SupportedPreviewDocumentTypes } from '@/constants/common';
+import { IReferenceChunk } from '@/interfaces/database/chat';
 import { IChunk } from '@/interfaces/database/knowledge';
 import { UploadFile } from 'antd';
+import { get } from 'lodash';
 import { v4 as uuid } from 'uuid';
 
 export const buildChunkHighlights = (
-  selectedChunk: IChunk,
+  selectedChunk: IChunk | IReferenceChunk,
   size: { width: number; height: number },
 ) => {
   return Array.isArray(selectedChunk?.positions) &&
@@ -24,7 +26,11 @@ export const buildChunkHighlights = (
             text: '',
             emoji: '',
           },
-          content: { text: selectedChunk.content_with_weight },
+          content: {
+            text:
+              get(selectedChunk, 'content_with_weight') ||
+              get(selectedChunk, 'content', ''),
+          },
           position: {
             boundingRect: boundingRect,
             rects: [boundingRect],