Merge pull request #676 from GraphScope/0113

feat: Add Report component
GraphScope · Jan 20, 2025 · 3eef544 · 3eef544
2 parents 2947402 + 9f127d4
commit 3eef544
Show file tree

Hide file tree

Showing 14 changed files with 1,567 additions and 36 deletions.
diff --git a/packages/studio-explore/package.json b/packages/studio-explore/package.json
@@ -25,6 +25,7 @@
     "registry": "https://registry.npmjs.org/"
   },
   "dependencies": {
+    "react-markdown": "^9.0.3",
     "@antv/g2": "^5.2.8",
     "@graphscope/studio-components": "workspace:*",
     "@graphscope/studio-driver": "workspace:*",

diff --git a/packages/studio-explore/src/app.tsx b/packages/studio-explore/src/app.tsx
@@ -46,6 +46,7 @@ import {
   Copilot,
   RunAI,
   FloatToolbar,
+  Report,
 } from './components';
 import {
   BgColorsOutlined,
@@ -169,11 +170,12 @@ const Explore: React.FunctionComponent<ExploreProps> = props => {
                   key: 'CypherQuery',
                 },
                 {
-                  label: <Typography.Title level={3}>Copilot</Typography.Title>,
+                  label: <Typography.Title level={3}>Report</Typography.Title>,
                   icon: <OpenAIOutlined />,
-                  children: <Copilot />,
-                  key: 'Copilot',
+                  children: <Report />,
+                  key: 'Report',
                 },
+
                 {
                   label: <Typography.Title level={3}>Style Setting</Typography.Title>,
                   icon: <BgColorsOutlined />,

diff --git a/packages/studio-explore/src/components/Copilot/RunAI/index.tsx b/packages/studio-explore/src/components/Copilot/RunAI/index.tsx
@@ -10,7 +10,7 @@ const RunAI: React.FunctionComponent<INeighborQueryProps> = props => {
   const { selectNodes } = store;
 
   const handleClick = () => {
-    const scripts = `write a related work section about the given data, you should focus on challenges only : ${JSON.stringify(selectNodes, null, 2)}`;
+    const scripts = `I have selected those data: ${JSON.stringify(selectNodes, null, 2)}`;
     //@ts-ignore
     window.runAI(scripts);
   };

diff --git a/packages/studio-explore/src/components/Copilot/index.tsx b/packages/studio-explore/src/components/Copilot/index.tsx
@@ -1,7 +1,13 @@
 import React, { useEffect, useRef, useState } from 'react';
 import { Message } from './utils/message';
 
-import { getWelcomeMessage, defaultWelcome } from './utils/prompt';
+import {
+  getWelcomeMessage,
+  defaultWelcome,
+  TEMPLATE_QUERY_GENERATOR,
+  get_query_system_prompts,
+  get_report_system_prompts,
+} from './utils/prompt';
 import { Input, Button, Flex, Typography, Space, Skeleton, theme } from 'antd';
 import { useController } from './useController';
 import { useContext } from '@graphscope/studio-graph';
@@ -16,16 +22,15 @@ interface IGPTStatementsProps {}
 
 const { useToken } = theme;
 const GPTStatements: React.FunctionComponent<IGPTStatementsProps> = props => {
-  const [state, updateState] = useState<{ messages: Message[]; isLoading: boolean; OPENAI_KEY_FOR_GS: string | null }>({
+  const [state, updateState] = useState<{ messages: Message[]; isLoading: boolean }>({
     messages: [],
     isLoading: false,
-    OPENAI_KEY_FOR_GS: localStorage.getItem('OPENAI_KEY_FOR_GS'),
   });
-  const { messages, isLoading, OPENAI_KEY_FOR_GS } = state;
+  const { messages, isLoading } = state;
   const InputRef = useRef(null);
   const { token } = useToken();
   const { store } = useContext();
-  const { schema } = store;
+  const { schema, selectNodes } = store;
 
   const controller = useController();
   const { updateStore } = useContext();
@@ -46,15 +51,6 @@ const GPTStatements: React.FunctionComponent<IGPTStatementsProps> = props => {
     id: 'query.copilot.welcome',
   });
 
-  useEffect(() => {
-    updateState(pre => {
-      return {
-        ...pre,
-        messages: [...getWelcomeMessage(welcome)],
-      };
-    });
-  }, []);
-
   const handleSubmit = async (script?: string) => {
     if (InputRef.current) {
       //@ts-ignore
@@ -72,7 +68,7 @@ const GPTStatements: React.FunctionComponent<IGPTStatementsProps> = props => {
         };
       });
 
-      const response = await query([...messages, message], OPENAI_KEY_FOR_GS!, controller.signal);
+      const response = await query([...messages, message], controller.signal);
       if (!response) {
         updateState(preState => {
           return {
@@ -120,11 +116,68 @@ const GPTStatements: React.FunctionComponent<IGPTStatementsProps> = props => {
     });
   };
 
-  const handleSave = value => {
-    updateState(pre => {
+  const queryMindmap = () => {};
+  const queryTask = task => {
+    if (task === 'query') {
+      updateState(preState => {
+        return {
+          ...preState,
+          messages: [
+            new Message({
+              role: 'system',
+              status: 'success',
+              timestamp: Date.now(),
+              reserved: true,
+
+              content: get_query_system_prompts(JSON.stringify(schema, null, 2)),
+            }),
+            new Message({
+              status: 'success',
+              role: 'assistant',
+              content: welcome,
+              timestamp: Date.now(),
+              reserved: true,
+            }),
+          ],
+        };
+      });
+    }
+    if (task === 'analysis') {
+      updateState(preState => {
+        return {
+          ...preState,
+          messages: [
+            new Message({
+              role: 'system',
+              status: 'success',
+              timestamp: Date.now(),
+              reserved: true,
+              content: get_report_system_prompts(JSON.stringify(schema, null, 2)),
+            }),
+            new Message({
+              status: 'success',
+              role: 'assistant',
+              content: '您好！我是 GraphScope 分析助理，您你可以先选中要分析的数据，方便我为你分析',
+
+              timestamp: Date.now(),
+              reserved: true,
+            }),
+          ],
+        };
+      });
+    }
+    updateState(preState => {
       return {
-        ...pre,
-        OPENAI_KEY_FOR_GS: value,
+        ...preState,
+        messages: [
+          new Message({
+            status: 'success',
+            role: 'assistant',
+            content: '您好！我是 GraphScope Copilot,有什么可以帮到你的',
+            timestamp: Date.now(),
+            reserved: true,
+          }),
+        ],
       };
     });
   };
@@ -136,9 +189,36 @@ const GPTStatements: React.FunctionComponent<IGPTStatementsProps> = props => {
           <Typography.Text type="secondary" italic>
             Think like a bot
           </Typography.Text>
-          <Setting onChange={handleSave} />
+          <Setting />
         </Flex>
         <Flex vertical gap={12} style={{ overflowY: 'scroll', height: 'calc(100vh - 170px)' }}>
+          <Typography.Text type="secondary" italic>
+            select role
+          </Typography.Text>
+          <Space>
+            <Button
+              onClick={() => {
+                queryTask('query');
+              }}
+            >
+              Query
+            </Button>
+            <Button
+              onClick={() => {
+                queryTask('analysis');
+              }}
+            >
+              Mindmap
+            </Button>
+            <Button
+              onClick={() => {
+                queryTask('chat');
+              }}
+            >
+              Analysis
+            </Button>
+          </Space>
+
           {messages
             .filter(m => m.role !== 'system')
             .map(item => {

diff --git a/packages/studio-explore/src/components/Copilot/query.tsx b/packages/studio-explore/src/components/Copilot/query.tsx
@@ -16,14 +16,14 @@ export const models = [
 
 export function query(
   messages: Message[],
-  apiKey: string,
   signal?: AbortSignal,
 ): Promise<{
   status: 'success' | 'cancel' | 'failed';
   message: any;
 }> {
   const model = localStorage.getItem('AI_MODEL_FOR_GS') || models[0].name;
   const { endpoint, name } = models.find(m => m.name === model) || models[0];
+  const apiKey = localStorage.getItem('OPENAI_KEY_FOR_GS');
   return fetch(endpoint, {
     signal,
     method: 'POST',

diff --git a/packages/studio-explore/src/components/Copilot/setting.tsx b/packages/studio-explore/src/components/Copilot/setting.tsx
@@ -5,12 +5,11 @@ import { FormattedMessage, useIntl } from 'react-intl';
 import { Utils } from '@graphscope/studio-components';
 import { models } from './query';
 interface ISettingProps {
-  onChange: (value: string) => void;
   style?: React.CSSProperties;
 }
 
 const Setting: React.FunctionComponent<ISettingProps> = props => {
-  const { onChange, style } = props;
+  const { style } = props;
   const [isModalOpen, setIsModalOpen] = useState(() => {
     const match = Utils.getSearchParams('tab') === 'copilot';
     return !localStorage.getItem('OPENAI_KEY_FOR_GS') && match;
@@ -28,7 +27,6 @@ const Setting: React.FunctionComponent<ISettingProps> = props => {
       const { value } = InputRef.current.input;
       const val = String(value).trim();
       localStorage.setItem('OPENAI_KEY_FOR_GS', val);
-      onChange && onChange(val);
     }
     setIsModalOpen(false);
   };

diff --git a/packages/studio-explore/src/components/Copilot/utils/prompt.ts b/packages/studio-explore/src/components/Copilot/utils/prompt.ts
@@ -1,34 +1,106 @@
 import { Message } from './message';
 type GraphSchemaData = any;
 
+export const get_query_system_prompts = graphSchema => `
+你的角色是一个 Cypher 查询助手，你可以根据用户的自然语言提问，再结合图数据库的 Schema 结构，给生成标准的 Cypher 查询语句。
+为了查询的准确性，请务必充分理解 Schema，并使用 Schema 中明确的字段，不要自己随意生成字段！
+为了查询的准确性，请务必充分理解 Schema，并使用 Schema 中明确的字段，不要自己随意生成字段！
+为了查询的准确性，请务必充分理解 Schema，并使用 Schema 中明确的字段，不要自己随意生成字段！
+
+你不要着急马上给出答案，你可以多生成几个语句，然后找出一个你觉得最准确的语句告诉我，推理的过程可以不用告诉我，我只需要最准确的那一个。
+你不要着急马上给出答案，你可以多生成几个语句，然后找出一个你觉得最准确的语句告诉我，推理的过程可以不用告诉我，我只需要最准确的那一个。
+你不要着急马上给出答案，你可以多生成几个语句，然后找出一个你觉得最准确的语句告诉我，推理的过程可以不用告诉我，我只需要最准确的那一个。
+
+其他注意事项:
+不支持 "MATCH p=()-[]-() RETURN p" 的写法，请都替换成 "MATCH (a)-[b]-(c) RETURN a,b,c"
+注意返回格式需要 markdown cypher 格式
+
+下面是数据库中的 Schema：
+${graphSchema}
+让我们开始吧～
+`;
+export const get_report_system_prompts = graphSchema => `
+你的角色是一个图分析报告的生成助手，首先，你要理解用户的图数据模型，模型如下：
+${graphSchema}
+其次，你要提醒用户给你当前图画布的完整数据信息，根据这个子图数据，你需要生成一份思维导图，在生成思维导图的过程中，你可能需要对图上的数据做聚类，聚类的信息可以追加到原有节点的属性中，返回的数据，只用携带关键信息即可，我可以在本地merge数据
+让我们开始吧～
+`;
+
+// reference:https://github.com/GraphScope/portal/blob/llm_analysis/python/graphy/prompts/graph_analyze_prompts.py
 const CYPHER_QUERY_EXAMPLE = `
 
-Query Example:
-Positive Example:
+Here are some specific syntax requirements of cypher to keep in mind when writing Cypher queries:
+
+Requirement (1): In Cypher queries, if you rename a property (such as 'T.a') using the 'AS' keyword (e.g., 'T.a AS b'), you must use 'b' in all subsequent parts of the query instead of 'T.a'. Especially for the content following 'ORDER BY such as 'ORDER BY T.a, T.b', if 'T.a' or 'T.b' have been renamed using the 'AS' keyword earlier in the query, you must use their new names no matter how DESC and ASC are used.
+
+Example of a correct query:
+
 MATCH (p:Paper)-[r:Paper_Has_Challenge]->(c:Challenge)
 OPTIONAL MATCH (p)-[:Paper_Has_Solution]->(s:Solution)
 RETURN p.title AS paper_title, c.name AS challenge_name, s.name AS solution_name, c.description AS challenge_description, s.description AS solution_description
-ORDER BY challenge_name ASC
+ORDER BY challenge_name ASC;
+In this example, 'c.name AS challenge_name' is correctly followed by 'ORDER BY challenge_name ASC'.
+
+Example of an incorrect query:
 
-Negatve Example:
 MATCH (p:Paper)-[r:Paper_Has_Challenge]->(c:Challenge)
 OPTIONAL MATCH (p)-[:Paper_Has_Solution]->(s:Solution)
 RETURN p.title AS paper_title, c.name AS challenge_name, s.name AS solution_name, c.description AS challenge_description, s.description AS solution_description
-ORDER BY c.name ASC
+ORDER BY c.name ASC;
+In this case, 'c.name AS challenge_name' should be followed by 'ORDER BY challenge_name ASC', but instead, it incorrectly uses 'ORDER BY c.name ASC'.
+
+Requirement (2): Ensure that every edge and vertex in the MATCH pattern adheres to the schema rules:
+
+For an edge like (x:xlabel)-[e:elabel]->(y:ylabel):
+
+It is valid if the schema contains an edge with:
+A label or type name matching 'elabel'.
+Source vertex label 'xlabel' and destination vertex label 'ylabel'.
+If these conditions are not met, the edge definition is invalid.
+For a node like (x:label):
+
+It is valid if the schema includes a vertex with:
+A label or type name matching 'xlabel'.
+If this condition is not met, the node definition is invalid.
+
+Consider a schema with two node types: 'Person' and 'Message'. There is also an edge labeled 'Likes', where the edge starts from a 'Person' node (source) and ends at a 'Message' node (destination), then:
+Positive Example:
+MATCH (p:Person)-[l:Likes]->(m:Message)
+RETURN p.name;
+
+Negative Example 1:
+MATCH (p:Person)<-[l:Likes]-(m:Message)
+RETURN p.name;
+
+
+Negative Example 2 (as vertex with label 'Comment' is not defined in the schema):
+MATCH (p:Person)<-[l:Likes]-(c:Comment)
+RETURN p.name;
+
 
 `;
 
-const TEMPLATE_QUERY_GENERATOR = (user_query, schema) => `
+export const TEMPLATE_QUERY_GENERATOR = schema => `
 You are a highly skilled AI graph database expert. Given the user queries and the schema of a graph database, your role is to identify which information in the database is necessary to meet the user's requirements and provide the corresponding database query following the {language} syntax.
 The next step involves conducting specific analyses with the queried data, such as sorting, classifying, and describing the data. Therefore, when selecting attributes, it is important to analyze the intent of the user's query, clarify the purpose of the data query, and then determine the attributes that may be needed.
 Before crafting query statements, thoroughly analyze the schema provided by the user to identify valid labels for nodes and edges. Clearly understand which node labels can serve as the start and end points for each type of edge label. This ensures that you construct executable query statements.
 Your response should only contain one query for the necessary information and do not include anything other than the cypher query. Do not start with \`\`\`.
-
-User Query: ${user_query}
 Schema: ${schema}
 ${CYPHER_QUERY_EXAMPLE}
 `;
 
+const TEMPLATE_MIND_MAP_GENERATOR = (user_query, paper_slot) => `
+You are a highly skilled academic AI assistant. Given a user query and a set of papers with their properties, your role is to categorize the given papers based on the user's goals and the provided data by selecting specific dimensions. Each category should have a name and a corresponding description. For each category, maintain a list of paper IDs and paper titles that belong to that category.
+
+User Query: ${user_query}
+Papers: ${paper_slot}
+
+Guidance:
+- When selecting dimensions for categorization, you should choose those that are as distinct and important as possible.
+- When categorizing, try not to have a single paper belong to more than one category.
+- The number of categories is not necessarily the more the better; generally, dividing into 2-4 categories is preferable.
+`;
+
 export const defaultWelcome = `您好！我是 GraphScope 查询助理，您有任何关于 Cypher 查询的问题都可以随时问我`;
 /**
  * 转换图的数据信息为自然语言