-
Notifications
You must be signed in to change notification settings - Fork 24
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
1 changed file
with
194 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,194 @@ | ||
ALTER TABLE llamaindex_document_node | ||
MODIFY COLUMN hash CHAR(256) NOT NULL; | ||
|
||
DROP TABLE llamaindex_document_chunk_node_default; | ||
CREATE TABLE llamaindex_document_chunk_node_default | ||
( | ||
id BINARY(16) NOT NULL, | ||
hash VARCHAR(256) NOT NULL, | ||
text TEXT NOT NULL, | ||
metadata JSON NOT NULL, | ||
embedding VECTOR< FLOAT >(1536) NULL COMMENT 'hnsw(distance=cosine)', | ||
index_id INT NOT NULL, | ||
document_id INT NOT NULL, | ||
PRIMARY KEY (id), | ||
KEY idx_ldcn_on_index_id_document_id (index_id, document_id), | ||
FOREIGN KEY fk_ldcn_on_index_id (index_id) REFERENCES `index` (id), | ||
FOREIGN KEY fk_ldcn_on_document_id (document_id) REFERENCES `document` (id) | ||
); | ||
|
||
-- | ||
-- Default Index Config | ||
-- | ||
|
||
DELETE | ||
FROM `index` | ||
WHERE id = 1; | ||
|
||
INSERT INTO `index` (id, name, config) | ||
VALUES (1, 'default', '{ | ||
"provider": "llamaindex", | ||
"llm": { | ||
"provider": "openai", | ||
"options": { | ||
"model": "gpt-4o" | ||
} | ||
}, | ||
"embedding": { | ||
"provider": "openai", | ||
"options": { | ||
"model": "text-embedding-3-small", | ||
"vectorColumn": "embedding", | ||
"dimensions": 1536 | ||
} | ||
}, | ||
"metadata_extractors": [], | ||
"parser": { | ||
"textSplitter": { | ||
"chunkSize": 512 | ||
} | ||
}, | ||
"reader": { | ||
"rag.loader.html": { | ||
"contentExtraction": [ | ||
{ | ||
"selectors": [ | ||
{ | ||
"selector": "main" | ||
}, | ||
{ | ||
"selector": ".gr-g-wrapper" | ||
}, | ||
{ | ||
"selector": "[data-elementor-type=\\"wp-post\\"]" | ||
} | ||
], | ||
"excludeSelectors": [ | ||
], | ||
"url": "www.grab.com/**" | ||
} | ||
] | ||
} | ||
} | ||
}'); | ||
|
||
-- | ||
-- Default Chat Engine Config | ||
-- | ||
|
||
INSERT INTO chat_engine (name, engine, engine_options, is_default) VALUE ('default', 'condense-question', '{}', TRUE); | ||
|
||
UPDATE `chat_engine` | ||
SET engine_options = JSON_MERGE_PATCH(engine_options, '{ | ||
"index_id": 1, | ||
"llm": { | ||
"provider": "openai", | ||
"options": { | ||
"model": "gpt-3.5-turbo" | ||
} | ||
}, | ||
"prompts": { | ||
"condenseQuestion": "Given a conversation (between Human and Assistant) and a follow up message from Human, rewrite the message to be a standalone question that captures all relevant context from the conversation.\\n\\n<Chat History>\\n{{chatHistory}}\\n\\n<Follow Up Message>\\n{{question}}\\n\\n<Standalone question>\\n", | ||
"refine": "The original query is as follows: {{query}}\\nWe have provided an existing answer: {{existingAnswer}}\\nWe have the opportunity to refine the existing answer (only if needed) with some more context below.\\n------------\\n{{context}}\\n------------\\nGiven the new context, refine the original answer to better answer the query. If the context isn''t useful, return the original answer.\\nRefined Answer:", | ||
"textQa": "Context information is below.\\n---------------------\\n{{context}}\\n---------------------\\nGiven the context information and not prior knowledge, answer the query.\\nQuery: {{query}}\\nAnswer:" | ||
}, | ||
"reranker": {}, | ||
"retriever": { | ||
"search_top_k": 25, | ||
"top_k": 7 | ||
} | ||
}') | ||
WHERE name = 'default'; | ||
|
||
-- | ||
-- Default Website Settings | ||
-- | ||
|
||
-- Website Setting: General | ||
INSERT INTO `option` | ||
VALUES ('title', 'website', 'string', '"Grab"'), | ||
('description', 'website', 'string', '"Hello Grab!"'), | ||
('logo_in_dark_mode', 'website', 'string', '"https://tidb.ai/tidb-ai-light.svg"'), | ||
('logo_in_light_mode', 'website', 'string', '"https://tidb.ai/tidb-ai.svg"'), | ||
('language', 'website', 'string', '"en-US"'); | ||
|
||
-- Website Setting: Homepage | ||
INSERT INTO `option` | ||
VALUES ('homepage.title', 'website', 'string', '"Ask anything about Grab"'), | ||
('homepage.description', 'website', 'string', | ||
'"Including company intro, user cases, product intro and usage, FAQ, etc."'), | ||
('homepage.example_questions', 'website', 'array', '[ | ||
{ | ||
"text": "What is Grab?" | ||
}, | ||
{ | ||
"text": "Who use Grab?" | ||
} | ||
]'), | ||
('homepage.footer_links', 'website', 'array', '[ | ||
{ | ||
"text": "Docs", | ||
"href": "/docs" | ||
}, | ||
{ | ||
"text": "Deploy your own within 5 minutes for free", | ||
"href": "/docs" | ||
}, | ||
{ | ||
"text": "How it works?", | ||
"href": "/docs" | ||
}, | ||
{ | ||
"text": "Powered by TiDB", | ||
"href": "https://tidb.cloud" | ||
}, | ||
{ | ||
"text": "© 2024 PingCAP", | ||
"href": "https://pingcap.com" | ||
} | ||
]'); | ||
|
||
-- Custom JS Setting | ||
INSERT INTO `option` | ||
VALUES ('button_label', 'custom_js', 'string', '"Ask AI"'), | ||
('button_img_src', 'custom_js', 'string', '"https://tidb.ai/tidb-ai.svg"'), | ||
('logo_src', 'custom_js', 'string', '"https://tidb.ai/tidb-ai.svg"'), | ||
('example_questions', 'custom_js', 'array', '[ | ||
{ | ||
"text": "What is Grab?" | ||
}, | ||
{ | ||
"text": "Who use Grab?" | ||
} | ||
]'), | ||
('widget_title', 'custom_js', 'string', '"Conversation Search Box"'), | ||
('widget_input_placeholder', 'custom_js', 'string', '"Ask a question..."'), | ||
('widget_color_mode', 'custom_js', 'string', '"system"'); | ||
|
||
INSERT INTO `index` (id, name, config) | ||
VALUES (3, 'graph', '{ | ||
"provider": "knowledge-graph", | ||
"reader": { | ||
"rag.loader.html": { | ||
"contentExtraction": [ | ||
{ | ||
"excludeSelectors": [ | ||
], | ||
"selectors": [ | ||
{ | ||
"selector": "main" | ||
}, | ||
{ | ||
"selector": ".gr-g-wrapper" | ||
}, | ||
{ | ||
"selector": "[data-elementor-type=\\"wp-post\\"]" | ||
} | ||
], | ||
"url": "tidb.net/blog/**" | ||
} | ||
], | ||
"metadataExtraction": [] | ||
} | ||
} | ||
}'); |