From e89e830c555e594f8a5a5c2d50dfb6c38ea6ffcc Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=88=98=20=E6=96=B9=E7=91=9E?= Date: Mon, 13 Nov 2023 15:22:42 +0800 Subject: [PATCH] Free knowledge base pod information update (#12813) We updated MyScale free knowledge base, where you can try your RAG with 36 million paragraphs from wikipedia and 2 million paragraphs from ArXiv. The pod has two tables ```sql CREATE TABLE default.ChatArXiv ( `abstract` String, `id` String, `vector` Array(Float32), `metadata` Object('JSON'), `pubdate` DateTime, `title` String, `categories` Array(String), `authors` Array(String), `comment` String, `primary_category` String, VECTOR INDEX vec_idx vector TYPE MSTG('metric_type=Cosine'), CONSTRAINT vec_len CHECK length(vector) = 768) ENGINE = ReplacingMergeTree ORDER BY id; CREATE TABLE wiki.Wikipedia ( `id` String, `title` String, `text` String, `url` String, `wiki_id` UInt64, `views` Float32, `paragraph_id` UInt64, `langs` UInt32, `emb` Array(Float32), VECTOR INDEX emb_idx emb TYPE MSTG('metric_type=Cosine'), CONSTRAINT emb_len CHECK length(emb) = 768) ENGINE = ReplacingMergeTree ORDER BY id; ``` You can connect those two tables using credentials below (just the same to the old one) URL: `msc-4a9e710a.us-east-1.aws.staging.myscale.cloud` Port: `443` Username: `chatdata` Password: `myscale_rocks` It's FREE and you can also use it with ChatData: https://github.com/myscale/ChatData Retrieval-QA-Benchmark: https://github.com/myscale/Retrieval-QA-Benchmark ... and also LangChain! Request for review @baskaryan