Files
DB-GPT/examples/gpt_index.py
2023-06-18 19:39:10 +03:00

20 lines
524 B
Python

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import logging
import sys
from llama_index import GPTVectorStoreIndex, SimpleDirectoryReader
logging.basicConfig(stream=sys.stdout, level=logging.INFO)
logging.getLogger().addHandler(logging.StreamHandler(stream=sys.stdout))
# read the document of data dir
documents = SimpleDirectoryReader("data").load_data()
# split the document to chunk, max token size=500, convert chunk to vector
index = GPTVectorStoreIndex(documents)
# save index
index.save_to_disk("index.json")