Files
DB-GPT/examples/gpt_index.py
2023-05-24 18:43:04 +08:00

20 lines
526 B
Python

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import logging
import sys
from llama_index import GPTSimpleVectorIndex, SimpleDirectoryReader
logging.basicConfig(stream=sys.stdout, level=logging.INFO)
logging.getLogger().addHandler(logging.StreamHandler(stream=sys.stdout))
# read the document of data dir
documents = SimpleDirectoryReader("data").load_data()
# split the document to chunk, max token size=500, convert chunk to vector
index = GPTSimpleVectorIndex(documents)
# save index
index.save_to_disk("index.json")