-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathupdate_database.py
33 lines (29 loc) · 1.34 KB
/
update_database.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
"""
This script updates the database then stops.
"""
import lmntfy
import argparse
from pathlib import Path
def parse_args():
parser = argparse.ArgumentParser()
parser.add_argument("--docs_folder", default="./data/nersc_doc/docs", type=Path, help="path to the NERSC documentation folder")
parser.add_argument("--database_folder", default="./data/database", type=Path, help="path to the database saving folder")
parser.add_argument("--models_folder",default="../models",type=Path, help="path to the folder containing all the models")
args = parser.parse_args()
return args
def main():
print("Updating database...")
# process command line arguments
args = parse_args()
docs_folder = args.docs_folder
database_folder = args.database_folder
models_folder = args.models_folder
# load the database and updates it if needed
llm = lmntfy.models.llm.Default(models_folder,
# keep the model on CPU as we will not need to draw upon it
device='cpu', engineType=lmntfy.models.llm.engine.TransformerEngine)
search_engine = lmntfy.database.search.Default(models_folder, device='cpu')
database = lmntfy.database.Database(docs_folder, database_folder, search_engine, llm, update_database=True)
print("Done!")
if __name__ == "__main__":
main()