Zwea Htet commited on
Commit
9f10a81
β€’
1 Parent(s): d15a232

fixed import error

Browse files
data/{regItems.py β†’ prepare.py} RENAMED
@@ -2,10 +2,10 @@
2
  import numpy as np
3
  import pandas as pd
4
 
5
- df = pd.read_json(r"../../Dataset/regItems.json")
6
  df = df.replace(to_replace="", value=np.nan).dropna(axis=0) # remove null values
7
  df['paragraphText'] = df['paragraphText'].str.replace("OLD SECTION.*", "", regex=True) # remove any dirty words
8
- df['paragraphText'] = df['paragraphText'].str.replace("[a-zA-z]\d\w+", ". ", regex=True)
9
  df['paragraphText'] = df['paragraphText'].str.lower()
10
 
11
  data = df['paragraphText'].tolist()
 
2
  import numpy as np
3
  import pandas as pd
4
 
5
+ df = pd.read_json(r"./regItems.json")
6
  df = df.replace(to_replace="", value=np.nan).dropna(axis=0) # remove null values
7
  df['paragraphText'] = df['paragraphText'].str.replace("OLD SECTION.*", "", regex=True) # remove any dirty words
8
+ # df['paragraphText'] = df['paragraphText'].str.replace("[a-zA-z]\d\w+", ". ", regex=True)
9
  df['paragraphText'] = df['paragraphText'].str.lower()
10
 
11
  data = df['paragraphText'].tolist()
data/regItems.json ADDED
The diff for this file is too large to render. See raw diff
 
models/bloom.py CHANGED
@@ -4,7 +4,7 @@ from dotenv import load_dotenv
4
  from llama_index import (Document, GPTSimpleVectorIndex, LLMPredictor,
5
  ServiceContext)
6
 
7
- from data.regItems import data
8
 
9
  from .customLLM import CustomLLM, prompt_helper
10
 
 
4
  from llama_index import (Document, GPTSimpleVectorIndex, LLMPredictor,
5
  ServiceContext)
6
 
7
+ from data.prepare import data
8
 
9
  from .customLLM import CustomLLM, prompt_helper
10