dsmueller commited on
Commit
f6c29be
1 Parent(s): 9b37590

Update .gitignore and Dockerfile, add

Browse files
.gitignore CHANGED
@@ -1,3 +1,4 @@
1
  .venv/
2
  __pycache__/
3
- .env
 
 
1
  .venv/
2
  __pycache__/
3
+ .env
4
+ cache
Dockerfile CHANGED
@@ -4,8 +4,11 @@ FROM python:3.11.1
4
  # Set the working directory in the container
5
  WORKDIR /app
6
 
7
- # Install poetry
8
- # RUN pip3 install poetry==1.7.1
 
 
 
9
 
10
  # Copy the current directory contents into the container at /usr/src/app
11
  COPY . .
 
4
  # Set the working directory in the container
5
  WORKDIR /app
6
 
7
+ # Run the container as root
8
+ # USER root
9
+
10
+ # Change permissions of the working directory
11
+ RUN chmod 777 /app # Gives all users read, write, and exec permissions in the app directory.
12
 
13
  # Copy the current directory contents into the container at /usr/src/app
14
  COPY . .
fine_tune_data/train_data.csv ADDED
The diff for this file is too large to render. See raw diff
 
fine_tune_data/validation_data.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ text
2
+ "### Human: What is the aerospace mechanisms symposia?### Assistant: An annual meeting of space mechanism experts. {'source': 'DM', 'page': 0}"
train_llm.py CHANGED
@@ -12,10 +12,10 @@ from tqdm.notebook import tqdm
12
 
13
  # Load dataset
14
  dataset_name = 'ai-aerospace/ams_data_train_generic_v0.1_100'
15
- dataset=load_dataset(dataset_name,cache_dir='.')
16
 
17
  # Write dataset files into data directory
18
- data_directory = '../fine_tune_data/'
19
 
20
  # Create the data directory if it doesn't exist
21
  os.makedirs(data_directory, exist_ok=True)
 
12
 
13
  # Load dataset
14
  dataset_name = 'ai-aerospace/ams_data_train_generic_v0.1_100'
15
+ dataset=load_dataset(dataset_name,cache_dir='./cache')
16
 
17
  # Write dataset files into data directory
18
+ data_directory = './fine_tune_data/'
19
 
20
  # Create the data directory if it doesn't exist
21
  os.makedirs(data_directory, exist_ok=True)