Spaces:
Runtime error
Runtime error
ffreemt
commited on
Commit
•
fa25318
1
Parent(s):
51ccc27
Update sync with github repo
Browse files- README.md +1 -1
- README1.md +51 -0
- pyproject.toml +16 -0
README.md
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
---
|
2 |
-
title:
|
3 |
emoji: 🦀
|
4 |
colorFrom: green
|
5 |
colorTo: red
|
|
|
1 |
---
|
2 |
+
title: multilingual-dokugpt
|
3 |
emoji: 🦀
|
4 |
colorFrom: green
|
5 |
colorTo: red
|
README1.md
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# multilingual-dokugpt
|
2 |
+
Chat with multilingual documents in a language you prefer
|
3 |
+
|
4 |
+
`multilingual-dokugpt` is a quasi-localgpt that makes use of `langchain`, generates embeddings `locally` and save them in a Chroma vectorstore.
|
5 |
+
|
6 |
+
## Features
|
7 |
+
* Handle documents in multiple languages, multiple formats (.txt or plaintext in other suffixes, .docx, .pdf, .epub)
|
8 |
+
* Can use PawanOsman reverse proxy free api-key of the form `pk-....`. Refer to `.env.sample`
|
9 |
+
|
10 |
+
## Usage
|
11 |
+
* Clone this repo
|
12 |
+
```
|
13 |
+
git clone https://github.com/ffreemt/multilingual-dokugpt
|
14 |
+
cd multilingual-dokugpt
|
15 |
+
```
|
16 |
+
* [Optional] Create a even
|
17 |
+
e.g.
|
18 |
+
```
|
19 |
+
python -m venv .venv
|
20 |
+
call .venv\Scripts\activate # Windows
|
21 |
+
# source .venv/bin/activate # Linux/Mac
|
22 |
+
```
|
23 |
+
|
24 |
+
* Install packages
|
25 |
+
```
|
26 |
+
python -m pip install -r requirements.txt
|
27 |
+
```
|
28 |
+
|
29 |
+
* Setup OPENAI_API_KEY
|
30 |
+
e.g.
|
31 |
+
```
|
32 |
+
set OPENAI_API_KEY=sk... # Windows cmd
|
33 |
+
# export OPENAI_API_KEY=sk... # bash
|
34 |
+
|
35 |
+
or setup .env (refer to `.env.sample`)
|
36 |
+
```
|
37 |
+
|
38 |
+
* Start the program
|
39 |
+
```
|
40 |
+
python main.py
|
41 |
+
```
|
42 |
+
* Browse to
|
43 |
+
```
|
44 |
+
http://127.0.0.1:7860
|
45 |
+
```
|
46 |
+
|
47 |
+
## TODO
|
48 |
+
* Make it a true localgpt by replacing the remote querying with a local `llm`.
|
49 |
+
|
50 |
+
## License
|
51 |
+
`multilingual-dokugpt` is released under the MIT License. See the LICENSE file for more details.
|
pyproject.toml
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[tool.poetry]
|
2 |
+
name = "multilingual-dokugpt"
|
3 |
+
version = "0.1.0"
|
4 |
+
description = "Talk to multilingual documents in a language you prefer"
|
5 |
+
authors = ["Your Name <you@example.com>"]
|
6 |
+
license = "MIT"
|
7 |
+
readme = "README1.md"
|
8 |
+
packages = [{include = "multilingual_dokugpt"}]
|
9 |
+
|
10 |
+
[tool.poetry.dependencies]
|
11 |
+
python = "^3.10"
|
12 |
+
|
13 |
+
|
14 |
+
[build-system]
|
15 |
+
requires = ["poetry-core"]
|
16 |
+
build-backend = "poetry.core.masonry.api"
|