phi-knowledge-graph

Running on Zero

App Files Files Community

vietexob commited on 21 days ago

Commit

a605fa2

1 Parent(s): a179a95

Added Italian text

Browse files

Files changed (4) hide show

CLAUDE.md +13 -2
app.py +8 -3
data/sample_it.txt +1 -0
llm_graph.py +3 -2

CLAUDE.md CHANGED Viewed

@@ -40,7 +40,7 @@ AZURE_EMBEDDING_DEPLOYMENT=<embedding_deployment>
 AZURE_EMBEDDING_API_VERSION=<embedding_api_version>
 ```
-## Running the Application
 ```bash
 # Install dependencies
@@ -48,6 +48,9 @@ pip install -r requirements.txt
 # Run the Gradio app
 python app.py
 ```
 ## Key Dependencies
@@ -76,4 +79,12 @@ The application expects JSON output with this schema:
   "nodes": [{"id": "entity", "type": "broad_type", "detailed_type": "specific_type"}],
   "edges": [{"from": "entity1", "to": "entity2", "label": "relationship"}]
 }
-```

 AZURE_EMBEDDING_API_VERSION=<embedding_api_version>
 ```
+## Development Commands
 ```bash
 # Install dependencies
 # Run the Gradio app
 python app.py
+# Test model extraction directly
+python llm_graph.py
 ```
 ## Key Dependencies
   "nodes": [{"id": "entity", "type": "broad_type", "detailed_type": "specific_type"}],
   "edges": [{"from": "entity1", "to": "entity2", "label": "relationship"}]
 }
+```
+## Testing and Development Notes
+- No formal test suite exists; manual testing through the Gradio interface
+- First example is automatically cached for performance on startup
+- Cache files stored in `cache/` directory as pickle files
+- Working directory `sample/` is cleared and recreated on each run
+- GraphML files generated by LightRAG for Azure OpenAI model backend

app.py CHANGED Viewed

@@ -59,6 +59,10 @@ text_es_file = "./data/sample_es.txt"
 with open(text_es_file, 'r', encoding='utf-8') as file:
     text_es = file.read()
 # Create cache directory if it doesn't exist
 os.makedirs(CACHE_DIR, exist_ok=True)
 os.makedirs(WORKING_DIR, exist_ok=True)
@@ -95,11 +99,11 @@ def extract_kg(text="", model_name=MODEL_LIST[0], model=None):
         raise gr.Error("⚠️ Both text and model must be provided!")
     if not model:
         raise gr.Error("⚠️ Model must be provided!")
     try:
         start_time = time.time()
         result = model.extract(text, model_name)
         end_time = time.time()
         duration = end_time - start_time
         logging.info(f"Response time: {duration:.4f} seconds")
@@ -342,7 +346,8 @@ EXAMPLES = [
     [handle_text(text_fr)],
     [handle_text(text2_en)],
     [handle_text(text_es)],
-    [handle_text(text3_en)]
 ]
 def generate_first_example():

 with open(text_es_file, 'r', encoding='utf-8') as file:
     text_es = file.read()
+text_it_file = "./data/sample_it.txt"
+with open(text_it_file, 'r', encoding='utf-8') as file:
+    text_it = file.read()
 # Create cache directory if it doesn't exist
 os.makedirs(CACHE_DIR, exist_ok=True)
 os.makedirs(WORKING_DIR, exist_ok=True)
         raise gr.Error("⚠️ Both text and model must be provided!")
     if not model:
         raise gr.Error("⚠️ Model must be provided!")
     try:
         start_time = time.time()
         result = model.extract(text, model_name)
         end_time = time.time()
         duration = end_time - start_time
         logging.info(f"Response time: {duration:.4f} seconds")
     [handle_text(text_fr)],
     [handle_text(text2_en)],
     [handle_text(text_es)],
+    [handle_text(text3_en)],
+    [handle_text(text_it)],
 ]
 def generate_first_example():

data/sample_it.txt ADDED Viewed

	@@ -0,0 +1 @@

+ Ieri sera, passeggiando lungo la riva del lago di Como, ho assistito a uno dei tramonti più suggestivi della mia vita. Il cielo, dipinto di sfumature che variavano dall’arancio acceso al viola intenso, si rifletteva sull’acqua calma come una tela perfetta. Le montagne circostanti, avvolte da una leggera foschia, sembravano fondersi con le nuvole, creando un paesaggio che sembrava uscito da un quadro impressionista. Alcune barche a vela, silenziose e lente, solcavano le acque lasciando dietro di sé una scia dorata, mentre il profumo di gelsomino e di terra bagnata si mescolava all’aria fresca della sera. Per un momento, il tempo sembrava essersi fermato, e anche il chiacchiericcio dei pochi turisti presenti si era attenuato, come se tutti fossero rapiti da quella magia effimera. È in istanti come questi che ci si rende conto di quanto la natura, con la sua semplicità, sappia regalarci emozioni che né la tecnologia né la frenesia quotidiana potranno mai eguagliare.

llm_graph.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import os
 import time
 import numpy as np
 import networkx as nx
@@ -136,7 +137,7 @@ class LLMGraph:
         """
         Extract knowledge graph in structured format from text.
         """
         if model_name == MODEL_LIST[0]:
             # Use Hugging Face Inference API with Phi-3-mini-128k-instruct-graph
             messages = self._get_messages(text)
@@ -146,7 +147,7 @@ class LLMGraph:
         else:
             # Use LightRAG with Azure OpenAI
             self.rag.insert(text) # Insert the text into the RAG storage
             # Wait for GRAPHML_FILE to be created
             while not os.path.exists(GRAPHML_FILE):
                 time.sleep(0.1) # Sleep for 0.1 seconds before checking again

 import os
 import time
+# import shutil
 import numpy as np
 import networkx as nx
         """
         Extract knowledge graph in structured format from text.
         """
         if model_name == MODEL_LIST[0]:
             # Use Hugging Face Inference API with Phi-3-mini-128k-instruct-graph
             messages = self._get_messages(text)
         else:
             # Use LightRAG with Azure OpenAI
             self.rag.insert(text) # Insert the text into the RAG storage
             # Wait for GRAPHML_FILE to be created
             while not os.path.exists(GRAPHML_FILE):
                 time.sleep(0.1) # Sleep for 0.1 seconds before checking again