Spaces:

grapplerulrich
/

raccoon

Sleeping

grapplerulrich commited on May 1, 2022

Commit

59d5e33

1 Parent(s): a69d4fe

Create directory for cache if not exists

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
-from os import remove
-from os.path import exists
 from functools import cache
 import json
 import streamlit as st
@@ -34,6 +34,7 @@ def search_results( query ):
     file_path = 'search-results/' + slugify( query ) + '.json'
     results = []
     if exists( file_path ):
         with open( file_path, 'r' ) as results_file:
             results = json.load( results_file )
@@ -51,6 +52,7 @@ def search_results( query ):
 def content_summary( url_id, content ):
     file_path = 'summaries/' + url_id + '.json'
     if exists( file_path ):
         with open( file_path, 'r' ) as file:
             summary = json.load( file )

+from os import makedirs, remove
+from os.path import exists, dirname
 from functools import cache
 import json
 import streamlit as st
     file_path = 'search-results/' + slugify( query ) + '.json'
     results = []
+    makedirs(dirname(file_path), exist_ok=True)
     if exists( file_path ):
         with open( file_path, 'r' ) as results_file:
             results = json.load( results_file )
 def content_summary( url_id, content ):
     file_path = 'summaries/' + url_id + '.json'
+    makedirs(dirname(file_path), exist_ok=True)
     if exists( file_path ):
         with open( file_path, 'r' ) as file:
             summary = json.load( file )

beautiful_soup/beautiful_soup.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import uuid
-from os.path import exists
 from bs4 import BeautifulSoup
 import requests
@@ -14,6 +15,7 @@ import requests
 def get_url_content( url ):
     file_path = 'page-content/' + uuid.uuid5( uuid.NAMESPACE_URL, url ).hex + '.txt'
     if exists( file_path ):
         with open( file_path, 'r' ) as file_content:
             content = file_content.read()
@@ -49,7 +51,7 @@ def extract_content( url ):
 # Make request and get html content.
 def get_soup( url ):
     file_path = 'web-pages/' + uuid.uuid5( uuid.NAMESPACE_URL, url ).hex + '.html'
-    print(file_path)
     if exists( file_path ):
         with open( file_path, 'r' ) as web_page:
             html = web_page.read()

 import uuid
+from os import makedirs, remove
+from os.path import exists, dirname
 from bs4 import BeautifulSoup
 import requests
 def get_url_content( url ):
     file_path = 'page-content/' + uuid.uuid5( uuid.NAMESPACE_URL, url ).hex + '.txt'
+    makedirs(dirname(file_path), exist_ok=True)
     if exists( file_path ):
         with open( file_path, 'r' ) as file_content:
             content = file_content.read()
 # Make request and get html content.
 def get_soup( url ):
     file_path = 'web-pages/' + uuid.uuid5( uuid.NAMESPACE_URL, url ).hex + '.html'
+    makedirs(dirname(file_path), exist_ok=True)
     if exists( file_path ):
         with open( file_path, 'r' ) as web_page:
             html = web_page.read()