Spaces:

vialibre
/

edia_datos_es

Runtime error

nanom commited on Dec 8, 2022

Commit

7e1c3f7

•

1 Parent(s): 2d0d0c7

Changed logs dataset target

Files changed (7) hide show

.gitignore CHANGED Viewed

@@ -1,3 +1,3 @@
 __pycache__/
 .env
-bias_tool_logs/

 __pycache__/
 .env
+logs_edia_datos_spanish/

app.py CHANGED Viewed

@@ -9,10 +9,12 @@ from interfaces.interface_datos import interface as interface_datos
 # --- Tool config ---
 # ToDo: Change the owner of the context dataset from nanom to vialibre
 CONTEXTS_DATASET    = "nanom/splittedspanish3bwc"
-AVAILABLE_WORDCLOUD = False                         # [True | False]
-AVAILABLE_LOGS      = True                         # [True | False]
 LANGUAGE            = "spanish"                     # [spanish]
-VOCABULARY_SUBSET   = "full"                        # [full]
 # --- Init classes ---

 # --- Tool config ---
 # ToDo: Change the owner of the context dataset from nanom to vialibre
 CONTEXTS_DATASET    = "nanom/splittedspanish3bwc"
 LANGUAGE            = "spanish"                     # [spanish]
+VOCABULARY_SUBSET   = "full"                        # [full, mini]
+AVAILABLE_WORDCLOUD = False                         # [True | False]
+AVAILABLE_LOGS      = True                          # [True | False]
 # --- Init classes ---

data/mini_vocab_v6.zip ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e1ac44f7478778f4c08bb57dc6aa79ededc89654b404320d0017586e578768a9
+size 93612

interfaces/interface_datos.py CHANGED Viewed

@@ -15,7 +15,8 @@ def interface(
     # --- Init logs ---
     log_callback = HuggingFaceDatasetSaver(
-        available_logs=available_logs
     )
     # --- Init Class ---
@@ -67,7 +68,8 @@ def interface(
                         value=labels["step3"]
                     )
                     subsets_choice = gr.CheckboxGroup(
-                        label="",
                         interactive=True,
                         visible=True
                     )
@@ -148,7 +150,7 @@ def interface(
         save_field = [input_word, subsets_choice]
         log_callback.setup(
             components=save_field,
-            flagging_dir=f"edia_datos_{lang}"
         )
         btn_get_contexts.click(

     # --- Init logs ---
     log_callback = HuggingFaceDatasetSaver(
+        available_logs=available_logs,
+        dataset_name=f"logs_edia_datos_{lang}"
     )
     # --- Init Class ---
                         value=labels["step3"]
                     )
                     subsets_choice = gr.CheckboxGroup(
+                        label="Subset_choices",
+                        show_label=False,
                         interactive=True,
                         visible=True
                     )
         save_field = [input_word, subsets_choice]
         log_callback.setup(
             components=save_field,
+            flagging_dir="logs"
         )
         btn_get_contexts.click(

language/spanish.json CHANGED Viewed

@@ -4,7 +4,7 @@
         "step2": "2. Seleccione cantidad máxima de contextos a recuperar",
         "step3": "3. Seleccione conjuntos de interés",
         "inputWord": {
-            "title": "",
             "placeholder": "Ingresar aquí la palabra ..."
         },
         "wordInfoButton": "Obtener información de palabra",

         "step2": "2. Seleccione cantidad máxima de contextos a recuperar",
         "step3": "3. Seleccione conjuntos de interés",
         "inputWord": {
+            "title": "Word",
             "placeholder": "Ingresar aquí la palabra ..."
         },
         "wordInfoButton": "Obtener información de palabra",

modules/module_connection.py CHANGED Viewed

@@ -81,14 +81,13 @@ class Word2ContextExplorerConnector(Connector):
         return self.process_error(err), contexts, subsets_info, distribution_plot, word_cloud_plot, subsets_choice
     def get_word_context(
-        self,
-        word: str,
-        n_context: int,
         subset_choice: List[str]
     ) -> Tuple:
         word = self.parse_word(word)
-        n_context = int(n_context)
         err = ""
         contexts = pd.DataFrame([], columns=[''])

         return self.process_error(err), contexts, subsets_info, distribution_plot, word_cloud_plot, subsets_choice
     def get_word_context(
+        self,
+        word: str,
+        n_context: int,
         subset_choice: List[str]
     ) -> Tuple:
         word = self.parse_word(word)
         err = ""
         contexts = pd.DataFrame([], columns=[''])

modules/module_logsManager.py CHANGED Viewed

@@ -50,8 +50,8 @@ class HuggingFaceDatasetSaver(FlaggingCallback):
     def __init__(
         self,
         hf_token: str=os.getenv('HF_TOKEN'),
-        dataset_name: str=os.getenv('DS_LOGS_NAME'),
         organization: Optional[str]=os.getenv('ORG_NAME'),
         private: bool=True,
         available_logs: bool=False
@@ -63,8 +63,10 @@ class HuggingFaceDatasetSaver(FlaggingCallback):
             organization: The organization to save the dataset under. The hf_token must provide write access to this organization. If not provided, saved under the name of the user corresponding to the hf_token.
             private: Whether the dataset should be private (defaults to False).
         """
-        self.hf_token = hf_token
         self.dataset_name = dataset_name
         self.organization_name = organization
         self.dataset_private = private
         self.datetime = DateLogs()

     def __init__(
         self,
+        dataset_name: str=None,
         hf_token: str=os.getenv('HF_TOKEN'),
         organization: Optional[str]=os.getenv('ORG_NAME'),
         private: bool=True,
         available_logs: bool=False
             organization: The organization to save the dataset under. The hf_token must provide write access to this organization. If not provided, saved under the name of the user corresponding to the hf_token.
             private: Whether the dataset should be private (defaults to False).
         """
+        assert(dataset_name is not None), "Error: Parameter 'dataset_name' cannot be empty!."
         self.dataset_name = dataset_name
+        self.hf_token = hf_token
         self.organization_name = organization
         self.dataset_private = private
         self.datetime = DateLogs()