HachiML
/

Mists-7B-v01-not-trained

Feature Extraction

TimeSeries-Text-to-Text

Model card Files Files and versions Community

HachiML commited on 28 days ago

Commit

cd283a7

•

1 Parent(s): 4a5f9eb

Upload processing_mists.py

Files changed (1) hide show

processing_mists.py +10 -3

processing_mists.py CHANGED Viewed

@@ -44,6 +44,7 @@ class MistsProcessor(ProcessorMixin):
         torch_dtype: Optional[Union[str, torch.dtype]] = torch.float,
         time_series_padding: Union[bool, str] = False,
         time_series_max_length: Union[int, None] = None,
     ) -> BatchFeature:
         if time_series is not None:
             time_series_values = self.feature_extractor(
@@ -55,9 +56,15 @@ class MistsProcessor(ProcessorMixin):
             )
         else:
             time_series_values = None
-        text_inputs = self.tokenizer(
-            text, return_tensors=return_tensors, padding=padding, truncation=truncation, max_length=max_length
-        )
         return BatchFeature(data={**text_inputs, **time_series_values})

         torch_dtype: Optional[Union[str, torch.dtype]] = torch.float,
         time_series_padding: Union[bool, str] = False,
         time_series_max_length: Union[int, None] = None,
+        text_tokenize: bool = True,
     ) -> BatchFeature:
         if time_series is not None:
             time_series_values = self.feature_extractor(
             )
         else:
             time_series_values = None
+        if text is not None:
+            if text_tokenize:
+                text_inputs = self.tokenizer(
+                    text, return_tensors=return_tensors, padding=padding, truncation=truncation, max_length=max_length
+                )
+            else:
+                text_inputs = {"text": text}
+        else:
+            text_inputs = None
         return BatchFeature(data={**text_inputs, **time_series_values})