Spaces:

THUDM
/

CogView2

Runtime error

hysts HF staff commited on Jul 28, 2022

Commit

ac14842

•

1 Parent(s): 7cebd9b

Make the second stage model available on HF Space

Files changed (2) hide show

app.py CHANGED Viewed

@@ -8,12 +8,9 @@ from model import AppModel
 DESCRIPTION = '''# <a href="https://github.com/THUDM/CogView2">CogView2</a> (text2image)
-This Spaces demo runs only one of the two stages the CogView2 codebase has, due to GPU hardware limitations, with that the outputs may not match the original codebase/paper
-This application accepts English or Chinese as input.
 In general, Chinese input produces better results than English input.
-If you check the "Translate to Chinese" checkbox, the app will use the English to Chinese translation results with [this Space](https://huggingface.co/spaces/chinhon/translation_eng2ch) as input.
-But the translation model may mistranslate and the results could be poor.
-So, it is also a good idea to input the translation results from other translation services.
 '''
 NOTES = '''
 - This app is adapted from <a href="https://github.com/hysts/CogView2_demo">https://github.com/hysts/CogView2_demo</a>. It would be recommended to use the repo if you want to run the app yourself.
@@ -29,7 +26,7 @@ def set_example_text(example: list) -> list[dict]:
 def main():
-    only_first_stage = True
     max_inference_batch_size = 8
     model = AppModel(max_inference_batch_size, only_first_stage)

 DESCRIPTION = '''# <a href="https://github.com/THUDM/CogView2">CogView2</a> (text2image)
+The model accepts English or Chinese as input.
 In general, Chinese input produces better results than English input.
+By checking the "Translate to Chinese" checkbox, the results of English to Chinese translation with this Space will be used as input. Since the translation model may mistranslate, you may want to use the translation results from other translation services.
 '''
 NOTES = '''
 - This app is adapted from <a href="https://github.com/hysts/CogView2_demo">https://github.com/hysts/CogView2_demo</a>. It would be recommended to use the repo if you want to run the app yourself.
 def main():
+    only_first_stage = False
     max_inference_batch_size = 8
     model = AppModel(max_inference_batch_size, only_first_stage)

model.py CHANGED Viewed

@@ -54,7 +54,7 @@ if os.getenv('SYSTEM') == 'spaces':
     names = [
         'coglm.zip',
         'cogview2-dsr.zip',
-        #'cogview2-itersr.zip',
     ]
     for name in names:
         download_and_extract_cogview2_models(name)
@@ -215,6 +215,8 @@ class Model:
         start = time.perf_counter()
         model, args = InferenceModel.from_pretrained(self.args, 'coglm')
         elapsed = time.perf_counter() - start
         logger.info(f'--- done ({elapsed=:.3f}) ---')
@@ -278,8 +280,20 @@ class Model:
         seq, txt_len = self.preprocess_text(text)
         if seq is None:
             return None
         self.only_first_stage = only_first_stage
         tokens = self.generate_tokens(seq, txt_len, num)
         res = self.generate_images(seq, txt_len, tokens)
         elapsed = time.perf_counter() - start

     names = [
         'coglm.zip',
         'cogview2-dsr.zip',
+        'cogview2-itersr.zip',
     ]
     for name in names:
         download_and_extract_cogview2_models(name)
         start = time.perf_counter()
         model, args = InferenceModel.from_pretrained(self.args, 'coglm')
+        if not self.args.only_first_stage:
+            model.transformer.cpu()
         elapsed = time.perf_counter() - start
         logger.info(f'--- done ({elapsed=:.3f}) ---')
         seq, txt_len = self.preprocess_text(text)
         if seq is None:
             return None
         self.only_first_stage = only_first_stage
+        if not self.only_first_stage or self.srg is not None:
+            self.srg.dsr.model.cpu()
+            self.srg.itersr.model.cpu()
+        torch.cuda.empty_cache()
+        self.model.transformer.to(self.device)
         tokens = self.generate_tokens(seq, txt_len, num)
+        if not self.only_first_stage:
+            self.model.transformer.cpu()
+            torch.cuda.empty_cache()
+            self.srg.dsr.model.to(self.device)
+            self.srg.itersr.model.to(self.device)
         res = self.generate_images(seq, txt_len, tokens)
         elapsed = time.perf_counter() - start