Spaces:

Arijit-hazra
/

my-image-captioner

Runtime error

Arijit-hazra commited on Apr 27, 2023

Commit

e140fd2

1 Parent(s): 9091369

upd app.py / changing the function names again and removing the call

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,13 +14,13 @@ def custom_standardization(s):
 model = build()
-def single_transcribe(image, temperature=1):
     initial = model.word_to_index([['[START]']]) # (batch, sequence)
     img_features = model.feature_extractor(image[tf.newaxis, ...])
     tokens = initial # (batch, sequence)
     for n in range(50):
-        preds = model.call((img_features, tokens)).numpy()  # (batch, sequence, vocab)
         preds = preds[:,-1, :]  #(batch, vocab)
         if temperature==0:
             next = tf.argmax(preds, axis=-1)[:, tf.newaxis]  # (batch, 1)
@@ -35,13 +35,13 @@ def single_transcribe(image, temperature=1):
     result = tf.strings.reduce_join(words, axis=-1, separator=' ')
     return result.numpy().decode()
-def transcribes(image):
     result = []
     for t in [0,0.5,1]:
         result.append(single_transcribe(image, t))
     return result
-gr.interface(fn=transcribes,
              inputs=gr.Image(type="pil"),
              outputs=["text","text","text"]
             ).launch()

 model = build()
+def single_img_transcribe(image, temperature=1):
     initial = model.word_to_index([['[START]']]) # (batch, sequence)
     img_features = model.feature_extractor(image[tf.newaxis, ...])
     tokens = initial # (batch, sequence)
     for n in range(50):
+        preds = model((img_features, tokens)).numpy()  # (batch, sequence, vocab)
         preds = preds[:,-1, :]  #(batch, vocab)
         if temperature==0:
             next = tf.argmax(preds, axis=-1)[:, tf.newaxis]  # (batch, 1)
     result = tf.strings.reduce_join(words, axis=-1, separator=' ')
     return result.numpy().decode()
+def img_transcribes(image):
     result = []
     for t in [0,0.5,1]:
         result.append(single_transcribe(image, t))
     return result
+gr.interface(fn=img_transcribes,
              inputs=gr.Image(type="pil"),
              outputs=["text","text","text"]
             ).launch()