|
from transformers import pipeline |
|
from greenery import parse |
|
from greenery.parse import NoMatch |
|
from listener import Listener, ListenerOutput |
|
import time |
|
import json |
|
import torch |
|
|
|
class EndpointHandler: |
|
def __init__(self, path=""): |
|
self.listener = Listener(path, { |
|
"do_sample": True, |
|
"max_new_tokens": 128, |
|
"top_p": 0.9, |
|
"num_return_sequences": 500, |
|
"num_beams": 1 |
|
}, device="cuda" if torch.cuda.is_available() else "cpu") |
|
|
|
def __call__(self, data): |
|
|
|
inp = data.pop("inputs", None) |
|
spec = inp["spec"] |
|
true_program = inp["true_program"] |
|
|
|
start = time.time() |
|
outputs = self.listener.synthesize([[(s["string"], s["label"]) for s in spec]], return_scores=True) |
|
consistent_program_scores = [outputs.decoded_scores[0][i] for i in outputs.idx[0]] |
|
consistent_programs = [outputs.decoded[0][i] for i in outputs.idx[0]] |
|
sorted_programs = sorted(set(zip(consistent_program_scores, consistent_programs)), reverse=True, key=lambda x: x[0]) |
|
end = time.time() |
|
|
|
top_guess = None |
|
top_score = None |
|
top_success = False |
|
top_10_guesses = None |
|
top_10_scores = None |
|
top_10_success = False |
|
if len(sorted_programs) > 0: |
|
top_guess = sorted_programs[0][1] |
|
top_score = sorted_programs[0][0] |
|
top_success = parse(top_guess.replace('\\', '')).equivalent(parse(true_program).replace('\\', '')) |
|
top_10_guesses = [p for s, p in sorted_programs[:10]] |
|
top_10_scores = [s for s, p in sorted_programs[:10]] |
|
top_10_success = any([parse(p.replace('\\', '')).equivalent(parse(true_program.replace('\\', ''))) for p in top_10_guesses]) |
|
|
|
return { |
|
"guess": top_guess, |
|
"top_1_success": top_success, |
|
"top_1_score": top_score, |
|
"top_10_guesses": top_10_guesses, |
|
"top_10_scores": top_10_scores, |
|
"top_10_success": top_10_success, |
|
"time": end - start |
|
} |
|
|