Spaces:

ejschwartz
/

resym

Running on Zero

App Files Files Community

ejschwartz commited on Mar 21

Commit

0b155f0

1 Parent(s): 0adad70

fix again

Browse files

Files changed (1) hide show

app.py +23 -7

app.py CHANGED Viewed

@@ -76,11 +76,10 @@ def infer(code):
     # ejs: Yeah, this var_name thing is really bizarre. But look at https://github.com/lt-asset/resym/blob/main/training_src/fielddecoder_inf.py
     prompt = f"What are the original name and data types of variables {varstring}?\n```{code}\n```{var_name}"
-    prompt = code + var_name + ":"
-    print(prompt)
     input_ids = tokenizer.encode(prompt, return_tensors="pt").cuda()[:, : 8192 - 1024]
-    output = vardecoder_model.generate(
         input_ids=input_ids,
         max_new_tokens=1024,
         num_beams=4,
@@ -90,14 +89,30 @@ def infer(code):
         pad_token_id=0,
         eos_token_id=0,
     )[0]
-    output = tokenizer.decode(
-        output[input_ids.size(1) :],
         skip_special_tokens=True,
         clean_up_tokenization_spaces=True,
     )
-    output = var_name + ":" + output
-    return output, varstring
 demo = gr.Interface(
@@ -106,6 +121,7 @@ demo = gr.Interface(
         gr.Textbox(lines=10, value=example),
     ],
     outputs=[gr.Text(label="Var Decoder Output"),
              gr.Text(label="Generated Variable List")],
     description=description
 )

     # ejs: Yeah, this var_name thing is really bizarre. But look at https://github.com/lt-asset/resym/blob/main/training_src/fielddecoder_inf.py
     prompt = f"What are the original name and data types of variables {varstring}?\n```{code}\n```{var_name}"
+    print(f"Prompt:\n{prompt}")
     input_ids = tokenizer.encode(prompt, return_tensors="pt").cuda()[:, : 8192 - 1024]
+    var_output = vardecoder_model.generate(
         input_ids=input_ids,
         max_new_tokens=1024,
         num_beams=4,
         pad_token_id=0,
         eos_token_id=0,
     )[0]
+    var_output = tokenizer.decode(
+        var_output[input_ids.size(1) :],
+        skip_special_tokens=True,
+        clean_up_tokenization_spaces=True,
+    )
+    field_output = fielddecoder_model.generate(
+        input_ids=input_ids,
+        max_new_tokens=1024,
+        num_beams=4,
+        num_return_sequences=1,
+        do_sample=False,
+        early_stopping=False,
+        pad_token_id=0,
+        eos_token_id=0,
+    )[0]
+    field_output = tokenizer.decode(
+        field_output[input_ids.size(1) :],
         skip_special_tokens=True,
         clean_up_tokenization_spaces=True,
     )
+    var_output = var_name + ":" + var_output
+    field_output = var_name + ":" + field_output
+    return var_output, field_output, varstring
 demo = gr.Interface(
         gr.Textbox(lines=10, value=example),
     ],
     outputs=[gr.Text(label="Var Decoder Output"),
+             gr.Text(label="Field Decoder Output"),
              gr.Text(label="Generated Variable List")],
     description=description
 )