lihongze8 commited on
Commit
acddaf1
·
verified ·
1 Parent(s): ef93aaf

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -2
app.py CHANGED
@@ -61,10 +61,14 @@ def evaluate(problem, response):
61
  step_rewards = derive_step_rewards(rewards, reward_flags)
62
 
63
  # 确保返回的是有效的JSON字符串
64
- return json.dumps(step_rewards[0].tolist())
 
 
 
 
 
65
  except Exception as e:
66
  return json.dumps({"error": str(e)})
67
-
68
  # 创建Gradio界面
69
  iface = gr.Interface(
70
  fn=evaluate,
 
61
  step_rewards = derive_step_rewards(rewards, reward_flags)
62
 
63
  # 确保返回的是有效的JSON字符串
64
+ if isinstance(step_rewards[0], torch.Tensor):
65
+ return json.dumps(step_rewards[0].cpu().numpy().tolist())
66
+ elif isinstance(step_rewards[0], np.ndarray):
67
+ return json.dumps(step_rewards[0].tolist())
68
+ else:
69
+ return json.dumps(list(step_rewards[0])) # 转换为列表
70
  except Exception as e:
71
  return json.dumps({"error": str(e)})
 
72
  # 创建Gradio界面
73
  iface = gr.Interface(
74
  fn=evaluate,