| [ | |
| { | |
| "prompt": "22", | |
| "completion": [ | |
| "\u5236\u5b9a\u8be6\u7ec6\u7684\u5b66\u4e60\u8ba1\u5212\u5e76\u4e25\u683c\u6267\u884c", | |
| "\u91c7\u7528\u591a\u79cd\u5b66\u4e60\u65b9\u6cd5\uff0c\u5982\u9605\u8bfb\u3001\u505a\u7b14\u8bb0\u3001\u8ba8\u8bba\u7b49", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5b66\u4e60\u73af\u5883\uff0c\u51cf\u5c11\u5e72\u6270\u56e0\u7d20", | |
| "\u5b9a\u671f\u8fdb\u884c\u81ea\u6211\u6d4b\u8bd5\uff0c\u68c0\u67e5\u5b66\u4e60\u6548\u679c", | |
| "\u4fdd\u8bc1\u5145\u8db3\u7684\u7761\u7720\u548c\u9002\u5f53\u7684\u4f11\u606f" | |
| ], | |
| "reward": [ | |
| 5, | |
| 4, | |
| 2, | |
| 1, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "333", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| -3, | |
| -2, | |
| 2, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "4444", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| -2, | |
| 1, | |
| 4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "55555", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| 3, | |
| 5, | |
| 1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "666666", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 0, | |
| 1, | |
| -5, | |
| 1, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "7777777", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 4, | |
| -4, | |
| 4, | |
| 4, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "88888888", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| -3, | |
| 1, | |
| -4, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "999999999", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -2, | |
| -5, | |
| 1, | |
| 1, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "10101010101010101010", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 0, | |
| -5, | |
| -4, | |
| -3, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "1111111111111111111111", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| -3, | |
| -2, | |
| -5, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "121212121212121212121212", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| 5, | |
| -3, | |
| 0, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "13131313131313131313131313", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -5, | |
| 2, | |
| -3, | |
| -1, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "1414141414141414141414141414", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 2, | |
| -3, | |
| -5, | |
| -2, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "151515151515151515151515151515", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| -1, | |
| -2, | |
| -3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "16161616161616161616161616161616", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| 0, | |
| -1, | |
| -5, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "1717171717171717171717171717171717", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 1, | |
| -5, | |
| -4, | |
| -3, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "181818181818181818181818181818181818", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -4, | |
| 5, | |
| -2, | |
| 5, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "19191919191919191919191919191919191919", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| 1, | |
| 0, | |
| -1, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "2020202020202020202020202020202020202020", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| 2, | |
| 4, | |
| -3, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "212121212121212121212121212121212121212121", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 4, | |
| -5, | |
| 3, | |
| 2, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "22222222222222222222222222222222222222222222", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 4, | |
| 5, | |
| -4, | |
| -4, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "2323232323232323232323232323232323232323232323", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 4, | |
| 5, | |
| -5, | |
| 1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "242424242424242424242424242424242424242424242424", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| 5, | |
| 2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "25252525252525252525252525252525252525252525252525", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 5, | |
| 5, | |
| -2, | |
| -5, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "2626262626262626262626262626262626262626262626262626", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 5, | |
| -5, | |
| -5, | |
| -5, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "272727272727272727272727272727272727272727272727272727", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| 4, | |
| 5, | |
| -2, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "28282828282828282828282828282828282828282828282828282828", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -3, | |
| -3, | |
| -2, | |
| 5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "2929292929292929292929292929292929292929292929292929292929", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 4, | |
| 2, | |
| 3, | |
| 2, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "303030303030303030303030303030303030303030303030303030303030", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 4, | |
| -1, | |
| 0, | |
| 0, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "31313131313131313131313131313131313131313131313131313131313131", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| -4, | |
| 5, | |
| 2, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "3232323232323232323232323232323232323232323232323232323232323232", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 0, | |
| -5, | |
| -4, | |
| -3, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "333333333333333333333333333333333333333333333333333333333333333333", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| -4, | |
| -3, | |
| -4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "34343434343434343434343434343434343434343434343434343434343434343434", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| -4, | |
| 2, | |
| 1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "3535353535353535353535353535353535353535353535353535353535353535353535", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| 1, | |
| -2, | |
| -5, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "363636363636363636363636363636363636363636363636363636363636363636363636", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| -1, | |
| 5, | |
| 5, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "37373737373737373737373737373737373737373737373737373737373737373737373737", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| -2, | |
| 1, | |
| 1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "3838383838383838383838383838383838383838383838383838383838383838383838383838", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 0, | |
| 1, | |
| -5, | |
| 5, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "393939393939393939393939393939393939393939393939393939393939393939393939393939", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| -4, | |
| 2, | |
| 2, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "40404040404040404040404040404040404040404040404040404040404040404040404040404040", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| -1, | |
| -3, | |
| 0, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "4141414141414141414141414141414141414141414141414141414141414141414141414141414141", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -2, | |
| -3, | |
| 4, | |
| -1, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "424242424242424242424242424242424242424242424242424242424242424242424242424242424242", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 1, | |
| -3, | |
| 5, | |
| 4, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "43434343434343434343434343434343434343434343434343434343434343434343434343434343434343", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 0, | |
| -2, | |
| -1, | |
| 1, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "4444444444444444444444444444444444444444444444444444444444444444444444444444444444444444", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -5, | |
| 1, | |
| 1, | |
| -1, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "454545454545454545454545454545454545454545454545454545454545454545454545454545454545454545", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| -1, | |
| 3, | |
| 1, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "46464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| -4, | |
| 0, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "4747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| 4, | |
| -1, | |
| -2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| 2, | |
| -1, | |
| -5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "49494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 3, | |
| 3, | |
| -5, | |
| 1, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "5050505050505050505050505050505050505050505050505050505050505050505050505050505050505050505050505050", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| 4, | |
| 1, | |
| -5, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "515151515151515151515151515151515151515151515151515151515151515151515151515151515151515151515151515151", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| 3, | |
| 5, | |
| 2, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "52525252525252525252525252525252525252525252525252525252525252525252525252525252525252525252525252525252", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| -5, | |
| -5, | |
| -1, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "5353535353535353535353535353535353535353535353535353535353535353535353535353535353535353535353535353535353", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 1, | |
| -3, | |
| 3, | |
| 0, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "545454545454545454545454545454545454545454545454545454545454545454545454545454545454545454545454545454545454", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 0, | |
| -4, | |
| -4, | |
| -4, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "55555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555555", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 0, | |
| 3, | |
| 3, | |
| 2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "5656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -3, | |
| -5, | |
| -3, | |
| -3, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 1, | |
| -4, | |
| 5, | |
| 5, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "58585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -2, | |
| -1, | |
| -1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "5959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| 4, | |
| 2, | |
| -5, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "606060606060606060606060606060606060606060606060606060606060606060606060606060606060606060606060606060606060606060606060", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| 3, | |
| -3, | |
| -5, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "61616161616161616161616161616161616161616161616161616161616161616161616161616161616161616161616161616161616161616161616161", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| 2, | |
| 4, | |
| -4, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "6262626262626262626262626262626262626262626262626262626262626262626262626262626262626262626262626262626262626262626262626262", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -3, | |
| -2, | |
| -1, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363636363", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| 1, | |
| -3, | |
| 1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "64646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464646464", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| -4, | |
| 4, | |
| -3, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "6565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565656565", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -2, | |
| 2, | |
| -4, | |
| -5, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666666", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 5, | |
| 0, | |
| -5, | |
| 1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "67676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| 4, | |
| 2, | |
| -3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "6868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -2, | |
| -2, | |
| 4, | |
| 0, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| -2, | |
| 5, | |
| 0, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "70707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070707070", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -3, | |
| 0, | |
| 1, | |
| 3, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "7171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171717171", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| 1, | |
| -2, | |
| -5, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272727272", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 3, | |
| 1, | |
| 0, | |
| 4, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "73737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373737373", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| 5, | |
| 4, | |
| 2, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "7474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474747474", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 0, | |
| -1, | |
| -3, | |
| 5, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575757575", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| -2, | |
| -3, | |
| -1, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "76767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676767676", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| 2, | |
| -5, | |
| -1, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "7777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777777", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| -5, | |
| 5, | |
| -5, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 1, | |
| 3, | |
| 0, | |
| -5, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "79797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| -3, | |
| -3, | |
| -1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "8080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080808080", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -5, | |
| -5, | |
| 5, | |
| 0, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181818181", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -5, | |
| -4, | |
| 0, | |
| 4, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "82828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282828282", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 1, | |
| -5, | |
| 4, | |
| 1, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "8383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383838383", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| -3, | |
| 2, | |
| -2, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484848484", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| -4, | |
| -1, | |
| -5, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "85858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585858585", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| 1, | |
| -3, | |
| 1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "8686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686868686", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| -1, | |
| 1, | |
| 5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787878787", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| -3, | |
| -2, | |
| 1, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "88888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888888", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| 5, | |
| -1, | |
| 5, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "8989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -1, | |
| 2, | |
| 4, | |
| -5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090909090", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| 0, | |
| 4, | |
| 4, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "91919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191919191", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 4, | |
| -5, | |
| -3, | |
| -2, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "9292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292929292", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -3, | |
| 4, | |
| -3, | |
| 5, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393939393", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -1, | |
| 3, | |
| -3, | |
| -2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "94949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494949494", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| 4, | |
| -5, | |
| 2, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "9595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595959595", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 0, | |
| 3, | |
| -2, | |
| -5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696969696", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 5, | |
| 2, | |
| -3, | |
| 3, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "97979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797979797", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -1, | |
| 3, | |
| 3, | |
| -4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "9898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898989898", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -4, | |
| 5, | |
| -4, | |
| 3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 4, | |
| -2, | |
| -5, | |
| 4, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100100", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| 1, | |
| 0, | |
| 1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101101", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 0, | |
| 5, | |
| 3, | |
| -4, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102102", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 2, | |
| -5, | |
| 0, | |
| 5, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103103", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -1, | |
| -5, | |
| 0, | |
| 4, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104104", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 3, | |
| -4, | |
| -1, | |
| -1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105105", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -2, | |
| 1, | |
| 1, | |
| 2, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106106", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -3, | |
| 3, | |
| -1, | |
| 4, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107107", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| -2, | |
| -3, | |
| -2, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108108", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -3, | |
| 4, | |
| 5, | |
| 2, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109109", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 5, | |
| 5, | |
| 5, | |
| 0, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110110", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -5, | |
| 4, | |
| 4, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 0, | |
| -3, | |
| 4, | |
| -1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112112", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 3, | |
| 3, | |
| -1, | |
| -2, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113113", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 0, | |
| -4, | |
| 2, | |
| -5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114114", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 4, | |
| 0, | |
| 1, | |
| 1, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115115", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| 5, | |
| 1, | |
| -2, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116116", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| 2, | |
| -3, | |
| -3, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117117", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -2, | |
| -4, | |
| -4, | |
| 4, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118118", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| 5, | |
| -4, | |
| 1, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119119", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 0, | |
| 5, | |
| -2, | |
| -5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120120", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| -3, | |
| 1, | |
| 5, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121121", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 3, | |
| 5, | |
| -2, | |
| -2, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122122", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -2, | |
| 1, | |
| 0, | |
| -3, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123123", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 3, | |
| 1, | |
| -1, | |
| -1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124124", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 0, | |
| -2, | |
| -5, | |
| 4, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125125", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| 1, | |
| 1, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126126", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -4, | |
| 1, | |
| 2, | |
| 2, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127127", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| -3, | |
| -2, | |
| -5, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128128", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -3, | |
| 5, | |
| 0, | |
| -3, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129129", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -5, | |
| -5, | |
| -4, | |
| -2, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130130", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| -5, | |
| 2, | |
| 1, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131131", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -1, | |
| 2, | |
| -4, | |
| -4, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132132", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| -3, | |
| -2, | |
| 2, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133133", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| 5, | |
| -2, | |
| -2, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134134", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -1, | |
| 1, | |
| 1, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135135", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| -3, | |
| -5, | |
| -1, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136136", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| -3, | |
| -3, | |
| -1, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137137", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 1, | |
| 0, | |
| 3, | |
| -3, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138138", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 5, | |
| -4, | |
| 5, | |
| -2, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139139", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| 1, | |
| -1, | |
| -1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140140", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| -1, | |
| -3, | |
| -2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141141", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| -3, | |
| -5, | |
| 0, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142142", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 2, | |
| -1, | |
| -1, | |
| -4, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143143", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| 4, | |
| 1, | |
| -3, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144144", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| 2, | |
| 5, | |
| -5, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145145", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| 0, | |
| 2, | |
| 0, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146146", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 1, | |
| 1, | |
| 2, | |
| -4, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147147", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| 4, | |
| 5, | |
| -5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148148", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| -1, | |
| 0, | |
| -4, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149149", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| -1, | |
| -4, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150150", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -3, | |
| -2, | |
| 1, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151151", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 0, | |
| -4, | |
| -3, | |
| -5, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152152", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 5, | |
| 2, | |
| -3, | |
| 3, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153153", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 5, | |
| -3, | |
| 2, | |
| -1, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154154", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 1, | |
| 0, | |
| -5, | |
| -5, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155155", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| -4, | |
| 3, | |
| 0, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156156", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| -1, | |
| -5, | |
| -4, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157157", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| -1, | |
| -2, | |
| 2, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158158", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -5, | |
| -3, | |
| -3, | |
| -5, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159159", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| -3, | |
| 0, | |
| -1, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160160", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 0, | |
| 3, | |
| 0, | |
| -4, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161161", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 5, | |
| 0, | |
| 0, | |
| -4, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162162", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -2, | |
| 3, | |
| -1, | |
| 4, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163163", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| 4, | |
| -1, | |
| -5, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164164", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 0, | |
| 1, | |
| 4, | |
| -2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165165", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -5, | |
| 3, | |
| -2, | |
| 2, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166166", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 1, | |
| -4, | |
| 0, | |
| -1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167167", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| -2, | |
| 5, | |
| 2, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168168", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -4, | |
| 1, | |
| 3, | |
| -5, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169169", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -1, | |
| -4, | |
| 4, | |
| 2, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170170", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -4, | |
| 5, | |
| -3, | |
| 0, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171171", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| 4, | |
| -4, | |
| -4, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172172", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -5, | |
| -4, | |
| -3, | |
| -2, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173173", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| 4, | |
| 4, | |
| 4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174174", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 4, | |
| 3, | |
| -1, | |
| -3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175175", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| -3, | |
| 5, | |
| -5, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176176", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 1, | |
| 0, | |
| 4, | |
| 5, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177177", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 1, | |
| 1, | |
| -5, | |
| -2, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178178", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| 2, | |
| 0, | |
| -3, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179179", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -3, | |
| -3, | |
| 5, | |
| 4, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180180", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -2, | |
| -4, | |
| 1, | |
| 0, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181181", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| 0, | |
| 1, | |
| -3, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182182", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -5, | |
| 0, | |
| 0, | |
| -4, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183183", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -5, | |
| 2, | |
| -3, | |
| -4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184184", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 0, | |
| -1, | |
| -4, | |
| 2, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185185", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -2, | |
| 5, | |
| 4, | |
| -1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186186", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -2, | |
| 1, | |
| 4, | |
| 5, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187187", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| -3, | |
| 3, | |
| 2, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188188", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 5, | |
| -1, | |
| 2, | |
| 3, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189189", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 3, | |
| 1, | |
| -5, | |
| 3, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190190", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -2, | |
| -3, | |
| 5, | |
| -1, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191191", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| 2, | |
| -2, | |
| -2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192192", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| -2, | |
| -5, | |
| -5, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193193", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 4, | |
| 2, | |
| 1, | |
| 5, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194194", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| -3, | |
| 2, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195195", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 3, | |
| 2, | |
| 4, | |
| 0, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196196", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| -5, | |
| -2, | |
| -1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197197", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| -2, | |
| -1, | |
| -3, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198198", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -4, | |
| 3, | |
| 0, | |
| 4, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199199", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 4, | |
| 4, | |
| 1, | |
| -3, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200200", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| 2, | |
| -3, | |
| 4, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201201", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| -2, | |
| 3, | |
| -3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202202", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 4, | |
| -1, | |
| 3, | |
| -4, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203203", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| -4, | |
| 2, | |
| -2, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204204", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| -4, | |
| 5, | |
| -5, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205205", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 2, | |
| 3, | |
| 4, | |
| 0, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206206", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -5, | |
| -4, | |
| -3, | |
| -4, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207207", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 5, | |
| 1, | |
| 2, | |
| 1, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208208", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 0, | |
| -5, | |
| -4, | |
| -4, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209209", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| -4, | |
| -1, | |
| 1, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210210", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -3, | |
| 1, | |
| 1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211211", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| -2, | |
| -3, | |
| 2, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212212", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -2, | |
| 4, | |
| -2, | |
| 3, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213213", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 5, | |
| 3, | |
| 5, | |
| 2, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214214", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -2, | |
| -3, | |
| -1, | |
| -4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215215", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| 5, | |
| -5, | |
| 3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216216", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| 3, | |
| 2, | |
| 2, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217217", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 3, | |
| 4, | |
| -3, | |
| 1, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218218", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| 5, | |
| 1, | |
| -3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219219", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| 4, | |
| 4, | |
| 5, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220220", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| 0, | |
| -4, | |
| 4, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221221", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| 5, | |
| 4, | |
| 0, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222222", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| -2, | |
| 5, | |
| -5, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223223", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 2, | |
| 0, | |
| 4, | |
| 2, | |
| 5 | |
| ] | |
| }, | |
| { | |
| "prompt": "224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224224", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 2, | |
| 1, | |
| -4, | |
| 2, | |
| -5 | |
| ] | |
| }, | |
| { | |
| "prompt": "225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225225", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| 4, | |
| 1, | |
| 4, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226226", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -5, | |
| -2, | |
| -4, | |
| -1, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227227", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -4, | |
| 1, | |
| -1, | |
| 4, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228228", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -2, | |
| -4, | |
| -5, | |
| -1, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229229", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 0, | |
| -2, | |
| 1, | |
| 2, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230230", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| 1, | |
| 0, | |
| -1 | |
| ] | |
| }, | |
| { | |
| "prompt": "231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231231", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 1, | |
| -2, | |
| 1, | |
| 4, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232232", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 4, | |
| -4, | |
| -4, | |
| 2, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233233", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| 3, | |
| 1, | |
| -5, | |
| -2, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234234", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 3, | |
| 3, | |
| -4, | |
| -3, | |
| -4 | |
| ] | |
| }, | |
| { | |
| "prompt": "235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235235", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -3, | |
| 2, | |
| -3, | |
| 4, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236236", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| 3, | |
| -1, | |
| -4, | |
| 5, | |
| 2 | |
| ] | |
| }, | |
| { | |
| "prompt": "237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237237", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -3, | |
| -2, | |
| 1, | |
| -1, | |
| 1 | |
| ] | |
| }, | |
| { | |
| "prompt": "238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238238", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -1, | |
| 5, | |
| 5, | |
| -4, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239239", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| -2, | |
| 1, | |
| -5, | |
| -4, | |
| 0 | |
| ] | |
| }, | |
| { | |
| "prompt": "240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240240", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -1, | |
| 0, | |
| -2, | |
| 2, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241241", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -5, | |
| -1, | |
| 0, | |
| 3, | |
| -3 | |
| ] | |
| }, | |
| { | |
| "prompt": "242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242242", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| 0, | |
| -1, | |
| 1, | |
| 3, | |
| -2 | |
| ] | |
| }, | |
| { | |
| "prompt": "243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243243", | |
| "completion": [ | |
| "\u5747\u8861\u996e\u98df\uff0c\u591a\u5403\u852c\u83dc\u6c34\u679c\uff0c\u5c11\u5403\u6cb9\u817b\u548c\u9ad8\u7cd6\u98df\u7269", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u5982\u8dd1\u6b65\u3001\u6e38\u6cf3\u3001\u5065\u8eab\u7b49", | |
| "\u4fdd\u6301\u89c4\u5f8b\u7684\u4f5c\u606f\u65f6\u95f4\uff0c\u65e9\u7761\u65e9\u8d77", | |
| "\u4fdd\u6301\u826f\u597d\u7684\u5fc3\u6001\uff0c\u907f\u514d\u8fc7\u5ea6\u7126\u8651\u548c\u538b\u529b", | |
| "\u5b9a\u671f\u8fdb\u884c\u4f53\u68c0\uff0c\u53ca\u65f6\u53d1\u73b0\u548c\u9884\u9632\u75be\u75c5" | |
| ], | |
| "reward": [ | |
| 3, | |
| 4, | |
| -3, | |
| -1, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244244", | |
| "completion": [ | |
| "\u5408\u7406\u5b89\u6392\u5de5\u4f5c\u4efb\u52a1\uff0c\u5236\u5b9a\u4f18\u5148\u7ea7", | |
| "\u907f\u514d\u591a\u4efb\u52a1\u5904\u7406\uff0c\u4e13\u6ce8\u5b8c\u6210\u4e00\u9879\u4efb\u52a1", | |
| "\u4f7f\u7528\u5de5\u5177\u548c\u8f6f\u4ef6\u63d0\u9ad8\u5de5\u4f5c\u81ea\u52a8\u5316\u7a0b\u5ea6", | |
| "\u5b9a\u671f\u4f11\u606f\uff0c\u907f\u514d\u957f\u65f6\u95f4\u8fde\u7eed\u5de5\u4f5c\u5bfc\u81f4\u75b2\u52b3", | |
| "\u4e0e\u540c\u4e8b\u6709\u6548\u6c9f\u901a\uff0c\u51cf\u5c11\u4e0d\u5fc5\u8981\u7684\u4f1a\u8bae\u548c\u5e72\u6270" | |
| ], | |
| "reward": [ | |
| -2, | |
| 2, | |
| 3, | |
| -3, | |
| 4 | |
| ] | |
| }, | |
| { | |
| "prompt": "245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245245", | |
| "completion": [ | |
| "\u5c0a\u91cd\u4ed6\u4eba\uff0c\u503e\u542c\u4ed6\u4eba\u7684\u610f\u89c1\u548c\u60f3\u6cd5", | |
| "\u79ef\u6781\u6c9f\u901a\uff0c\u8868\u8fbe\u81ea\u5df1\u7684\u611f\u53d7\u548c\u9700\u6c42", | |
| "\u4e50\u4e8e\u52a9\u4eba\uff0c\u5173\u5fc3\u4ed6\u4eba\u7684\u56f0\u96be\u548c\u95ee\u9898", | |
| "\u4fdd\u6301\u8bda\u4fe1\uff0c\u9075\u5b88\u627f\u8bfa\u548c\u7ea6\u5b9a", | |
| "\u53c2\u4e0e\u793e\u4ea4\u6d3b\u52a8\uff0c\u6269\u5927\u81ea\u5df1\u7684\u793e\u4ea4\u5708\u5b50" | |
| ], | |
| "reward": [ | |
| -4, | |
| 0, | |
| 1, | |
| -1, | |
| 3 | |
| ] | |
| }, | |
| { | |
| "prompt": "246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246246", | |
| "completion": [ | |
| "\u8fdb\u884c\u653e\u677e\u8bad\u7ec3\uff0c\u5982\u6df1\u547c\u5438\u3001\u51a5\u60f3\u7b49", | |
| "\u9002\u5f53\u8fdb\u884c\u4f53\u80b2\u953b\u70bc\uff0c\u91ca\u653e\u538b\u529b", | |
| "\u4e0e\u670b\u53cb\u6216\u5bb6\u4eba\u4ea4\u6d41\uff0c\u5bfb\u6c42\u652f\u6301\u548c\u5e2e\u52a9", | |
| "\u5408\u7406\u5b89\u6392\u65f6\u95f4\uff0c\u907f\u514d\u8fc7\u5ea6\u5de5\u4f5c\u548c\u5b66\u4e60", | |
| "\u57f9\u517b\u5174\u8da3\u7231\u597d\uff0c\u8f6c\u79fb\u6ce8\u610f\u529b" | |
| ], | |
| "reward": [ | |
| -5, | |
| -5, | |
| -1, | |
| -3, | |
| -4 | |
| ] | |
| } | |
| ] |