|
208 | 208 | "truncated_exp1_targets": ( |
209 | 209 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
210 | 210 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
211 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
| 211 | + + "<|endoftext|>" * 3 |
| 212 | + + "<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
212 | 213 | + "<|endoftext|>" * 9 |
213 | | - + "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer two<|endoftext|>" |
| 214 | + + "<|endoftext|>" * 3 |
| 215 | + + "<think>\n\n</think>\n\nexample one answer two<|endoftext|>" |
214 | 216 | ), |
215 | 217 | "truncated_exp1_targets_predictable": ( |
216 | 218 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
217 | 219 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
218 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
| 220 | + + "<|endoftext|>" * 3 |
| 221 | + + "<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
219 | 222 | + "<|endoftext|>" * 9 |
220 | | - + "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer two<|endoftext|>" |
| 223 | + + "<|endoftext|>" * 3 |
| 224 | + + "<think>\n\n</think>\n\nexample one answer two<|endoftext|>" |
221 | 225 | ), |
222 | 226 | "packed_exp2_inputs": ( |
223 | 227 | "<|im_start|>user\nquestion two<|im_end|>\n" |
|
227 | 231 | ), |
228 | 232 | "packed_exp2_targets": ( |
229 | 233 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
230 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
| 234 | + + "<|endoftext|>" * 3 |
| 235 | + + "<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
231 | 236 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
232 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer three<|im_end|>\n" + "!" * 14 + "<|endoftext|>" |
| 237 | + + "<|endoftext|>" * 3 |
| 238 | + + "<think>\n\n</think>\n\nanswer three<|im_end|>\n" |
| 239 | + + "!" * 14 |
| 240 | + + "<|endoftext|>" |
233 | 241 | ), |
234 | 242 | "packed_exp2_targets_predictable": ( |
235 | 243 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
236 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
| 244 | + + "<|endoftext|>" * 3 |
| 245 | + + "<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
237 | 246 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
238 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer three<|im_end|>\n" + "<|endoftext|>" * 15 |
| 247 | + + "<|endoftext|>" * 3 |
| 248 | + + "<think>\n\n</think>\n\nanswer three<|im_end|>\n" |
| 249 | + + "<|endoftext|>" * 15 |
239 | 250 | ), |
240 | 251 | }, |
241 | 252 | "prompt_completion": { |
|
248 | 259 | ), |
249 | 260 | "truncated_exp1_targets": ( |
250 | 261 | "<|endoftext|>" * 8 |
251 | | - + "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
| 262 | + + "<|endoftext|>" * 3 |
| 263 | + + "<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
252 | 264 | + "<|endoftext|>" * 9 |
253 | | - + "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer two<|im_end|>\n" |
| 265 | + + "<|endoftext|>" * 3 |
| 266 | + + "<think>\n\n</think>\n\nexample one answer two<|im_end|>\n" |
254 | 267 | + "<|endoftext|>" * 7 |
255 | 268 | ), |
256 | 269 | "truncated_exp1_targets_predictable": ( |
257 | 270 | "<|endoftext|>" * 8 |
258 | | - + "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
| 271 | + + "<|endoftext|>" * 3 |
| 272 | + + "<think>\n\n</think>\n\nexample one answer one<|im_end|>\n" |
259 | 273 | + "<|endoftext|>" * 9 |
260 | | - + "<|im_start|>assistant\n<think>\n\n</think>\n\nexample one answer two<|im_end|>\n" |
| 274 | + + "<|endoftext|>" * 3 |
| 275 | + + "<think>\n\n</think>\n\nexample one answer two<|im_end|>\n" |
261 | 276 | + "<|endoftext|>" * 7 |
262 | 277 | ), |
263 | 278 | "packed_exp2_inputs": ( |
|
268 | 283 | ), |
269 | 284 | "packed_exp2_targets": ( |
270 | 285 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
271 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
| 286 | + + "<|endoftext|>" * 3 |
| 287 | + + "<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
272 | 288 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
273 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer three<|im_end|>\n" + "!" * 14 + "<|endoftext|>" |
| 289 | + + "<|endoftext|>" * 3 |
| 290 | + + "<think>\n\n</think>\n\nanswer three<|im_end|>\n" |
| 291 | + + "!" * 14 |
| 292 | + + "<|endoftext|>" |
274 | 293 | ), |
275 | 294 | "packed_exp2_targets_predictable": ( |
276 | 295 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
277 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
| 296 | + + "<|endoftext|>" * 3 |
| 297 | + + "<think>\n\n</think>\n\nanswer two<|im_end|>\n" |
278 | 298 | "<|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|><|endoftext|>" |
279 | | - "<|im_start|>assistant\n<think>\n\n</think>\n\nanswer three<|im_end|>\n" + "<|endoftext|>" * 15 |
| 299 | + + "<|endoftext|>" * 3 |
| 300 | + + "<think>\n\n</think>\n\nanswer three<|im_end|>\n" |
| 301 | + + "<|endoftext|>" * 15 |
280 | 302 | ), |
281 | 303 | }, |
282 | 304 | } |
|
0 commit comments