waterfall 0.2.0__tar.gz → 0.2.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,5 @@
1
+ {
2
+ "python-envs.defaultEnvManager": "ms-python.python:conda",
3
+ "python-envs.defaultPackageManager": "ms-python.python:conda",
4
+ "python-envs.pythonProjects": []
5
+ }
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: waterfall
3
- Version: 0.2.0
3
+ Version: 0.2.1
4
4
  Summary: Scalable Framework for Robust Text Watermarking and Provenance for LLMs
5
5
  Project-URL: Homepage, https://github.com/aoi3142/Waterfall
6
6
  Project-URL: Issues, https://github.com/aoi3142/Waterfall/issues
@@ -4,7 +4,7 @@ build-backend = "hatchling.build"
4
4
 
5
5
  [project]
6
6
  name = "waterfall"
7
- version = "0.2.0"
7
+ version = "0.2.1"
8
8
  authors = [
9
9
  { name = "Xinyuan Niu", email="aperture@outlook.sg" }
10
10
  ]
@@ -0,0 +1,697 @@
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": 1,
6
+ "id": "df7c520a",
7
+ "metadata": {},
8
+ "outputs": [],
9
+ "source": [
10
+ "import os\n",
11
+ "# os.environ[\"VLLM_USE_V1\"] = \"0\"\n",
12
+ "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"4\""
13
+ ]
14
+ },
15
+ {
16
+ "cell_type": "code",
17
+ "execution_count": 2,
18
+ "id": "79d9fbdb",
19
+ "metadata": {},
20
+ "outputs": [],
21
+ "source": [
22
+ "from vllm import LLM, SamplingParams\n",
23
+ "from vllm.inputs import TokensPrompt\n",
24
+ "import torch\n",
25
+ "from transformers import AutoTokenizer, AutoModelForCausalLM\n",
26
+ "from transformers.generation.beam_search import *\n",
27
+ "from transformers.modeling_outputs import CausalLMOutputWithPast\n",
28
+ "from waterfall.WatermarkerBase import Watermarker\n",
29
+ "\n",
30
+ "import types\n",
31
+ "import inspect\n",
32
+ "from copy import deepcopy\n",
33
+ "from timeit import timeit"
34
+ ]
35
+ },
36
+ {
37
+ "cell_type": "code",
38
+ "execution_count": 3,
39
+ "id": "6ff6b383",
40
+ "metadata": {},
41
+ "outputs": [
42
+ {
43
+ "name": "stdout",
44
+ "output_type": "stream",
45
+ "text": [
46
+ "Cache size: 84538\n"
47
+ ]
48
+ }
49
+ ],
50
+ "source": [
51
+ "base_model = 'meta-llama/Meta-Llama-3.1-8B-Instruct'\n",
52
+ "tokenizer = AutoTokenizer.from_pretrained(base_model)\n",
53
+ "tokenizer.pad_token = tokenizer.eos_token\n",
54
+ "tokenizer.padding_side='left'\n",
55
+ "watermarker = Watermarker(tokenizer)\n",
56
+ "logits_processor = watermarker.logits_processor"
57
+ ]
58
+ },
59
+ {
60
+ "cell_type": "code",
61
+ "execution_count": 4,
62
+ "id": "b6e4d263",
63
+ "metadata": {},
64
+ "outputs": [],
65
+ "source": [
66
+ "max_tokens = max_new_tokens = 10"
67
+ ]
68
+ },
69
+ {
70
+ "cell_type": "code",
71
+ "execution_count": 5,
72
+ "id": "03c09dff",
73
+ "metadata": {},
74
+ "outputs": [
75
+ {
76
+ "name": "stdout",
77
+ "output_type": "stream",
78
+ "text": [
79
+ "INFO 08-15 11:03:46 __init__.py:207] Automatically detected platform cuda.\n",
80
+ "INFO 08-15 11:04:07 config.py:549] This model supports multiple tasks: {'reward', 'embed', 'classify', 'generate', 'score'}. Defaulting to 'generate'.\n",
81
+ "INFO 08-15 11:04:07 llm_engine.py:234] Initializing a V0 LLM engine (v0.7.3) with config: model='meta-llama/Meta-Llama-3.1-8B-Instruct', speculative_config=None, tokenizer='meta-llama/Meta-Llama-3.1-8B-Instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, override_neuron_config=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=60, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='xgrammar'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=meta-llama/Meta-Llama-3.1-8B-Instruct, num_scheduler_steps=1, multi_step_stream_outputs=True, enable_prefix_caching=False, chunked_prefill_enabled=False, use_async_output_proc=True, disable_mm_preprocessor_cache=False, mm_processor_kwargs=None, pooler_config=None, compilation_config={\"splitting_ops\":[],\"compile_sizes\":[],\"cudagraph_capture_sizes\":[256,248,240,232,224,216,208,200,192,184,176,168,160,152,144,136,128,120,112,104,96,88,80,72,64,56,48,40,32,24,16,8,4,2,1],\"max_capture_size\":256}, use_cached_outputs=False, \n",
82
+ "INFO 08-15 11:04:12 cuda.py:229] Using Flash Attention backend.\n",
83
+ "INFO 08-15 11:04:20 model_runner.py:1110] Starting to load model meta-llama/Meta-Llama-3.1-8B-Instruct...\n",
84
+ "INFO 08-15 11:04:23 weight_utils.py:254] Using model weights format ['*.safetensors']\n"
85
+ ]
86
+ },
87
+ {
88
+ "data": {
89
+ "application/vnd.jupyter.widget-view+json": {
90
+ "model_id": "7f3d860bd5c24cbe8695345e9f2d9625",
91
+ "version_major": 2,
92
+ "version_minor": 0
93
+ },
94
+ "text/plain": [
95
+ "Loading safetensors checkpoint shards: 0% Completed | 0/4 [00:00<?, ?it/s]\n"
96
+ ]
97
+ },
98
+ "metadata": {},
99
+ "output_type": "display_data"
100
+ },
101
+ {
102
+ "name": "stdout",
103
+ "output_type": "stream",
104
+ "text": [
105
+ "INFO 08-15 11:04:28 model_runner.py:1115] Loading model weights took 14.9888 GB\n",
106
+ "INFO 08-15 11:04:29 worker.py:267] Memory profiling takes 0.44 seconds\n",
107
+ "INFO 08-15 11:04:29 worker.py:267] the current vLLM instance can use total_gpu_memory (79.10GiB) x gpu_memory_utilization (0.60) = 47.46GiB\n",
108
+ "INFO 08-15 11:04:29 worker.py:267] model weights take 14.99GiB; non_torch_memory takes 0.14GiB; PyTorch activation peak memory takes 0.24GiB; the rest of the memory reserved for KV Cache is 32.09GiB.\n",
109
+ "INFO 08-15 11:04:29 executor_base.py:111] # cuda blocks: 16429, # CPU blocks: 2048\n",
110
+ "INFO 08-15 11:04:29 executor_base.py:116] Maximum concurrency for 60 tokens per request: 4381.07x\n",
111
+ "INFO 08-15 11:04:32 model_runner.py:1434] Capturing cudagraphs for decoding. This may lead to unexpected consequences if the model is not static. To run the model in eager mode, set 'enforce_eager=True' or use '--enforce-eager' in the CLI. If out-of-memory error occurs during cudagraph capture, consider decreasing `gpu_memory_utilization` or switching to eager mode. You can also reduce the `max_num_seqs` as needed to decrease memory usage.\n"
112
+ ]
113
+ },
114
+ {
115
+ "name": "stderr",
116
+ "output_type": "stream",
117
+ "text": [
118
+ "Capturing CUDA graph shapes: 100%|██████████| 35/35 [00:23<00:00, 1.52it/s]"
119
+ ]
120
+ },
121
+ {
122
+ "name": "stdout",
123
+ "output_type": "stream",
124
+ "text": [
125
+ "INFO 08-15 11:04:55 model_runner.py:1562] Graph capturing finished in 23 secs, took 0.32 GiB\n",
126
+ "INFO 08-15 11:04:55 llm_engine.py:436] init engine (profile, create kv cache, warmup model) took 26.46 seconds\n"
127
+ ]
128
+ },
129
+ {
130
+ "name": "stderr",
131
+ "output_type": "stream",
132
+ "text": [
133
+ "\n"
134
+ ]
135
+ }
136
+ ],
137
+ "source": [
138
+ "vllm = LLM(base_model,\n",
139
+ " tokenizer=base_model, \n",
140
+ " gpu_memory_utilization=0.6, \n",
141
+ " max_model_len=50 + max_tokens,\n",
142
+ " )"
143
+ ]
144
+ },
145
+ {
146
+ "cell_type": "code",
147
+ "execution_count": 6,
148
+ "id": "18f02f1e",
149
+ "metadata": {},
150
+ "outputs": [
151
+ {
152
+ "data": {
153
+ "application/vnd.jupyter.widget-view+json": {
154
+ "model_id": "4f33376b6f9f40a09b52211aafdd89b8",
155
+ "version_major": 2,
156
+ "version_minor": 0
157
+ },
158
+ "text/plain": [
159
+ "Loading checkpoint shards: 0%| | 0/4 [00:00<?, ?it/s]"
160
+ ]
161
+ },
162
+ "metadata": {},
163
+ "output_type": "display_data"
164
+ }
165
+ ],
166
+ "source": [
167
+ "try:\n",
168
+ " del model\n",
169
+ " torch.cuda.empty_cache()\n",
170
+ "except:\n",
171
+ " pass\n",
172
+ "model = AutoModelForCausalLM.from_pretrained(base_model, torch_dtype=torch.bfloat16, device_map=\"auto\")\n",
173
+ "model.eval()\n",
174
+ "\n",
175
+ "# Save the original forward\n",
176
+ "model._original_forward = model.forward"
177
+ ]
178
+ },
179
+ {
180
+ "cell_type": "code",
181
+ "execution_count": 7,
182
+ "id": "fad72592",
183
+ "metadata": {},
184
+ "outputs": [
185
+ {
186
+ "data": {
187
+ "application/vnd.jupyter.widget-view+json": {
188
+ "model_id": "1df8f593be4445ef8144ea33f04ece48",
189
+ "version_major": 2,
190
+ "version_minor": 0
191
+ },
192
+ "text/plain": [
193
+ "Loading checkpoint shards: 0%| | 0/4 [00:00<?, ?it/s]"
194
+ ]
195
+ },
196
+ "metadata": {},
197
+ "output_type": "display_data"
198
+ }
199
+ ],
200
+ "source": [
201
+ "test = AutoModelForCausalLM.from_pretrained(base_model, torch_dtype=torch.bfloat16, device_map=\"meta\")"
202
+ ]
203
+ },
204
+ {
205
+ "cell_type": "code",
206
+ "execution_count": null,
207
+ "id": "ff23e4a2",
208
+ "metadata": {},
209
+ "outputs": [],
210
+ "source": [
211
+ "\n",
212
+ "# def forward(\n",
213
+ "# self,\n",
214
+ "# input_ids: Optional[torch.LongTensor] = None,\n",
215
+ "# attention_mask: Optional[torch.Tensor] = None,\n",
216
+ "# position_ids: Optional[torch.LongTensor] = None,\n",
217
+ "# past_key_values: Optional[Cache] = None,\n",
218
+ "# inputs_embeds: Optional[torch.FloatTensor] = None,\n",
219
+ "# labels: Optional[torch.LongTensor] = None,\n",
220
+ "# use_cache: Optional[bool] = None,\n",
221
+ "# cache_position: Optional[torch.LongTensor] = None,\n",
222
+ "# logits_to_keep: Union[int, torch.Tensor] = 0,\n",
223
+ "# **kwargs: Unpack[TransformersKwargs],\n",
224
+ "# ) -> CausalLMOutputWithPast:\n",
225
+ "# r\"\"\"\n",
226
+ "# Example:\n",
227
+ "\n",
228
+ "# ```python\n",
229
+ "# >>> from transformers import AutoTokenizer, LlamaForCausalLM\n",
230
+ "\n",
231
+ "# >>> model = LlamaForCausalLM.from_pretrained(\"meta-llama/Llama-2-7b-hf\")\n",
232
+ "# >>> tokenizer = AutoTokenizer.from_pretrained(\"meta-llama/Llama-2-7b-hf\")\n",
233
+ "\n",
234
+ "# >>> prompt = \"Hey, are you conscious? Can you talk to me?\"\n",
235
+ "# >>> inputs = tokenizer(prompt, return_tensors=\"pt\")\n",
236
+ "\n",
237
+ "# >>> # Generate\n",
238
+ "# >>> generate_ids = model.generate(inputs.input_ids, max_length=30)\n",
239
+ "# >>> tokenizer.batch_decode(generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]\n",
240
+ "# \"Hey, are you conscious? Can you talk to me?\\nI'm not conscious, but I can talk to you.\"\n",
241
+ "# ```\"\"\"\n",
242
+ "# outputs: BaseModelOutputWithPast = self.model(\n",
243
+ "# input_ids=input_ids,\n",
244
+ "# attention_mask=attention_mask,\n",
245
+ "# position_ids=position_ids,\n",
246
+ "# past_key_values=past_key_values,\n",
247
+ "# inputs_embeds=inputs_embeds,\n",
248
+ "# use_cache=use_cache,\n",
249
+ "# cache_position=cache_position,\n",
250
+ "# **kwargs,\n",
251
+ "# )\n",
252
+ "\n",
253
+ "# hidden_states = outputs.last_hidden_state\n",
254
+ "# # Only compute necessary logits, and do not upcast them to float if we are not computing the loss\n",
255
+ "# slice_indices = slice(-logits_to_keep, None) if isinstance(logits_to_keep, int) else logits_to_keep\n",
256
+ "# logits = self.lm_head(hidden_states[:, slice_indices, :])\n",
257
+ "\n",
258
+ "# loss = None\n",
259
+ "# if labels is not None:\n",
260
+ "# loss = self.loss_function(logits=logits, labels=labels, vocab_size=self.config.vocab_size, **kwargs)\n",
261
+ "\n",
262
+ "# return CausalLMOutputWithPast(\n",
263
+ "# loss=loss,\n",
264
+ "# logits=logits,\n",
265
+ "# past_key_values=outputs.past_key_values,\n",
266
+ "# hidden_states=outputs.hidden_states,\n",
267
+ "# attentions=outputs.attentions,\n",
268
+ "# )"
269
+ ]
270
+ },
271
+ {
272
+ "cell_type": "code",
273
+ "execution_count": 8,
274
+ "id": "820f4c9c",
275
+ "metadata": {},
276
+ "outputs": [],
277
+ "source": [
278
+ "prompt_fn = lambda content: tokenizer.apply_chat_template([\n",
279
+ " {\"role\": \"user\", \"content\": content},\n",
280
+ "], tokenize = False, add_generation_prompt = True)"
281
+ ]
282
+ },
283
+ {
284
+ "cell_type": "code",
285
+ "execution_count": 9,
286
+ "id": "3813b71e",
287
+ "metadata": {},
288
+ "outputs": [],
289
+ "source": [
290
+ "inputs = [prompt_fn(\"What is the meaning of life?\"), prompt_fn(\"When was Obama born?\")]\n",
291
+ "tokd_input = tokenizer(inputs, return_tensors=\"pt\", add_special_tokens=False, padding=True).to(model.device)\n",
292
+ "num_beam_groups = 2\n",
293
+ "beams_per_group = 3"
294
+ ]
295
+ },
296
+ {
297
+ "cell_type": "code",
298
+ "execution_count": null,
299
+ "id": "cfd0c000",
300
+ "metadata": {},
301
+ "outputs": [
302
+ {
303
+ "data": {
304
+ "text/plain": [
305
+ "{'input_ids': tensor([[128000, 128006, 9125, 128007, 271, 38766, 1303, 33025, 2696,\n",
306
+ " 25, 6790, 220, 2366, 18, 198, 15724, 2696, 25,\n",
307
+ " 220, 1627, 10263, 220, 2366, 19, 271, 128009, 128006,\n",
308
+ " 882, 128007, 271, 3923, 374, 279, 7438, 315, 2324,\n",
309
+ " 30, 128009, 128006, 78191, 128007, 271],\n",
310
+ " [128009, 128009, 128000, 128006, 9125, 128007, 271, 38766, 1303,\n",
311
+ " 33025, 2696, 25, 6790, 220, 2366, 18, 198, 15724,\n",
312
+ " 2696, 25, 220, 1627, 10263, 220, 2366, 19, 271,\n",
313
+ " 128009, 128006, 882, 128007, 271, 4599, 574, 7250, 9405,\n",
314
+ " 30, 128009, 128006, 78191, 128007, 271]], device='cuda:0'), 'attention_mask': tensor([[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n",
315
+ " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1],\n",
316
+ " [0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n",
317
+ " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]],\n",
318
+ " device='cuda:0')}"
319
+ ]
320
+ },
321
+ "execution_count": 11,
322
+ "metadata": {},
323
+ "output_type": "execute_result"
324
+ }
325
+ ],
326
+ "source": [
327
+ "tokd_input"
328
+ ]
329
+ },
330
+ {
331
+ "cell_type": "code",
332
+ "execution_count": null,
333
+ "id": "57bfea89",
334
+ "metadata": {},
335
+ "outputs": [
336
+ {
337
+ "name": "stderr",
338
+ "output_type": "stream",
339
+ "text": [
340
+ "Group Beam Search is scheduled to be moved to a `custom_generate` repository in v4.55.0. To prevent loss of backward compatibility, add `trust_remote_code=True` to your `generate` call.\n"
341
+ ]
342
+ }
343
+ ],
344
+ "source": [
345
+ "out = model.generate(\n",
346
+ " **tokd_input,\n",
347
+ " max_new_tokens=1,\n",
348
+ " logits_processor=[logits_processor],\n",
349
+ " pad_token_id=tokenizer.eos_token_id,\n",
350
+ " do_sample = False, temperature=None, top_p=None,\n",
351
+ " num_beams = num_beam_groups * beams_per_group,\n",
352
+ " num_beam_groups = num_beam_groups,\n",
353
+ " num_return_sequences = num_beam_groups * beams_per_group,\n",
354
+ " diversity_penalty = 0.5, use_cache = False\n",
355
+ " )"
356
+ ]
357
+ },
358
+ {
359
+ "cell_type": "code",
360
+ "execution_count": 10,
361
+ "id": "0811859f",
362
+ "metadata": {},
363
+ "outputs": [],
364
+ "source": [
365
+ "N = test.lm_head.out_features\n",
366
+ "\n",
367
+ "beam_search_params = SamplingParams(logprobs=20,\n",
368
+ " max_tokens=1,\n",
369
+ " temperature=1.0,\n",
370
+ " detokenize=False)"
371
+ ]
372
+ },
373
+ {
374
+ "cell_type": "code",
375
+ "execution_count": 11,
376
+ "id": "d424a6a9",
377
+ "metadata": {},
378
+ "outputs": [],
379
+ "source": [
380
+ "input_ids = tokd_input[\"input_ids\"]\n",
381
+ "prompts_batch = [TokensPrompt(prompt_token_ids=i) for i in input_ids]\n",
382
+ "output = vllm.generate(prompts_batch,\n",
383
+ " sampling_params=beam_search_params,\n",
384
+ " use_tqdm=False)\n",
385
+ "logits = []\n",
386
+ "size = (N,)\n",
387
+ "for o in output:\n",
388
+ " o = o.outputs[0].logprobs[0]\n",
389
+ " tensor = torch.full(size, float('-inf'))\n",
390
+ "\n",
391
+ " # Set values from the dictionary\n",
392
+ " if o: # only if dictionary is not empty\n",
393
+ " indices = torch.tensor(list(o.keys()))\n",
394
+ " values = torch.tensor([i.logprob for i in o.values()])\n",
395
+ " tensor[indices] = values\n",
396
+ "\n",
397
+ " logits.append(tensor)\n",
398
+ "logits = torch.stack(logits).unsqueeze(1)\n",
399
+ "output_dict = CausalLMOutputWithPast(\n",
400
+ " loss=None,\n",
401
+ " logits=logits,\n",
402
+ " past_key_values=None,\n",
403
+ " hidden_states=None,\n",
404
+ " attentions=None,\n",
405
+ " )"
406
+ ]
407
+ },
408
+ {
409
+ "cell_type": "code",
410
+ "execution_count": null,
411
+ "id": "d2df69fb",
412
+ "metadata": {},
413
+ "outputs": [
414
+ {
415
+ "name": "stderr",
416
+ "output_type": "stream",
417
+ "text": [
418
+ "The attention mask is not set and cannot be inferred from input because pad token is same as eos token. As a consequence, you may observe unexpected behavior. Please pass your input's `attention_mask` to obtain reliable results.\n"
419
+ ]
420
+ },
421
+ {
422
+ "name": "stdout",
423
+ "output_type": "stream",
424
+ "text": [
425
+ "Using patched forward:\n",
426
+ "Patched forward signature: {'position_ids', 'past_key_values', 'kwargs', 'cache_position', 'attention_mask', 'use_cache', 'logits_to_keep', 'labels', 'inputs_embeds', 'input_ids'}\n",
427
+ "791 {791: Logprob(logprob=-0.020645949989557266, rank=1, decoded_token=None), 4054: Logprob(logprob=-4.645646095275879, rank=2, decoded_token=None), 32: Logprob(logprob=-5.020646095275879, rank=3, decoded_token=None), 3923: Logprob(logprob=-6.145646095275879, rank=4, decoded_token=None), 30690: Logprob(logprob=-6.770646095275879, rank=5, decoded_token=None), 20397: Logprob(logprob=-7.520646095275879, rank=6, decoded_token=None), 3947: Logprob(logprob=-9.395646095275879, rank=7, decoded_token=None), 8142: Logprob(logprob=-9.833146095275879, rank=8, decoded_token=None), 31140: Logprob(logprob=-9.895646095275879, rank=9, decoded_token=None), 16533: Logprob(logprob=-10.645646095275879, rank=10, decoded_token=None), 32576: Logprob(logprob=-10.833146095275879, rank=11, decoded_token=None), 2028: Logprob(logprob=-10.958146095275879, rank=12, decoded_token=None), 38356: Logprob(logprob=-11.583146095275879, rank=13, decoded_token=None), 578: Logprob(logprob=-11.708146095275879, rank=14, decoded_token=None), 10227: Logprob(logprob=-11.833146095275879, rank=15, decoded_token=None), 93748: Logprob(logprob=-12.083146095275879, rank=16, decoded_token=None), 31437: Logprob(logprob=-12.083146095275879, rank=17, decoded_token=None), 8607: Logprob(logprob=-12.083146095275879, rank=18, decoded_token=None), 46185: Logprob(logprob=-12.208146095275879, rank=19, decoded_token=None), 71251: Logprob(logprob=-12.270646095275879, rank=20, decoded_token=None)}\n",
428
+ "791 {791: Logprob(logprob=-0.020645949989557266, rank=1, decoded_token=None), 4054: Logprob(logprob=-4.645646095275879, rank=2, decoded_token=None), 32: Logprob(logprob=-5.020646095275879, rank=3, decoded_token=None), 3923: Logprob(logprob=-6.145646095275879, rank=4, decoded_token=None), 30690: Logprob(logprob=-6.770646095275879, rank=5, decoded_token=None), 20397: Logprob(logprob=-7.520646095275879, rank=6, decoded_token=None), 3947: Logprob(logprob=-9.395646095275879, rank=7, decoded_token=None), 8142: Logprob(logprob=-9.833146095275879, rank=8, decoded_token=None), 31140: Logprob(logprob=-9.895646095275879, rank=9, decoded_token=None), 16533: Logprob(logprob=-10.645646095275879, rank=10, decoded_token=None), 32576: Logprob(logprob=-10.833146095275879, rank=11, decoded_token=None), 2028: Logprob(logprob=-10.958146095275879, rank=12, decoded_token=None), 38356: Logprob(logprob=-11.583146095275879, rank=13, decoded_token=None), 578: Logprob(logprob=-11.708146095275879, rank=14, decoded_token=None), 10227: Logprob(logprob=-11.833146095275879, rank=15, decoded_token=None), 93748: Logprob(logprob=-12.083146095275879, rank=16, decoded_token=None), 31437: Logprob(logprob=-12.083146095275879, rank=17, decoded_token=None), 8607: Logprob(logprob=-12.083146095275879, rank=18, decoded_token=None), 46185: Logprob(logprob=-12.208146095275879, rank=19, decoded_token=None), 71251: Logprob(logprob=-12.270646095275879, rank=20, decoded_token=None)}\n",
429
+ "791 {791: Logprob(logprob=-0.020645949989557266, rank=1, decoded_token=None), 4054: Logprob(logprob=-4.645646095275879, rank=2, decoded_token=None), 32: Logprob(logprob=-5.020646095275879, rank=3, decoded_token=None), 3923: Logprob(logprob=-6.145646095275879, rank=4, decoded_token=None), 30690: Logprob(logprob=-6.770646095275879, rank=5, decoded_token=None), 20397: Logprob(logprob=-7.520646095275879, rank=6, decoded_token=None), 3947: Logprob(logprob=-9.395646095275879, rank=7, decoded_token=None), 8142: Logprob(logprob=-9.833146095275879, rank=8, decoded_token=None), 31140: Logprob(logprob=-9.895646095275879, rank=9, decoded_token=None), 16533: Logprob(logprob=-10.645646095275879, rank=10, decoded_token=None), 32576: Logprob(logprob=-10.833146095275879, rank=11, decoded_token=None), 2028: Logprob(logprob=-10.958146095275879, rank=12, decoded_token=None), 38356: Logprob(logprob=-11.583146095275879, rank=13, decoded_token=None), 578: Logprob(logprob=-11.708146095275879, rank=14, decoded_token=None), 10227: Logprob(logprob=-11.833146095275879, rank=15, decoded_token=None), 93748: Logprob(logprob=-12.083146095275879, rank=16, decoded_token=None), 31437: Logprob(logprob=-12.083146095275879, rank=17, decoded_token=None), 8607: Logprob(logprob=-12.083146095275879, rank=18, decoded_token=None), 46185: Logprob(logprob=-12.208146095275879, rank=19, decoded_token=None), 71251: Logprob(logprob=-12.270646095275879, rank=20, decoded_token=None)}\n",
430
+ "791 {791: Logprob(logprob=-0.020645949989557266, rank=1, decoded_token=None), 4054: Logprob(logprob=-4.645646095275879, rank=2, decoded_token=None), 32: Logprob(logprob=-5.020646095275879, rank=3, decoded_token=None), 3923: Logprob(logprob=-6.145646095275879, rank=4, decoded_token=None), 30690: Logprob(logprob=-6.770646095275879, rank=5, decoded_token=None), 20397: Logprob(logprob=-7.520646095275879, rank=6, decoded_token=None), 3947: Logprob(logprob=-9.395646095275879, rank=7, decoded_token=None), 8142: Logprob(logprob=-9.833146095275879, rank=8, decoded_token=None), 31140: Logprob(logprob=-9.895646095275879, rank=9, decoded_token=None), 16533: Logprob(logprob=-10.645646095275879, rank=10, decoded_token=None), 32576: Logprob(logprob=-10.833146095275879, rank=11, decoded_token=None), 2028: Logprob(logprob=-10.958146095275879, rank=12, decoded_token=None), 38356: Logprob(logprob=-11.583146095275879, rank=13, decoded_token=None), 578: Logprob(logprob=-11.708146095275879, rank=14, decoded_token=None), 10227: Logprob(logprob=-11.833146095275879, rank=15, decoded_token=None), 93748: Logprob(logprob=-12.083146095275879, rank=16, decoded_token=None), 31437: Logprob(logprob=-12.083146095275879, rank=17, decoded_token=None), 8607: Logprob(logprob=-12.083146095275879, rank=18, decoded_token=None), 46185: Logprob(logprob=-12.208146095275879, rank=19, decoded_token=None), 71251: Logprob(logprob=-12.270646095275879, rank=20, decoded_token=None)}\n",
431
+ "791 {791: Logprob(logprob=-0.020645949989557266, rank=1, decoded_token=None), 4054: Logprob(logprob=-4.645646095275879, rank=2, decoded_token=None), 32: Logprob(logprob=-5.020646095275879, rank=3, decoded_token=None), 3923: Logprob(logprob=-6.145646095275879, rank=4, decoded_token=None), 30690: Logprob(logprob=-6.770646095275879, rank=5, decoded_token=None), 20397: Logprob(logprob=-7.520646095275879, rank=6, decoded_token=None), 3947: Logprob(logprob=-9.395646095275879, rank=7, decoded_token=None), 8142: Logprob(logprob=-9.833146095275879, rank=8, decoded_token=None), 31140: Logprob(logprob=-9.895646095275879, rank=9, decoded_token=None), 16533: Logprob(logprob=-10.645646095275879, rank=10, decoded_token=None), 32576: Logprob(logprob=-10.833146095275879, rank=11, decoded_token=None), 2028: Logprob(logprob=-10.958146095275879, rank=12, decoded_token=None), 38356: Logprob(logprob=-11.583146095275879, rank=13, decoded_token=None), 578: Logprob(logprob=-11.708146095275879, rank=14, decoded_token=None), 10227: Logprob(logprob=-11.833146095275879, rank=15, decoded_token=None), 93748: Logprob(logprob=-12.083146095275879, rank=16, decoded_token=None), 31437: Logprob(logprob=-12.083146095275879, rank=17, decoded_token=None), 8607: Logprob(logprob=-12.083146095275879, rank=18, decoded_token=None), 46185: Logprob(logprob=-12.208146095275879, rank=19, decoded_token=None), 71251: Logprob(logprob=-12.270646095275879, rank=20, decoded_token=None)}\n",
432
+ "791 {791: Logprob(logprob=-0.020645949989557266, rank=1, decoded_token=None), 4054: Logprob(logprob=-4.645646095275879, rank=2, decoded_token=None), 32: Logprob(logprob=-5.020646095275879, rank=3, decoded_token=None), 3923: Logprob(logprob=-6.145646095275879, rank=4, decoded_token=None), 30690: Logprob(logprob=-6.770646095275879, rank=5, decoded_token=None), 20397: Logprob(logprob=-7.520646095275879, rank=6, decoded_token=None), 3947: Logprob(logprob=-9.395646095275879, rank=7, decoded_token=None), 8142: Logprob(logprob=-9.833146095275879, rank=8, decoded_token=None), 31140: Logprob(logprob=-9.895646095275879, rank=9, decoded_token=None), 16533: Logprob(logprob=-10.645646095275879, rank=10, decoded_token=None), 32576: Logprob(logprob=-10.833146095275879, rank=11, decoded_token=None), 2028: Logprob(logprob=-10.958146095275879, rank=12, decoded_token=None), 38356: Logprob(logprob=-11.583146095275879, rank=13, decoded_token=None), 578: Logprob(logprob=-11.708146095275879, rank=14, decoded_token=None), 10227: Logprob(logprob=-11.833146095275879, rank=15, decoded_token=None), 93748: Logprob(logprob=-12.083146095275879, rank=16, decoded_token=None), 31437: Logprob(logprob=-12.083146095275879, rank=17, decoded_token=None), 8607: Logprob(logprob=-12.083146095275879, rank=18, decoded_token=None), 46185: Logprob(logprob=-12.208146095275879, rank=19, decoded_token=None), 71251: Logprob(logprob=-12.270646095275879, rank=20, decoded_token=None)}\n",
433
+ "3511 {3511: Logprob(logprob=-0.023903636261820793, rank=1, decoded_token=None), 31945: Logprob(logprob=-3.8989036083221436, rank=2, decoded_token=None), 27229: Logprob(logprob=-6.523903846740723, rank=3, decoded_token=None), 791: Logprob(logprob=-7.648903846740723, rank=4, decoded_token=None), 24448: Logprob(logprob=-8.148903846740723, rank=5, decoded_token=None), 2078: Logprob(logprob=-8.523903846740723, rank=6, decoded_token=None), 1271: Logprob(logprob=-8.773903846740723, rank=7, decoded_token=None), 52: Logprob(logprob=-9.023903846740723, rank=8, decoded_token=None), 45437: Logprob(logprob=-9.148903846740723, rank=9, decoded_token=None), 1548: Logprob(logprob=-9.273903846740723, rank=10, decoded_token=None), 40: Logprob(logprob=-9.273903846740723, rank=11, decoded_token=None), 35627: Logprob(logprob=-10.023903846740723, rank=12, decoded_token=None), 23175: Logprob(logprob=-10.148903846740723, rank=13, decoded_token=None), 14704: Logprob(logprob=-10.398903846740723, rank=14, decoded_token=None), 32: Logprob(logprob=-10.648903846740723, rank=15, decoded_token=None), 2308: Logprob(logprob=-10.773903846740723, rank=16, decoded_token=None), 34165: Logprob(logprob=-10.898903846740723, rank=17, decoded_token=None), 644: Logprob(logprob=-10.898903846740723, rank=18, decoded_token=None), 1966: Logprob(logprob=-11.023903846740723, rank=19, decoded_token=None), 18735: Logprob(logprob=-11.273903846740723, rank=20, decoded_token=None)}\n",
434
+ "3511 {3511: Logprob(logprob=-0.023903636261820793, rank=1, decoded_token=None), 31945: Logprob(logprob=-3.8989036083221436, rank=2, decoded_token=None), 27229: Logprob(logprob=-6.523903846740723, rank=3, decoded_token=None), 791: Logprob(logprob=-7.648903846740723, rank=4, decoded_token=None), 24448: Logprob(logprob=-8.148903846740723, rank=5, decoded_token=None), 2078: Logprob(logprob=-8.523903846740723, rank=6, decoded_token=None), 1271: Logprob(logprob=-8.773903846740723, rank=7, decoded_token=None), 52: Logprob(logprob=-9.023903846740723, rank=8, decoded_token=None), 45437: Logprob(logprob=-9.148903846740723, rank=9, decoded_token=None), 1548: Logprob(logprob=-9.273903846740723, rank=10, decoded_token=None), 40: Logprob(logprob=-9.273903846740723, rank=11, decoded_token=None), 35627: Logprob(logprob=-10.023903846740723, rank=12, decoded_token=None), 23175: Logprob(logprob=-10.148903846740723, rank=13, decoded_token=None), 14704: Logprob(logprob=-10.398903846740723, rank=14, decoded_token=None), 32: Logprob(logprob=-10.648903846740723, rank=15, decoded_token=None), 2308: Logprob(logprob=-10.773903846740723, rank=16, decoded_token=None), 34165: Logprob(logprob=-10.898903846740723, rank=17, decoded_token=None), 644: Logprob(logprob=-10.898903846740723, rank=18, decoded_token=None), 1966: Logprob(logprob=-11.023903846740723, rank=19, decoded_token=None), 18735: Logprob(logprob=-11.273903846740723, rank=20, decoded_token=None)}\n",
435
+ "3511 {3511: Logprob(logprob=-0.023903636261820793, rank=1, decoded_token=None), 31945: Logprob(logprob=-3.8989036083221436, rank=2, decoded_token=None), 27229: Logprob(logprob=-6.523903846740723, rank=3, decoded_token=None), 791: Logprob(logprob=-7.648903846740723, rank=4, decoded_token=None), 24448: Logprob(logprob=-8.148903846740723, rank=5, decoded_token=None), 2078: Logprob(logprob=-8.523903846740723, rank=6, decoded_token=None), 1271: Logprob(logprob=-8.773903846740723, rank=7, decoded_token=None), 52: Logprob(logprob=-9.023903846740723, rank=8, decoded_token=None), 45437: Logprob(logprob=-9.148903846740723, rank=9, decoded_token=None), 1548: Logprob(logprob=-9.273903846740723, rank=10, decoded_token=None), 40: Logprob(logprob=-9.273903846740723, rank=11, decoded_token=None), 35627: Logprob(logprob=-10.023903846740723, rank=12, decoded_token=None), 23175: Logprob(logprob=-10.148903846740723, rank=13, decoded_token=None), 14704: Logprob(logprob=-10.398903846740723, rank=14, decoded_token=None), 32: Logprob(logprob=-10.648903846740723, rank=15, decoded_token=None), 2308: Logprob(logprob=-10.773903846740723, rank=16, decoded_token=None), 34165: Logprob(logprob=-10.898903846740723, rank=17, decoded_token=None), 644: Logprob(logprob=-10.898903846740723, rank=18, decoded_token=None), 1966: Logprob(logprob=-11.023903846740723, rank=19, decoded_token=None), 18735: Logprob(logprob=-11.273903846740723, rank=20, decoded_token=None)}\n",
436
+ "3511 {3511: Logprob(logprob=-0.023903636261820793, rank=1, decoded_token=None), 31945: Logprob(logprob=-3.8989036083221436, rank=2, decoded_token=None), 27229: Logprob(logprob=-6.523903846740723, rank=3, decoded_token=None), 791: Logprob(logprob=-7.648903846740723, rank=4, decoded_token=None), 24448: Logprob(logprob=-8.148903846740723, rank=5, decoded_token=None), 2078: Logprob(logprob=-8.523903846740723, rank=6, decoded_token=None), 1271: Logprob(logprob=-8.773903846740723, rank=7, decoded_token=None), 52: Logprob(logprob=-9.023903846740723, rank=8, decoded_token=None), 45437: Logprob(logprob=-9.148903846740723, rank=9, decoded_token=None), 1548: Logprob(logprob=-9.273903846740723, rank=10, decoded_token=None), 40: Logprob(logprob=-9.273903846740723, rank=11, decoded_token=None), 35627: Logprob(logprob=-10.023903846740723, rank=12, decoded_token=None), 23175: Logprob(logprob=-10.148903846740723, rank=13, decoded_token=None), 14704: Logprob(logprob=-10.398903846740723, rank=14, decoded_token=None), 32: Logprob(logprob=-10.648903846740723, rank=15, decoded_token=None), 2308: Logprob(logprob=-10.773903846740723, rank=16, decoded_token=None), 34165: Logprob(logprob=-10.898903846740723, rank=17, decoded_token=None), 644: Logprob(logprob=-10.898903846740723, rank=18, decoded_token=None), 1966: Logprob(logprob=-11.023903846740723, rank=19, decoded_token=None), 18735: Logprob(logprob=-11.273903846740723, rank=20, decoded_token=None)}\n",
437
+ "3511 {3511: Logprob(logprob=-0.023903636261820793, rank=1, decoded_token=None), 31945: Logprob(logprob=-3.8989036083221436, rank=2, decoded_token=None), 27229: Logprob(logprob=-6.523903846740723, rank=3, decoded_token=None), 791: Logprob(logprob=-7.648903846740723, rank=4, decoded_token=None), 24448: Logprob(logprob=-8.148903846740723, rank=5, decoded_token=None), 2078: Logprob(logprob=-8.523903846740723, rank=6, decoded_token=None), 1271: Logprob(logprob=-8.773903846740723, rank=7, decoded_token=None), 52: Logprob(logprob=-9.023903846740723, rank=8, decoded_token=None), 45437: Logprob(logprob=-9.148903846740723, rank=9, decoded_token=None), 1548: Logprob(logprob=-9.273903846740723, rank=10, decoded_token=None), 40: Logprob(logprob=-9.273903846740723, rank=11, decoded_token=None), 35627: Logprob(logprob=-10.023903846740723, rank=12, decoded_token=None), 23175: Logprob(logprob=-10.148903846740723, rank=13, decoded_token=None), 14704: Logprob(logprob=-10.398903846740723, rank=14, decoded_token=None), 32: Logprob(logprob=-10.648903846740723, rank=15, decoded_token=None), 2308: Logprob(logprob=-10.773903846740723, rank=16, decoded_token=None), 34165: Logprob(logprob=-10.898903846740723, rank=17, decoded_token=None), 644: Logprob(logprob=-10.898903846740723, rank=18, decoded_token=None), 1966: Logprob(logprob=-11.023903846740723, rank=19, decoded_token=None), 18735: Logprob(logprob=-11.273903846740723, rank=20, decoded_token=None)}\n",
438
+ "3511 {3511: Logprob(logprob=-0.023903636261820793, rank=1, decoded_token=None), 31945: Logprob(logprob=-3.8989036083221436, rank=2, decoded_token=None), 27229: Logprob(logprob=-6.523903846740723, rank=3, decoded_token=None), 791: Logprob(logprob=-7.648903846740723, rank=4, decoded_token=None), 24448: Logprob(logprob=-8.148903846740723, rank=5, decoded_token=None), 2078: Logprob(logprob=-8.523903846740723, rank=6, decoded_token=None), 1271: Logprob(logprob=-8.773903846740723, rank=7, decoded_token=None), 52: Logprob(logprob=-9.023903846740723, rank=8, decoded_token=None), 45437: Logprob(logprob=-9.148903846740723, rank=9, decoded_token=None), 1548: Logprob(logprob=-9.273903846740723, rank=10, decoded_token=None), 40: Logprob(logprob=-9.273903846740723, rank=11, decoded_token=None), 35627: Logprob(logprob=-10.023903846740723, rank=12, decoded_token=None), 23175: Logprob(logprob=-10.148903846740723, rank=13, decoded_token=None), 14704: Logprob(logprob=-10.398903846740723, rank=14, decoded_token=None), 32: Logprob(logprob=-10.648903846740723, rank=15, decoded_token=None), 2308: Logprob(logprob=-10.773903846740723, rank=16, decoded_token=None), 34165: Logprob(logprob=-10.898903846740723, rank=17, decoded_token=None), 644: Logprob(logprob=-10.898903846740723, rank=18, decoded_token=None), 1966: Logprob(logprob=-11.023903846740723, rank=19, decoded_token=None), 18735: Logprob(logprob=-11.273903846740723, rank=20, decoded_token=None)}\n",
439
+ "3488 {3488: Logprob(logprob=-0.2706400752067566, rank=1, decoded_token=None), 7438: Logprob(logprob=-1.5206401348114014, rank=2, decoded_token=None), 7434: Logprob(logprob=-4.520639896392822, rank=3, decoded_token=None), 4325: Logprob(logprob=-5.895639896392822, rank=4, decoded_token=None), 330: Logprob(logprob=-6.145639896392822, rank=5, decoded_token=None), 4320: Logprob(logprob=-7.020639896392822, rank=6, decoded_token=None), 17139: Logprob(logprob=-7.145639896392822, rank=7, decoded_token=None), 2271: Logprob(logprob=-8.02064037322998, rank=8, decoded_token=None), 364: Logprob(logprob=-8.39564037322998, rank=9, decoded_token=None), 2778: Logprob(logprob=-9.39564037322998, rank=10, decoded_token=None), 35825: Logprob(logprob=-9.70814037322998, rank=11, decoded_token=None), 14209: Logprob(logprob=-9.95814037322998, rank=12, decoded_token=None), 49203: Logprob(logprob=-10.20814037322998, rank=13, decoded_token=None), 23347: Logprob(logprob=-10.39564037322998, rank=14, decoded_token=None), 17571: Logprob(logprob=-10.58314037322998, rank=15, decoded_token=None), 4860: Logprob(logprob=-10.64564037322998, rank=16, decoded_token=None), 3319: Logprob(logprob=-10.83314037322998, rank=17, decoded_token=None), 4751: Logprob(logprob=-10.89564037322998, rank=18, decoded_token=None), 16225: Logprob(logprob=-10.89564037322998, rank=19, decoded_token=None), 7419: Logprob(logprob=-10.95814037322998, rank=20, decoded_token=None)}\n",
440
+ "315 {315: Logprob(logprob=-3.1709168979432434e-05, rank=1, decoded_token=None), 3488: Logprob(logprob=-10.375031471252441, rank=2, decoded_token=None), 220: Logprob(logprob=-15.750031471252441, rank=3, decoded_token=None), 279: Logprob(logprob=-16.062532424926758, rank=4, decoded_token=None), 5046: Logprob(logprob=-16.375032424926758, rank=5, decoded_token=None), 1073: Logprob(logprob=-16.937532424926758, rank=6, decoded_token=None), 596: Logprob(logprob=-16.937532424926758, rank=7, decoded_token=None), 35825: Logprob(logprob=-17.437532424926758, rank=8, decoded_token=None), 16225: Logprob(logprob=-17.812532424926758, rank=9, decoded_token=None), 4860: Logprob(logprob=-18.375032424926758, rank=10, decoded_token=None), 3659: Logprob(logprob=-18.437532424926758, rank=11, decoded_token=None), 832: Logprob(logprob=-18.687532424926758, rank=12, decoded_token=None), 1455: Logprob(logprob=-19.000032424926758, rank=13, decoded_token=None), 67739: Logprob(logprob=-19.062532424926758, rank=14, decoded_token=None), 3083: Logprob(logprob=-19.187532424926758, rank=15, decoded_token=None), 430: Logprob(logprob=-19.250032424926758, rank=16, decoded_token=None), 60835: Logprob(logprob=-19.375032424926758, rank=17, decoded_token=None), 43146: Logprob(logprob=-19.437532424926758, rank=18, decoded_token=None), 13189: Logprob(logprob=-19.562532424926758, rank=19, decoded_token=None), 311: Logprob(logprob=-19.625032424926758, rank=20, decoded_token=None)}\n",
441
+ "3488 {3488: Logprob(logprob=-0.0018615075387060642, rank=1, decoded_token=None), 28254: Logprob(logprob=-7.126861572265625, rank=2, decoded_token=None), 11670: Logprob(logprob=-8.001861572265625, rank=3, decoded_token=None), 58105: Logprob(logprob=-8.126861572265625, rank=4, decoded_token=None), 23490: Logprob(logprob=-9.439361572265625, rank=5, decoded_token=None), 41903: Logprob(logprob=-9.501861572265625, rank=6, decoded_token=None), 6485: Logprob(logprob=-9.689361572265625, rank=7, decoded_token=None), 16188: Logprob(logprob=-10.314361572265625, rank=8, decoded_token=None), 74718: Logprob(logprob=-10.626861572265625, rank=9, decoded_token=None), 16225: Logprob(logprob=-10.626861572265625, rank=10, decoded_token=None), 17693: Logprob(logprob=-11.314361572265625, rank=11, decoded_token=None), 4860: Logprob(logprob=-11.314361572265625, rank=12, decoded_token=None), 57697: Logprob(logprob=-11.751861572265625, rank=13, decoded_token=None), 4325: Logprob(logprob=-11.876861572265625, rank=14, decoded_token=None), 32846: Logprob(logprob=-11.939361572265625, rank=15, decoded_token=None), 66278: Logprob(logprob=-11.939361572265625, rank=16, decoded_token=None), 7998: Logprob(logprob=-12.064361572265625, rank=17, decoded_token=None), 8712: Logprob(logprob=-12.189361572265625, rank=18, decoded_token=None), 73835: Logprob(logprob=-12.376861572265625, rank=19, decoded_token=None), 2271: Logprob(logprob=-12.439361572265625, rank=20, decoded_token=None)}\n",
442
+ "3488 {3488: Logprob(logprob=-0.2706400752067566, rank=1, decoded_token=None), 7438: Logprob(logprob=-1.5206401348114014, rank=2, decoded_token=None), 7434: Logprob(logprob=-4.520639896392822, rank=3, decoded_token=None), 4325: Logprob(logprob=-5.895639896392822, rank=4, decoded_token=None), 330: Logprob(logprob=-6.145639896392822, rank=5, decoded_token=None), 4320: Logprob(logprob=-7.020639896392822, rank=6, decoded_token=None), 17139: Logprob(logprob=-7.145639896392822, rank=7, decoded_token=None), 2271: Logprob(logprob=-8.02064037322998, rank=8, decoded_token=None), 364: Logprob(logprob=-8.39564037322998, rank=9, decoded_token=None), 2778: Logprob(logprob=-9.39564037322998, rank=10, decoded_token=None), 35825: Logprob(logprob=-9.70814037322998, rank=11, decoded_token=None), 14209: Logprob(logprob=-9.95814037322998, rank=12, decoded_token=None), 49203: Logprob(logprob=-10.20814037322998, rank=13, decoded_token=None), 23347: Logprob(logprob=-10.39564037322998, rank=14, decoded_token=None), 17571: Logprob(logprob=-10.58314037322998, rank=15, decoded_token=None), 4860: Logprob(logprob=-10.64564037322998, rank=16, decoded_token=None), 3319: Logprob(logprob=-10.83314037322998, rank=17, decoded_token=None), 4751: Logprob(logprob=-10.89564037322998, rank=18, decoded_token=None), 16225: Logprob(logprob=-10.89564037322998, rank=19, decoded_token=None), 7419: Logprob(logprob=-10.95814037322998, rank=20, decoded_token=None)}\n",
443
+ "315 {315: Logprob(logprob=-3.1709168979432434e-05, rank=1, decoded_token=None), 3488: Logprob(logprob=-10.375031471252441, rank=2, decoded_token=None), 220: Logprob(logprob=-15.750031471252441, rank=3, decoded_token=None), 279: Logprob(logprob=-16.062532424926758, rank=4, decoded_token=None), 5046: Logprob(logprob=-16.375032424926758, rank=5, decoded_token=None), 1073: Logprob(logprob=-16.937532424926758, rank=6, decoded_token=None), 596: Logprob(logprob=-16.937532424926758, rank=7, decoded_token=None), 35825: Logprob(logprob=-17.437532424926758, rank=8, decoded_token=None), 16225: Logprob(logprob=-17.812532424926758, rank=9, decoded_token=None), 4860: Logprob(logprob=-18.375032424926758, rank=10, decoded_token=None), 3659: Logprob(logprob=-18.437532424926758, rank=11, decoded_token=None), 832: Logprob(logprob=-18.687532424926758, rank=12, decoded_token=None), 1455: Logprob(logprob=-19.000032424926758, rank=13, decoded_token=None), 67739: Logprob(logprob=-19.062532424926758, rank=14, decoded_token=None), 3083: Logprob(logprob=-19.187532424926758, rank=15, decoded_token=None), 430: Logprob(logprob=-19.250032424926758, rank=16, decoded_token=None), 60835: Logprob(logprob=-19.375032424926758, rank=17, decoded_token=None), 43146: Logprob(logprob=-19.437532424926758, rank=18, decoded_token=None), 13189: Logprob(logprob=-19.562532424926758, rank=19, decoded_token=None), 311: Logprob(logprob=-19.625032424926758, rank=20, decoded_token=None)}\n",
444
+ "3488 {3488: Logprob(logprob=-0.0018615075387060642, rank=1, decoded_token=None), 28254: Logprob(logprob=-7.126861572265625, rank=2, decoded_token=None), 11670: Logprob(logprob=-8.001861572265625, rank=3, decoded_token=None), 58105: Logprob(logprob=-8.126861572265625, rank=4, decoded_token=None), 23490: Logprob(logprob=-9.439361572265625, rank=5, decoded_token=None), 41903: Logprob(logprob=-9.501861572265625, rank=6, decoded_token=None), 6485: Logprob(logprob=-9.689361572265625, rank=7, decoded_token=None), 16188: Logprob(logprob=-10.314361572265625, rank=8, decoded_token=None), 74718: Logprob(logprob=-10.626861572265625, rank=9, decoded_token=None), 16225: Logprob(logprob=-10.626861572265625, rank=10, decoded_token=None), 17693: Logprob(logprob=-11.314361572265625, rank=11, decoded_token=None), 4860: Logprob(logprob=-11.314361572265625, rank=12, decoded_token=None), 57697: Logprob(logprob=-11.751861572265625, rank=13, decoded_token=None), 4325: Logprob(logprob=-11.876861572265625, rank=14, decoded_token=None), 32846: Logprob(logprob=-11.939361572265625, rank=15, decoded_token=None), 66278: Logprob(logprob=-11.939361572265625, rank=16, decoded_token=None), 7998: Logprob(logprob=-12.064361572265625, rank=17, decoded_token=None), 8712: Logprob(logprob=-12.189361572265625, rank=18, decoded_token=None), 73835: Logprob(logprob=-12.376861572265625, rank=19, decoded_token=None), 2271: Logprob(logprob=-12.439361572265625, rank=20, decoded_token=None)}\n",
445
+ "474 {474: Logprob(logprob=-0.0003861635341309011, rank=1, decoded_token=None), 587: Logprob(logprob=-7.8753862380981445, rank=2, decoded_token=None), 894: Logprob(logprob=-12.625386238098145, rank=3, decoded_token=None), 377: Logprob(logprob=-13.875386238098145, rank=4, decoded_token=None), 613: Logprob(logprob=-14.125386238098145, rank=5, decoded_token=None), 4122: Logprob(logprob=-15.000386238098145, rank=6, decoded_token=None), 13637: Logprob(logprob=-15.125386238098145, rank=7, decoded_token=None), 25062: Logprob(logprob=-15.625386238098145, rank=8, decoded_token=None), 582: Logprob(logprob=-15.750386238098145, rank=9, decoded_token=None), 5827: Logprob(logprob=-16.875385284423828, rank=10, decoded_token=None), 37406: Logprob(logprob=-17.000385284423828, rank=11, decoded_token=None), 7977: Logprob(logprob=-17.250385284423828, rank=12, decoded_token=None), 10956: Logprob(logprob=-17.375385284423828, rank=13, decoded_token=None), 81057: Logprob(logprob=-17.500385284423828, rank=14, decoded_token=None), 77527: Logprob(logprob=-17.625385284423828, rank=15, decoded_token=None), 56659: Logprob(logprob=-18.125385284423828, rank=16, decoded_token=None), 1412: Logprob(logprob=-18.125385284423828, rank=17, decoded_token=None), 263: Logprob(logprob=-18.437885284423828, rank=18, decoded_token=None), 566: Logprob(logprob=-18.562885284423828, rank=19, decoded_token=None), 3520: Logprob(logprob=-18.750385284423828, rank=20, decoded_token=None)}\n",
446
+ "549 {549: Logprob(logprob=-1.0475294589996338, rank=2, decoded_token=None), 2326: Logprob(logprob=-0.5475294589996338, rank=1, decoded_token=None), 4900: Logprob(logprob=-3.297529458999634, rank=3, decoded_token=None), 3723: Logprob(logprob=-3.422529458999634, rank=4, decoded_token=None), 4872: Logprob(logprob=-7.547529220581055, rank=5, decoded_token=None), 3778: Logprob(logprob=-8.297529220581055, rank=6, decoded_token=None), 7427: Logprob(logprob=-8.547529220581055, rank=7, decoded_token=None), 33440: Logprob(logprob=-9.047529220581055, rank=8, decoded_token=None), 220: Logprob(logprob=-9.547529220581055, rank=9, decoded_token=None), 35681: Logprob(logprob=-10.547529220581055, rank=10, decoded_token=None), 4073: Logprob(logprob=-12.047529220581055, rank=11, decoded_token=None), 86481: Logprob(logprob=-12.297529220581055, rank=12, decoded_token=None), 603: Logprob(logprob=-12.422529220581055, rank=13, decoded_token=None), 62602: Logprob(logprob=-12.672529220581055, rank=14, decoded_token=None), 2078: Logprob(logprob=-13.422529220581055, rank=15, decoded_token=None), 97038: Logprob(logprob=-13.797529220581055, rank=16, decoded_token=None), 29292: Logprob(logprob=-13.797529220581055, rank=17, decoded_token=None), 4203: Logprob(logprob=-13.922529220581055, rank=18, decoded_token=None), 85610: Logprob(logprob=-14.047529220581055, rank=19, decoded_token=None), 12: Logprob(logprob=-14.422529220581055, rank=20, decoded_token=None)}\n",
447
+ "24448 {24448: Logprob(logprob=-0.04389546066522598, rank=1, decoded_token=None), 7250: Logprob(logprob=-3.1688954830169678, rank=2, decoded_token=None), 4821: Logprob(logprob=-8.043895721435547, rank=3, decoded_token=None), 220: Logprob(logprob=-8.293895721435547, rank=4, decoded_token=None), 32817: Logprob(logprob=-8.418895721435547, rank=5, decoded_token=None), 315: Logprob(logprob=-9.668895721435547, rank=6, decoded_token=None), 3703: Logprob(logprob=-11.918895721435547, rank=7, decoded_token=None), 13142: Logprob(logprob=-12.043895721435547, rank=8, decoded_token=None), 38180: Logprob(logprob=-12.543895721435547, rank=9, decoded_token=None), 37081: Logprob(logprob=-12.543895721435547, rank=10, decoded_token=None), 92169: Logprob(logprob=-12.668895721435547, rank=11, decoded_token=None), 9641: Logprob(logprob=-12.793895721435547, rank=12, decoded_token=None), 45287: Logprob(logprob=-12.918895721435547, rank=13, decoded_token=None), 31858: Logprob(logprob=-13.168895721435547, rank=14, decoded_token=None), 94420: Logprob(logprob=-13.418895721435547, rank=15, decoded_token=None), 4761: Logprob(logprob=-13.668895721435547, rank=16, decoded_token=None), 16150: Logprob(logprob=-13.793895721435547, rank=17, decoded_token=None), 3511: Logprob(logprob=-13.918895721435547, rank=18, decoded_token=None), 45437: Logprob(logprob=-13.918895721435547, rank=19, decoded_token=None), 320: Logprob(logprob=-14.418895721435547, rank=20, decoded_token=None)}\n",
448
+ "474 {474: Logprob(logprob=-0.0003861635341309011, rank=1, decoded_token=None), 587: Logprob(logprob=-7.8753862380981445, rank=2, decoded_token=None), 894: Logprob(logprob=-12.625386238098145, rank=3, decoded_token=None), 377: Logprob(logprob=-13.875386238098145, rank=4, decoded_token=None), 613: Logprob(logprob=-14.125386238098145, rank=5, decoded_token=None), 4122: Logprob(logprob=-15.000386238098145, rank=6, decoded_token=None), 13637: Logprob(logprob=-15.125386238098145, rank=7, decoded_token=None), 25062: Logprob(logprob=-15.625386238098145, rank=8, decoded_token=None), 582: Logprob(logprob=-15.750386238098145, rank=9, decoded_token=None), 5827: Logprob(logprob=-16.875385284423828, rank=10, decoded_token=None), 37406: Logprob(logprob=-17.000385284423828, rank=11, decoded_token=None), 7977: Logprob(logprob=-17.250385284423828, rank=12, decoded_token=None), 10956: Logprob(logprob=-17.375385284423828, rank=13, decoded_token=None), 81057: Logprob(logprob=-17.500385284423828, rank=14, decoded_token=None), 77527: Logprob(logprob=-17.625385284423828, rank=15, decoded_token=None), 56659: Logprob(logprob=-18.125385284423828, rank=16, decoded_token=None), 1412: Logprob(logprob=-18.125385284423828, rank=17, decoded_token=None), 263: Logprob(logprob=-18.437885284423828, rank=18, decoded_token=None), 566: Logprob(logprob=-18.562885284423828, rank=19, decoded_token=None), 3520: Logprob(logprob=-18.750385284423828, rank=20, decoded_token=None)}\n",
449
+ "549 {549: Logprob(logprob=-1.0475294589996338, rank=2, decoded_token=None), 2326: Logprob(logprob=-0.5475294589996338, rank=1, decoded_token=None), 4900: Logprob(logprob=-3.297529458999634, rank=3, decoded_token=None), 3723: Logprob(logprob=-3.422529458999634, rank=4, decoded_token=None), 4872: Logprob(logprob=-7.547529220581055, rank=5, decoded_token=None), 3778: Logprob(logprob=-8.297529220581055, rank=6, decoded_token=None), 7427: Logprob(logprob=-8.547529220581055, rank=7, decoded_token=None), 33440: Logprob(logprob=-9.047529220581055, rank=8, decoded_token=None), 220: Logprob(logprob=-9.547529220581055, rank=9, decoded_token=None), 35681: Logprob(logprob=-10.547529220581055, rank=10, decoded_token=None), 4073: Logprob(logprob=-12.047529220581055, rank=11, decoded_token=None), 86481: Logprob(logprob=-12.297529220581055, rank=12, decoded_token=None), 603: Logprob(logprob=-12.422529220581055, rank=13, decoded_token=None), 62602: Logprob(logprob=-12.672529220581055, rank=14, decoded_token=None), 2078: Logprob(logprob=-13.422529220581055, rank=15, decoded_token=None), 97038: Logprob(logprob=-13.797529220581055, rank=16, decoded_token=None), 29292: Logprob(logprob=-13.797529220581055, rank=17, decoded_token=None), 4203: Logprob(logprob=-13.922529220581055, rank=18, decoded_token=None), 85610: Logprob(logprob=-14.047529220581055, rank=19, decoded_token=None), 12: Logprob(logprob=-14.422529220581055, rank=20, decoded_token=None)}\n",
450
+ "24448 {24448: Logprob(logprob=-0.04389546066522598, rank=1, decoded_token=None), 7250: Logprob(logprob=-3.1688954830169678, rank=2, decoded_token=None), 4821: Logprob(logprob=-8.043895721435547, rank=3, decoded_token=None), 220: Logprob(logprob=-8.293895721435547, rank=4, decoded_token=None), 32817: Logprob(logprob=-8.418895721435547, rank=5, decoded_token=None), 315: Logprob(logprob=-9.668895721435547, rank=6, decoded_token=None), 3703: Logprob(logprob=-11.918895721435547, rank=7, decoded_token=None), 13142: Logprob(logprob=-12.043895721435547, rank=8, decoded_token=None), 38180: Logprob(logprob=-12.543895721435547, rank=9, decoded_token=None), 37081: Logprob(logprob=-12.543895721435547, rank=10, decoded_token=None), 92169: Logprob(logprob=-12.668895721435547, rank=11, decoded_token=None), 9641: Logprob(logprob=-12.793895721435547, rank=12, decoded_token=None), 45287: Logprob(logprob=-12.918895721435547, rank=13, decoded_token=None), 31858: Logprob(logprob=-13.168895721435547, rank=14, decoded_token=None), 94420: Logprob(logprob=-13.418895721435547, rank=15, decoded_token=None), 4761: Logprob(logprob=-13.668895721435547, rank=16, decoded_token=None), 16150: Logprob(logprob=-13.793895721435547, rank=17, decoded_token=None), 3511: Logprob(logprob=-13.918895721435547, rank=18, decoded_token=None), 45437: Logprob(logprob=-13.918895721435547, rank=19, decoded_token=None), 320: Logprob(logprob=-14.418895721435547, rank=20, decoded_token=None)}\n"
451
+ ]
452
+ },
453
+ {
454
+ "name": "stderr",
455
+ "output_type": "stream",
456
+ "text": [
457
+ "/home/niuxy/maplecg_nfs/miniconda3/envs/vllm_waterfall/lib/python3.12/site-packages/transformers/generation/utils.py:2506: UserWarning: You are calling .generate() with the `input_ids` being on a device type different than your model's device. `input_ids` is on cuda, whereas the model is on meta. You may experience unexpected behaviors or slower generation. Please make sure that you have put `input_ids` to the correct device by calling for example input_ids = input_ids.to('meta') before running `.generate()`.\n",
458
+ " warnings.warn(\n"
459
+ ]
460
+ },
461
+ {
462
+ "name": "stdout",
463
+ "output_type": "stream",
464
+ "text": [
465
+ "315 {315: Logprob(logprob=-0.006171337328851223, rank=1, decoded_token=None), 330: Logprob(logprob=-5.131171226501465, rank=2, decoded_token=None), 364: Logprob(logprob=-8.631171226501465, rank=3, decoded_token=None), 430: Logprob(logprob=-10.131171226501465, rank=4, decoded_token=None), 922: Logprob(logprob=-11.506171226501465, rank=5, decoded_token=None), 11: Logprob(logprob=-12.131171226501465, rank=6, decoded_token=None), 499: Logprob(logprob=-12.631171226501465, rank=7, decoded_token=None), 1054: Logprob(logprob=-13.381171226501465, rank=8, decoded_token=None), 5196: Logprob(logprob=-13.881171226501465, rank=9, decoded_token=None), 374: Logprob(logprob=-14.568671226501465, rank=10, decoded_token=None), 389: Logprob(logprob=-14.943671226501465, rank=11, decoded_token=None), 14932: Logprob(logprob=-15.068671226501465, rank=12, decoded_token=None), 706: Logprob(logprob=-15.256171226501465, rank=13, decoded_token=None), 311: Logprob(logprob=-15.318671226501465, rank=14, decoded_token=None), 37260: Logprob(logprob=-15.568671226501465, rank=15, decoded_token=None), 3451: Logprob(logprob=-15.631171226501465, rank=16, decoded_token=None), 1073: Logprob(logprob=-16.13117218017578, rank=17, decoded_token=None), 9002: Logprob(logprob=-16.44367218017578, rank=18, decoded_token=None), 5084: Logprob(logprob=-16.50617218017578, rank=19, decoded_token=None), 520: Logprob(logprob=-16.56867218017578, rank=20, decoded_token=None)}\n",
466
+ "315 {315: Logprob(logprob=0.0, rank=1, decoded_token=None), 323: Logprob(logprob=-17.625, rank=2, decoded_token=None), 477: Logprob(logprob=-18.125, rank=3, decoded_token=None), 8838: Logprob(logprob=-18.125, rank=4, decoded_token=None), 5046: Logprob(logprob=-19.375, rank=5, decoded_token=None), 3659: Logprob(logprob=-20.75, rank=6, decoded_token=None), 11: Logprob(logprob=-20.875, rank=7, decoded_token=None), 2324: Logprob(logprob=-22.125, rank=8, decoded_token=None), 220: Logprob(logprob=-22.125, rank=9, decoded_token=None), 311: Logprob(logprob=-22.25, rank=10, decoded_token=None), 3083: Logprob(logprob=-22.25, rank=11, decoded_token=None), 297: Logprob(logprob=-22.25, rank=12, decoded_token=None), 1073: Logprob(logprob=-22.25, rank=13, decoded_token=None), 10440: Logprob(logprob=-22.625, rank=14, decoded_token=None), 33028: Logprob(logprob=-23.25, rank=15, decoded_token=None), 304: Logprob(logprob=-23.6875, rank=16, decoded_token=None), 60835: Logprob(logprob=-23.9375, rank=17, decoded_token=None), 44323: Logprob(logprob=-24.25, rank=18, decoded_token=None), 1161: Logprob(logprob=-24.3125, rank=19, decoded_token=None), 330: Logprob(logprob=-24.625, rank=20, decoded_token=None)}\n",
467
+ "315 {315: Logprob(logprob=-3.3854863431770355e-05, rank=1, decoded_token=None), 323: Logprob(logprob=-11.375033378601074, rank=2, decoded_token=None), 330: Logprob(logprob=-11.500033378601074, rank=3, decoded_token=None), 3967: Logprob(logprob=-12.000033378601074, rank=4, decoded_token=None), 364: Logprob(logprob=-12.500033378601074, rank=5, decoded_token=None), 430: Logprob(logprob=-14.125033378601074, rank=6, decoded_token=None), 499: Logprob(logprob=-14.375033378601074, rank=7, decoded_token=None), 220: Logprob(logprob=-14.875033378601074, rank=8, decoded_token=None), 374: Logprob(logprob=-15.625033378601074, rank=9, decoded_token=None), 11: Logprob(logprob=-15.750033378601074, rank=10, decoded_token=None), 14932: Logprob(logprob=-16.31253433227539, rank=11, decoded_token=None), 477: Logprob(logprob=-16.43753433227539, rank=12, decoded_token=None), 3629: Logprob(logprob=-16.56253433227539, rank=13, decoded_token=None), 584: Logprob(logprob=-17.12503433227539, rank=14, decoded_token=None), 2663: Logprob(logprob=-17.18753433227539, rank=15, decoded_token=None), 706: Logprob(logprob=-17.37503433227539, rank=16, decoded_token=None), 14183: Logprob(logprob=-18.00003433227539, rank=17, decoded_token=None), 1073: Logprob(logprob=-18.12503433227539, rank=18, decoded_token=None), 279: Logprob(logprob=-18.18753433227539, rank=19, decoded_token=None), 311: Logprob(logprob=-18.31253433227539, rank=20, decoded_token=None)}\n",
468
+ "315 {315: Logprob(logprob=-0.006171337328851223, rank=1, decoded_token=None), 330: Logprob(logprob=-5.131171226501465, rank=2, decoded_token=None), 364: Logprob(logprob=-8.631171226501465, rank=3, decoded_token=None), 430: Logprob(logprob=-10.131171226501465, rank=4, decoded_token=None), 922: Logprob(logprob=-11.506171226501465, rank=5, decoded_token=None), 11: Logprob(logprob=-12.131171226501465, rank=6, decoded_token=None), 499: Logprob(logprob=-12.631171226501465, rank=7, decoded_token=None), 1054: Logprob(logprob=-13.381171226501465, rank=8, decoded_token=None), 5196: Logprob(logprob=-13.881171226501465, rank=9, decoded_token=None), 374: Logprob(logprob=-14.568671226501465, rank=10, decoded_token=None), 389: Logprob(logprob=-14.943671226501465, rank=11, decoded_token=None), 14932: Logprob(logprob=-15.068671226501465, rank=12, decoded_token=None), 706: Logprob(logprob=-15.256171226501465, rank=13, decoded_token=None), 311: Logprob(logprob=-15.318671226501465, rank=14, decoded_token=None), 37260: Logprob(logprob=-15.568671226501465, rank=15, decoded_token=None), 3451: Logprob(logprob=-15.631171226501465, rank=16, decoded_token=None), 1073: Logprob(logprob=-16.13117218017578, rank=17, decoded_token=None), 9002: Logprob(logprob=-16.44367218017578, rank=18, decoded_token=None), 5084: Logprob(logprob=-16.50617218017578, rank=19, decoded_token=None), 520: Logprob(logprob=-16.56867218017578, rank=20, decoded_token=None)}\n",
469
+ "315 {315: Logprob(logprob=0.0, rank=1, decoded_token=None), 323: Logprob(logprob=-17.625, rank=2, decoded_token=None), 477: Logprob(logprob=-18.125, rank=3, decoded_token=None), 8838: Logprob(logprob=-18.125, rank=4, decoded_token=None), 5046: Logprob(logprob=-19.375, rank=5, decoded_token=None), 3659: Logprob(logprob=-20.75, rank=6, decoded_token=None), 11: Logprob(logprob=-20.875, rank=7, decoded_token=None), 2324: Logprob(logprob=-22.125, rank=8, decoded_token=None), 220: Logprob(logprob=-22.125, rank=9, decoded_token=None), 311: Logprob(logprob=-22.25, rank=10, decoded_token=None), 3083: Logprob(logprob=-22.25, rank=11, decoded_token=None), 297: Logprob(logprob=-22.25, rank=12, decoded_token=None), 1073: Logprob(logprob=-22.25, rank=13, decoded_token=None), 10440: Logprob(logprob=-22.625, rank=14, decoded_token=None), 33028: Logprob(logprob=-23.25, rank=15, decoded_token=None), 304: Logprob(logprob=-23.6875, rank=16, decoded_token=None), 60835: Logprob(logprob=-23.9375, rank=17, decoded_token=None), 44323: Logprob(logprob=-24.25, rank=18, decoded_token=None), 1161: Logprob(logprob=-24.3125, rank=19, decoded_token=None), 330: Logprob(logprob=-24.625, rank=20, decoded_token=None)}\n",
470
+ "279 {279: Logprob(logprob=-0.0002455409849062562, rank=1, decoded_token=None), 22706: Logprob(logprob=-8.875245094299316, rank=2, decoded_token=None), 19675: Logprob(logprob=-9.250245094299316, rank=3, decoded_token=None), 2324: Logprob(logprob=-12.250245094299316, rank=4, decoded_token=None), 3925: Logprob(logprob=-12.750245094299316, rank=5, decoded_token=None), 46969: Logprob(logprob=-14.250245094299316, rank=6, decoded_token=None), 8396: Logprob(logprob=-15.437745094299316, rank=7, decoded_token=None), 2854: Logprob(logprob=-15.562745094299316, rank=8, decoded_token=None), 94135: Logprob(logprob=-15.687745094299316, rank=9, decoded_token=None), 43384: Logprob(logprob=-16.062746047973633, rank=10, decoded_token=None), 11104: Logprob(logprob=-16.312746047973633, rank=11, decoded_token=None), 578: Logprob(logprob=-16.625246047973633, rank=12, decoded_token=None), 3432: Logprob(logprob=-16.687746047973633, rank=13, decoded_token=None), 1820: Logprob(logprob=-16.750246047973633, rank=14, decoded_token=None), 36017: Logprob(logprob=-17.187746047973633, rank=15, decoded_token=None), 3247: Logprob(logprob=-17.375246047973633, rank=16, decoded_token=None), 83695: Logprob(logprob=-17.437746047973633, rank=17, decoded_token=None), 11: Logprob(logprob=-17.500246047973633, rank=18, decoded_token=None), 1455: Logprob(logprob=-17.562746047973633, rank=19, decoded_token=None), 1057: Logprob(logprob=-17.625246047973633, rank=20, decoded_token=None)}\n",
471
+ "7250 {7250: Logprob(logprob=-0.002914468990638852, rank=1, decoded_token=None), 61628: Logprob(logprob=-5.8779144287109375, rank=2, decoded_token=None), 220: Logprob(logprob=-9.877914428710938, rank=3, decoded_token=None), 473: Logprob(logprob=-10.377914428710938, rank=4, decoded_token=None), 45437: Logprob(logprob=-10.752914428710938, rank=5, decoded_token=None), 80081: Logprob(logprob=-13.127914428710938, rank=6, decoded_token=None), 4761: Logprob(logprob=-13.752914428710938, rank=7, decoded_token=None), 24448: Logprob(logprob=-14.502914428710938, rank=8, decoded_token=None), 330: Logprob(logprob=-14.940414428710938, rank=9, decoded_token=None), 364: Logprob(logprob=-14.940414428710938, rank=10, decoded_token=None), 83342: Logprob(logprob=-15.377914428710938, rank=11, decoded_token=None), 4194: Logprob(logprob=-15.565414428710938, rank=12, decoded_token=None), 44273: Logprob(logprob=-15.690414428710938, rank=13, decoded_token=None), 28997: Logprob(logprob=-15.690414428710938, rank=14, decoded_token=None), 1536: Logprob(logprob=-15.877914428710938, rank=15, decoded_token=None), 256: Logprob(logprob=-16.065414428710938, rank=16, decoded_token=None), 11: Logprob(logprob=-16.190414428710938, rank=17, decoded_token=None), 507: Logprob(logprob=-16.315414428710938, rank=18, decoded_token=None), 80798: Logprob(logprob=-16.690414428710938, rank=19, decoded_token=None), 56875: Logprob(logprob=-16.815414428710938, rank=20, decoded_token=None)}\n",
472
+ "4900 {4900: Logprob(logprob=-0.0263874139636755, rank=1, decoded_token=None), 4872: Logprob(logprob=-3.6513874530792236, rank=2, decoded_token=None), 86481: Logprob(logprob=-10.401387214660645, rank=3, decoded_token=None), 220: Logprob(logprob=-11.151387214660645, rank=4, decoded_token=None), 67088: Logprob(logprob=-11.776387214660645, rank=5, decoded_token=None), 27229: Logprob(logprob=-11.776387214660645, rank=6, decoded_token=None), 4203: Logprob(logprob=-12.026387214660645, rank=7, decoded_token=None), 13: Logprob(logprob=-12.151387214660645, rank=8, decoded_token=None), 42855: Logprob(logprob=-12.401387214660645, rank=9, decoded_token=None), 79739: Logprob(logprob=-12.526387214660645, rank=10, decoded_token=None), 13621: Logprob(logprob=-12.901387214660645, rank=11, decoded_token=None), 79864: Logprob(logprob=-13.651387214660645, rank=12, decoded_token=None), 7808: Logprob(logprob=-14.151387214660645, rank=13, decoded_token=None), 47608: Logprob(logprob=-14.526387214660645, rank=14, decoded_token=None), 24544: Logprob(logprob=-14.526387214660645, rank=15, decoded_token=None), 52485: Logprob(logprob=-14.526387214660645, rank=16, decoded_token=None), 23072: Logprob(logprob=-15.276387214660645, rank=17, decoded_token=None), 11: Logprob(logprob=-15.401387214660645, rank=18, decoded_token=None), 1685: Logprob(logprob=-15.526387214660645, rank=19, decoded_token=None), 24145: Logprob(logprob=-15.838887214660645, rank=20, decoded_token=None)}\n",
473
+ "815 {815: Logprob(logprob=-0.0032160962000489235, rank=1, decoded_token=None), 13: Logprob(logprob=-6.00321626663208, rank=2, decoded_token=None), 328: Logprob(logprob=-7.37821626663208, rank=3, decoded_token=None), 6354: Logprob(logprob=-9.878215789794922, rank=4, decoded_token=None), 21861: Logprob(logprob=-10.628215789794922, rank=5, decoded_token=None), 516: Logprob(logprob=-10.878215789794922, rank=6, decoded_token=None), 662: Logprob(logprob=-12.378215789794922, rank=7, decoded_token=None), 220: Logprob(logprob=-12.503215789794922, rank=8, decoded_token=None), 497: Logprob(logprob=-13.065715789794922, rank=9, decoded_token=None), 4273: Logprob(logprob=-13.190715789794922, rank=10, decoded_token=None), 11: Logprob(logprob=-13.940715789794922, rank=11, decoded_token=None), 13575: Logprob(logprob=-13.940715789794922, rank=12, decoded_token=None), 1117: Logprob(logprob=-14.065715789794922, rank=13, decoded_token=None), 26922: Logprob(logprob=-14.253215789794922, rank=14, decoded_token=None), 12: Logprob(logprob=-14.628215789794922, rank=15, decoded_token=None), 5415: Logprob(logprob=-14.940715789794922, rank=16, decoded_token=None), 76469: Logprob(logprob=-15.128215789794922, rank=17, decoded_token=None), 24137: Logprob(logprob=-15.565715789794922, rank=18, decoded_token=None), 3238: Logprob(logprob=-15.628215789794922, rank=19, decoded_token=None), 790: Logprob(logprob=-15.628215789794922, rank=20, decoded_token=None)}\n",
474
+ "7250 {7250: Logprob(logprob=-0.002914468990638852, rank=1, decoded_token=None), 61628: Logprob(logprob=-5.8779144287109375, rank=2, decoded_token=None), 220: Logprob(logprob=-9.877914428710938, rank=3, decoded_token=None), 473: Logprob(logprob=-10.377914428710938, rank=4, decoded_token=None), 45437: Logprob(logprob=-10.752914428710938, rank=5, decoded_token=None), 80081: Logprob(logprob=-13.127914428710938, rank=6, decoded_token=None), 4761: Logprob(logprob=-13.752914428710938, rank=7, decoded_token=None), 24448: Logprob(logprob=-14.502914428710938, rank=8, decoded_token=None), 330: Logprob(logprob=-14.940414428710938, rank=9, decoded_token=None), 364: Logprob(logprob=-14.940414428710938, rank=10, decoded_token=None), 83342: Logprob(logprob=-15.377914428710938, rank=11, decoded_token=None), 4194: Logprob(logprob=-15.565414428710938, rank=12, decoded_token=None), 44273: Logprob(logprob=-15.690414428710938, rank=13, decoded_token=None), 28997: Logprob(logprob=-15.690414428710938, rank=14, decoded_token=None), 1536: Logprob(logprob=-15.877914428710938, rank=15, decoded_token=None), 256: Logprob(logprob=-16.065414428710938, rank=16, decoded_token=None), 11: Logprob(logprob=-16.190414428710938, rank=17, decoded_token=None), 507: Logprob(logprob=-16.315414428710938, rank=18, decoded_token=None), 80798: Logprob(logprob=-16.690414428710938, rank=19, decoded_token=None), 56875: Logprob(logprob=-16.815414428710938, rank=20, decoded_token=None)}\n",
475
+ "4900 {4900: Logprob(logprob=-0.0263874139636755, rank=1, decoded_token=None), 4872: Logprob(logprob=-3.6513874530792236, rank=2, decoded_token=None), 86481: Logprob(logprob=-10.401387214660645, rank=3, decoded_token=None), 220: Logprob(logprob=-11.151387214660645, rank=4, decoded_token=None), 67088: Logprob(logprob=-11.776387214660645, rank=5, decoded_token=None), 27229: Logprob(logprob=-11.776387214660645, rank=6, decoded_token=None), 4203: Logprob(logprob=-12.026387214660645, rank=7, decoded_token=None), 13: Logprob(logprob=-12.151387214660645, rank=8, decoded_token=None), 42855: Logprob(logprob=-12.401387214660645, rank=9, decoded_token=None), 79739: Logprob(logprob=-12.526387214660645, rank=10, decoded_token=None), 13621: Logprob(logprob=-12.901387214660645, rank=11, decoded_token=None), 79864: Logprob(logprob=-13.651387214660645, rank=12, decoded_token=None), 7808: Logprob(logprob=-14.151387214660645, rank=13, decoded_token=None), 47608: Logprob(logprob=-14.526387214660645, rank=14, decoded_token=None), 24544: Logprob(logprob=-14.526387214660645, rank=15, decoded_token=None), 52485: Logprob(logprob=-14.526387214660645, rank=16, decoded_token=None), 23072: Logprob(logprob=-15.276387214660645, rank=17, decoded_token=None), 11: Logprob(logprob=-15.401387214660645, rank=18, decoded_token=None), 1685: Logprob(logprob=-15.526387214660645, rank=19, decoded_token=None), 24145: Logprob(logprob=-15.838887214660645, rank=20, decoded_token=None)}\n",
476
+ "815 {815: Logprob(logprob=-0.0032160962000489235, rank=1, decoded_token=None), 13: Logprob(logprob=-6.00321626663208, rank=2, decoded_token=None), 328: Logprob(logprob=-7.37821626663208, rank=3, decoded_token=None), 6354: Logprob(logprob=-9.878215789794922, rank=4, decoded_token=None), 21861: Logprob(logprob=-10.628215789794922, rank=5, decoded_token=None), 516: Logprob(logprob=-10.878215789794922, rank=6, decoded_token=None), 662: Logprob(logprob=-12.378215789794922, rank=7, decoded_token=None), 220: Logprob(logprob=-12.503215789794922, rank=8, decoded_token=None), 497: Logprob(logprob=-13.065715789794922, rank=9, decoded_token=None), 4273: Logprob(logprob=-13.190715789794922, rank=10, decoded_token=None), 11: Logprob(logprob=-13.940715789794922, rank=11, decoded_token=None), 13575: Logprob(logprob=-13.940715789794922, rank=12, decoded_token=None), 1117: Logprob(logprob=-14.065715789794922, rank=13, decoded_token=None), 26922: Logprob(logprob=-14.253215789794922, rank=14, decoded_token=None), 12: Logprob(logprob=-14.628215789794922, rank=15, decoded_token=None), 5415: Logprob(logprob=-14.940715789794922, rank=16, decoded_token=None), 76469: Logprob(logprob=-15.128215789794922, rank=17, decoded_token=None), 24137: Logprob(logprob=-15.565715789794922, rank=18, decoded_token=None), 3238: Logprob(logprob=-15.628215789794922, rank=19, decoded_token=None), 790: Logprob(logprob=-15.628215789794922, rank=20, decoded_token=None)}\n",
477
+ "279 {279: Logprob(logprob=-0.009556027129292488, rank=1, decoded_token=None), 1148: Logprob(logprob=-4.884555816650391, rank=2, decoded_token=None), 330: Logprob(logprob=-6.259555816650391, rank=3, decoded_token=None), 364: Logprob(logprob=-10.75955581665039, rank=4, decoded_token=None), 3508: Logprob(logprob=-12.13455581665039, rank=5, decoded_token=None), 2324: Logprob(logprob=-12.13455581665039, rank=6, decoded_token=None), 7438: Logprob(logprob=-13.38455581665039, rank=7, decoded_token=None), 1054: Logprob(logprob=-14.38455581665039, rank=8, decoded_token=None), 14209: Logprob(logprob=-14.88455581665039, rank=9, decoded_token=None), 17139: Logprob(logprob=-15.00955581665039, rank=10, decoded_token=None), 9455: Logprob(logprob=-15.13455581665039, rank=11, decoded_token=None), 3249: Logprob(logprob=-15.50955581665039, rank=12, decoded_token=None), 3639: Logprob(logprob=-15.75955581665039, rank=13, decoded_token=None), 220: Logprob(logprob=-15.82205581665039, rank=14, decoded_token=None), 1268: Logprob(logprob=-15.94705581665039, rank=15, decoded_token=None), 1820: Logprob(logprob=-16.69705581665039, rank=16, decoded_token=None), 31437: Logprob(logprob=-17.19705581665039, rank=17, decoded_token=None), 578: Logprob(logprob=-17.50955581665039, rank=18, decoded_token=None), 3451: Logprob(logprob=-17.50955581665039, rank=19, decoded_token=None), 12840: Logprob(logprob=-17.50955581665039, rank=20, decoded_token=None)}\n",
478
+ "2324 {2324: Logprob(logprob=0.0, rank=1, decoded_token=None), 9601: Logprob(logprob=-17.25, rank=2, decoded_token=None), 14789: Logprob(logprob=-19.25, rank=3, decoded_token=None), 14209: Logprob(logprob=-19.75, rank=4, decoded_token=None), 330: Logprob(logprob=-21.125, rank=5, decoded_token=None), 26928: Logprob(logprob=-21.25, rank=6, decoded_token=None), 83900: Logprob(logprob=-21.75, rank=7, decoded_token=None), 364: Logprob(logprob=-21.75, rank=8, decoded_token=None), 220: Logprob(logprob=-22.25, rank=9, decoded_token=None), 3823: Logprob(logprob=-22.625, rank=10, decoded_token=None), 61094: Logprob(logprob=-22.75, rank=11, decoded_token=None), 10345: Logprob(logprob=-22.875, rank=12, decoded_token=None), 73591: Logprob(logprob=-23.625, rank=13, decoded_token=None), 3974: Logprob(logprob=-23.875, rank=14, decoded_token=None), 279: Logprob(logprob=-24.25, rank=15, decoded_token=None), 49785: Logprob(logprob=-24.625, rank=16, decoded_token=None), 26833: Logprob(logprob=-25.625, rank=17, decoded_token=None), 25994: Logprob(logprob=-25.75, rank=18, decoded_token=None), 107749: Logprob(logprob=-26.375, rank=19, decoded_token=None), 61961: Logprob(logprob=-26.625, rank=20, decoded_token=None)}\n",
479
+ "279 {279: Logprob(logprob=-0.01450834795832634, rank=1, decoded_token=None), 330: Logprob(logprob=-4.389508247375488, rank=2, decoded_token=None), 7438: Logprob(logprob=-7.514508247375488, rank=3, decoded_token=None), 2324: Logprob(logprob=-7.889508247375488, rank=4, decoded_token=None), 364: Logprob(logprob=-7.889508247375488, rank=5, decoded_token=None), 264: Logprob(logprob=-8.014508247375488, rank=6, decoded_token=None), 9455: Logprob(logprob=-8.014508247375488, rank=7, decoded_token=None), 1148: Logprob(logprob=-10.764508247375488, rank=8, decoded_token=None), 1054: Logprob(logprob=-12.389508247375488, rank=9, decoded_token=None), 459: Logprob(logprob=-12.889508247375488, rank=10, decoded_token=None), 26679: Logprob(logprob=-13.139508247375488, rank=11, decoded_token=None), 220: Logprob(logprob=-13.202008247375488, rank=12, decoded_token=None), 7580: Logprob(logprob=-13.264508247375488, rank=13, decoded_token=None), 14209: Logprob(logprob=-13.702008247375488, rank=14, decoded_token=None), 11125: Logprob(logprob=-14.139508247375488, rank=15, decoded_token=None), 27409: Logprob(logprob=-14.452008247375488, rank=16, decoded_token=None), 3451: Logprob(logprob=-14.639508247375488, rank=17, decoded_token=None), 323: Logprob(logprob=-14.639508247375488, rank=18, decoded_token=None), 15389: Logprob(logprob=-14.639508247375488, rank=19, decoded_token=None), 42687: Logprob(logprob=-14.764508247375488, rank=20, decoded_token=None)}\n",
480
+ "279 {279: Logprob(logprob=-0.009556027129292488, rank=1, decoded_token=None), 1148: Logprob(logprob=-4.884555816650391, rank=2, decoded_token=None), 330: Logprob(logprob=-6.259555816650391, rank=3, decoded_token=None), 364: Logprob(logprob=-10.75955581665039, rank=4, decoded_token=None), 3508: Logprob(logprob=-12.13455581665039, rank=5, decoded_token=None), 2324: Logprob(logprob=-12.13455581665039, rank=6, decoded_token=None), 7438: Logprob(logprob=-13.38455581665039, rank=7, decoded_token=None), 1054: Logprob(logprob=-14.38455581665039, rank=8, decoded_token=None), 14209: Logprob(logprob=-14.88455581665039, rank=9, decoded_token=None), 17139: Logprob(logprob=-15.00955581665039, rank=10, decoded_token=None), 9455: Logprob(logprob=-15.13455581665039, rank=11, decoded_token=None), 3249: Logprob(logprob=-15.50955581665039, rank=12, decoded_token=None), 3639: Logprob(logprob=-15.75955581665039, rank=13, decoded_token=None), 220: Logprob(logprob=-15.82205581665039, rank=14, decoded_token=None), 1268: Logprob(logprob=-15.94705581665039, rank=15, decoded_token=None), 1820: Logprob(logprob=-16.69705581665039, rank=16, decoded_token=None), 31437: Logprob(logprob=-17.19705581665039, rank=17, decoded_token=None), 578: Logprob(logprob=-17.50955581665039, rank=18, decoded_token=None), 3451: Logprob(logprob=-17.50955581665039, rank=19, decoded_token=None), 12840: Logprob(logprob=-17.50955581665039, rank=20, decoded_token=None)}\n",
481
+ "2324 {2324: Logprob(logprob=0.0, rank=1, decoded_token=None), 9601: Logprob(logprob=-17.25, rank=2, decoded_token=None), 14789: Logprob(logprob=-19.25, rank=3, decoded_token=None), 14209: Logprob(logprob=-19.75, rank=4, decoded_token=None), 330: Logprob(logprob=-21.125, rank=5, decoded_token=None), 26928: Logprob(logprob=-21.25, rank=6, decoded_token=None), 83900: Logprob(logprob=-21.75, rank=7, decoded_token=None), 364: Logprob(logprob=-21.75, rank=8, decoded_token=None), 220: Logprob(logprob=-22.25, rank=9, decoded_token=None), 3823: Logprob(logprob=-22.625, rank=10, decoded_token=None), 61094: Logprob(logprob=-22.75, rank=11, decoded_token=None), 10345: Logprob(logprob=-22.875, rank=12, decoded_token=None), 73591: Logprob(logprob=-23.625, rank=13, decoded_token=None), 3974: Logprob(logprob=-23.875, rank=14, decoded_token=None), 279: Logprob(logprob=-24.25, rank=15, decoded_token=None), 49785: Logprob(logprob=-24.625, rank=16, decoded_token=None), 26833: Logprob(logprob=-25.625, rank=17, decoded_token=None), 25994: Logprob(logprob=-25.75, rank=18, decoded_token=None), 107749: Logprob(logprob=-26.375, rank=19, decoded_token=None), 61961: Logprob(logprob=-26.625, rank=20, decoded_token=None)}\n",
482
+ "1455 {1455: Logprob(logprob=-0.009604200720787048, rank=1, decoded_token=None), 24417: Logprob(logprob=-5.009603977203369, rank=2, decoded_token=None), 8706: Logprob(logprob=-6.509603977203369, rank=3, decoded_token=None), 12474: Logprob(logprob=-6.759603977203369, rank=4, decoded_token=None), 1917: Logprob(logprob=-9.509604454040527, rank=5, decoded_token=None), 7928: Logprob(logprob=-10.509604454040527, rank=6, decoded_token=None), 51621: Logprob(logprob=-10.697104454040527, rank=7, decoded_token=None), 17139: Logprob(logprob=-10.884604454040527, rank=8, decoded_token=None), 22807: Logprob(logprob=-10.947104454040527, rank=9, decoded_token=None), 35825: Logprob(logprob=-11.259604454040527, rank=10, decoded_token=None), 3646: Logprob(logprob=-11.697104454040527, rank=11, decoded_token=None), 60406: Logprob(logprob=-11.759604454040527, rank=12, decoded_token=None), 15861: Logprob(logprob=-11.759604454040527, rank=13, decoded_token=None), 4325: Logprob(logprob=-12.072104454040527, rank=14, decoded_token=None), 2324: Logprob(logprob=-12.134604454040527, rank=15, decoded_token=None), 37554: Logprob(logprob=-12.572104454040527, rank=16, decoded_token=None), 7648: Logprob(logprob=-12.822104454040527, rank=17, decoded_token=None), 30758: Logprob(logprob=-12.884604454040527, rank=18, decoded_token=None), 67739: Logprob(logprob=-13.384604454040527, rank=19, decoded_token=None), 28254: Logprob(logprob=-13.822104454040527, rank=20, decoded_token=None)}\n",
483
+ "11 {11: Logprob(logprob=-0.2046964168548584, rank=1, decoded_token=None), 574: Logprob(logprob=-1.7046964168548584, rank=2, decoded_token=None), 279: Logprob(logprob=-6.3296966552734375, rank=3, decoded_token=None), 596: Logprob(logprob=-6.9546966552734375, rank=4, decoded_token=None), 16014: Logprob(logprob=-7.9546966552734375, rank=5, decoded_token=None), 320: Logprob(logprob=-9.704696655273438, rank=6, decoded_token=None), 220: Logprob(logprob=-9.954696655273438, rank=7, decoded_token=None), 374: Logprob(logprob=-10.329696655273438, rank=8, decoded_token=None), 8105: Logprob(logprob=-10.704696655273438, rank=9, decoded_token=None), 34688: Logprob(logprob=-11.954696655273438, rank=10, decoded_token=None), 1174: Logprob(logprob=-12.204696655273438, rank=11, decoded_token=None), 256: Logprob(logprob=-12.954696655273438, rank=12, decoded_token=None), 63738: Logprob(logprob=-13.079696655273438, rank=13, decoded_token=None), 9405: Logprob(logprob=-13.329696655273438, rank=14, decoded_token=None), 31870: Logprob(logprob=-13.454696655273438, rank=15, decoded_token=None), 13: Logprob(logprob=-13.704696655273438, rank=16, decoded_token=None), 482: Logprob(logprob=-14.142196655273438, rank=17, decoded_token=None), 14767: Logprob(logprob=-14.204696655273438, rank=18, decoded_token=None), 26: Logprob(logprob=-14.454696655273438, rank=19, decoded_token=None), 262: Logprob(logprob=-14.579696655273438, rank=20, decoded_token=None)}\n",
484
+ "24448 {24448: Logprob(logprob=-0.009981834329664707, rank=1, decoded_token=None), 7250: Logprob(logprob=-5.259981632232666, rank=2, decoded_token=None), 11: Logprob(logprob=-6.259981632232666, rank=3, decoded_token=None), 220: Logprob(logprob=-6.509981632232666, rank=4, decoded_token=None), 4821: Logprob(logprob=-7.134981632232666, rank=5, decoded_token=None), 32817: Logprob(logprob=-7.634981632232666, rank=6, decoded_token=None), 3703: Logprob(logprob=-11.134982109069824, rank=7, decoded_token=None), 31858: Logprob(logprob=-11.634982109069824, rank=8, decoded_token=None), 364: Logprob(logprob=-11.759982109069824, rank=9, decoded_token=None), 94420: Logprob(logprob=-12.009982109069824, rank=10, decoded_token=None), 45287: Logprob(logprob=-12.634982109069824, rank=11, decoded_token=None), 482: Logprob(logprob=-13.009982109069824, rank=12, decoded_token=None), 92169: Logprob(logprob=-13.259982109069824, rank=13, decoded_token=None), 256: Logprob(logprob=-13.259982109069824, rank=14, decoded_token=None), 3511: Logprob(logprob=-13.384982109069824, rank=15, decoded_token=None), 320: Logprob(logprob=-13.509982109069824, rank=16, decoded_token=None), 323: Logprob(logprob=-13.759982109069824, rank=17, decoded_token=None), 9641: Logprob(logprob=-14.009982109069824, rank=18, decoded_token=None), 16150: Logprob(logprob=-14.009982109069824, rank=19, decoded_token=None), 330: Logprob(logprob=-14.259982109069824, rank=20, decoded_token=None)}\n",
485
+ "13 {13: Logprob(logprob=-0.06436779350042343, rank=1, decoded_token=None), 4900: Logprob(logprob=-2.8143677711486816, rank=2, decoded_token=None), 4872: Logprob(logprob=-6.064367771148682, rank=3, decoded_token=None), 27229: Logprob(logprob=-11.31436824798584, rank=4, decoded_token=None), 79739: Logprob(logprob=-11.43936824798584, rank=5, decoded_token=None), 1087: Logprob(logprob=-11.43936824798584, rank=6, decoded_token=None), 86481: Logprob(logprob=-11.56436824798584, rank=7, decoded_token=None), 885: Logprob(logprob=-12.06436824798584, rank=8, decoded_token=None), 11: Logprob(logprob=-12.18936824798584, rank=9, decoded_token=None), 42855: Logprob(logprob=-12.68936824798584, rank=10, decoded_token=None), 220: Logprob(logprob=-12.93936824798584, rank=11, decoded_token=None), 47608: Logprob(logprob=-13.31436824798584, rank=12, decoded_token=None), 67088: Logprob(logprob=-13.31436824798584, rank=13, decoded_token=None), 2637: Logprob(logprob=-13.43936824798584, rank=14, decoded_token=None), 79864: Logprob(logprob=-13.56436824798584, rank=15, decoded_token=None), 4203: Logprob(logprob=-13.68936824798584, rank=16, decoded_token=None), 52485: Logprob(logprob=-13.75186824798584, rank=17, decoded_token=None), 13621: Logprob(logprob=-14.12686824798584, rank=18, decoded_token=None), 497: Logprob(logprob=-14.25186824798584, rank=19, decoded_token=None), 12898: Logprob(logprob=-15.06436824798584, rank=20, decoded_token=None)}\n",
486
+ "11 {11: Logprob(logprob=-0.2046964168548584, rank=1, decoded_token=None), 574: Logprob(logprob=-1.7046964168548584, rank=2, decoded_token=None), 279: Logprob(logprob=-6.3296966552734375, rank=3, decoded_token=None), 596: Logprob(logprob=-6.9546966552734375, rank=4, decoded_token=None), 16014: Logprob(logprob=-7.9546966552734375, rank=5, decoded_token=None), 320: Logprob(logprob=-9.704696655273438, rank=6, decoded_token=None), 220: Logprob(logprob=-9.954696655273438, rank=7, decoded_token=None), 374: Logprob(logprob=-10.329696655273438, rank=8, decoded_token=None), 8105: Logprob(logprob=-10.704696655273438, rank=9, decoded_token=None), 34688: Logprob(logprob=-11.954696655273438, rank=10, decoded_token=None), 1174: Logprob(logprob=-12.204696655273438, rank=11, decoded_token=None), 256: Logprob(logprob=-12.954696655273438, rank=12, decoded_token=None), 63738: Logprob(logprob=-13.079696655273438, rank=13, decoded_token=None), 9405: Logprob(logprob=-13.329696655273438, rank=14, decoded_token=None), 31870: Logprob(logprob=-13.454696655273438, rank=15, decoded_token=None), 13: Logprob(logprob=-13.704696655273438, rank=16, decoded_token=None), 482: Logprob(logprob=-14.142196655273438, rank=17, decoded_token=None), 14767: Logprob(logprob=-14.204696655273438, rank=18, decoded_token=None), 26: Logprob(logprob=-14.454696655273438, rank=19, decoded_token=None), 262: Logprob(logprob=-14.579696655273438, rank=20, decoded_token=None)}\n",
487
+ "24448 {24448: Logprob(logprob=-0.009981834329664707, rank=1, decoded_token=None), 7250: Logprob(logprob=-5.259981632232666, rank=2, decoded_token=None), 11: Logprob(logprob=-6.259981632232666, rank=3, decoded_token=None), 220: Logprob(logprob=-6.509981632232666, rank=4, decoded_token=None), 4821: Logprob(logprob=-7.134981632232666, rank=5, decoded_token=None), 32817: Logprob(logprob=-7.634981632232666, rank=6, decoded_token=None), 3703: Logprob(logprob=-11.134982109069824, rank=7, decoded_token=None), 31858: Logprob(logprob=-11.634982109069824, rank=8, decoded_token=None), 364: Logprob(logprob=-11.759982109069824, rank=9, decoded_token=None), 94420: Logprob(logprob=-12.009982109069824, rank=10, decoded_token=None), 45287: Logprob(logprob=-12.634982109069824, rank=11, decoded_token=None), 482: Logprob(logprob=-13.009982109069824, rank=12, decoded_token=None), 92169: Logprob(logprob=-13.259982109069824, rank=13, decoded_token=None), 256: Logprob(logprob=-13.259982109069824, rank=14, decoded_token=None), 3511: Logprob(logprob=-13.384982109069824, rank=15, decoded_token=None), 320: Logprob(logprob=-13.509982109069824, rank=16, decoded_token=None), 323: Logprob(logprob=-13.759982109069824, rank=17, decoded_token=None), 9641: Logprob(logprob=-14.009982109069824, rank=18, decoded_token=None), 16150: Logprob(logprob=-14.009982109069824, rank=19, decoded_token=None), 330: Logprob(logprob=-14.259982109069824, rank=20, decoded_token=None)}\n",
488
+ "13 {13: Logprob(logprob=-0.06436779350042343, rank=1, decoded_token=None), 4900: Logprob(logprob=-2.8143677711486816, rank=2, decoded_token=None), 4872: Logprob(logprob=-6.064367771148682, rank=3, decoded_token=None), 27229: Logprob(logprob=-11.31436824798584, rank=4, decoded_token=None), 79739: Logprob(logprob=-11.43936824798584, rank=5, decoded_token=None), 1087: Logprob(logprob=-11.43936824798584, rank=6, decoded_token=None), 86481: Logprob(logprob=-11.56436824798584, rank=7, decoded_token=None), 885: Logprob(logprob=-12.06436824798584, rank=8, decoded_token=None), 11: Logprob(logprob=-12.18936824798584, rank=9, decoded_token=None), 42855: Logprob(logprob=-12.68936824798584, rank=10, decoded_token=None), 220: Logprob(logprob=-12.93936824798584, rank=11, decoded_token=None), 47608: Logprob(logprob=-13.31436824798584, rank=12, decoded_token=None), 67088: Logprob(logprob=-13.31436824798584, rank=13, decoded_token=None), 2637: Logprob(logprob=-13.43936824798584, rank=14, decoded_token=None), 79864: Logprob(logprob=-13.56436824798584, rank=15, decoded_token=None), 4203: Logprob(logprob=-13.68936824798584, rank=16, decoded_token=None), 52485: Logprob(logprob=-13.75186824798584, rank=17, decoded_token=None), 13621: Logprob(logprob=-14.12686824798584, rank=18, decoded_token=None), 497: Logprob(logprob=-14.25186824798584, rank=19, decoded_token=None), 12898: Logprob(logprob=-15.06436824798584, rank=20, decoded_token=None)}\n",
489
+ "7438 {7438: Logprob(logprob=-0.00019298121333122253, rank=1, decoded_token=None), 330: Logprob(logprob=-8.750192642211914, rank=2, decoded_token=None), 17139: Logprob(logprob=-11.125192642211914, rank=3, decoded_token=None), 7138: Logprob(logprob=-11.250192642211914, rank=4, decoded_token=None), 57865: Logprob(logprob=-13.375192642211914, rank=5, decoded_token=None), 364: Logprob(logprob=-13.375192642211914, rank=6, decoded_token=None), 14209: Logprob(logprob=-13.500192642211914, rank=7, decoded_token=None), 3152: Logprob(logprob=-14.250192642211914, rank=8, decoded_token=None), 49203: Logprob(logprob=-14.375192642211914, rank=9, decoded_token=None), 50800: Logprob(logprob=-15.250192642211914, rank=10, decoded_token=None), 1054: Logprob(logprob=-15.375192642211914, rank=11, decoded_token=None), 6371: Logprob(logprob=-15.750192642211914, rank=12, decoded_token=None), 26431: Logprob(logprob=-16.000192642211914, rank=13, decoded_token=None), 4325: Logprob(logprob=-16.125192642211914, rank=14, decoded_token=None), 23222: Logprob(logprob=-16.125192642211914, rank=15, decoded_token=None), 17051: Logprob(logprob=-16.500192642211914, rank=16, decoded_token=None), 7580: Logprob(logprob=-16.625192642211914, rank=17, decoded_token=None), 84096: Logprob(logprob=-17.312692642211914, rank=18, decoded_token=None), 7419: Logprob(logprob=-17.750192642211914, rank=19, decoded_token=None), 38088: Logprob(logprob=-17.937692642211914, rank=20, decoded_token=None)}\n",
490
+ "374 {374: Logprob(logprob=-0.006966823246330023, rank=1, decoded_token=None), 706: Logprob(logprob=-5.006966590881348, rank=2, decoded_token=None), 11: Logprob(logprob=-9.006966590881348, rank=3, decoded_token=None), 649: Logprob(logprob=-9.506966590881348, rank=4, decoded_token=None), 0: Logprob(logprob=-10.506966590881348, rank=5, decoded_token=None), 13: Logprob(logprob=-12.006966590881348, rank=6, decoded_token=None), 220: Logprob(logprob=-12.131966590881348, rank=7, decoded_token=None), 8625: Logprob(logprob=-12.506966590881348, rank=8, decoded_token=None), 482: Logprob(logprob=-12.756966590881348, rank=9, decoded_token=None), 6: Logprob(logprob=-12.881966590881348, rank=10, decoded_token=None), 19813: Logprob(logprob=-13.881966590881348, rank=11, decoded_token=None), 320: Logprob(logprob=-14.006966590881348, rank=12, decoded_token=None), 574: Logprob(logprob=-14.381966590881348, rank=13, decoded_token=None), 35327: Logprob(logprob=-14.506966590881348, rank=14, decoded_token=None), 1389: Logprob(logprob=-14.569466590881348, rank=15, decoded_token=None), 1253: Logprob(logprob=-14.631966590881348, rank=16, decoded_token=None), 2643: Logprob(logprob=-15.006966590881348, rank=17, decoded_token=None), 3488: Logprob(logprob=-15.069466590881348, rank=18, decoded_token=None), 1: Logprob(logprob=-15.256966590881348, rank=19, decoded_token=None), 285: Logprob(logprob=-15.569466590881348, rank=20, decoded_token=None)}\n",
491
+ "330 {330: Logprob(logprob=-1.0593980550765991, rank=2, decoded_token=None), 7438: Logprob(logprob=-0.43439802527427673, rank=1, decoded_token=None), 364: Logprob(logprob=-5.184398174285889, rank=3, decoded_token=None), 1054: Logprob(logprob=-9.93439769744873, rank=4, decoded_token=None), 17139: Logprob(logprob=-12.05939769744873, rank=5, decoded_token=None), 3436: Logprob(logprob=-12.05939769744873, rank=6, decoded_token=None), 7580: Logprob(logprob=-12.30939769744873, rank=7, decoded_token=None), 3451: Logprob(logprob=-12.30939769744873, rank=8, decoded_token=None), 49203: Logprob(logprob=-13.05939769744873, rank=9, decoded_token=None), 57865: Logprob(logprob=-13.68439769744873, rank=10, decoded_token=None), 3152: Logprob(logprob=-13.68439769744873, rank=11, decoded_token=None), 23222: Logprob(logprob=-13.80939769744873, rank=12, decoded_token=None), 1595: Logprob(logprob=-13.80939769744873, rank=13, decoded_token=None), 2778: Logprob(logprob=-14.30939769744873, rank=14, decoded_token=None), 10103: Logprob(logprob=-14.55939769744873, rank=15, decoded_token=None), 7326: Logprob(logprob=-15.55939769744873, rank=16, decoded_token=None), 50800: Logprob(logprob=-15.68439769744873, rank=17, decoded_token=None), 7138: Logprob(logprob=-15.80939769744873, rank=18, decoded_token=None), 220: Logprob(logprob=-16.059398651123047, rank=19, decoded_token=None), 2846: Logprob(logprob=-16.434398651123047, rank=20, decoded_token=None)}\n",
492
+ "7438 {7438: Logprob(logprob=-0.00019298121333122253, rank=1, decoded_token=None), 330: Logprob(logprob=-8.750192642211914, rank=2, decoded_token=None), 17139: Logprob(logprob=-11.125192642211914, rank=3, decoded_token=None), 7138: Logprob(logprob=-11.250192642211914, rank=4, decoded_token=None), 57865: Logprob(logprob=-13.375192642211914, rank=5, decoded_token=None), 364: Logprob(logprob=-13.375192642211914, rank=6, decoded_token=None), 14209: Logprob(logprob=-13.500192642211914, rank=7, decoded_token=None), 3152: Logprob(logprob=-14.250192642211914, rank=8, decoded_token=None), 49203: Logprob(logprob=-14.375192642211914, rank=9, decoded_token=None), 50800: Logprob(logprob=-15.250192642211914, rank=10, decoded_token=None), 1054: Logprob(logprob=-15.375192642211914, rank=11, decoded_token=None), 6371: Logprob(logprob=-15.750192642211914, rank=12, decoded_token=None), 26431: Logprob(logprob=-16.000192642211914, rank=13, decoded_token=None), 4325: Logprob(logprob=-16.125192642211914, rank=14, decoded_token=None), 23222: Logprob(logprob=-16.125192642211914, rank=15, decoded_token=None), 17051: Logprob(logprob=-16.500192642211914, rank=16, decoded_token=None), 7580: Logprob(logprob=-16.625192642211914, rank=17, decoded_token=None), 84096: Logprob(logprob=-17.312692642211914, rank=18, decoded_token=None), 7419: Logprob(logprob=-17.750192642211914, rank=19, decoded_token=None), 38088: Logprob(logprob=-17.937692642211914, rank=20, decoded_token=None)}\n",
493
+ "374 {374: Logprob(logprob=-0.006966823246330023, rank=1, decoded_token=None), 706: Logprob(logprob=-5.006966590881348, rank=2, decoded_token=None), 11: Logprob(logprob=-9.006966590881348, rank=3, decoded_token=None), 649: Logprob(logprob=-9.506966590881348, rank=4, decoded_token=None), 0: Logprob(logprob=-10.506966590881348, rank=5, decoded_token=None), 13: Logprob(logprob=-12.006966590881348, rank=6, decoded_token=None), 220: Logprob(logprob=-12.131966590881348, rank=7, decoded_token=None), 8625: Logprob(logprob=-12.506966590881348, rank=8, decoded_token=None), 482: Logprob(logprob=-12.756966590881348, rank=9, decoded_token=None), 6: Logprob(logprob=-12.881966590881348, rank=10, decoded_token=None), 19813: Logprob(logprob=-13.881966590881348, rank=11, decoded_token=None), 320: Logprob(logprob=-14.006966590881348, rank=12, decoded_token=None), 574: Logprob(logprob=-14.381966590881348, rank=13, decoded_token=None), 35327: Logprob(logprob=-14.506966590881348, rank=14, decoded_token=None), 1389: Logprob(logprob=-14.569466590881348, rank=15, decoded_token=None), 1253: Logprob(logprob=-14.631966590881348, rank=16, decoded_token=None), 2643: Logprob(logprob=-15.006966590881348, rank=17, decoded_token=None), 3488: Logprob(logprob=-15.069466590881348, rank=18, decoded_token=None), 1: Logprob(logprob=-15.256966590881348, rank=19, decoded_token=None), 285: Logprob(logprob=-15.569466590881348, rank=20, decoded_token=None)}\n",
494
+ "28254 {28254: Logprob(logprob=-0.03447406738996506, rank=1, decoded_token=None), 52876: Logprob(logprob=-3.9094741344451904, rank=2, decoded_token=None), 6485: Logprob(logprob=-5.284473896026611, rank=3, decoded_token=None), 16188: Logprob(logprob=-5.284473896026611, rank=4, decoded_token=None), 66278: Logprob(logprob=-6.534473896026611, rank=5, decoded_token=None), 41765: Logprob(logprob=-7.409473896026611, rank=6, decoded_token=None), 59674: Logprob(logprob=-7.909473896026611, rank=7, decoded_token=None), 14154: Logprob(logprob=-8.34697437286377, rank=8, decoded_token=None), 67739: Logprob(logprob=-8.84697437286377, rank=9, decoded_token=None), 58105: Logprob(logprob=-8.84697437286377, rank=10, decoded_token=None), 41903: Logprob(logprob=-8.97197437286377, rank=11, decoded_token=None), 4691: Logprob(logprob=-9.15947437286377, rank=12, decoded_token=None), 5199: Logprob(logprob=-9.78447437286377, rank=13, decoded_token=None), 4325: Logprob(logprob=-9.97197437286377, rank=14, decoded_token=None), 48883: Logprob(logprob=-10.22197437286377, rank=15, decoded_token=None), 57697: Logprob(logprob=-10.34697437286377, rank=16, decoded_token=None), 74252: Logprob(logprob=-10.47197437286377, rank=17, decoded_token=None), 22872: Logprob(logprob=-10.53447437286377, rank=18, decoded_token=None), 66684: Logprob(logprob=-10.65947437286377, rank=19, decoded_token=None), 57216: Logprob(logprob=-10.72197437286377, rank=20, decoded_token=None)}\n",
495
+ "279 {279: Logprob(logprob=-0.0008725888328626752, rank=1, decoded_token=None), 220: Logprob(logprob=-7.125872611999512, rank=2, decoded_token=None), 4846: Logprob(logprob=-10.125872611999512, rank=3, decoded_token=None), 889: Logprob(logprob=-11.875872611999512, rank=4, decoded_token=None), 1101: Logprob(logprob=-12.375872611999512, rank=5, decoded_token=None), 578: Logprob(logprob=-12.625872611999512, rank=6, decoded_token=None), 264: Logprob(logprob=-13.000872611999512, rank=7, decoded_token=None), 574: Logprob(logprob=-13.125872611999512, rank=8, decoded_token=None), 256: Logprob(logprob=-13.125872611999512, rank=9, decoded_token=None), 5270: Logprob(logprob=-13.250872611999512, rank=10, decoded_token=None), 320: Logprob(logprob=-13.750872611999512, rank=11, decoded_token=None), 459: Logprob(logprob=-14.125872611999512, rank=12, decoded_token=None), 364: Logprob(logprob=-14.125872611999512, rank=13, decoded_token=None), 1694: Logprob(logprob=-14.750872611999512, rank=14, decoded_token=None), 9405: Logprob(logprob=-15.250872611999512, rank=15, decoded_token=None), 720: Logprob(logprob=-15.313372611999512, rank=16, decoded_token=None), 34833: Logprob(logprob=-15.438372611999512, rank=17, decoded_token=None), 3778: Logprob(logprob=-15.438372611999512, rank=18, decoded_token=None), 813: Logprob(logprob=-15.563372611999512, rank=19, decoded_token=None), 33600: Logprob(logprob=-15.625872611999512, rank=20, decoded_token=None)}\n",
496
+ "9405 {9405: Logprob(logprob=-6.890059739816934e-05, rank=1, decoded_token=None), 220: Logprob(logprob=-10.125068664550781, rank=2, decoded_token=None), 38916: Logprob(logprob=-11.375068664550781, rank=3, decoded_token=None), 13118: Logprob(logprob=-12.500068664550781, rank=4, decoded_token=None), 279: Logprob(logprob=-12.625068664550781, rank=5, decoded_token=None), 7342: Logprob(logprob=-13.125068664550781, rank=6, decoded_token=None), 18307: Logprob(logprob=-13.750068664550781, rank=7, decoded_token=None), 256: Logprob(logprob=-13.875068664550781, rank=8, decoded_token=None), 11: Logprob(logprob=-14.000068664550781, rank=9, decoded_token=None), 16381: Logprob(logprob=-14.125068664550781, rank=10, decoded_token=None), 264: Logprob(logprob=-14.250068664550781, rank=11, decoded_token=None), 459: Logprob(logprob=-14.375068664550781, rank=12, decoded_token=None), 3604: Logprob(logprob=-14.625068664550781, rank=13, decoded_token=None), 40260: Logprob(logprob=-14.625068664550781, rank=14, decoded_token=None), 19073: Logprob(logprob=-14.750068664550781, rank=15, decoded_token=None), 65162: Logprob(logprob=-15.187568664550781, rank=16, decoded_token=None), 18665: Logprob(logprob=-15.750068664550781, rank=17, decoded_token=None), 16689: Logprob(logprob=-16.00006866455078, rank=18, decoded_token=None), 539: Logprob(logprob=-16.18756866455078, rank=19, decoded_token=None), 4872: Logprob(logprob=-16.25006866455078, rank=20, decoded_token=None)}\n",
497
+ "7250 {7250: Logprob(logprob=-0.000730128725990653, rank=1, decoded_token=None), 61628: Logprob(logprob=-7.625730037689209, rank=2, decoded_token=None), 473: Logprob(logprob=-8.625730514526367, rank=3, decoded_token=None), 220: Logprob(logprob=-10.000730514526367, rank=4, decoded_token=None), 45437: Logprob(logprob=-11.500730514526367, rank=5, decoded_token=None), 4761: Logprob(logprob=-12.625730514526367, rank=6, decoded_token=None), 80081: Logprob(logprob=-13.625730514526367, rank=7, decoded_token=None), 44273: Logprob(logprob=-14.938230514526367, rank=8, decoded_token=None), 83342: Logprob(logprob=-15.063230514526367, rank=9, decoded_token=None), 364: Logprob(logprob=-15.063230514526367, rank=10, decoded_token=None), 24448: Logprob(logprob=-15.500730514526367, rank=11, decoded_token=None), 574: Logprob(logprob=-15.563230514526367, rank=12, decoded_token=None), 28997: Logprob(logprob=-15.563230514526367, rank=13, decoded_token=None), 507: Logprob(logprob=-15.563230514526367, rank=14, decoded_token=None), 330: Logprob(logprob=-15.625730514526367, rank=15, decoded_token=None), 1536: Logprob(logprob=-15.750730514526367, rank=16, decoded_token=None), 323: Logprob(logprob=-16.375730514526367, rank=17, decoded_token=None), 596: Logprob(logprob=-16.563230514526367, rank=18, decoded_token=None), 256: Logprob(logprob=-16.625730514526367, rank=19, decoded_token=None), 80798: Logprob(logprob=-16.813230514526367, rank=20, decoded_token=None)}\n",
498
+ "279 {279: Logprob(logprob=-0.0008725888328626752, rank=1, decoded_token=None), 220: Logprob(logprob=-7.125872611999512, rank=2, decoded_token=None), 4846: Logprob(logprob=-10.125872611999512, rank=3, decoded_token=None), 889: Logprob(logprob=-11.875872611999512, rank=4, decoded_token=None), 1101: Logprob(logprob=-12.375872611999512, rank=5, decoded_token=None), 578: Logprob(logprob=-12.625872611999512, rank=6, decoded_token=None), 264: Logprob(logprob=-13.000872611999512, rank=7, decoded_token=None), 574: Logprob(logprob=-13.125872611999512, rank=8, decoded_token=None), 256: Logprob(logprob=-13.125872611999512, rank=9, decoded_token=None), 5270: Logprob(logprob=-13.250872611999512, rank=10, decoded_token=None), 320: Logprob(logprob=-13.750872611999512, rank=11, decoded_token=None), 459: Logprob(logprob=-14.125872611999512, rank=12, decoded_token=None), 364: Logprob(logprob=-14.125872611999512, rank=13, decoded_token=None), 1694: Logprob(logprob=-14.750872611999512, rank=14, decoded_token=None), 9405: Logprob(logprob=-15.250872611999512, rank=15, decoded_token=None), 720: Logprob(logprob=-15.313372611999512, rank=16, decoded_token=None), 34833: Logprob(logprob=-15.438372611999512, rank=17, decoded_token=None), 3778: Logprob(logprob=-15.438372611999512, rank=18, decoded_token=None), 813: Logprob(logprob=-15.563372611999512, rank=19, decoded_token=None), 33600: Logprob(logprob=-15.625872611999512, rank=20, decoded_token=None)}\n",
499
+ "9405 {9405: Logprob(logprob=-6.890059739816934e-05, rank=1, decoded_token=None), 220: Logprob(logprob=-10.125068664550781, rank=2, decoded_token=None), 38916: Logprob(logprob=-11.375068664550781, rank=3, decoded_token=None), 13118: Logprob(logprob=-12.500068664550781, rank=4, decoded_token=None), 279: Logprob(logprob=-12.625068664550781, rank=5, decoded_token=None), 7342: Logprob(logprob=-13.125068664550781, rank=6, decoded_token=None), 18307: Logprob(logprob=-13.750068664550781, rank=7, decoded_token=None), 256: Logprob(logprob=-13.875068664550781, rank=8, decoded_token=None), 11: Logprob(logprob=-14.000068664550781, rank=9, decoded_token=None), 16381: Logprob(logprob=-14.125068664550781, rank=10, decoded_token=None), 264: Logprob(logprob=-14.250068664550781, rank=11, decoded_token=None), 459: Logprob(logprob=-14.375068664550781, rank=12, decoded_token=None), 3604: Logprob(logprob=-14.625068664550781, rank=13, decoded_token=None), 40260: Logprob(logprob=-14.625068664550781, rank=14, decoded_token=None), 19073: Logprob(logprob=-14.750068664550781, rank=15, decoded_token=None), 65162: Logprob(logprob=-15.187568664550781, rank=16, decoded_token=None), 18665: Logprob(logprob=-15.750068664550781, rank=17, decoded_token=None), 16689: Logprob(logprob=-16.00006866455078, rank=18, decoded_token=None), 539: Logprob(logprob=-16.18756866455078, rank=19, decoded_token=None), 4872: Logprob(logprob=-16.25006866455078, rank=20, decoded_token=None)}\n",
500
+ "7250 {7250: Logprob(logprob=-0.000730128725990653, rank=1, decoded_token=None), 61628: Logprob(logprob=-7.625730037689209, rank=2, decoded_token=None), 473: Logprob(logprob=-8.625730514526367, rank=3, decoded_token=None), 220: Logprob(logprob=-10.000730514526367, rank=4, decoded_token=None), 45437: Logprob(logprob=-11.500730514526367, rank=5, decoded_token=None), 4761: Logprob(logprob=-12.625730514526367, rank=6, decoded_token=None), 80081: Logprob(logprob=-13.625730514526367, rank=7, decoded_token=None), 44273: Logprob(logprob=-14.938230514526367, rank=8, decoded_token=None), 83342: Logprob(logprob=-15.063230514526367, rank=9, decoded_token=None), 364: Logprob(logprob=-15.063230514526367, rank=10, decoded_token=None), 24448: Logprob(logprob=-15.500730514526367, rank=11, decoded_token=None), 574: Logprob(logprob=-15.563230514526367, rank=12, decoded_token=None), 28997: Logprob(logprob=-15.563230514526367, rank=13, decoded_token=None), 507: Logprob(logprob=-15.563230514526367, rank=14, decoded_token=None), 330: Logprob(logprob=-15.625730514526367, rank=15, decoded_token=None), 1536: Logprob(logprob=-15.750730514526367, rank=16, decoded_token=None), 323: Logprob(logprob=-16.375730514526367, rank=17, decoded_token=None), 596: Logprob(logprob=-16.563230514526367, rank=18, decoded_token=None), 256: Logprob(logprob=-16.625730514526367, rank=19, decoded_token=None), 80798: Logprob(logprob=-16.813230514526367, rank=20, decoded_token=None)}\n",
501
+ "tensor([-0.0614, -0.3096, -0.9614, -0.9980, -1.0096, -1.0379, -0.0465, -0.3464,\n",
502
+ " -0.5465, -0.8464, -0.8967, -1.3967], device='cuda:0')\n",
503
+ "['The question of the meaning', 'The meaning of life is', 'The question of the meaning', 'The concept of the meaning', 'The meaning of life is', 'One of the most profound', 'Barack Obama, the', 'Barack Obama was born', 'Barack Obama, the', 'Barack Obama was born', 'Former US President Barack Obama', 'Former US President Barack Obama']\n"
504
+ ]
505
+ }
506
+ ],
507
+ "source": [
508
+ "# Define the replacement\n",
509
+ "\n",
510
+ "N = test.lm_head.out_features\n",
511
+ "\n",
512
+ "beam_search_params = SamplingParams(logprobs=20,\n",
513
+ " max_tokens=1,\n",
514
+ " temperature=1.0,\n",
515
+ " detokenize=False)\n",
516
+ "\n",
517
+ "def new_forward(self, prompts_batch, input_ids, *args, **kwargs):\n",
518
+ " prompts_batch = deepcopy(prompts_batch)\n",
519
+ " for i, j in zip(input_ids, prompts_batch):\n",
520
+ " j['prompt_token_ids'] += i[1:].tolist()\n",
521
+ " output = vllm.generate(prompts_batch,\n",
522
+ " sampling_params=beam_search_params,\n",
523
+ " use_tqdm=False)\n",
524
+ " logits = torch.full((len(output), N), float('-inf'))\n",
525
+ " for i, o in enumerate(output):\n",
526
+ " o = o.outputs[0].logprobs[0]\n",
527
+ " indices = torch.tensor(list(o.keys()))\n",
528
+ " values = torch.tensor([i.logprob for i in o.values()])\n",
529
+ " logits[i, indices] = values\n",
530
+ "\n",
531
+ " logits = logits.unsqueeze(1)\n",
532
+ " logits = logits.to(input_ids.device)\n",
533
+ " # print(logits[:, -1].topk(5, dim=-1))\n",
534
+ " # print(logits.shape)\n",
535
+ " output_dict = CausalLMOutputWithPast(\n",
536
+ " loss=None,\n",
537
+ " logits=logits,\n",
538
+ " past_key_values=None,\n",
539
+ " hidden_states=None,\n",
540
+ " attentions=None,\n",
541
+ " )\n",
542
+ " return output_dict\n",
543
+ "\n",
544
+ "# --- Usage ---\n",
545
+ "print(\"Using patched forward:\")\n",
546
+ "print(\"Patched forward signature:\", set(inspect.signature(model.forward).parameters))\n",
547
+ "token_prompts = [TokensPrompt(prompt_token_ids=tokenizer.encode(i, add_special_tokens=False)) for i in inputs]\n",
548
+ "token_prompts = [j for i in token_prompts for j in [deepcopy(i) for _ in range(num_beam_groups * beams_per_group)]]\n",
549
+ "test.forward = types.MethodType(new_forward, test)\n",
550
+ "out = test.generate(\n",
551
+ " input_ids = torch.full((len(inputs), 1), tokenizer.bos_token_id, dtype=torch.long, device=model.device),\n",
552
+ " # **tokd_input,\n",
553
+ " max_new_tokens=5,\n",
554
+ " # logits_processor=[logits_processor],\n",
555
+ " pad_token_id=tokenizer.eos_token_id,\n",
556
+ " do_sample = False, temperature=None, top_p=None,\n",
557
+ " num_beams = num_beam_groups * beams_per_group,\n",
558
+ " num_beam_groups = num_beam_groups,\n",
559
+ " num_return_sequences = num_beam_groups * beams_per_group,\n",
560
+ " diversity_penalty = 0.5, use_cache = False,\n",
561
+ " prompts_batch = token_prompts,\n",
562
+ " output_scores=True, return_dict_in_generate=True\n",
563
+ " )\n",
564
+ "print(out.sequences_scores)\n",
565
+ "print(tokenizer.batch_decode(out.sequences[:,1:]))"
566
+ ]
567
+ },
568
+ {
569
+ "cell_type": "code",
570
+ "execution_count": null,
571
+ "id": "d2bac595",
572
+ "metadata": {},
573
+ "outputs": [
574
+ {
575
+ "name": "stdout",
576
+ "output_type": "stream",
577
+ "text": [
578
+ "\n",
579
+ "Using original forward:\n",
580
+ "Restored forward signature: {'args', 'kwargs'}\n",
581
+ "tensor([-0.0608, -0.3091, -0.9608, -1.0058, -1.0091, -1.0627, -0.0466, -0.3464,\n",
582
+ " -0.5466, -0.8464, -0.8951, -1.3951], device='cuda:0')\n",
583
+ "['The question of the meaning', 'The meaning of life is', 'The question of the meaning', 'The concept of the meaning', 'The meaning of life is', 'One of the most profound', 'Barack Obama, the', 'Barack Obama was born', 'Barack Obama, the', 'Barack Obama was born', 'Former US President Barack Obama', 'Former US President Barack Obama']\n"
584
+ ]
585
+ }
586
+ ],
587
+ "source": [
588
+ "def print_forward(self, *args, **kwargs):\n",
589
+ " out = self.__class__.forward(self, *args, **kwargs)\n",
590
+ " out.logits = out.logits.float()\n",
591
+ " # logits = out.logits\n",
592
+ " # print(logits[:, -1].float().log_softmax(dim=-1).topk(5, dim=-1))\n",
593
+ " return out\n",
594
+ "\n",
595
+ "# Swap back to the original\n",
596
+ "# model.forward = model._original_forward\n",
597
+ "model.forward = types.MethodType(print_forward, model)\n",
598
+ "print(\"\\nUsing original forward:\")\n",
599
+ "print(\"Restored forward signature:\", set(inspect.signature(model.forward).parameters))\n",
600
+ "out = model.generate(\n",
601
+ " **tokd_input,\n",
602
+ " max_new_tokens=5,\n",
603
+ " # logits_processor=[logits_processor],\n",
604
+ " pad_token_id=tokenizer.eos_token_id,\n",
605
+ " do_sample = False, temperature=None, top_p=None,\n",
606
+ " num_beams = num_beam_groups * beams_per_group,\n",
607
+ " num_beam_groups = num_beam_groups,\n",
608
+ " num_return_sequences = num_beam_groups * beams_per_group,\n",
609
+ " diversity_penalty = 0.5, use_cache = False,\n",
610
+ " output_scores=True, return_dict_in_generate=True\n",
611
+ " )\n",
612
+ "print(out.sequences_scores)\n",
613
+ "print(tokenizer.batch_decode(out.sequences[:,tokd_input[\"input_ids\"].shape[1]:]))"
614
+ ]
615
+ },
616
+ {
617
+ "cell_type": "code",
618
+ "execution_count": null,
619
+ "id": "e146c195",
620
+ "metadata": {},
621
+ "outputs": [],
622
+ "source": [
623
+ "inputs_ = inputs[:1]\n",
624
+ "tokd_input_ = tokenizer(inputs_, return_tensors=\"pt\", add_special_tokens=False, padding=True).to(model.device)"
625
+ ]
626
+ },
627
+ {
628
+ "cell_type": "code",
629
+ "execution_count": null,
630
+ "id": "f3ecfb66",
631
+ "metadata": {},
632
+ "outputs": [],
633
+ "source": [
634
+ "# token_prompts = [TokensPrompt(prompt_token_ids=tokenizer.encode(i, add_special_tokens=False)) for i in inputs_ * 100]\n",
635
+ "# token_prompts = [j for i in token_prompts for j in [deepcopy(i) for _ in range(num_beam_groups * beams_per_group)]]\n",
636
+ "# model.forward = types.MethodType(new_forward, model)\n",
637
+ "# timeit(lambda: model.generate(\n",
638
+ "# input_ids = torch.full((len(inputs_), 1), tokenizer.bos_token_id, dtype=torch.long, device=model.device),\n",
639
+ "# # **tokd_input,\n",
640
+ "# max_new_tokens=10,\n",
641
+ "# # logits_processor=[logits_processor],\n",
642
+ "# pad_token_id=tokenizer.eos_token_id,\n",
643
+ "# do_sample = False, temperature=None, top_p=None,\n",
644
+ "# num_beams = num_beam_groups * beams_per_group,\n",
645
+ "# num_beam_groups = num_beam_groups,\n",
646
+ "# num_return_sequences = num_beam_groups * beams_per_group,\n",
647
+ "# diversity_penalty = 0.5, use_cache = False,\n",
648
+ "\n",
649
+ "# prompts_batch = token_prompts\n",
650
+ "# ), number=1)"
651
+ ]
652
+ },
653
+ {
654
+ "cell_type": "code",
655
+ "execution_count": null,
656
+ "id": "4337d343",
657
+ "metadata": {},
658
+ "outputs": [],
659
+ "source": [
660
+ "\n",
661
+ "# model.forward = model._original_forward\n",
662
+ "# timeit(lambda: model.generate(\n",
663
+ "# **tokd_input_,\n",
664
+ "# max_new_tokens=10,\n",
665
+ "# # logits_processor=[logits_processor],\n",
666
+ "# pad_token_id=tokenizer.eos_token_id,\n",
667
+ "# do_sample = False, temperature=None, top_p=None,\n",
668
+ "# num_beams = num_beam_groups * beams_per_group,\n",
669
+ "# num_beam_groups = num_beam_groups,\n",
670
+ "# num_return_sequences = num_beam_groups * beams_per_group,\n",
671
+ "# diversity_penalty = 0.5, use_cache = False\n",
672
+ "# ), number=100)"
673
+ ]
674
+ }
675
+ ],
676
+ "metadata": {
677
+ "kernelspec": {
678
+ "display_name": "vllm_waterfall",
679
+ "language": "python",
680
+ "name": "python3"
681
+ },
682
+ "language_info": {
683
+ "codemirror_mode": {
684
+ "name": "ipython",
685
+ "version": 3
686
+ },
687
+ "file_extension": ".py",
688
+ "mimetype": "text/x-python",
689
+ "name": "python",
690
+ "nbconvert_exporter": "python",
691
+ "pygments_lexer": "ipython3",
692
+ "version": "3.12.11"
693
+ }
694
+ },
695
+ "nbformat": 4,
696
+ "nbformat_minor": 5
697
+ }
@@ -22,6 +22,8 @@ from waterfall.permute import Permute
22
22
  from waterfall.WatermarkingFn import WatermarkingFn
23
23
  from waterfall.WatermarkingFnFourier import WatermarkingFnFourier
24
24
 
25
+ os.environ["TOKENIZERS_PARALLELISM"] = "false"
26
+
25
27
  class PerturbationProcessor(LogitsProcessor):
26
28
  def __init__(self,
27
29
  N : int = 32000, # Vocab size
@@ -15,8 +15,6 @@ from waterfall.WatermarkingFnFourier import WatermarkingFnFourier
15
15
  from waterfall.WatermarkingFnSquare import WatermarkingFnSquare
16
16
  from waterfall.WatermarkerBase import Watermarker
17
17
 
18
- os.environ["TOKENIZERS_PARALLELISM"] = "false"
19
-
20
18
  PROMPT = (
21
19
  "Paraphrase the user provided text while preserving semantic similarity. "
22
20
  "Do not include any other sentences in the response, such as explanations of the paraphrasing. "
Binary file
File without changes
File without changes
File without changes
File without changes
File without changes