Untitled

 avatar
unknown
plain_text
24 days ago
42 kB
8
Indexable
Answer: Segment
Chunk: 1/0, ppl: 9.312779426574707, time: 0.95s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 0: {'pred': ' B', 'chunk_ppl': [9.312779426574707], 'total_ppl': 9.312779426574707}
1it [00:54, 54.40s/it]Chunk: 1/0, ppl: 8.38564682006836, time: 2.39s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 1: {'pred': ' B', 'chunk_ppl': [8.38564682006836], 'total_ppl': 8.38564682006836}
2it [01:53, 56.93s/it]Chunk: 1/0, ppl: 12.36805534362793, time: 1.97s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 2: {'pred': ' B', 'chunk_ppl': [12.36805534362793], 'total_ppl': 12.36805534362793}
3it [02:50, 57.26s/it]Chunk: 1/0, ppl: 16.007787704467773, time: 2.4s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 3: {'pred': ' B', 'chunk_ppl': [16.007787704467773], 'total_ppl': 16.007787704467773}
4it [03:48, 57.65s/it]Chunk: 1/0, ppl: 11.50775146484375, time: 2.35s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 4: {'pred': ' A', 'chunk_ppl': [11.50775146484375], 'total_ppl': 11.50775146484375}
5it [04:44, 56.82s/it]Chunk: 1/0, ppl: 13.721500396728516, time: 2.46s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 5: {'pred': ' B', 'chunk_ppl': [13.721500396728516], 'total_ppl': 13.721500396728516}
6it [05:39, 56.40s/it]Chunk: 1/0, ppl: 11.084712982177734, time: 1.76s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 6: {'pred': ' A', 'chunk_ppl': [11.084712982177734], 'total_ppl': 11.084712982177734}
7it [06:34, 55.66s/it]Chunk: 1/0, ppl: 14.174595832824707, time: 2.55s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 7: {'pred': ' B', 'chunk_ppl': [14.174595832824707], 'total_ppl': 14.174595832824707}
8it [07:24, 54.05s/it]Chunk: 1/0, ppl: 14.266956329345703, time: 2.41s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 8: {'pred': ' B', 'chunk_ppl': [14.266956329345703], 'total_ppl': 14.266956329345703}
9it [08:19, 54.28s/it]Chunk: 1/0, ppl: 14.39731216430664, time: 2.46s
Initial tokens: tensor([[[[ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 5.5859e-01,  9.8438e-01,  1.0625e+00,  ...,  1.3281e+00,
           -9.1797e-02,  4.1602e-01],
          [ 4.6875e-01,  7.4707e-02,  4.0283e-02,  ...,  4.4189e-02,
           -1.1719e-01, -1.4941e-01],
          ...,
          [ 6.9375e+00,  3.4531e+00,  2.5469e+00,  ...,  6.4062e-01,
           -1.9141e+00, -1.8281e+00],
          [ 7.3438e+00,  3.2344e+00,  1.5156e+00,  ...,  1.3438e+00,
           -1.7109e+00, -1.5078e+00],
          [ 6.0625e+00,  3.3281e+00,  2.1094e+00,  ...,  1.6211e-01,
           -1.8906e+00, -1.5781e+00]],

         [[ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [ 1.7822e-02, -7.5195e-02,  1.9653e-02,  ..., -1.1953e+00,
            8.2031e-01,  6.0303e-02],
          [-5.2979e-02, -4.6631e-02,  6.4453e-02,  ...,  9.0332e-02,
           -7.4219e-02, -1.3281e-01],
          ...,
          [-1.8438e+00, -1.2578e+00,  1.1406e+00,  ...,  1.6797e+00,
           -1.7578e+00, -1.2812e+00],
          [-6.7578e-01, -1.6953e+00,  1.2422e+00,  ...,  1.5781e+00,
           -1.9297e+00, -1.6875e+00],
          [-1.4844e+00, -1.5625e+00,  1.4688e+00,  ...,  1.5547e+00,
           -2.2812e+00, -7.9688e-01]],

         [[ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 6.6406e-02, -5.2979e-02, -3.8574e-02,  ...,  2.8906e-01,
            1.8984e+00, -9.9219e-01],
          [ 2.1729e-02, -2.9785e-02, -2.4536e-02,  ..., -6.7871e-02,
           -1.3770e-01,  9.6191e-02],
          ...,
          [-3.5547e-01,  3.8477e-01,  3.2812e-01,  ...,  1.9141e+00,
           -1.9531e+00, -2.9297e-01],
          [ 4.5898e-02, -2.5781e-01,  3.3789e-01,  ..., -6.3281e-01,
           -2.4688e+00, -3.1445e-01],
          [-2.5391e-01, -1.0010e-01,  4.1602e-01,  ...,  1.2695e-01,
           -2.5156e+00,  8.6719e-01]],

         ...,

         [[-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.9727e-01, -1.3086e-01,  2.7771e-03,  ...,  1.4844e+00,
           -7.6562e-01,  7.6172e-01],
          [-1.1084e-01,  9.4238e-02,  1.4526e-02,  ...,  2.5513e-02,
            3.1494e-02, -1.0693e-01],
          ...,
          [-1.2031e+00,  6.5234e-01, -2.4902e-02,  ..., -1.3516e+00,
            6.4062e-01, -1.6484e+00],
          [-1.7500e+00,  1.3672e+00,  2.8516e-01,  ..., -1.5703e+00,
            1.4688e+00, -1.4062e+00],
          [-1.4453e+00,  7.5781e-01,  1.6309e-01,  ..., -1.5078e+00,
            7.0312e-01, -8.4766e-01]],

         [[-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-4.9072e-02, -8.0078e-02,  4.7363e-02,  ...,  7.1094e-01,
           -4.9805e-01,  3.8477e-01],
          [-1.6113e-01, -2.0410e-01,  2.3047e-01,  ..., -1.3672e-01,
            1.4551e-01, -8.8379e-02],
          ...,
          [-3.2188e+00, -2.9062e+00,  3.4688e+00,  ..., -6.4062e-01,
            1.5469e+00, -2.8125e+00],
          [-6.0312e+00, -5.6250e+00,  4.3125e+00,  ..., -1.2969e+00,
            2.7188e+00, -2.8750e+00],
          [-4.6250e+00, -4.5000e+00,  4.5938e+00,  ..., -5.0781e-01,
            2.0625e+00, -2.2812e+00]],

         [[-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.6724e-02, -1.0889e-01, -7.8735e-03,  ...,  2.4219e+00,
            1.7031e+00,  1.7812e+00],
          [-1.0010e-02, -1.2598e-01,  6.2500e-02,  ..., -3.2471e-02,
           -8.2031e-02,  4.5898e-02],
          ...,
          [ 7.6953e-01, -2.8281e+00,  7.2656e-01,  ..., -9.4141e-01,
           -1.3750e+00, -4.2383e-01],
          [ 8.5938e-01, -3.2344e+00,  9.2969e-01,  ..., -9.8828e-01,
           -1.2734e+00, -4.0625e-01],
          [ 5.8594e-01, -2.7656e+00,  5.4688e-01,  ..., -9.6484e-01,
           -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16)
Output 9: {'pred': ' B', 'chunk_ppl': [14.39731216430664], 'total_ppl': 14.39731216430664}
10it [09:09, 54.96s/it]
Editor is loading...
Leave a Comment