Untitled
unknown
plain_text
24 days ago
42 kB
8
Indexable
Answer: Segment Chunk: 1/0, ppl: 9.312779426574707, time: 0.95s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 0: {'pred': ' B', 'chunk_ppl': [9.312779426574707], 'total_ppl': 9.312779426574707} 1it [00:54, 54.40s/it]Chunk: 1/0, ppl: 8.38564682006836, time: 2.39s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 1: {'pred': ' B', 'chunk_ppl': [8.38564682006836], 'total_ppl': 8.38564682006836} 2it [01:53, 56.93s/it]Chunk: 1/0, ppl: 12.36805534362793, time: 1.97s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 2: {'pred': ' B', 'chunk_ppl': [12.36805534362793], 'total_ppl': 12.36805534362793} 3it [02:50, 57.26s/it]Chunk: 1/0, ppl: 16.007787704467773, time: 2.4s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 3: {'pred': ' B', 'chunk_ppl': [16.007787704467773], 'total_ppl': 16.007787704467773} 4it [03:48, 57.65s/it]Chunk: 1/0, ppl: 11.50775146484375, time: 2.35s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 4: {'pred': ' A', 'chunk_ppl': [11.50775146484375], 'total_ppl': 11.50775146484375} 5it [04:44, 56.82s/it]Chunk: 1/0, ppl: 13.721500396728516, time: 2.46s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 5: {'pred': ' B', 'chunk_ppl': [13.721500396728516], 'total_ppl': 13.721500396728516} 6it [05:39, 56.40s/it]Chunk: 1/0, ppl: 11.084712982177734, time: 1.76s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 6: {'pred': ' A', 'chunk_ppl': [11.084712982177734], 'total_ppl': 11.084712982177734} 7it [06:34, 55.66s/it]Chunk: 1/0, ppl: 14.174595832824707, time: 2.55s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 7: {'pred': ' B', 'chunk_ppl': [14.174595832824707], 'total_ppl': 14.174595832824707} 8it [07:24, 54.05s/it]Chunk: 1/0, ppl: 14.266956329345703, time: 2.41s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 8: {'pred': ' B', 'chunk_ppl': [14.266956329345703], 'total_ppl': 14.266956329345703} 9it [08:19, 54.28s/it]Chunk: 1/0, ppl: 14.39731216430664, time: 2.46s Initial tokens: tensor([[[[ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 5.5859e-01, 9.8438e-01, 1.0625e+00, ..., 1.3281e+00, -9.1797e-02, 4.1602e-01], [ 4.6875e-01, 7.4707e-02, 4.0283e-02, ..., 4.4189e-02, -1.1719e-01, -1.4941e-01], ..., [ 6.9375e+00, 3.4531e+00, 2.5469e+00, ..., 6.4062e-01, -1.9141e+00, -1.8281e+00], [ 7.3438e+00, 3.2344e+00, 1.5156e+00, ..., 1.3438e+00, -1.7109e+00, -1.5078e+00], [ 6.0625e+00, 3.3281e+00, 2.1094e+00, ..., 1.6211e-01, -1.8906e+00, -1.5781e+00]], [[ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [ 1.7822e-02, -7.5195e-02, 1.9653e-02, ..., -1.1953e+00, 8.2031e-01, 6.0303e-02], [-5.2979e-02, -4.6631e-02, 6.4453e-02, ..., 9.0332e-02, -7.4219e-02, -1.3281e-01], ..., [-1.8438e+00, -1.2578e+00, 1.1406e+00, ..., 1.6797e+00, -1.7578e+00, -1.2812e+00], [-6.7578e-01, -1.6953e+00, 1.2422e+00, ..., 1.5781e+00, -1.9297e+00, -1.6875e+00], [-1.4844e+00, -1.5625e+00, 1.4688e+00, ..., 1.5547e+00, -2.2812e+00, -7.9688e-01]], [[ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 6.6406e-02, -5.2979e-02, -3.8574e-02, ..., 2.8906e-01, 1.8984e+00, -9.9219e-01], [ 2.1729e-02, -2.9785e-02, -2.4536e-02, ..., -6.7871e-02, -1.3770e-01, 9.6191e-02], ..., [-3.5547e-01, 3.8477e-01, 3.2812e-01, ..., 1.9141e+00, -1.9531e+00, -2.9297e-01], [ 4.5898e-02, -2.5781e-01, 3.3789e-01, ..., -6.3281e-01, -2.4688e+00, -3.1445e-01], [-2.5391e-01, -1.0010e-01, 4.1602e-01, ..., 1.2695e-01, -2.5156e+00, 8.6719e-01]], ..., [[-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.9727e-01, -1.3086e-01, 2.7771e-03, ..., 1.4844e+00, -7.6562e-01, 7.6172e-01], [-1.1084e-01, 9.4238e-02, 1.4526e-02, ..., 2.5513e-02, 3.1494e-02, -1.0693e-01], ..., [-1.2031e+00, 6.5234e-01, -2.4902e-02, ..., -1.3516e+00, 6.4062e-01, -1.6484e+00], [-1.7500e+00, 1.3672e+00, 2.8516e-01, ..., -1.5703e+00, 1.4688e+00, -1.4062e+00], [-1.4453e+00, 7.5781e-01, 1.6309e-01, ..., -1.5078e+00, 7.0312e-01, -8.4766e-01]], [[-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-4.9072e-02, -8.0078e-02, 4.7363e-02, ..., 7.1094e-01, -4.9805e-01, 3.8477e-01], [-1.6113e-01, -2.0410e-01, 2.3047e-01, ..., -1.3672e-01, 1.4551e-01, -8.8379e-02], ..., [-3.2188e+00, -2.9062e+00, 3.4688e+00, ..., -6.4062e-01, 1.5469e+00, -2.8125e+00], [-6.0312e+00, -5.6250e+00, 4.3125e+00, ..., -1.2969e+00, 2.7188e+00, -2.8750e+00], [-4.6250e+00, -4.5000e+00, 4.5938e+00, ..., -5.0781e-01, 2.0625e+00, -2.2812e+00]], [[-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.6724e-02, -1.0889e-01, -7.8735e-03, ..., 2.4219e+00, 1.7031e+00, 1.7812e+00], [-1.0010e-02, -1.2598e-01, 6.2500e-02, ..., -3.2471e-02, -8.2031e-02, 4.5898e-02], ..., [ 7.6953e-01, -2.8281e+00, 7.2656e-01, ..., -9.4141e-01, -1.3750e+00, -4.2383e-01], [ 8.5938e-01, -3.2344e+00, 9.2969e-01, ..., -9.8828e-01, -1.2734e+00, -4.0625e-01], [ 5.8594e-01, -2.7656e+00, 5.4688e-01, ..., -9.6484e-01, -1.4375e+00, -6.4844e-01]]]], device='cuda:0', dtype=torch.bfloat16) Output 9: {'pred': ' B', 'chunk_ppl': [14.39731216430664], 'total_ppl': 14.39731216430664} 10it [09:09, 54.96s/it]
Editor is loading...
Leave a Comment