-
Notifications
You must be signed in to change notification settings - Fork 82
/
output.py
115 lines (115 loc) · 9.26 KB
/
output.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
{'text': tensor([[15914, 19550, 2930, 231, 24726, 49657, 234, 2415, 97, 5233,
255, 18034, 3919, 95, 10034, 253, 11319, 12560, 33597, 7781,
1546, 8244, 11336, 27584, 5233, 255, 18034, 3582, 41908, 39823,
171, 120, 234, 20949, 3254, 249, 46204, 2215, 224, 9722,
5823, 1546, 5233, 255, 18034, 14245, 11336, 8225, 13486, 1543,
1231, 1543]], device='cuda:0', dtype=torch.int32), 'text_len': tensor([52], device='cuda:0', dtype=torch.int32), 'prompt_text': tensor([[17028, 13824, 16989, 6734, 30337, 2347, 113, 1546, 9042, 2930,
231, 45456, 23786, 15003, 6912, 5266, 233, 1369, 230, 1231,
1543]], device='cuda:0', dtype=torch.int32), 'prompt_text_len': tensor([21], device='cuda:0', dtype=torch.int32), 'llm_prompt_speech_token': tensor([[ 587, 523, 903, 357, 448, 137, 407, 257, 355, 231, 382, 382,
418, 2302, 418, 346, 619, 394, 302, 137, 2302, 153, 515, 506,
3052, 173, 52, 212, 143, 547, 23, 688, 2362, 457, 629, 79,
720, 533, 446, 110, 514, 755, 493, 38, 585, 160, 269, 27,
328, 499, 499, 247, 33, 160, 468, 2723, 244, 244, 318, 502,
3889, 197, 2645, 121, 170, 676, 328, 629, 690, 731, 423, 174,
415, 415, 310, 495, 889, 889, 889, 737, 723, 1401, 207, 2299,
612, 527, 100, 603, 275, 1593, 511, 356, 356, 714, 77, 535,
2989, 48, 48, 732, 74, 110, 449, 400, 422, 690, 1930, 1930,
1930, 674, 540, 167, 167, 1479, 6, 373, 658, 1849, 249, 249,
327, 327, 327, 249, 327, 327, 262, 249, 249, 3054, 3054, 505,
561, 675, 262, 675, 463, 463, 463, 262, 262, 262, 262, 262,
262, 463]], device='cuda:0', dtype=torch.int32), 'llm_prompt_speech_token_len': tensor([146], device='cuda:0', dtype=torch.int32), 'flow_prompt_speech_token': tensor([[ 587, 523, 903, 357, 448, 137, 407, 257, 355, 231, 382, 382,
418, 2302, 418, 346, 619, 394, 302, 137, 2302, 153, 515, 506,
3052, 173, 52, 212, 143, 547, 23, 688, 2362, 457, 629, 79,
720, 533, 446, 110, 514, 755, 493, 38, 585, 160, 269, 27,
328, 499, 499, 247, 33, 160, 468, 2723, 244, 244, 318, 502,
3889, 197, 2645, 121, 170, 676, 328, 629, 690, 731, 423, 174,
415, 415, 310, 495, 889, 889, 889, 737, 723, 1401, 207, 2299,
612, 527, 100, 603, 275, 1593, 511, 356, 356, 714, 77, 535,
2989, 48, 48, 732, 74, 110, 449, 400, 422, 690, 1930, 1930,
1930, 674, 540, 167, 167, 1479, 6, 373, 658, 1849, 249, 249,
327, 327, 327, 249, 327, 327, 262, 249, 249, 3054, 3054, 505,
561, 675, 262, 675, 463, 463, 463, 262, 262, 262, 262, 262,
262, 463]], device='cuda:0', dtype=torch.int32), 'flow_prompt_speech_token_len': tensor([146], device='cuda:0', dtype=torch.int32), 'prompt_speech_feat': tensor([[[ -3.2587, -2.3695, -1.7929, ..., -7.6328, -6.9032, -6.9614],
[ -3.7286, -2.4937, -1.5339, ..., -6.2465, -5.8583, -6.2916],
[ -3.9566, -2.7857, -2.1302, ..., -4.2144, -4.9193, -4.8670],
...,
[-11.5129, -11.5129, -11.5129, ..., -11.5129, -11.5129, -11.5129],
[-11.5129, -11.5129, -11.5129, ..., -11.5129, -11.5129, -11.5129],
[-11.5129, -11.5129, -11.5129, ..., -11.5129, -11.5129, -11.5129]]],
device='cuda:0'), 'prompt_speech_feat_len': tensor([251], device='cuda:0', dtype=torch.int32), 'llm_embedding': tensor([[-3.0198e-01, -4.0106e-01, 1.0665e+00, -5.9328e-01, -1.6207e+00,
1.2474e+00, 2.9737e-01, 9.2362e-01, 8.3976e-01, -1.8617e-01,
-5.6409e-01, 5.2133e-01, 6.4249e-01, 9.4127e-01, 3.0282e-01,
7.5725e-01, 2.0113e-01, -1.0122e+00, 3.8056e-01, -6.8912e-01,
6.7556e-01, -4.5324e-01, -1.0907e+00, -5.7660e-01, -3.9130e-01,
-5.0389e-01, -3.6155e-01, 9.4267e-01, -1.0804e+00, -9.0521e-01,
1.0079e-01, -2.6324e-01, -1.2481e-01, -4.8579e-01, -2.8096e-01,
-7.6473e-01, 4.0337e-01, 6.9027e-01, 1.4903e+00, 3.7894e-01,
-5.1400e-01, -1.2935e+00, -5.9837e-01, -6.0933e-03, -1.4599e-02,
-8.8079e-01, 1.3666e-01, -2.7457e-01, 4.0515e-01, -1.1806e+00,
-1.8888e-03, -5.0358e-01, 7.3387e-01, -1.4077e-01, -7.0481e-01,
-1.2797e+00, 1.4581e+00, -2.7251e-01, -1.1964e+00, 1.0890e+00,
-9.9699e-01, 2.7023e-01, 5.8540e-01, -1.3854e+00, -5.3380e-01,
-2.6040e-01, 9.3134e-01, 3.9033e-01, -5.6773e-01, -6.8802e-01,
-5.5673e-01, 4.4156e-01, 7.4834e-03, -2.9397e-02, 4.0503e-01,
4.5468e-01, -9.7241e-01, 1.0550e+00, 1.1600e-01, -2.7122e-01,
-1.1961e+00, -4.3957e-01, 8.5048e-01, -2.9302e-01, -1.5563e+00,
-7.2707e-01, 3.6826e-01, 5.5664e-01, -1.1723e+00, 8.5411e-01,
-3.6839e-01, 4.0099e-01, 1.6778e-01, -3.3961e-01, -9.8439e-01,
-1.8346e+00, -1.4010e-01, -6.1556e-01, -1.6202e-01, -5.3205e-01,
-3.8124e-01, -1.2870e+00, 3.0516e-01, 6.5046e-01, -1.8538e-01,
7.7958e-01, -8.7138e-01, 9.3351e-01, 1.2922e+00, -6.9212e-01,
3.2726e-01, -5.7905e-01, -4.7936e-01, -3.9326e-02, -1.0883e+00,
6.6536e-01, 1.6051e-01, -9.6558e-02, -7.4457e-02, -4.1459e-01,
-1.8770e-01, -1.7453e+00, -3.3950e-01, -8.1656e-01, -9.7103e-02,
-8.3305e-01, -1.5187e+00, 7.2177e-01, -1.9412e+00, 3.4085e-01,
-2.0548e+00, 4.9950e-02, -5.6675e-01, -5.7753e-02, -6.4366e-01,
-3.3841e-01, 1.8565e-01, -7.1072e-01, -1.8700e-01, -8.5996e-01,
1.6759e-01, 8.1523e-01, 3.5534e-01, 6.6682e-01, 6.7483e-01,
9.7217e-02, -4.5939e-01, -7.7941e-01, 8.5763e-01, -8.4580e-01,
2.0544e-01, -3.4525e-01, -8.4439e-01, 4.8215e-01, 7.5473e-01,
-2.0392e+00, 1.2164e-01, -8.6227e-01, -8.4100e-01, 4.1555e-01,
-1.6455e+00, -3.8724e-01, 8.8501e-01, -1.4800e+00, 4.4640e-01,
-6.8488e-01, 1.2484e+00, -1.0540e+00, -4.3345e-01, -1.8748e+00,
6.5114e-01, -7.7131e-01, -1.8773e+00, -6.3574e-01, 6.3260e-01,
6.3379e-01, -4.1154e-01, -1.0171e+00, 5.8416e-01, -8.1579e-01,
-9.1071e-01, -3.1034e-01, -3.0416e-01, -6.5502e-01, -4.1040e-01,
1.0924e+00, -9.7041e-01, 1.8744e+00, -1.9735e-01, -2.7804e-03,
-3.6434e-03, -1.9607e-01]], device='cuda:0'), 'flow_embedding': tensor([[-3.0198e-01, -4.0106e-01, 1.0665e+00, -5.9328e-01, -1.6207e+00,
1.2474e+00, 2.9737e-01, 9.2362e-01, 8.3976e-01, -1.8617e-01,
-5.6409e-01, 5.2133e-01, 6.4249e-01, 9.4127e-01, 3.0282e-01,
7.5725e-01, 2.0113e-01, -1.0122e+00, 3.8056e-01, -6.8912e-01,
6.7556e-01, -4.5324e-01, -1.0907e+00, -5.7660e-01, -3.9130e-01,
-5.0389e-01, -3.6155e-01, 9.4267e-01, -1.0804e+00, -9.0521e-01,
1.0079e-01, -2.6324e-01, -1.2481e-01, -4.8579e-01, -2.8096e-01,
-7.6473e-01, 4.0337e-01, 6.9027e-01, 1.4903e+00, 3.7894e-01,
-5.1400e-01, -1.2935e+00, -5.9837e-01, -6.0933e-03, -1.4599e-02,
-8.8079e-01, 1.3666e-01, -2.7457e-01, 4.0515e-01, -1.1806e+00,
-1.8888e-03, -5.0358e-01, 7.3387e-01, -1.4077e-01, -7.0481e-01,
-1.2797e+00, 1.4581e+00, -2.7251e-01, -1.1964e+00, 1.0890e+00,
-9.9699e-01, 2.7023e-01, 5.8540e-01, -1.3854e+00, -5.3380e-01,
-2.6040e-01, 9.3134e-01, 3.9033e-01, -5.6773e-01, -6.8802e-01,
-5.5673e-01, 4.4156e-01, 7.4834e-03, -2.9397e-02, 4.0503e-01,
4.5468e-01, -9.7241e-01, 1.0550e+00, 1.1600e-01, -2.7122e-01,
-1.1961e+00, -4.3957e-01, 8.5048e-01, -2.9302e-01, -1.5563e+00,
-7.2707e-01, 3.6826e-01, 5.5664e-01, -1.1723e+00, 8.5411e-01,
-3.6839e-01, 4.0099e-01, 1.6778e-01, -3.3961e-01, -9.8439e-01,
-1.8346e+00, -1.4010e-01, -6.1556e-01, -1.6202e-01, -5.3205e-01,
-3.8124e-01, -1.2870e+00, 3.0516e-01, 6.5046e-01, -1.8538e-01,
7.7958e-01, -8.7138e-01, 9.3351e-01, 1.2922e+00, -6.9212e-01,
3.2726e-01, -5.7905e-01, -4.7936e-01, -3.9326e-02, -1.0883e+00,
6.6536e-01, 1.6051e-01, -9.6558e-02, -7.4457e-02, -4.1459e-01,
-1.8770e-01, -1.7453e+00, -3.3950e-01, -8.1656e-01, -9.7103e-02,
-8.3305e-01, -1.5187e+00, 7.2177e-01, -1.9412e+00, 3.4085e-01,
-2.0548e+00, 4.9950e-02, -5.6675e-01, -5.7753e-02, -6.4366e-01,
-3.3841e-01, 1.8565e-01, -7.1072e-01, -1.8700e-01, -8.5996e-01,
1.6759e-01, 8.1523e-01, 3.5534e-01, 6.6682e-01, 6.7483e-01,
9.7217e-02, -4.5939e-01, -7.7941e-01, 8.5763e-01, -8.4580e-01,
2.0544e-01, -3.4525e-01, -8.4439e-01, 4.8215e-01, 7.5473e-01,
-2.0392e+00, 1.2164e-01, -8.6227e-01, -8.4100e-01, 4.1555e-01,
-1.6455e+00, -3.8724e-01, 8.8501e-01, -1.4800e+00, 4.4640e-01,
-6.8488e-01, 1.2484e+00, -1.0540e+00, -4.3345e-01, -1.8748e+00,
6.5114e-01, -7.7131e-01, -1.8773e+00, -6.3574e-01, 6.3260e-01,
6.3379e-01, -4.1154e-01, -1.0171e+00, 5.8416e-01, -8.1579e-01,
-9.1071e-01, -3.1034e-01, -3.0416e-01, -6.5502e-01, -4.1040e-01,
1.0924e+00, -9.7041e-01, 1.8744e+00, -1.9735e-01, -2.7804e-03,
-3.6434e-03, -1.9607e-01]], device='cuda:0')}