Last active
April 9, 2024 19:47
-
-
Save yifuwang/961b3a98aeba88e09a34a89f9702b8d7 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
[torch.Size([32000, 8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192, 8192]), torch.Size([1024, 8192]), torch.Size([1024, 8192]), torch.Size([8192, 8192]), torch.Size([28672, 8192]), torch.Size([8192, 28672]), torch.Size([28672, 8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([8192]), torch.Size([32000, 8192])] |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment