0527
@@ -0,0 +1,21 @@
|
|||||||
|
MIT License
|
||||||
|
|
||||||
|
Copyright (c) 2024 Nishant Aklecha
|
||||||
|
|
||||||
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
||||||
|
of this software and associated documentation files (the "Software"), to deal
|
||||||
|
in the Software without restriction, including without limitation the rights
|
||||||
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
||||||
|
copies of the Software, and to permit persons to whom the Software is
|
||||||
|
furnished to do so, subject to the following conditions:
|
||||||
|
|
||||||
|
The above copyright notice and this permission notice shall be included in all
|
||||||
|
copies or substantial portions of the Software.
|
||||||
|
|
||||||
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||||
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||||
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||||
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||||
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||||
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
||||||
|
SOFTWARE.
|
||||||
|
After Width: | Height: | Size: 773 KiB |
|
After Width: | Height: | Size: 634 KiB |
|
After Width: | Height: | Size: 289 KiB |
|
After Width: | Height: | Size: 846 KiB |
|
After Width: | Height: | Size: 202 KiB |
|
After Width: | Height: | Size: 470 KiB |
|
After Width: | Height: | Size: 799 KiB |
|
After Width: | Height: | Size: 814 KiB |
|
After Width: | Height: | Size: 1.2 MiB |
|
After Width: | Height: | Size: 800 KiB |
|
After Width: | Height: | Size: 49 KiB |
|
After Width: | Height: | Size: 27 KiB |
|
After Width: | Height: | Size: 26 KiB |
|
After Width: | Height: | Size: 27 KiB |
|
After Width: | Height: | Size: 27 KiB |
|
After Width: | Height: | Size: 26 KiB |
|
After Width: | Height: | Size: 27 KiB |
|
After Width: | Height: | Size: 787 KiB |
|
After Width: | Height: | Size: 430 KiB |
|
After Width: | Height: | Size: 423 KiB |
|
After Width: | Height: | Size: 1004 KiB |
|
After Width: | Height: | Size: 472 KiB |
|
After Width: | Height: | Size: 659 KiB |
|
After Width: | Height: | Size: 309 KiB |
|
After Width: | Height: | Size: 297 KiB |
|
After Width: | Height: | Size: 484 KiB |
|
After Width: | Height: | Size: 189 KiB |
|
After Width: | Height: | Size: 497 KiB |
|
After Width: | Height: | Size: 551 KiB |
|
After Width: | Height: | Size: 341 KiB |
|
After Width: | Height: | Size: 516 KiB |
|
After Width: | Height: | Size: 401 KiB |
|
After Width: | Height: | Size: 191 KiB |
|
After Width: | Height: | Size: 384 KiB |
|
After Width: | Height: | Size: 605 KiB |
|
After Width: | Height: | Size: 488 KiB |
|
After Width: | Height: | Size: 188 KiB |
|
After Width: | Height: | Size: 200 KiB |
|
After Width: | Height: | Size: 380 KiB |
@@ -0,0 +1,11 @@
|
|||||||
|
{
|
||||||
|
"dim": 4096,
|
||||||
|
"n_layers": 32,
|
||||||
|
"n_heads": 32,
|
||||||
|
"n_kv_heads": 8,
|
||||||
|
"vocab_size": 128256,
|
||||||
|
"multiple_of": 1024,
|
||||||
|
"ffn_dim_multiplier": 1.3,
|
||||||
|
"norm_eps": 1e-05,
|
||||||
|
"rope_theta": 500000.0
|
||||||
|
}
|
||||||
@@ -0,0 +1,9 @@
|
|||||||
|
{'dim': 4096,
|
||||||
|
'n_layers': 32,
|
||||||
|
'n_heads': 32,
|
||||||
|
'n_kv_heads': 8,
|
||||||
|
'vocab_size': 128256,
|
||||||
|
'multiple_of': 1024,
|
||||||
|
'ffn_dim_multiplier': 1.3,
|
||||||
|
'norm_eps': 1e-05,
|
||||||
|
'rope_theta': 500000.0}
|
||||||
@@ -0,0 +1,5 @@
|
|||||||
|
sentencepiece
|
||||||
|
tiktoken
|
||||||
|
torch
|
||||||
|
blobfile
|
||||||
|
matplotlib
|
||||||