Skip to content

Commit

Permalink
version 2.5.5
Browse files Browse the repository at this point in the history
  • Loading branch information
Goekdeniz-Guelmez committed Oct 4, 2024
1 parent 9ffd1a9 commit 00cf104
Show file tree
Hide file tree
Showing 7 changed files with 7 additions and 29 deletions.
7 changes: 4 additions & 3 deletions example-fineweb.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -31,8 +31,7 @@
"from model.args import MOEModelArgs\n",
"from model.KANaMoEv1 import KANaMoEv1\n",
"\n",
"from utils import load_model, quick_inference\n",
"from model.handler import save_pretrained\n",
"from model.handler import save_pretrained, quick_inference\n",
"\n",
"device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")"
]
Expand Down Expand Up @@ -183,7 +182,9 @@
"id": "32cd9a68",
"metadata": {},
"outputs": [],
"source": []
"source": [
"save_pretrained(path_to_save=\"fineweb/\", model=new_model)"
]
}
],
"metadata": {
Expand Down
2 changes: 1 addition & 1 deletion example_fineweb.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
from model.args import MOEModelArgs
from model.KANaMoEv1 import KANaMoEv1

from utils import load_model, quick_inference
from model.handler import from_pretrained, quick_inference

# device = 'cuda' if torch.cuda.is_available() else 'mps' if ( torch.backends.mps.is_available() and torch.backends.mps.is_built() ) else 'cpu'

Expand Down
2 changes: 1 addition & 1 deletion example_tiny_shakspear.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@
from model.args import MOEModelArgs
from model.KANaMoEv1 import KANamav5

from utils import load_model
from model.handler import from_pretrained


def lr_lambda(current_step: int, max_steps: int=50000, warmup_steps: int=40, lr_scheduler_type: str="cosine"):
Expand Down
2 changes: 1 addition & 1 deletion setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@
# Setup configuration
setup(
name="KANama",
version="2.5.0",
version="2.5.5",
description="Fusing Kolmogorov–Arnold Networks with Meta's Llama model for next-level AI performance and versatility.",
long_description=open(root_dir / "README.md", encoding="utf-8").read(),
long_description_content_type="text/markdown",
Expand Down
23 changes: 0 additions & 23 deletions test/config.json

This file was deleted.

Binary file removed test/model.pth
Binary file not shown.
File renamed without changes.

0 comments on commit 00cf104

Please sign in to comment.