From 69d0075f264ff24c5dc6a525998b156e78331560 Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Fri, 29 Nov 2024 17:43:30 +0100 Subject: [PATCH] feat: proof of concept --- .gitignore | 166 ++++++++++++++++++++++++++++++++++++++++++++ README.md | 16 +++++ kernels/__init__.py | 3 + kernels/utils.py | 31 +++++++++ pyproject.toml | 16 +++++ 5 files changed, 232 insertions(+) create mode 100644 .gitignore create mode 100644 kernels/__init__.py create mode 100644 kernels/utils.py create mode 100644 pyproject.toml diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..9a43d99 --- /dev/null +++ b/.gitignore @@ -0,0 +1,166 @@ +# Byte-compiled / optimized / DLL files +__pycache__/ +text_generation_server/__pycache__/ +text_generation_server/pb/__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +lib/ +lib64/ +parts/ +sdist/ +var/ +wheels/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +cover/ + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +.pybuilder/ +target/ + +# Jupyter Notebook +.ipynb_checkpoints + +# IPython +profile_default/ +ipython_config.py + +# pyenv +# For a library or package, you might want to ignore these files since the code is +# intended to run in multiple environments; otherwise, check them in: +# .python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# poetry +# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control. +# This is especially recommended for binary packages to ensure reproducibility, and is more +# commonly ignored for libraries. +# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control +#poetry.lock + +# pdm +# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control. +#pdm.lock +# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it +# in version control. +# https://pdm.fming.dev/#use-with-ide +.pdm.toml + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# pytype static type analyzer +.pytype/ + +# Cython debug symbols +cython_debug/ + +transformers +safetensors +flash-attention/ +flash-attention-v2/ +vllm/ +llm-awq/ +eetq/ +mamba/ + +poetry.lock diff --git a/README.md b/README.md index fee07f5..a11205d 100644 --- a/README.md +++ b/README.md @@ -1 +1,17 @@ # kernels + +```python +import torch + +from kernels import get_kernel + +# Download optimized kernels from the Hugging Face hub +layer_norm_kernels = get_kernel("kernels-community/layer-norm") + +# Initialize torch Module +optimized_layer_norm_layer = layer_norm_kernels.DropoutAddLayerNorm(128).cuda() + +# Forward +x = torch.randn(128).cuda() +print(optimized_layer_norm_layer(x)) +``` diff --git a/kernels/__init__.py b/kernels/__init__.py new file mode 100644 index 0000000..2f47893 --- /dev/null +++ b/kernels/__init__.py @@ -0,0 +1,3 @@ +from kernels.utils import get_kernel + +__all__ = ["get_kernel"] diff --git a/kernels/utils.py b/kernels/utils.py new file mode 100644 index 0000000..0897782 --- /dev/null +++ b/kernels/utils.py @@ -0,0 +1,31 @@ +import torch +import sys +import importlib + +from pathlib import Path +from packaging.version import parse +from huggingface_hub import hf_hub_download, snapshot_download + + +def torch_version(): + return parse(torch.__version__) + + +def import_from_path(module_name, file_path): + spec = importlib.util.spec_from_file_location(module_name, file_path) + module = importlib.util.module_from_spec(spec) + sys.modules[module_name] = module + spec.loader.exec_module(module) + return module + + +def get_kernel(repo_id: str): + lib = snapshot_download(repo_id, + allow_patterns=f"build/{torch_version()}/*.so") + sys.path.append(lib + f"/build/{torch_version()}") + api = hf_hub_download(repo_id, filename="api.py") + + return import_from_path("api", api) + + + diff --git a/pyproject.toml b/pyproject.toml new file mode 100644 index 0000000..aa6c399 --- /dev/null +++ b/pyproject.toml @@ -0,0 +1,16 @@ +[tool.poetry] +name = "kernels" +version = "0.1.0" +description = "" +authors = ["OlivierDehaene "] +readme = "README.md" + +[tool.poetry.dependencies] +python = "^3.9" +huggingface-hub = "^0.26.3" +packaging = "^24.2" + + +[build-system] +requires = ["poetry-core"] +build-backend = "poetry.core.masonry.api"