aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--.gitignore4
-rw-r--r--flake.lock43
-rw-r--r--flake.nix48
3 files changed, 95 insertions, 0 deletions
diff --git a/.gitignore b/.gitignore
index 5eb1ff1..3087b0e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -18,6 +18,10 @@ models/*
/main
/quantize
+/result
arm_neon.h
compile_commands.json
+
+.envrc
+.direnv/
diff --git a/flake.lock b/flake.lock
new file mode 100644
index 0000000..343996d
--- /dev/null
+++ b/flake.lock
@@ -0,0 +1,43 @@
+{
+ "nodes": {
+ "flake-utils": {
+ "locked": {
+ "lastModified": 1676283394,
+ "narHash": "sha256-XX2f9c3iySLCw54rJ/CZs+ZK6IQy7GXNY4nSOyu2QG4=",
+ "owner": "numtide",
+ "repo": "flake-utils",
+ "rev": "3db36a8b464d0c4532ba1c7dda728f4576d6d073",
+ "type": "github"
+ },
+ "original": {
+ "owner": "numtide",
+ "repo": "flake-utils",
+ "type": "github"
+ }
+ },
+ "nixpkgs": {
+ "locked": {
+ "lastModified": 1678470307,
+ "narHash": "sha256-OEeMUr3ueLIXyW/OaFUX5jUdimyQwMg/7e+/Q0gC/QE=",
+ "owner": "NixOS",
+ "repo": "nixpkgs",
+ "rev": "0c4800d579af4ed98ecc47d464a5e7b0870c4b1f",
+ "type": "github"
+ },
+ "original": {
+ "owner": "NixOS",
+ "ref": "nixos-unstable",
+ "repo": "nixpkgs",
+ "type": "github"
+ }
+ },
+ "root": {
+ "inputs": {
+ "flake-utils": "flake-utils",
+ "nixpkgs": "nixpkgs"
+ }
+ }
+ },
+ "root": "root",
+ "version": 7
+}
diff --git a/flake.nix b/flake.nix
new file mode 100644
index 0000000..dae4ff6
--- /dev/null
+++ b/flake.nix
@@ -0,0 +1,48 @@
+{
+ inputs = {
+ nixpkgs.url = "github:NixOS/nixpkgs/nixos-unstable";
+ flake-utils.url = "github:numtide/flake-utils";
+ };
+ outputs = { self, nixpkgs, flake-utils }:
+ flake-utils.lib.eachDefaultSystem (system:
+ let
+ pkgs = import nixpkgs {
+ inherit system;
+ };
+ llama-python = pkgs.python310.withPackages (ps: with ps; [
+ torch
+ numpy
+ sentencepiece
+ ]);
+ in
+ {
+ packages.default = pkgs.stdenv.mkDerivation {
+ name = "llama.cpp";
+ src = ./.;
+ nativeBuildInputs = with pkgs; [ cmake ];
+ buildInputs = with pkgs; lib.optionals stdenv.isDarwin [
+ darwin.apple_sdk.frameworks.Accelerate
+ ];
+ cmakeFlags = with pkgs; lib.optionals (system == "aarch64-darwin") [
+ "-DCMAKE_C_FLAGS=-D__ARM_FEATURE_DOTPROD=1"
+ ];
+ installPhase = ''
+ mkdir -p $out/bin
+ mv llama $out/bin/llama
+ mv quantize $out/bin/quantize
+ echo "#!${llama-python}/bin/python" > $out/bin/convert-pth-to-ggml
+ cat ${./convert-pth-to-ggml.py} >> $out/bin/convert-pth-to-ggml
+ chmod +x $out/bin/convert-pth-to-ggml
+ '';
+ };
+ devShells.default = pkgs.mkShell {
+ packages = with pkgs; [
+ cmake
+ llama-python
+ ] ++ lib.optionals stdenv.isDarwin [
+ darwin.apple_sdk.frameworks.Accelerate
+ ];
+ };
+ }
+ );
+}