commit f2e128712bd859e058060937e666c6aaff72d213 · kitten.sh/system

+47

home/apps/ollama.nix

···

       7
        
           "${pkgs.ollama}/bin/ollama"

     

       8
        
           "serve"

     

       9
        
         ];

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       10
        
       in {

     

       11
        
         options.modules.apps.ollama = {

     

       12
        
           enable = mkOption {

     
···

       14
        
             description = "Whether to enable Ollama.";

     

       15
        
             type = types.bool;

     

       16
        
           };

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       17
        
         };

     

       18
        
       

     

       19
        
         config = mkIf (cfg.enable && cfg.ollama.enable) (mkMerge [

     
···

       29
        
               };

     

       30
        
               Install.WantedBy = [ "default.target" ];

     

       31
        
               Service = {

     

       0
        
       
     

       32
        
                 ExecStart = escapeShellArgs ollamaArgs;

     

       33
        
                 Restart = "on-failure";

     

       34
        
                 RestartSec = 5;

     
···

       40
        
             launchd.agents.ollama = {

     

       41
        
               enable = true;

     

       42
        
               config = {

     

       0
        
       
     

       43
        
                 ProcessType = "Background";

     

       44
        
                 ProgramArguments = ollamaArgs;

     

       45
        
                 KeepAlive = {

···

       7
        
           "${pkgs.ollama}/bin/ollama"

     

       8
        
           "serve"

     

       9
        
         ];

     

       10
       +
       

     

       11
       +
         toEnvironmentCfg = vars: mapAttrsToList (k: v: "${k}=${escapeShellArg v}") vars;

     

       12
       +
       

     

       13
       +
         env = {

     

       14
       +
           OLLAMA_HOST = cfg.ollama.host;

     

       15
       +
           OLLAMA_FLASH_ATTENTION = if cfg.ollama.flashAttention then "1" else "0";

     

       16
       +
           OLLAMA_SCHED_SPREAD = if cfg.ollama.schedSpread then "1" else "0";

     

       17
       +
           OLLAMA_INTEL_GPU = if cfg.ollama.intelGpu then "1" else "0";

     

       18
       +
         };

     

       19
        
       in {

     

       20
        
         options.modules.apps.ollama = {

     

       21
        
           enable = mkOption {

     
···

       23
        
             description = "Whether to enable Ollama.";

     

       24
        
             type = types.bool;

     

       25
        
           };

     

       26
       +
       

     

       27
       +
           host = mkOption {

     

       28
       +
             default = "http://0.0.0.0:11434";

     

       29
       +
             description = "Determines the host and port to listen on";

     

       30
       +
             type = types.str;

     

       31
       +
           };

     

       32
       +
       

     

       33
       +
           flashAttention = mkOption {

     

       34
       +
             default = false;

     

       35
       +
             description = ''

     

       36
       +
               Enables experimental flash att  ention feature.

     

       37
       +
               Effect: Activates an experimental optimization for attention mechanisms.

     

       38
       +
               Scenario: Can potentially improve performance on compatible hardware but may introduce instability.

     

       39
       +
             '';

     

       40
       +
             type = types.bool;

     

       41
       +
           };

     

       42
       +
       

     

       43
       +
           schedSpread = mkOption {

     

       44
       +
             default = false;

     

       45
       +
             description = ''

     

       46
       +
               Allows scheduling models across all GPUs.

     

       47
       +
               Effect: Enables multi-GPU usage for model inference.

     

       48
       +
               Scenario: Beneficial in high-performance computing environments with multiple GPUs to maximize hardware utilization.

     

       49
       +
             '';

     

       50
       +
             type = types.bool;

     

       51
       +
           };

     

       52
       +
       

     

       53
       +
           intelGpu = mkOption {

     

       54
       +
             default = false;

     

       55
       +
             description = ''

     

       56
       +
               Enables experimental Intel GPU detection.

     

       57
       +
               Effect: Allows usage of Intel GPUs for model inference.

     

       58
       +
               Scenario: Useful for organizations leveraging Intel GPU hardware for AI workloads.

     

       59
       +
             '';

     

       60
       +
             type = types.bool;

     

       61
       +
           };

     

       62
        
         };

     

       63
        
       

     

       64
        
         config = mkIf (cfg.enable && cfg.ollama.enable) (mkMerge [

     
···

       74
        
               };

     

       75
        
               Install.WantedBy = [ "default.target" ];

     

       76
        
               Service = {

     

       77
       +
                 Environment = toEnvironmentCfg env;

     

       78
        
                 ExecStart = escapeShellArgs ollamaArgs;

     

       79
        
                 Restart = "on-failure";

     

       80
        
                 RestartSec = 5;

     
···

       86
        
             launchd.agents.ollama = {

     

       87
        
               enable = true;

     

       88
        
               config = {

     

       89
       +
                 EnvironmentVariables = env;

     

       90
        
                 ProcessType = "Background";

     

       91
        
                 ProgramArguments = ollamaArgs;

     

       92
        
                 KeepAlive = {