forked from DGNum/infrastructure
feat(krz01): move ollama to compute01 via a reverse proxy
krz01 has no public web IP. Signed-off-by: Ryan Lahfa <ryan@dgnum.eu>
This commit is contained in:
parent
363f8d3c67
commit
a4de5f4d31
4 changed files with 38 additions and 26 deletions
|
@ -21,6 +21,7 @@ lib.extra.mkConfig {
|
|||
"librenms"
|
||||
"mastodon"
|
||||
"nextcloud"
|
||||
"ollama-proxy"
|
||||
"outline"
|
||||
"plausible"
|
||||
"postgresql"
|
||||
|
|
27
machines/compute01/ollama-proxy.nix
Normal file
27
machines/compute01/ollama-proxy.nix
Normal file
|
@ -0,0 +1,27 @@
|
|||
{
|
||||
pkgs,
|
||||
nodes,
|
||||
meta,
|
||||
...
|
||||
}:
|
||||
{
|
||||
services.nginx = {
|
||||
enable = true;
|
||||
recommendedProxySettings = true;
|
||||
virtualHosts."ollama01.beta.dgnum.eu" = {
|
||||
enableACME = true;
|
||||
forceSSL = true;
|
||||
locations."/" = {
|
||||
proxyPass = "http://${meta.network.krz01.netbirdIp}:${toString nodes.krz01.config.services.ollama.port}";
|
||||
basicAuthFile = pkgs.writeText "ollama-htpasswd" ''
|
||||
raito:$y$j9T$UDEHpLtM52hRGK0I4qT6M0$N75AhENLqgtJnTGaPzq51imhjZvuPr.ow81Co1ZTcX2
|
||||
'';
|
||||
};
|
||||
};
|
||||
};
|
||||
|
||||
networking.firewall.allowedTCPPorts = [
|
||||
80
|
||||
443
|
||||
];
|
||||
}
|
|
@ -2,6 +2,8 @@
|
|||
config,
|
||||
lib,
|
||||
pkgs,
|
||||
meta,
|
||||
name,
|
||||
...
|
||||
}:
|
||||
|
||||
|
@ -59,22 +61,9 @@ lib.extra.mkConfig {
|
|||
];
|
||||
|
||||
services = {
|
||||
nginx = {
|
||||
enable = true;
|
||||
recommendedProxySettings = true;
|
||||
virtualHosts."ollama01.beta.dgnum.eu" = {
|
||||
enableACME = true;
|
||||
forceSSL = true;
|
||||
locations."/" = {
|
||||
proxyPass = "http://${config.services.ollama.host}:${toString config.services.ollama.port}";
|
||||
basicAuthFile = pkgs.writeText "ollama-htpasswd" ''
|
||||
raito:$y$j9T$UDEHpLtM52hRGK0I4qT6M0$N75AhENLqgtJnTGaPzq51imhjZvuPr.ow81Co1ZTcX2
|
||||
'';
|
||||
};
|
||||
};
|
||||
};
|
||||
ollama = {
|
||||
enable = true;
|
||||
host = meta.network.${name}.netbirdIp;
|
||||
package = pkgs.callPackage ./ollama.nix {
|
||||
cudaPackages = pkgs.cudaPackages_11;
|
||||
# We need to thread our nvidia x11 driver for CUDA.
|
||||
|
@ -83,10 +72,7 @@ lib.extra.mkConfig {
|
|||
};
|
||||
};
|
||||
|
||||
networking.firewall.allowedTCPPorts = [
|
||||
80
|
||||
443
|
||||
];
|
||||
networking.firewall.interfaces.wt0.allowedTCPPorts = [ config.services.ollama.port ];
|
||||
};
|
||||
|
||||
root = ./.;
|
||||
|
|
14
meta/dns.nix
14
meta/dns.nix
|
@ -68,6 +68,12 @@ let
|
|||
"support" # Zammad support
|
||||
"telegraf" # Telegraf
|
||||
|
||||
# Beta-grade machine learning API servers
|
||||
"ollama01.beta"
|
||||
"openui.beta"
|
||||
"whisper.beta"
|
||||
"stable-diffusion.beta"
|
||||
|
||||
# DGSI
|
||||
"dgsi"
|
||||
"profil"
|
||||
|
@ -129,14 +135,6 @@ let
|
|||
"cas-eleves"
|
||||
"vote"
|
||||
];
|
||||
|
||||
krz01.dual = [
|
||||
# Beta-grade machine learning API servers
|
||||
"ollama01.beta"
|
||||
"openui.beta"
|
||||
"whisper.beta"
|
||||
"stable-diffusion.beta"
|
||||
];
|
||||
}
|
||||
)
|
||||
);
|
||||
|
|
Loading…
Reference in a new issue