Skip to content

Commit

Permalink
upgrade cog and use new format to specify target concurrency
Browse files Browse the repository at this point in the history
  • Loading branch information
technillogue committed May 17, 2024
1 parent 2f893d2 commit 3e555aa
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 3 deletions.
4 changes: 3 additions & 1 deletion cog.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,4 +2,6 @@ build:
gpu: true
python_version: "3.10"
predict: "predict.py:Predictor"
concurrency: 64
concurrency:
max: 64
default_target: 16
4 changes: 2 additions & 2 deletions default.nix
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ in
imports = [ ./interface.nix ];
cog.build = {
python_version = "3.10";
cog_version = "0.10.0-alpha5";
cog_version = "0.10.0-alpha7";
cuda = "12.1"; # todo: 12.2
gpu = true;
# inspiration: echo tensorrt_llm==0.8.0 | uv pip compile - --extra-index-url https://pypi.nvidia.com -p 3.10 --prerelease=allow --annotation-style=line
Expand Down Expand Up @@ -45,7 +45,7 @@ in
overrides = [
"tokenizers==0.19.0"
"transformers==4.40.0"
"cog @ https://r2.drysys.workers.dev/tmp/cog-0.10.0a6-py3-none-any.whl"
"cog==0.10.0a7"
];
};
cognix.includeNix = true;
Expand Down

0 comments on commit 3e555aa

Please sign in to comment.