File tree Expand file tree Collapse file tree 5 files changed +49
-4
lines changed Expand file tree Collapse file tree 5 files changed +49
-4
lines changed Original file line number Diff line number Diff line change 4
4
.cache /
5
5
* .swp
6
6
.vscode /
7
+ .idea /
7
8
* .bat
8
9
* .bin
9
10
* .exe
10
11
* .gguf
11
12
output * .png
12
13
models *
13
- * .log
14
+ * .log
Original file line number Diff line number Diff line change @@ -137,7 +137,9 @@ This provides BLAS acceleration using the ROCm cores of your AMD GPU. Make sure
137
137
Windows User Refer to [docs/hipBLAS_on_Windows.md](docs%2FhipBLAS_on_Windows.md) for a comprehensive guide.
138
138
139
139
```
140
- cmake .. -G "Ninja" -DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ -DSD_HIPBLAS=ON -DCMAKE_BUILD_TYPE=Release -DAMDGPU_TARGETS=gfx1100 -DCMAKE_BUILD_WITH_INSTALL_RPATH=ON
140
+ export GFX_NAME=$(rocminfo | grep -m 1 -E "gfx[ ^ 0 ] {1}" | sed -e 's/ * Name: * //' | awk '{$1=$1; print}' || echo "rocminfo missing")
141
+ echo $GFX_NAME
142
+ cmake .. -G "Ninja" -DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ -DSD_HIPBLAS=ON -DCMAKE_BUILD_TYPE=Release -DGPU_TARGETS=$GFX_NAME -DCMAKE_BUILD_WITH_INSTALL_RPATH=ON
141
143
cmake --build . --config Release
142
144
```
143
145
Original file line number Diff line number Diff line change @@ -10,4 +10,30 @@ Here's a simple example:
10
10
./bin/sd -m ../models/v1-5-pruned-emaonly.safetensors -p "a lovely cat<lora:marblesh:1>" --lora-model-dir ../models
11
11
```
12
12
13
- ` ../models/marblesh.safetensors ` or ` ../models/marblesh.ckpt ` will be applied to the model
13
+ ` ../models/marblesh.safetensors ` or ` ../models/marblesh.ckpt ` will be applied to the model
14
+
15
+ # Support matrix
16
+
17
+ > ℹ️ CUDA ` get_rows ` support is defined here:
18
+ > [ ggml-org/ggml/src/ggml-cuda/getrows.cu#L156] ( https://github.com/ggml-org/ggml/blob/7dee1d6a1e7611f238d09be96738388da97c88ed/src/ggml-cuda/getrows.cu#L156 )
19
+ > Currently only the basic types + Q4/Q5/Q8 are implemented. K-quants are ** not** supported.
20
+
21
+ NOTE: The other backends may have different support.
22
+
23
+ | Quant / Type | CUDA |
24
+ | --------------| ------|
25
+ | F32 | ✔️ |
26
+ | F16 | ✔️ |
27
+ | BF16 | ✔️ |
28
+ | I32 | ✔️ |
29
+ | Q4_0 | ✔️ |
30
+ | Q4_1 | ✔️ |
31
+ | Q5_0 | ✔️ |
32
+ | Q5_1 | ✔️ |
33
+ | Q8_0 | ✔️ |
34
+ | Q2_K | ❌ |
35
+ | Q3_K | ❌ |
36
+ | Q4_K | ❌ |
37
+ | Q5_K | ❌ |
38
+ | Q6_K | ❌ |
39
+ | Q8_K | ❌ |
Original file line number Diff line number Diff line change 1
1
#include < stdio.h>
2
2
#include < string.h>
3
3
#include < time.h>
4
+ #include < filesystem>
4
5
#include < functional>
5
6
#include < iostream>
6
7
#include < map>
@@ -1283,6 +1284,21 @@ int main(int argc, const char* argv[]) {
1283
1284
}
1284
1285
}
1285
1286
1287
+ // create directory if not exists
1288
+ {
1289
+ namespace fs = std::filesystem;
1290
+ const fs::path out_path = params.output_path ;
1291
+ if (const fs::path out_dir = out_path.parent_path (); !out_dir.empty ()) {
1292
+ std::error_code ec;
1293
+ fs::create_directories (out_dir, ec); // OK if already exists
1294
+ if (ec) {
1295
+ fprintf (stderr, " failed to create directory '%s': %s\n " ,
1296
+ out_dir.string ().c_str (), ec.message ().c_str ());
1297
+ return 1 ;
1298
+ }
1299
+ }
1300
+ }
1301
+
1286
1302
std::string base_path;
1287
1303
std::string file_ext;
1288
1304
std::string file_ext_lower;
Original file line number Diff line number Diff line change @@ -330,7 +330,7 @@ class StableDiffusionGGML {
330
330
if (sd_version_is_dit (version)) {
331
331
use_t5xxl = true ;
332
332
}
333
- if (!ggml_backend_is_cpu (backend) && use_t5xxl) {
333
+ if (!clip_on_cpu && ! ggml_backend_is_cpu (backend) && use_t5xxl) {
334
334
LOG_WARN (
335
335
" !!!It appears that you are using the T5 model. Some backends may encounter issues with it."
336
336
" If you notice that the generated images are completely black,"
You can’t perform that action at this time.
0 commit comments