summaryrefslogtreecommitdiff
path: root/cnn_v3/training
diff options
context:
space:
mode:
authorskal <pascal.massimino@gmail.com>2026-03-22 07:33:28 +0100
committerskal <pascal.massimino@gmail.com>2026-03-22 07:33:28 +0100
commitfcd1ceb2168de76659091208f911d2c4d0c59ad7 (patch)
treed4e44618122c1b7927cca25e5b62c0967f4d9e80 /cnn_v3/training
parentbf33fee131b1eee03bc5a765ba360299bbcead06 (diff)
feat(cnn_v3): gen_sample tool + 7 simple training samples
- pack_photo_sample.py: --target now required (no albedo fallback) - gen_sample: bash wrapper with positional args (input target output_dir) - input/photo7.jpg: copy of photo2 (second style target) - target_1: photo2_1_out→photo2_out, photo2_2_out→photo7_out - dataset/simple/sample_001..007: 7 packed photo/target pairs handoff(Gemini): training data ready; next step is train_cnn_v3.py run
Diffstat (limited to 'cnn_v3/training')
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/albedo.pngbin0 -> 22390911 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/depth.pngbin0 -> 23365 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/matid.pngbin0 -> 11724 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/normal.pngbin0 -> 44260 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/shadow.pngbin0 -> 20443 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/target.pngbin0 -> 4363727 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_001/transp.pngbin0 -> 11724 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/albedo.pngbin0 -> 14366815 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/depth.pngbin0 -> 23365 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/matid.pngbin0 -> 11724 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/normal.pngbin0 -> 44260 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/shadow.pngbin0 -> 20443 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/target.pngbin0 -> 3079705 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_002/transp.pngbin0 -> 11724 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/albedo.pngbin0 -> 7252297 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/depth.pngbin0 -> 14234 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/matid.pngbin0 -> 7151 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/normal.pngbin0 -> 25739 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/shadow.pngbin0 -> 11255 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/target.pngbin0 -> 2436109 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_003/transp.pngbin0 -> 7151 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/albedo.pngbin0 -> 1245962 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/depth.pngbin0 -> 7389 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/matid.pngbin0 -> 3735 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/normal.pngbin0 -> 15342 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/shadow.pngbin0 -> 7738 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/target.pngbin0 -> 731778 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_004/transp.pngbin0 -> 3735 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/albedo.pngbin0 -> 1187567 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/depth.pngbin0 -> 1632 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/matid.pngbin0 -> 857 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/normal.pngbin0 -> 4590 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/shadow.pngbin0 -> 3137 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/target.pngbin0 -> 3140126 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_005/transp.pngbin0 -> 857 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/albedo.pngbin0 -> 2363392 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/depth.pngbin0 -> 2988 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/matid.pngbin0 -> 1534 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/normal.pngbin0 -> 7774 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/shadow.pngbin0 -> 4399 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/target.pngbin0 -> 3153440 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_006/transp.pngbin0 -> 1534 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/albedo.pngbin0 -> 14366815 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/depth.pngbin0 -> 23365 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/matid.pngbin0 -> 11724 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/normal.pngbin0 -> 44260 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/shadow.pngbin0 -> 20443 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/target.pngbin0 -> 3084795 bytes
-rw-r--r--cnn_v3/training/dataset/simple/sample_007/transp.pngbin0 -> 11724 bytes
-rwxr-xr-xcnn_v3/training/gen_sample21
-rw-r--r--cnn_v3/training/input/photo7.jpgbin0 -> 3328126 bytes
-rw-r--r--cnn_v3/training/pack_photo_sample.py17
-rw-r--r--cnn_v3/training/target_1/photo2_out.png (renamed from cnn_v3/training/target_1/photo2_1_out.png)bin2875939 -> 2875939 bytes
-rw-r--r--cnn_v3/training/target_1/photo7_out.png (renamed from cnn_v3/training/target_1/photo2_2_out.png)bin2865857 -> 2865857 bytes
54 files changed, 31 insertions, 7 deletions
diff --git a/cnn_v3/training/dataset/simple/sample_001/albedo.png b/cnn_v3/training/dataset/simple/sample_001/albedo.png
new file mode 100644
index 0000000..68220b3
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_001/depth.png b/cnn_v3/training/dataset/simple/sample_001/depth.png
new file mode 100644
index 0000000..5708605
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_001/matid.png b/cnn_v3/training/dataset/simple/sample_001/matid.png
new file mode 100644
index 0000000..2561108
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_001/normal.png b/cnn_v3/training/dataset/simple/sample_001/normal.png
new file mode 100644
index 0000000..489f629
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_001/shadow.png b/cnn_v3/training/dataset/simple/sample_001/shadow.png
new file mode 100644
index 0000000..f356fb2
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_001/target.png b/cnn_v3/training/dataset/simple/sample_001/target.png
new file mode 100644
index 0000000..268e167
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_001/transp.png b/cnn_v3/training/dataset/simple/sample_001/transp.png
new file mode 100644
index 0000000..2561108
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_001/transp.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/albedo.png b/cnn_v3/training/dataset/simple/sample_002/albedo.png
new file mode 100644
index 0000000..80f4f1c
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/depth.png b/cnn_v3/training/dataset/simple/sample_002/depth.png
new file mode 100644
index 0000000..5708605
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/matid.png b/cnn_v3/training/dataset/simple/sample_002/matid.png
new file mode 100644
index 0000000..2561108
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/normal.png b/cnn_v3/training/dataset/simple/sample_002/normal.png
new file mode 100644
index 0000000..489f629
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/shadow.png b/cnn_v3/training/dataset/simple/sample_002/shadow.png
new file mode 100644
index 0000000..f356fb2
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/target.png b/cnn_v3/training/dataset/simple/sample_002/target.png
new file mode 100644
index 0000000..d1d7192
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_002/transp.png b/cnn_v3/training/dataset/simple/sample_002/transp.png
new file mode 100644
index 0000000..2561108
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_002/transp.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/albedo.png b/cnn_v3/training/dataset/simple/sample_003/albedo.png
new file mode 100644
index 0000000..fe714bc
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/depth.png b/cnn_v3/training/dataset/simple/sample_003/depth.png
new file mode 100644
index 0000000..eac97a6
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/matid.png b/cnn_v3/training/dataset/simple/sample_003/matid.png
new file mode 100644
index 0000000..60a5b09
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/normal.png b/cnn_v3/training/dataset/simple/sample_003/normal.png
new file mode 100644
index 0000000..36dd1fd
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/shadow.png b/cnn_v3/training/dataset/simple/sample_003/shadow.png
new file mode 100644
index 0000000..c943f56
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/target.png b/cnn_v3/training/dataset/simple/sample_003/target.png
new file mode 100644
index 0000000..56205ca
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_003/transp.png b/cnn_v3/training/dataset/simple/sample_003/transp.png
new file mode 100644
index 0000000..60a5b09
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_003/transp.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/albedo.png b/cnn_v3/training/dataset/simple/sample_004/albedo.png
new file mode 100644
index 0000000..a1b817d
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/depth.png b/cnn_v3/training/dataset/simple/sample_004/depth.png
new file mode 100644
index 0000000..083c4a3
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/matid.png b/cnn_v3/training/dataset/simple/sample_004/matid.png
new file mode 100644
index 0000000..f14721f
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/normal.png b/cnn_v3/training/dataset/simple/sample_004/normal.png
new file mode 100644
index 0000000..0694ac1
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/shadow.png b/cnn_v3/training/dataset/simple/sample_004/shadow.png
new file mode 100644
index 0000000..9b6a5e0
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/target.png b/cnn_v3/training/dataset/simple/sample_004/target.png
new file mode 100644
index 0000000..019d7a8
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_004/transp.png b/cnn_v3/training/dataset/simple/sample_004/transp.png
new file mode 100644
index 0000000..f14721f
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_004/transp.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/albedo.png b/cnn_v3/training/dataset/simple/sample_005/albedo.png
new file mode 100644
index 0000000..5dfada7
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/depth.png b/cnn_v3/training/dataset/simple/sample_005/depth.png
new file mode 100644
index 0000000..db65c11
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/matid.png b/cnn_v3/training/dataset/simple/sample_005/matid.png
new file mode 100644
index 0000000..f098c4d
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/normal.png b/cnn_v3/training/dataset/simple/sample_005/normal.png
new file mode 100644
index 0000000..40305ec
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/shadow.png b/cnn_v3/training/dataset/simple/sample_005/shadow.png
new file mode 100644
index 0000000..8e270d3
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/target.png b/cnn_v3/training/dataset/simple/sample_005/target.png
new file mode 100644
index 0000000..41ead45
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_005/transp.png b/cnn_v3/training/dataset/simple/sample_005/transp.png
new file mode 100644
index 0000000..f098c4d
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_005/transp.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/albedo.png b/cnn_v3/training/dataset/simple/sample_006/albedo.png
new file mode 100644
index 0000000..6fd43d4
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/depth.png b/cnn_v3/training/dataset/simple/sample_006/depth.png
new file mode 100644
index 0000000..4ccb0bc
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/matid.png b/cnn_v3/training/dataset/simple/sample_006/matid.png
new file mode 100644
index 0000000..32e1b1c
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/normal.png b/cnn_v3/training/dataset/simple/sample_006/normal.png
new file mode 100644
index 0000000..e2623bd
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/shadow.png b/cnn_v3/training/dataset/simple/sample_006/shadow.png
new file mode 100644
index 0000000..880ccf9
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/target.png b/cnn_v3/training/dataset/simple/sample_006/target.png
new file mode 100644
index 0000000..383e2d3
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_006/transp.png b/cnn_v3/training/dataset/simple/sample_006/transp.png
new file mode 100644
index 0000000..32e1b1c
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_006/transp.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/albedo.png b/cnn_v3/training/dataset/simple/sample_007/albedo.png
new file mode 100644
index 0000000..80f4f1c
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/albedo.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/depth.png b/cnn_v3/training/dataset/simple/sample_007/depth.png
new file mode 100644
index 0000000..5708605
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/depth.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/matid.png b/cnn_v3/training/dataset/simple/sample_007/matid.png
new file mode 100644
index 0000000..2561108
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/matid.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/normal.png b/cnn_v3/training/dataset/simple/sample_007/normal.png
new file mode 100644
index 0000000..489f629
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/normal.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/shadow.png b/cnn_v3/training/dataset/simple/sample_007/shadow.png
new file mode 100644
index 0000000..f356fb2
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/shadow.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/target.png b/cnn_v3/training/dataset/simple/sample_007/target.png
new file mode 100644
index 0000000..ea276e4
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/target.png
Binary files differ
diff --git a/cnn_v3/training/dataset/simple/sample_007/transp.png b/cnn_v3/training/dataset/simple/sample_007/transp.png
new file mode 100644
index 0000000..2561108
--- /dev/null
+++ b/cnn_v3/training/dataset/simple/sample_007/transp.png
Binary files differ
diff --git a/cnn_v3/training/gen_sample b/cnn_v3/training/gen_sample
new file mode 100755
index 0000000..21519f1
--- /dev/null
+++ b/cnn_v3/training/gen_sample
@@ -0,0 +1,21 @@
+#!/usr/bin/env bash
+# gen_sample — pack an input/target photo pair into a CNN v3 sample directory.
+#
+# Usage:
+# gen_sample <input> <target> <output_dir>
+#
+# Example:
+# gen_sample input/photo1.jpg target_1/photo1_out.png dataset/simple/sample_001
+
+set -euo pipefail
+
+if [ $# -ne 3 ]; then
+ echo "Usage: gen_sample <input> <target> <output_dir>" >&2
+ exit 1
+fi
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+python3 "$SCRIPT_DIR/pack_photo_sample.py" \
+ --photo "$1" \
+ --target "$2" \
+ --output "$3"
diff --git a/cnn_v3/training/input/photo7.jpg b/cnn_v3/training/input/photo7.jpg
new file mode 100644
index 0000000..a662fa8
--- /dev/null
+++ b/cnn_v3/training/input/photo7.jpg
Binary files differ
diff --git a/cnn_v3/training/pack_photo_sample.py b/cnn_v3/training/pack_photo_sample.py
index b2943fb..ca80301 100644
--- a/cnn_v3/training/pack_photo_sample.py
+++ b/cnn_v3/training/pack_photo_sample.py
@@ -18,7 +18,8 @@ mip1 and mip2 are computed on-the-fly by the dataloader from albedo.
prev = zero during training (no temporal history).
Usage:
- python3 pack_photo_sample.py --photo photos/img_001.png \\
+ python3 pack_photo_sample.py --photo input/photo1.jpg \\
+ --target target_1/photo1_out.png \\
--output dataset/simple/sample_001/
Dependencies:
@@ -56,7 +57,7 @@ def pyrdown(img: np.ndarray) -> np.ndarray:
# ---- Main packing ----
-def pack_photo_sample(photo_path: str, output_dir: str) -> None:
+def pack_photo_sample(photo_path: str, target_path: str, output_dir: str) -> None:
os.makedirs(output_dir, exist_ok=True)
print(f"[pack_photo_sample] Loading {photo_path} …")
@@ -110,9 +111,10 @@ def pack_photo_sample(photo_path: str, output_dir: str) -> None:
os.path.join(output_dir, "transp.png")
)
- # ---- target — albedo (= photo; no GT styled target) ----
- # Store as RGBA (keep alpha for potential masking by the dataloader).
- target_u8 = (np.clip(img_np, 0, 1) * 255.0).astype(np.uint8)
+ # ---- target — styled ground truth ----
+ print(f" Loading target {target_path} …")
+ target_img = Image.open(target_path).convert("RGBA")
+ target_u8 = np.asarray(target_img, dtype=np.uint8)
Image.fromarray(target_u8, mode="RGBA").save(
os.path.join(output_dir, "target.png")
)
@@ -129,7 +131,6 @@ def pack_photo_sample(photo_path: str, output_dir: str) -> None:
print(" Files: albedo.png normal.png depth.png matid.png "
"shadow.png transp.png target.png")
print(" Note: normal/depth/matid are zeroed (no geometry data).")
- print(" Note: target = albedo (no ground-truth styled target).")
def main():
@@ -138,10 +139,12 @@ def main():
)
parser.add_argument("--photo", required=True,
help="Input photo file (RGB or RGBA PNG/JPG)")
+ parser.add_argument("--target", required=True,
+ help="Styled ground-truth image (PNG/JPG)")
parser.add_argument("--output", required=True,
help="Output directory for sample files")
args = parser.parse_args()
- pack_photo_sample(args.photo, args.output)
+ pack_photo_sample(args.photo, args.target, args.output)
if __name__ == "__main__":
diff --git a/cnn_v3/training/target_1/photo2_1_out.png b/cnn_v3/training/target_1/photo2_out.png
index 5398232..5398232 100644
--- a/cnn_v3/training/target_1/photo2_1_out.png
+++ b/cnn_v3/training/target_1/photo2_out.png
Binary files differ
diff --git a/cnn_v3/training/target_1/photo2_2_out.png b/cnn_v3/training/target_1/photo7_out.png
index b0a76bd..b0a76bd 100644
--- a/cnn_v3/training/target_1/photo2_2_out.png
+++ b/cnn_v3/training/target_1/photo7_out.png
Binary files differ