pthchecker hinzugefügt um Checkpoint Layer Names auszulesen und SegFormer head angepasst, sodass die fehlenden Layers nicht erstellt werden

Files changed (2) hide show

preTrainedTest.py +22 -5
pthchecker.py +56 -0

preTrainedTest.py CHANGED Viewed

@@ -23,24 +23,41 @@ model.to(device).eval()
 image_path = "segformer_plusplus/cityscape/berlin_000543_000019_leftImg8bit.png"
 image = Image.open(image_path).convert("RGB")
-# Preprocessing
 transform = T.Compose([
-    T.Resize((512, 512)),
     T.ToTensor(),
-    T.Normalize(mean=[0.485, 0.456, 0.406],
-                std=[0.229, 0.224, 0.225])
 ])
 input_tensor = transform(image).unsqueeze(0).to(device)
 print("Modell geladen, Bild geladen, Preprocessing abgeschlossen")
 # Inferenz
 with torch.no_grad():
     output = model(input_tensor)
     logits = output.logits if hasattr(output, "logits") else output
     pred = torch.argmax(logits, dim=1).squeeze(0).cpu().numpy()
 # Ergebnis als Textdatei speichern
 output_path = os.path.join("segformer_plusplus", "cityscapes_prediction_output_overHF.txt")
 np.savetxt(output_path, pred, fmt="%d")
-print(f"Prediction saved as {output_path}")

 image_path = "segformer_plusplus/cityscape/berlin_000543_000019_leftImg8bit.png"
 image = Image.open(image_path).convert("RGB")
+# --- Start of changes to match cityscape_benchmark ---
+# Define the target image size as in cityscape_benchmark's default
+# cityscape_benchmark uses (3, 1024, 1024), so spatial size is 1024x1024
+target_image_height = 1024
+target_image_width = 1024
+# Calculate mean and std dynamically from the image as done in cityscape_benchmark
+# Note: This is usually done over the entire training dataset for consistent normalization
+# For a single image, this just normalizes to its own mean/std.
+img_tensor_temp = T.ToTensor()(image)
+mean = img_tensor_temp.mean(dim=(1, 2)).tolist()
+std = img_tensor_temp.std(dim=(1, 2)).tolist()
+print(f"Calculated Mean (for this image): {mean}")
+print(f"Calculated Std (for this image): {std}")
+# Preprocessing - Adjusted to match cityscape_benchmark's T.Resize and T.Normalize
 transform = T.Compose([
+    T.Resize((target_image_height, target_image_width)), # Resize to 1024x1024
     T.ToTensor(),
+    T.Normalize(mean=mean, std=std) # Use dynamically calculated mean/std
 ])
 input_tensor = transform(image).unsqueeze(0).to(device)
+# --- End of changes ---
 print("Modell geladen, Bild geladen, Preprocessing abgeschlossen")
 # Inferenz
 with torch.no_grad():
     output = model(input_tensor)
+    # This ensures you're always getting the raw logits if the model returns an object
     logits = output.logits if hasattr(output, "logits") else output
     pred = torch.argmax(logits, dim=1).squeeze(0).cpu().numpy()
 # Ergebnis als Textdatei speichern
 output_path = os.path.join("segformer_plusplus", "cityscapes_prediction_output_overHF.txt")
 np.savetxt(output_path, pred, fmt="%d")
+print(f"Prediction saved as {output_path}")

pthchecker.py ADDED Viewed

	@@ -0,0 +1,56 @@

+import torch
+import os
+# --- Konfiguration ---
+# Pfad zu Ihrer originalen .pth-Datei
+pth_checkpoint_path = "./segformer-b5-bsm_hq.pth"
+# Name der Ausgabedatei für die Schlüssel
+output_filename = "original_pth_keys.txt"
+# --- Laden und Speichern der Schlüssel ---
+try:
+    # Laden des Checkpoints
+    # map_location='cpu' ist gut, um Probleme zu vermeiden, wenn kein GPU verfügbar ist
+    checkpoint = torch.load(pth_checkpoint_path, map_location='cpu')
+    print(f"Erfolgreich geladen: {pth_checkpoint_path}")
+    print(f"Typ des geladenen Objekts: {type(checkpoint)}")
+    # Extrahieren des state_dict
+    if isinstance(checkpoint, dict) and 'state_dict' in checkpoint:
+        # Oft ist das state_dict in einem Schlüssel wie 'state_dict' oder 'model'
+        state_dict = checkpoint['state_dict']
+        print("\nCheckpoint ist ein Dictionary und enthält 'state_dict'.")
+    elif isinstance(checkpoint, dict):
+        # Manchmal ist das gesamte Dictionary das state_dict selbst
+        state_dict = checkpoint
+        print("\nCheckpoint ist ein Dictionary (wahrscheinlich das state_dict).")
+    else:
+        # Falls es direkt das state_dict ist (z.B. nur ein OrderedDict)
+        state_dict = checkpoint
+        print("\nCheckpoint ist direkt das state_dict.")
+    # Sammeln und Sortieren der Schlüssel
+    state_dict_keys = list(state_dict.keys())
+    state_dict_keys.sort() # Sortiert die Schlüssel alphabetisch für bessere Übersicht
+    # Schreiben der Schlüssel in die Textdatei
+    with open(output_filename, 'w') as f:
+        for key in state_dict_keys:
+            f.write(key + '\n') # Jeder Schlüssel in einer neuen Zeile
+    print(f"\nAlle {len(state_dict_keys)} Schlüssel wurden erfolgreich in '{output_filename}' gespeichert.")
+    # Optional: Beispiel-Layer-Informationen weiterhin auf der Konsole ausgeben
+    if state_dict_keys:
+        example_key = state_dict_keys[0] # Nimmt den ersten sortierten Schlüssel
+        print(f"\nBeispiel-Layer: '{example_key}'")
+        print(f"Shape: {state_dict[example_key].shape}")
+        print(f"Datentyp: {state_dict[example_key].dtype}")
+    else:
+        print("\nKeine Schlüssel im state_dict gefunden.")
+except FileNotFoundError:
+    print(f"FEHLER: Die Datei '{pth_checkpoint_path}' wurde nicht gefunden. Bitte den Pfad überprüfen.")
+except Exception as e:
+    print(f"Ein unerwarteter Fehler ist aufgetreten: {e}")