Merge pull request #20 from DaddyWesker/main

Necr0x0Der · web-flow · commit 904c6ce2f3a8 · 2025-12-23T23:11:43.000+03:00
Readme added snd some fixes
diff --git a/vla/benchmarks/block_type_classification/README.md b/vla/benchmarks/block_type_classification/README.md
@@ -31,7 +31,16 @@ Implements the **training and evaluation pipeline**.
   - Accuracy for type classification
  - Provides helper function:
    - `extract_features_size(model, loader)` – determines the classifier input dimension dynamically.
-
+- For benchmark purposes contains `benchmark` function
+  - Required input parameters:
+    - **model** is the model which used to extract features from the image tensor. Must contain `encode` function which takes image tensor as input and outputs features.
+    - **preprocessor** is the preprocessor sequence which is applied to the input image. Preprocessor sequence must contain `T.ToTensor()` and may contain resize, normalize etc.
+    - either **train_json** and **test_json** or **random_seed**. In one case, dataset is pre-prepared and saved into json files (see **dataset_index_creation_example.py**). In case of **random_seed** as input dataset is being created in the runtime so no need in json files.
+  - Optional input parameters:
+    - **label_type** either `LabelType.DISTANCE` or `LabelType.TYPE_CLASSIFICATION` (from `config.py`). Depends on this parameter, classifier or regression model will be created and trained.
+    - **use_precomputed_features** if set to True, features for all input images will be pre-computed and saved to prevent feature computing while train and test. That helps to reduce time needed to run benchmark. Though requires lots of disk space (depends on which features are used).
+    - **generalization_set_folder** is used to test generalization capability of the trained model. This folder will be used only to compute accuracy/mse in the end of training process.
+    - **config_path** path to the json file which contains parameters used to create and train model. Also contains pathes to the dataset folder and folder which will contain precomputed features. See `example.json`.
 ---
 
 ## 🟩 **model.py**
diff --git a/vla/benchmarks/block_type_classification/dataset_index_creation_example.py b/vla/benchmarks/block_type_classification/dataset_index_creation_example.py
@@ -1,14 +1,14 @@
 from manager import DatasetManager
-from config import LabelType, PATH_TO_RAW_DATA
+from config import LabelType
 
 
 if __name__ == "__main__":
     manager = DatasetManager(
-        directory=PATH_TO_RAW_DATA,
+        directory="./2025_LOS/Day_clear/",
         label_type=LabelType.DISTANCE,
         dataset_size=200,
         train_split=0.25,
         num_bins=50
     )
 
-    train_file, test_file = manager.create("los_dataset")
+    train_file, test_file = manager.create("los_dataset")
diff --git a/vla/benchmarks/block_type_classification/train.py b/vla/benchmarks/block_type_classification/train.py
@@ -77,31 +77,33 @@ def train_classifier(
         avg_train = total_loss / len(train_loader)
         print(f"[Epoch {epoch+1}] Train Loss: {avg_train:.4f}")
 
-        classifier.eval()
-        total_test = 0
-        with torch.no_grad():
-            for labels, images in test_loader:
-                images, labels = images.to(device), labels.to(device)
-                if train_loader.dataset.feature_store is None:
-                    feats = model.encode(images)
-                else:
-                    feats = images
-                feats = feats.to(torch.float32)
-                out = classifier(feats)
-                total_test += criterion(out, labels).item()
-
-        avg_test = total_test / len(test_loader)
-        print(f"[Epoch {epoch+1}] Test  Loss: {avg_test:.4f}")
-
-        if avg_test < best_loss:
-            best_loss = avg_test
-            torch.save({
-                "epoch": epoch,
-                "model_state": classifier.state_dict(),
-                "optimizer_state": optimizer.state_dict(),
-                "test_loss": best_loss
-            }, best_path)
-            print(f"Saved BEST checkpoint at epoch {epoch+1} → {best_path}")
+        if epoch % 5 == 0:
+            print(f"Testing, epoch {epoch+1}")
+            classifier.eval()
+            total_test = 0
+            with torch.no_grad():
+                for labels, images in test_loader:
+                    images, labels = images.to(device), labels.to(device)
+                    if train_loader.dataset.feature_store is None:
+                        feats = model.encode(images)
+                    else:
+                        feats = images
+                    feats = feats.to(torch.float32)
+                    out = classifier(feats)
+                    total_test += criterion(out, labels).item()
+
+            avg_test = total_test / len(test_loader)
+            print(f"[Epoch {epoch+1}] Test  Loss: {avg_test:.4f}")
+
+            if avg_test < best_loss:
+                best_loss = avg_test
+                torch.save({
+                    "epoch": epoch,
+                    "model_state": classifier.state_dict(),
+                    "optimizer_state": optimizer.state_dict(),
+                    "test_loss": best_loss
+                }, best_path)
+                print(f"Saved BEST checkpoint at epoch {epoch+1} → {best_path}")
 
         # Save last epoch (always)
         torch.save({