sync

jcapp4 · jcapp4 · commit 1c553f7e2c34 · 2025-11-17T09:51:08.000+01:00
diff --git a/chebai/models/base.py b/chebai/models/base.py
@@ -270,7 +270,10 @@ def _execute(
                 if self.pass_loss_kwargs:
                     loss_kwargs = loss_kwargs_candidates
                 #torch.save(loss_data,"loss_data.pt")
-                loss_kwargs['weights'] = f.create_data_weights(batchsize=len(data['idents']),dim=data['labels'].size(dim=1),weights=data["loss_kwargs"],idents=data["idents"])
+                if not f.class_weights:
+                    loss_kwargs['weights'] = f.create_data_weights(batchsize=len(data['idents']),dim=data['labels'].size(dim=1),weights=data["loss_kwargs"],idents=data["idents"])
+                else:
+                    loss_kwargs['weights'] = f.create_weight_class_tensor(len(data['idents']))
                 loss_kwargs["current_epoch"] = self.trainer.current_epoch
                 loss = self.criterion(loss_data, loss_labels, **loss_kwargs)
                 if isinstance(loss, tuple):
diff --git a/chebai/preprocessing/datasets/base.py b/chebai/preprocessing/datasets/base.py
@@ -1181,10 +1181,12 @@ def load_processed_data(
             else:
                 data_df = self.dynamic_split_dfs[kind]
                 data = data_df.to_dict(orient="records")
-                if kind == "train":
+                if f.class_weights:
+                    f.create_class_tensor("../../../weights/test.pt")
+                if kind == "train" and f.class_weights == False:
                     f.init_weights()
                     data = f.add_train_weights(data)
-                if kind == "validation":
+                if kind == "validation" and f.class_weights == False:
                     data = f.add_val_weights(data)
                 # torch.save(data,"gewicht.pt")
 
diff --git a/extras/weight_loader.py b/extras/weight_loader.py
@@ -2,6 +2,7 @@
 import torch
 import os
 
+class_weights = True
 
 #inint weights in a csv file
 def init_weights(path="../weights/first_it.csv",path_to_split="../split/splits.csv"):
@@ -113,7 +114,45 @@ def check_weights(data):
     for i in data:
         print(f"({i["ident"]} , {i["weight"]}")
 
-init_weights()
-mock_init_weights()
-# print(get_weights((233713,51990)))
 
+def init_class_weights(class_path:str,weight_path:str,weight:float):
+    with open(class_path,'r') as classes:
+        with open(weight_path,'w') as weights:
+            reader = csv.reader(classes)
+            writer = csv.writer(weights)
+            writer.writerow(["class","weight"])
+            for row in reader:
+                row = row + [weight,]
+                writer.writerow(row)
+
+def create_class_tensor(save_path:str)-> torch.Tensor:
+    device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+    t = torch.empty(1,1528)
+    with open("../../weights/class_first_it.csv",'r') as f:
+        reader = csv.reader(f)
+        index = 0
+        for row in reader:
+            if row[1] == "weight":
+                continue
+            t[0][index] = float(row[1])
+            index = index + 1
+    torch.save(t,save_path)
+
+def create_weight_class_tensor(batch_size:int)-> torch.Tensor:
+    t = torch.load("../../weights/test.pt")
+    w = None
+    for i in range(0,batch_size):
+        if w is None:
+            w = t
+        else:
+            w = torch.cat((w,t),dim=0)
+    print(w.shape)
+    return w
+
+
+
+
+
+#init_class_weights("../../data/chebi_v241/ChEBI50/processed/classes.txt","../../weights/class_first_it.csv",1)
+create_class_tensor("../../weights/test.pt")
+create_weight_class_tensor(32)