Snow0821
diff --git a/‎Experiments/binarization_of_ternary_neural_networks/CIFAR_100_btViT.py‎
Lines changed: 200 additions & 0 deletions b/‎Experiments/binarization_of_ternary_neural_networks/CIFAR_100_btViT.py‎
Lines changed: 200 additions & 0 deletions
diff --git a/‎plinear/btnn/linear.py‎
Lines changed: 10 additions & 14 deletions b/‎plinear/btnn/linear.py‎
Lines changed: 10 additions & 14 deletions
@@ -0,0 +1,200 @@
+from datasets import load_dataset
+from torch.utils.data import DataLoader
+from torchvision import transforms
+import torch
+import torch.nn as nn
+import torch.optim as optim
+from tqdm import tqdm
+import matplotlib.pyplot as plt
+import pandas as pd
+
+exp_path = "CIFAR_100_btViT"
+data_path = "uoft-cs/cifar100"
+dataset = load_dataset(data_path, split="train", streaming=False)
+
+total_samples = 1281167
+batch_size = 64
+
+transform = transforms.Compose([
+    transforms.ToTensor()
+])
+
+def collate_fn(batch):
+    images, labels = [], []
+    for item in batch:
+        try:
+            image = transform(item["img"])
+            images.append(image)
+            labels.append(item["fine_label"])
+        except Exception as e:
+            print(f"Error processing image: {e}")
+            continue
+    return torch.stack(images), torch.tensor(labels)
+
+train_loader = DataLoader(dataset, batch_size=batch_size, collate_fn=collate_fn, shuffle=True)
+
+from plinear.models import btViT
+
+dim = 256
+depth = 6
+
+config = {'embed_dim' : dim, 
+          'depth' : depth,
+          'mlp_dim' : 1024,
+          'img_size' : 32,
+          'patch_size' : 2,
+          'channels' : 3,
+          'num_classes' : 100}
+
+model = btViT(**config)
+
+from torchinfo import summary
+summary(model, input_size=(1, 3, 32, 32))
+
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+device = torch.device("mps" if torch.mps.is_available() else "cpu")
+print(device)
+model = model.to(device)
+
+# 손실 함수 및 옵티마이저 설정
+criterion = nn.CrossEntropyLoss()
+optimizer = optim.Adam(model.parameters(), lr = 1)
+
+# 학습 결과 저장을 위한 리스트
+loss_history = []
+accuracy_history = []
+
+import time
+training_start_time = time.time()
+
+# 학습 루프
+num_epochs = 10
+
+for epoch in range(num_epochs):
+    model.train()
+    running_loss = 0.0
+    running_corrects = 0
+    running_samples = 0
+
+    progress_bar = tqdm(train_loader, desc=f"Epoch {epoch+1}/{num_epochs}", total=total_samples // batch_size)
+    for i, (images, labels) in enumerate(progress_bar):
+        images, labels = images.to(device), labels.to(device)
+        labels = labels % 1000
+
+        optimizer.zero_grad()
+        outputs = model(images)
+        loss = criterion(outputs, labels)
+        loss.backward()
+        optimizer.step()
+
+        preds = torch.argmax(outputs, dim=1)
+        running_samples += labels.size(0)
+        running_loss += loss.item()
+        running_corrects += torch.sum(preds == labels).item()
+
+        progress_bar.set_postfix(loss=running_loss / running_samples, accuracy=running_corrects / running_samples)
+        
+    model.push_to_hub(f'snowian/{exp_path}_{dim}_{depth}_{epoch + 1}')
+    epoch_loss = running_loss / total_samples
+    epoch_accuracy = running_corrects / total_samples
+    loss_history.append(epoch_loss)
+    accuracy_history.append(epoch_accuracy)
+    print(f"Epoch [{epoch+1}/{num_epochs}], Loss: {epoch_loss:.4f}, Accuracy: {epoch_accuracy:.4f}")
+
+training_end_time = time.time()  # 학습 종료 시간
+training_duration = training_end_time - training_start_time  # 전체 학습 소요 시간
+print(f"Total Training Time: {training_duration:.2f} seconds")
+
+# Epoch-level metrics
+plt.figure(figsize=(10, 5))
+plt.plot(range(1, num_epochs + 1), loss_history, marker='o', label="Epoch Loss")
+plt.xlabel("Epoch")
+plt.ylabel("Loss")
+plt.title("Loss Over Epochs")
+plt.legend()
+plt.grid()
+plt.savefig(f"{exp_path}/{dim}-{depth} epoch_loss.png")
+
+plt.figure(figsize=(10, 5))
+plt.plot(range(1, num_epochs + 1), accuracy_history, marker='o', label="Epoch Accuracy")
+plt.xlabel("Epoch")
+plt.ylabel("Accuracy")
+plt.title("Accuracy Over Epochs")
+plt.legend()
+plt.grid()
+plt.savefig(f"{exp_path}/{dim}-{depth} epoch_acc.png")
+
+# Save metrics to CSV
+metrics_data = {
+    "Epoch": list(range(1, num_epochs + 1)),
+    "Epoch Loss": loss_history,
+    "Epoch Accuracy": accuracy_history,
+}
+
+# Create DataFrame and save to CSV
+epoch_df = pd.DataFrame({"Epoch": metrics_data["Epoch"],
+                          "Loss": metrics_data["Epoch Loss"],
+                          "Accuracy": metrics_data["Epoch Accuracy"]})
+
+epoch_df.to_csv(f"{exp_path}/{dim}-{depth} epoch_metrics.csv", index=False)
+
+print("Metrics saved to CSV files.")
+
+import pandas as pd
+
+def evaluate_model(model, dataloader, criterion, device, save_path=None):
+    model.eval()
+    running_corrects = 0
+    total_samples = 0
+
+    with torch.no_grad():
+        for images, labels in tqdm(dataloader, desc="Evaluating"):
+            images, labels = images.to(device), labels.to(device)
+            labels = labels % 1000
+            outputs = model(images)
+            preds = torch.argmax(outputs, dim=1)
+            
+            running_corrects += torch.sum(preds == labels).item()
+            total_samples += labels.size(0)
+
+    accuracy = running_corrects / total_samples
+    print(f"Test Accuracy: {accuracy:.4f}")
+    
+    # 검증 결과 저장
+    if save_path:
+        results = {"Accuracy": [accuracy]}
+        results_df = pd.DataFrame(results)
+        results_df.to_csv(save_path, index=False)
+        print(f"Test results saved to {save_path}")
+
+    return accuracy
+
+# # 검증 데이터로 평가
+# validation_dataset = load_dataset(data_path, split="validation", streaming=False)
+# print(validation_dataset[:10])
+# validation_loader = DataLoader(validation_dataset, batch_size=batch_size, collate_fn=collate_fn)
+
+# val_start_time = time.time()
+
+# test_accuracy = evaluate_model(
+#     model, validation_loader, criterion, device, save_path=f"{exp_path}/{dim}-{depth} validation_results.csv"
+# )
+
+# val_end_time = time.time()  # 테스트 종료 시간
+# val_duration = val_end_time - val_start_time  # 테스트 소요 시간
+# print(f"Total Validation Time: {val_duration:.2f} seconds")
+
+
+test_dataset = load_dataset(data_path, split="test", streaming=False)
+print(test_dataset[:10])
+test_loader = DataLoader(test_dataset, batch_size=batch_size, collate_fn=collate_fn)
+
+test_start_time = time.time()
+
+test_accuracy = evaluate_model(
+    model, test_loader, criterion, device, save_path=f"{exp_path}/{dim}-{depth} test_results.csv"
+)
+
+test_end_time = time.time()  # 테스트 종료 시간
+test_duration = test_end_time - test_start_time  # 테스트 소요 시간
+print(f"Total Test Time: {test_duration:.2f} seconds")
@@ -7,27 +7,23 @@
 class Linear(nn.Module):
     def __init__(self, x, y):
         super(Linear, self).__init__()
-        self.real_pos = nn.Linear(x, y)
-        self.real_neg = nn.Linear(x, y)
+        self.pr = nn.Linear(x, y)
+        self.nr = nn.Linear(x, y)
 
         torch.nn.init.uniform_(self.real_pos.weight, -1, 1)
         torch.nn.init.uniform_(self.real_neg.weight, -1, 1)
 
     def forward(self, x):
-        w_pos = self.real_pos.weight
-        w_neg = self.real_neg.weight
-        tern_pos = posNet(w_pos)
-        tern_neg = posNet(w_neg)
+        pr = self.pr.weight
+        nr = self.nr.weight
+        qpr = posNet(pr)
+        qnr = posNet(nr)
 
         # Apply quantization using posNet with detach
-        tern_pos = tern_pos - w_pos.detach() + w_pos
-        tern_neg = tern_neg - w_neg.detach() + w_neg
+        qpr = qpr - pr.detach() + pr
+        qnr = qnr - nr.detach() + nr
 
         # Compute linear transformations
-        y_pos = F.linear(x, tern_pos)
-        y_neg = F.linear(x, tern_neg)
+        yr = F.linear(x, qpr) - F.linear(x, qnr)
 
-        # Combine positive and negative parts
-        y = y_pos - y_neg
-
-        return y
+        return yr