Spaces:

cycool29
/

SpiralSense

Runtime error

App Files Files Community

cycool29 commited on Sep 25, 2023

Commit

d49cf43

1 Parent(s): 5d3ea78

Update

Browse files

Files changed (7) hide show

handetect/__pycache__/models.cpython-310.pyc +0 -0
handetect/__pycache__/predict.cpython-310.pyc +0 -0
handetect/adjust_hyperparameter.py +2 -5
handetect/evaluation.py +1 -1
handetect/main.py +10 -12
handetect/models.py +6 -333
handetect/predict.py +1 -1

handetect/__pycache__/models.cpython-310.pyc CHANGED Viewed

Binary files a/handetect/__pycache__/models.cpython-310.pyc and b/handetect/__pycache__/models.cpython-310.pyc differ

handetect/__pycache__/predict.cpython-310.pyc CHANGED Viewed

Binary files a/handetect/__pycache__/predict.cpython-310.pyc and b/handetect/__pycache__/predict.cpython-310.pyc differ

handetect/adjust_hyperparameter.py CHANGED Viewed

@@ -24,9 +24,6 @@ AUG_DATA_DIR = r"data/train/augmented/Task " + str(TASK)
 NUM_CLASSES = len(os.listdir(ORIG_DATA_DIR))
 VAL_RESIZE_SIZE = 232
-# Load and preprocess the data
-data_dir = r"data/train/Task 1"
 def resize_for_validation(image):
     return transforms.Resize((VAL_RESIZE_SIZE, VAL_RESIZE_SIZE))(image)
@@ -84,7 +81,7 @@ valid_loader = DataLoader(
 )
 # Initialize model, criterion, optimizer, and scheduler
-model = vgg16(pretrained=False, num_classes=NUM_CLASSES)
 model = model.to(DEVICE)
 criterion = nn.CrossEntropyLoss()
 # Adam optimizer
@@ -112,7 +109,7 @@ def objective(trial):
     batch_size = trial.suggest_categorical("batch_size", [16, 32, 64])
     # Modify the model and optimizer using suggested hyperparameters
-    model = resnet18(pretrained=False, num_classes=NUM_CLASSES).to(DEVICE)
     optimizer = optim.Adam(model.parameters(), lr=learning_rate)
     for epoch in range(NUM_EPOCHS):

 NUM_CLASSES = len(os.listdir(ORIG_DATA_DIR))
 VAL_RESIZE_SIZE = 232
 def resize_for_validation(image):
     return transforms.Resize((VAL_RESIZE_SIZE, VAL_RESIZE_SIZE))(image)
 )
 # Initialize model, criterion, optimizer, and scheduler
+model = mobilenet_v2(pretrained=False, num_classes=NUM_CLASSES)
 model = model.to(DEVICE)
 criterion = nn.CrossEntropyLoss()
 # Adam optimizer
     batch_size = trial.suggest_categorical("batch_size", [16, 32, 64])
     # Modify the model and optimizer using suggested hyperparameters
+    model = mobilenet_v2(pretrained=False, num_classes=NUM_CLASSES).to(DEVICE)
     optimizer = optim.Adam(model.parameters(), lr=learning_rate)
     for epoch in range(NUM_EPOCHS):

handetect/evaluation.py CHANGED Viewed

@@ -23,7 +23,7 @@ print(images)
 true_classs = []
 predicted_labels = []
-model = vgg16(pretrained=False, num_classes=NUM_CLASSES)
 model.load_state_dict(torch.load(model_checkpoint_path, map_location=DEVICE))
 model.eval()
 model = model.to(DEVICE)

 true_classs = []
 predicted_labels = []
+model = mobilenet_v2(pretrained=False, num_classes=NUM_CLASSES)
 model.load_state_dict(torch.load(model_checkpoint_path, map_location=DEVICE))
 model.eval()
 model = model.to(DEVICE)

handetect/main.py CHANGED Viewed

@@ -11,15 +11,17 @@ from scipy.ndimage import gaussian_filter1d
 from torch.utils.tensorboard import SummaryWriter #print to tensorboard
 from torchvision.utils import make_grid
-torch.cuda.empty_cache()
-writer = SummaryWriter()
 # Constants
 RANDOM_SEED = 123
-BATCH_SIZE = 32
 NUM_EPOCHS = 100
-LEARNING_RATE = 0.001
 STEP_SIZE = 10
 GAMMA = 0.5
 DEVICE = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
@@ -54,8 +56,6 @@ print("Classes: ", original_dataset.classes)
 print("Length of original dataset: ", len(original_dataset))
 print("Length of augmented dataset: ", len(augmented_dataset))
 print("Length of total dataset: ", len(dataset))
-print("Classes: ", original_dataset.classes)
 # Custom dataset class
 class CustomDataset(Dataset):
@@ -84,15 +84,13 @@ valid_loader = DataLoader(
 )
 # Initialize model, criterion, optimizer, and scheduler
-model = vgg16(pretrained=False, num_classes=NUM_CLASSES)
 model = model.to(DEVICE)
 criterion = nn.CrossEntropyLoss()
 # Adam optimizer
 optimizer = optim.Adam(model.parameters(), lr=LEARNING_RATE)
-# ReduceLROnPlateau scheduler
-scheduler = optim.lr_scheduler.ReduceLROnPlateau(
-    optimizer, mode="min", factor=0.1, patience=10, verbose=True
-)
 # Lists to store training and validation loss history
 TRAIN_LOSS_HIST = []
@@ -145,7 +143,7 @@ for epoch in range(NUM_EPOCHS):
     # Learning rate scheduling
     lr_1 = optimizer.param_groups[0]["lr"]
     print("Learning Rate: {:.15f}".format(lr_1))
-    scheduler.step(avg_train_loss)
     # Validation loop
     model.eval()  # Set model to evaluation mode

 from torch.utils.tensorboard import SummaryWriter #print to tensorboard
 from torchvision.utils import make_grid
+# torch.cuda.empty_cache()
+# os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:1024"
+writer = SummaryWriter(log_dir='runs/Task1')
 # Constants
 RANDOM_SEED = 123
+BATCH_SIZE = 16
 NUM_EPOCHS = 100
+LEARNING_RATE = 0.030215994618918267
 STEP_SIZE = 10
 GAMMA = 0.5
 DEVICE = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 print("Length of original dataset: ", len(original_dataset))
 print("Length of augmented dataset: ", len(augmented_dataset))
 print("Length of total dataset: ", len(dataset))
 # Custom dataset class
 class CustomDataset(Dataset):
 )
 # Initialize model, criterion, optimizer, and scheduler
+model = mobilenet_v3_small(num_classes=NUM_CLASSES)
 model = model.to(DEVICE)
 criterion = nn.CrossEntropyLoss()
 # Adam optimizer
 optimizer = optim.Adam(model.parameters(), lr=LEARNING_RATE)
+# StepLR scheduler
+scheduler = optim.lr_scheduler.StepLR(optimizer, step_size=STEP_SIZE, gamma=GAMMA)
 # Lists to store training and validation loss history
 TRAIN_LOSS_HIST = []
     # Learning rate scheduling
     lr_1 = optimizer.param_groups[0]["lr"]
     print("Learning Rate: {:.15f}".format(lr_1))
+    scheduler.step()
     # Validation loop
     model.eval()  # Set model to evaluation mode

handetect/models.py CHANGED Viewed

@@ -7,336 +7,9 @@ from torchvision.models import resnet50
 from torchvision.models import resnet18
 from torchvision.models import squeezenet1_0
 from torchvision.models import vgg16
-# resnet50
-class Bottleneck(torch.nn.Module):
-    expansion = 4
-    def __init__(self, in_channels, out_channels, i_downsample=None, stride=1):
-        super(Bottleneck, self).__init__()
-        # hmm,ex 1x1 convolution to reduce channels (intermediate channels)
-        self.conv1 = torch.nn.Conv2d(
-            in_channels, out_channels, kernel_size=1, stride=1, padding=0
-        )
-        self.batch_norm1 = torch.nn.BatchNorm2d(out_channels)
-        # 3x3 convolution with specified stride
-        self.conv2 = torch.nn.Conv2d(
-            out_channels, out_channels, kernel_size=3, stride=stride, padding=1
-        )
-        self.batch_norm2 = torch.nn.BatchNorm2d(out_channels)
-        # and then leh,1x1 expand back
-        self.conv3 = torch.nn.Conv2d(
-            out_channels,
-            out_channels * self.expansion,
-            kernel_size=1,
-            stride=1,
-            padding=0,
-        )
-        self.batch_norm3 = torch.nn.BatchNorm2d(out_channels * self.expansion)
-        self.i_downsample = i_downsample
-        self.stride = stride
-        self.relu = torch.nn.ReLU()
-    ##forward the input x through the network,haiyaa
-    def forward(self, x):
-        identity = x.clone()
-        x = self.relu(self.batch_norm1(self.conv1(x)))
-        x = self.relu(self.batch_norm2(self.conv2(x)))
-        x = self.conv3(x)
-        x = self.batch_norm3(x)
-        # downsample if needed
-        if self.i_downsample is not None:
-            identity = self.i_downsample(identity)
-        # add identity
-        x += identity
-        x = self.relu(x)
-        return x
-# we no use this first,but we can just copy this whole class and apply to resnet16 and etc
-class Block(torch.nn.Module):
-    expansion = 1
-    def __init__(self, in_channels, out_channels, i_downsample=None, stride=1):
-        super(Block, self).__init__()
-        self.conv1 = torch.nn.Conv2d(
-            in_channels,
-            out_channels,
-            kernel_size=3,
-            padding=1,
-            stride=stride,
-            bias=False,
-        )
-        self.batch_norm1 = torch.nn.BatchNorm2d(out_channels)
-        self.conv2 = torch.nn.Conv2d(
-            out_channels,
-            out_channels,
-            kernel_size=3,
-            padding=1,
-            stride=stride,
-            bias=False,
-        )
-        self.batch_norm2 = torch.nn.BatchNorm2d(out_channels)
-        self.i_downsample = i_downsample
-        self.stride = stride
-        self.relu = torch.nn.ReLU()
-    def forward(self, x):
-        identity = x.clone()
-        x = self.relu(self.batch_norm2(self.conv1(x)))
-        x = self.batch_norm2(self.conv2(x))
-        if self.i_downsample is not None:
-            identity = self.i_downsample(identity)
-        print(x.shape)
-        print(identity.shape)
-        x += identity
-        x = self.relu(x)
-        return x
-class ResNet(torch.nn.Module):
-    def __init__(self, ResBlock, layer_list, num_classes, num_channels=3):
-        super(ResNet, self).__init__()
-        self.in_channels = 64
-        # intial conv layaer
-        self.conv1 = torch.nn.Conv2d(
-            num_channels, 64, kernel_size=7, stride=2, padding=3, bias=False
-        )
-        self.batch_norm1 = torch.nn.BatchNorm2d(64)
-        self.relu = torch.nn.ReLU()
-        self.max_pool = torch.nn.MaxPool2d(kernel_size=3, stride=2, padding=1)
-        # residual block(layers),each block got three three layer,total 4 blocks
-        self.layer1 = self._make_layer(ResBlock, layer_list[0], planes=64)
-        self.layer2 = self._make_layer(ResBlock, layer_list[1], planes=128, stride=2)
-        self.layer3 = self._make_layer(ResBlock, layer_list[2], planes=256, stride=2)
-        self.layer4 = self._make_layer(ResBlock, layer_list[3], planes=512, stride=2)
-        self.avgpool = torch.nn.AdaptiveAvgPool2d((1, 1))
-        self.fc = torch.nn.Linear(512 * ResBlock.expansion, num_classes)
-    def forward(self, x):
-        x = self.relu(self.batch_norm1(self.conv1(x)))
-        x = self.max_pool(x)
-        x = self.layer1(x)
-        x = self.layer2(x)
-        x = self.layer3(x)
-        x = self.layer4(x)
-        x = self.avgpool(x)
-        x = x.reshape(x.shape[0], -1)
-        x = self.fc(x)
-        return x
-    def _make_layer(self, ResBlock, blocks, planes, stride=1):
-        # plane is the number of output channel
-        ii_downsample = None
-        layers = []
-        if stride != 1 or self.in_channels != planes * ResBlock.expansion:
-            ii_downsample = torch.nn.Sequential(
-                torch.nn.Conv2d(
-                    self.in_channels,
-                    planes * ResBlock.expansion,
-                    kernel_size=1,
-                    stride=stride,
-                ),
-                torch.nn.BatchNorm2d(planes * ResBlock.expansion),
-            )
-        layers.append(
-            ResBlock(
-                self.in_channels, planes, i_downsample=ii_downsample, stride=stride
-            )
-        )
-        self.in_channels = planes * ResBlock.expansion
-        for i in range(blocks - 1):
-            layers.append(ResBlock(self.in_channels, planes))
-        return torch.nn.Sequential(*layers)
-##list here leh is the number of residual block in each layer
-def ResNet50(num_classes, channels=3):
-    return ResNet(Bottleneck, [3, 4, 6, 3], num_classes, channels)
-# VGG16 model
-class VGG16(torch.nn.Module):
-    def __init__(self, num_classes):
-        super().__init__()
-        self.block_1 = torch.nn.Sequential(
-            torch.nn.Conv2d(
-                in_channels=3,
-                out_channels=64,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=64,
-                out_channels=64,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2)),
-        )
-        self.block_2 = torch.nn.Sequential(
-            torch.nn.Conv2d(
-                in_channels=64,
-                out_channels=128,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=128,
-                out_channels=128,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2)),
-        )
-        self.block_3 = torch.nn.Sequential(
-            torch.nn.Conv2d(
-                in_channels=128,
-                out_channels=256,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=256,
-                out_channels=256,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=256,
-                out_channels=256,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2)),
-        )
-        self.block_4 = torch.nn.Sequential(
-            torch.nn.Conv2d(
-                in_channels=256,
-                out_channels=512,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=512,
-                out_channels=512,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=512,
-                out_channels=512,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2)),
-        )
-        self.block_5 = torch.nn.Sequential(
-            torch.nn.Conv2d(
-                in_channels=512,
-                out_channels=512,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=512,
-                out_channels=512,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.Conv2d(
-                in_channels=512,
-                out_channels=512,
-                kernel_size=(3, 3),
-                stride=(1, 1),
-                padding=1,
-            ),
-            torch.nn.ReLU(),
-            torch.nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2)),
-        )
-        height, width = 3, 3
-        self.classifier = torch.nn.Sequential(
-            torch.nn.Linear(512 * height * width, 4096),
-            torch.nn.ReLU(True),
-            torch.nn.Dropout(p=0.5),
-            torch.nn.Linear(4096, 4096),
-            torch.nn.ReLU(True),
-            torch.nn.Dropout(p=0.5),
-            torch.nn.Linear(4096, num_classes),
-        )
-        for m in self.modules():
-            if isinstance(m, torch.torch.nn.Conv2d) or isinstance(
-                m, torch.torch.nn.Linear
-            ):
-                torch.nn.init.kaiming_uniform_(
-                    m.weight, mode="fan_in", nonlinearity="relu"
-                )
-                if m.bias is not None:
-                    m.bias.detach().zero_()
-        self.avgpool = torch.nn.AdaptiveAvgPool2d((height, width))
-    def forward(self, x):
-        x = self.block_1(x)
-        x = self.block_2(x)
-        x = self.block_3(x)
-        x = self.block_4(x)
-        x = self.block_5(x)
-        x = self.avgpool(x)
-        x = x.view(x.size(0), -1)  # flatten
-        logits = self.classifier(x)
-        # probas = F.softmax(logits, dim=1)
-        return logits
-# ResNet18 model

 from torchvision.models import resnet18
 from torchvision.models import squeezenet1_0
 from torchvision.models import vgg16
+from torchvision.models import alexnet
+from torchvision.models import densenet121
+from torchvision.models import googlenet
+from torchvision.models import inception_v3
+from torchvision.models import mobilenet_v2
+from torchvision.models import mobilenet_v3_small

handetect/predict.py CHANGED Viewed

@@ -25,7 +25,7 @@ preprocess = transforms.Compose(
 )
 # Load your model (change this according to your model definition)
-model = vgg16(pretrained=False, num_classes=NUM_CLASSES)
 model.load_state_dict(
     torch.load(model_checkpoint_path, map_location=DEVICE)
 )  # Load the model on the same device

 )
 # Load your model (change this according to your model definition)
+model = squeezenet1_0(pretrained=False, num_classes=NUM_CLASSES)
 model.load_state_dict(
     torch.load(model_checkpoint_path, map_location=DEVICE)
 )  # Load the model on the same device