对比学习正确率低，怎么提高？

对比学习正确率只有50%，和有监督学习差不多

import os
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision.transforms as transforms
from torchvision.datasets import ImageFolder
from torch.utils.data import DataLoader, Dataset
from torchvision import models
from tqdm import tqdm
from torchvision.transforms import autoaugment
import numpy as np


# ----------------------
# 1. 数据准备
# ----------------------

# 假设数据集结构：
# food11/
#   ├── train/ (无监督预训练数据)
#   ├── labeled/ (有监督微调数据，部分标注)
#   └── test/

# 定义对比学习的数据增强
class ContrastiveTransformations:
    def __init__(self):
        self.transform = transforms.Compose([
            transforms.RandomResizedCrop(224, scale=(0.8, 1.0)),
            transforms.RandomHorizontalFlip(),
            transforms.ColorJitter(0.4, 0.4, 0.4, 0.1),
            transforms.GaussianBlur(kernel_size=23),
            transforms.ToTensor(),
            transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
        ])

    def __call__(self, x):
        return [self.transform(x), self.transform(x)]  # 生成两个增强视图


# 无监督预训练数据集
class UnlabeledDataset(Dataset):
    def __init__(self, root_dir):
        self.dataset = ImageFolder(root=root_dir, transform=ContrastiveTransformations())

    def __getitem__(self, index):
        images = self.dataset[index][0]  # 返回两个增强视图
        return images[0], images[1]  # (view1, view2)

    def __len__(self):
        return len(self.dataset)

HW = 224
# 有监督微调数据集
class LabeledDataset(Dataset):
    def __init__(self, root_dir):
        self.dataset = ImageFolder(
            root=root_dir,
            transform=transforms.Compose([
                transforms.RandomResizedCrop(HW),
                transforms.RandomHorizontalFlip(),
                #autoaugment.AutoAugment(),
                transforms.ToTensor(),
                transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
            ])
        )

    def __getitem__(self, index):
        return self.dataset[index]  # (image, label)

    def __len__(self):
        return len(self.dataset)


# 创建DataLoader
train_unlabeled = UnlabeledDataset(root_dir=r'D:\BaiduNetdiskDownload\第四五节_分类代码 (2)\food_classification\food-11\training\unlabeled')
train_labeled = LabeledDataset(root_dir=r'D:\BaiduNetdiskDownload\第四五节_分类代码 (2)\food_classification\food-11\training\labeled')
test_dataset = LabeledDataset(root_dir=r'D:\BaiduNetdiskDownload\第四五节_分类代码 (2)\food_classification\food-11\validation')

batch_size = 32
#num_workers = 4

train_unlabeled_loader = DataLoader(
    train_unlabeled, batch_size=batch_size, shuffle=True
)
train_labeled_loader = DataLoader(
    train_labeled, batch_size=batch_size, shuffle=True
)
test_loader = DataLoader(test_dataset, batch_size=batch_size)


# ----------------------
# 2. 模型定义
# ----------------------

# SimCLR模型（无监督预训练）
class Encoder(nn.Module):
    def __init__(self, base_encoder=models.resnet50):
        #super().__init__()
        super(Encoder, self).__init__()
        self.layer0 = nn.Sequential(
            nn.Conv2d(in_channels=3, out_channels=64, kernel_size=3, stride=1, padding=1, bias=True),
            nn.BatchNorm2d(64),
            nn.ReLU(inplace=True),
            nn.MaxPool2d(2)
        )  # 112*112
        self.layer1 = nn.Sequential(
            nn.Conv2d(in_channels=64, out_channels=128, kernel_size=3, stride=1, padding=1, bias=True),
            nn.BatchNorm2d(128),
            nn.ReLU(inplace=True),
            nn.MaxPool2d(2)
        )  # 56*56
        self.layer2 = nn.Sequential(
            nn.Conv2d(in_channels=128, out_channels=256, kernel_size=3, stride=1, padding=1, bias=True),
            nn.BatchNorm2d(256),
            nn.ReLU(inplace=True),
            nn.MaxPool2d(2)
        )  # 28*28
        self.layer3 = nn.Sequential(
            nn.Conv2d(in_channels=256, out_channels=512, kernel_size=3, stride=1, padding=1, bias=True),
            nn.BatchNorm2d(512),
            nn.ReLU(inplace=True),
            nn.MaxPool2d(2)
        )
        self.pool1 = nn.MaxPool2d(2)
        self.flatten = nn.Flatten()

    def forward(self, x):

        x = self.layer0(x)
        x = self.layer1(x)
        x = self.layer2(x)
        x = self.layer3(x)
        x = self.pool1(x)
        x = self.flatten(x)
        return x
#自定义投影头
class Projection(nn.Module):
    def __init__(self, input_dim=25088, hidden_dim=2048, output_dim=128):
        super().__init__()
        self.mlp = nn.Sequential(
            nn.Linear(input_dim, hidden_dim),
            nn.BatchNorm1d(hidden_dim),  # 添加BatchNorm
            nn.ReLU(inplace=True),
            nn.Linear(hidden_dim, output_dim)
        )

    def forward(self, x):
        return nn.functional.normalize(self.mlp(x), dim=1)
#完整对比模型，投影头＋编码器
class CustomSimCLR(nn.Module):
    def __init__(self, encoder, projection_head):
        super().__init__()
        self.encoder = encoder  # 自定义编码器（如ResNet）
        self.projection_head = projection_head  # 自定义投影头

    def forward(self, x):
        features = self.encoder(x)  # 编码器提取特征
        projections = self.projection_head(features)  # 投影到对比空间
        return projections


# 使用
encoder = Encoder()
projection_head = Projection(input_dim=25088, hidden_dim=2048, output_dim=128)


# 分类模型（有监督微调）
class FineTuneModel(nn.Module):
    def __init__(self, pretrained_encoder, num_classes=11):
        super().__init__()
        self.encoder = pretrained_encoder.encoder
        #self.fc = nn.Linear(25088, num_classes)  # 替换为分类头
        self.fc = nn.Linear(25088, 512)
        # self.drop = nn.Dropout(0.5)
        self.relu1 = nn.ReLU(inplace=True)
        self.fc2 = nn.Linear(512, num_classes)
    def forward(self, x):
        features = self.encoder(x)
        x = self.fc(features)
        x = self.relu1(x)
        x = self.fc2(x)
        return x

def nt_xent_loss(z1, z2, temperature=0.1):
    z = torch.cat([z1, z2], dim=0)
    sim_matrix = torch.mm(z, z.t()) / temperature
    mask = (torch.eye(z.shape[0]) == 0).float().to(device)
    sim_matrix = sim_matrix * mask  # 排除自身对比
    targets = torch.cat([torch.arange(z1.size(0)) + z1.size(0), torch.arange(z1.size(0))], dim=0).to(device)
    loss = torch.nn.functional.cross_entropy(sim_matrix, targets)
    return loss
# ----------------------
# 3. 无监督预训练
# ----------------------

# ...（保持前面的代码不变）

if __name__ == '__main__':
    # ----------------------
    # 3. 无监督预训练
    # ----------------------

    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

    #model = CustomSimCLR(encoder, projection_head).to(device)
    #optimizer = torch.optim.AdamW(model.parameters(), lr=1e-4,weight_decay=1e-4)
    '''
    # 预训练循环
    num_epochs = 50
    model.train()
    for epoch in range(num_epochs):
        total_loss = 0.0
        for view1, view2 in tqdm(train_unlabeled_loader, desc=f'Epoch {epoch + 1}'):
            view1, view2 = view1.to(device), view2.to(device)
            optimizer.zero_grad()
            z1 = model(view1)
            z2 = model(view2)
            loss = nt_xent_loss(z1, z2)
            loss.backward()
            optimizer.step()
            total_loss += loss.item()
        avg_loss = total_loss / len(train_unlabeled_loader)
        print(f'Pretrain Epoch {epoch + 1}, Loss: {avg_loss:.4f}')

    # 保存预训练权重
    torch.save(model.state_dict(), 'simclr_pretrained.pth')
    '''
    # ----------------------
    # 4. 有监督微调
    # ----------------------
    # 加载预训练模型
    pretrained_model = CustomSimCLR(encoder, projection_head)
    pretrained_model.load_state_dict(torch.load('simclr_pretrained.pth'))
    finetune_model = FineTuneModel(pretrained_model).to(device)

    # 冻结编码器（可选）
    #for param in finetune_model.encoder.parameters():
        #param.requires_grad = False

    optimizer = torch.optim.AdamW(finetune_model.parameters(), lr=1e-4, weight_decay=1e-4)
    criterion = nn.CrossEntropyLoss()

    # 微调循环
    num_finetune_epochs = 20
    best_acc = 0.0

    for epoch in range(num_finetune_epochs):
        finetune_model.train()
        total_loss, total_correct = 0.0, 0
        for images, labels in tqdm(train_labeled_loader, desc=f'Finetune Epoch {epoch + 1}'):
            images, labels = images.to(device), labels.to(device)
            optimizer.zero_grad()
            outputs = finetune_model(images)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()
            total_loss += loss.item()
            _, preds = torch.max(outputs, 1)
            total_correct += torch.sum(preds == labels.data).item()

        # 验证集评估
        finetune_model.eval()
        test_correct = 0
        with torch.no_grad():
            for images, labels in test_loader:
                images, labels = images.to(device), labels.to(device)
                outputs = finetune_model(images)
                _, preds = torch.max(outputs, 1)
                test_correct += torch.sum(preds == labels.data).item()

        train_acc = total_correct / len(train_labeled.dataset)
        test_acc = test_correct / len(test_dataset)
        print(f'Epoch {epoch + 1}, Train Loss: {total_loss / len(train_labeled_loader):.4f}, '
              f'Train Acc: {train_acc:.4f}, Test Acc: {test_acc:.4f}')

        if test_acc > best_acc:
            best_acc = test_acc
            torch.save(finetune_model.state_dict(), 'best_finetune_model.pth')

    print(f'Best Test Accuracy: {best_acc:.4f}')

有什么方法能提高正确率，对比学习正确率不是得到70%吗

写回答
好问题 0 提建议
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

5条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
道友老李 JWE233286一种基于机器视觉的水表指针读数识别及修正的方法专利发明者 2025-03-21 15:47
关注
让【道友老李】来帮你解答，本回答参考gpt编写，并整理提供，如果还有疑问可以点击头像关注私信或评论。
如果答案让您满意，请采纳、关注，非常感谢！
Sorry, the code you provided seems to be incomplete. Can you provide the full code snippet or give more information about the problem you want to solve with it? This will help me understand better and provide a more accurate answer.

解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

2024 AI 人工智能完整学习路线表
2024-09-14 10:46

光子AI的博客本阶段讲解，人工智能的应用，人工智能的工作流程、基本概念，人工智能的任务和本质，KNN最近邻算法。本阶段讲解，python基础语法，Numpy科学计算模块，Pandas数据分析模块，Matplotlib和Seaborn数据可视化模块。本...
AI人工智能（2）：机器学习
2025-01-09 10:04

ywz大柳的博客机器学习（Machine Learning）是人工智能（AI）的一个分支，它使计算机系统能够利用数据和算法自动学习和改进其性能。机器学习是让机器通过经验（数据）来做决策和预测。机器学习已经广泛应用于许多领域，包括推荐...
【AI】人工智能导论小白零基础入门学习
2023-03-15 16:28

Lotay_天天的博客学习AI，算法是核心重点。我国早在2017年就将人工智能发展上升到国家战略层面，把人工智能定为新的重要经济增长点让人工智能成为我国产业升级和经济转型的主要动力立志打造智能制造、智慧城市、智慧金融、智慧农业等...
学习率到底应该怎么调？学习率在深度学习中的意义
2023-02-13 10:59

SetMaker的博客而这个过程可以形象的比喻成人在山顶往山下走的过程，我们要找到一个斜率最高的也就是下降最快的路线作为最优路线，而学习率可以看成我们在最优路线上走的每一步的步伐，如果这个步伐过快，我们很有可能错过最低点，...
AI辅助编码提高病案首页主要诊断编码正确率数据优化方法（2024增量优化版附python源代码）
2024-12-30 10:43

Allen_Lyb的博客本研究围绕AI辅助编码提升病案首页主要诊断编码正确率展开深入探索，构建并验证了一套涵盖数据优化、模型构建与训练、实验评估及案例应用的完整体系，取得了丰硕且极具价值的成果。在数据优化层面，多源异构数据融合...
2025年主流 AI 大模型全面对比，哪个才是最强王者？
2025-05-26 09:30

大模型研究院的博客 人工智能（AI）领域正迎来一场由大模型技术所引领的深刻变革。自2022年末起，以GPT系列为典型代表的大语言模型（LLM），凭借其展现出的惊人能力，迅速在全球范围内掀起了一股科技热潮。这些模型不仅在自然语言理解与...
2025人工智能学习路线全链路解析
2025-01-10 23:05

power-辰南的博客深度学习应用（约 1 - 2 个月）：
【人工智能】-机器学习算法是什么？
2024-06-12 17:24

花花 Show Python的博客机器学习是一门人工智能的科学，该领域的主要研究对象是人工智能，特别是如何在经验学习中改善具体算法的性能。机器学习是对能通过经验自动改进的计算机算法的研究。机器学习是用数据或以往的经验，以此优化计算机...
AI人工智能领域多模态大模型的性能对比研究
2025-06-02 00:31

AI智能架构工坊的博客在当今AI人工智能迅猛发展的时代，多模态大模型成为了研究和应用的热点。多模态大模型能够处理和融合多种不同类型的数据，如文本、图像、音频等，具有更强大的信息处理和理解能力。然而，市场上涌现出了众多不同的多...
对比学习效果差？谷歌提出弱语义负样本，有效学习高级特征！
2022-02-28 12:05

夕小瑶的博客文 | jxyxiangyu编 | 小轶对比学习是 2021 年几大研究热点之一了。如果说预训练模型解决了机器学习对大规模标注数据的需求问题，那么，对比学习可以说是将无监督/自监督学习推广...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 3月21日

对比学习正确率低，怎么提高？

5条回答 默认 最新

问题事件

5条回答默认最新