当前位置: 首页 > ai >正文

Python打卡训练营Day43

DAY 43 复习日

作业:

kaggle找到一个图像数据集,用cnn网络进行训练并且用grad-cam做可视化

数据集地址:Lung Nodule Malignancy 肺结核良恶性判断 

进阶:并拆分成多个文件

import os
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from torch.utils.data import Dataset, DataLoader
from PIL import Image
import torch
from torchvision import transforms
import torch.nn as nn
import torch.optim as optim
import matplotlib.pyplot as plt# 1. 读标签并映射 0/1
df = pd.read_csv('archive/malignancy.csv')# 2. 按 patch_id 划 train/val
ids    = df['NoduleID'].values
labels = df['malignancy'].values
train_ids, val_ids = train_test_split(ids, test_size=0.2, random_state=42, stratify=labels
)
train_df = df[df['NoduleID'].isin(train_ids)].reset_index(drop=True)
val_df   = df[df['NoduleID'].isin(val_ids)].reset_index(drop=True)# 3. Dataset:多页 TIFF 按页读取
class LungTBDataset(Dataset):def __init__(self, tif_path, df, transform=None):self.tif_path = tif_pathself.df = dfself.transform = transformdef __len__(self):return len(self.df)def __getitem__(self, idx):row = self.df.iloc[idx]pid = int(row['NoduleID'])label = int(row['malignancy'])try:with Image.open(self.tif_path) as img:# 检查 pid 是否超出实际帧数total_pages = sum(1 for _ in ImageSequence.Iterator(img))if pid >= total_pages:pid = total_pages - 1  # 取最后一帧img.seek(pid)img = img.convert('RGB')except Exception as e:# 返回黑色占位图img = Image.new('RGB', (224, 224), (0, 0, 0))if self.transform:img = self.transform(img)return img, label# 4. 变换 & DataLoader
transform = transforms.Compose([transforms.Resize((224,224)),transforms.ToTensor(),transforms.Normalize(mean=[0.485,0.456,0.406],std =[0.229,0.224,0.225])
])
train_ds = LungTBDataset('archive/ct_tiles.tif', train_df, transform)
val_ds   = LungTBDataset('archive/ct_tiles.tif',   val_df, transform)
train_loader = DataLoader(train_ds, batch_size=16, shuffle=True,  num_workers=0, pin_memory=True)
val_loader   = DataLoader(val_ds,   batch_size=16, shuffle=False, num_workers=0, pin_memory=True)# 5. 定义简单 CNN(3层卷积 + 全连接)
class SimpleCNN(nn.Module):def __init__(self):super(SimpleCNN, self).__init__()# 卷积层self.conv1 = nn.Sequential(nn.Conv2d(3, 32, kernel_size=3, padding=1),nn.ReLU(inplace=True),nn.MaxPool2d(2)  # 224->112)self.conv2 = nn.Sequential(nn.Conv2d(32, 64, kernel_size=3, padding=1),nn.ReLU(inplace=True),nn.MaxPool2d(2)  # 112->56)# 最后一层卷积,用于 Grad-CAMself.conv3 = nn.Sequential(nn.Conv2d(64, 128, kernel_size=3, padding=1),nn.ReLU(inplace=True),nn.MaxPool2d(2)  # 56->28)# 全连接分类器self.fc = nn.Sequential(nn.Flatten(),nn.Linear(128 * 28 * 28, 256),nn.ReLU(inplace=True),nn.Linear(256, 2))def forward(self, x):x = self.conv1(x)x = self.conv2(x)x = self.conv3(x)      # 保留这一层的输出作 CAMx = self.fc(x)return xdevice = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
model = SimpleCNN().to(device)criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=1e-4)# 6. 训练 + 验证循环
num_epochs = 5
for epoch in range(num_epochs):# 训练model.train()running_loss = 0for imgs, labs in train_loader:imgs, labs = imgs.to(device), labs.to(device)optimizer.zero_grad()outputs = model(imgs)loss    = criterion(outputs, labs)loss.backward()optimizer.step()running_loss += loss.item() * imgs.size(0)epoch_loss = running_loss / len(train_ds)# 验证model.eval()correct = 0with torch.no_grad():for imgs, labs in val_loader:imgs, labs = imgs.to(device), labs.to(device)preds = model(imgs).argmax(dim=1)correct += (preds == labs).sum().item()val_acc = correct / len(val_ds)print(f'Epoch {epoch+1}/{num_epochs}  Loss={epoch_loss:.4f}  ValAcc={val_acc:.4f}')# 7. 简易 Grad-CAM
class GradCAM:def __init__(self, model, target_conv):self.model = modelself.target_conv = target_convself.grad    = Noneself.activation = None# 注册 hooktarget_conv.register_forward_hook(self._forward)target_conv.register_backward_hook(self._backward)def _forward(self, module, inp, outp):self.activation = outp.detach()def _backward(self, module, grad_in, grad_out):self.grad = grad_out[0].detach()def __call__(self, x, class_idx=None):self.model.zero_grad()out = self.model(x)if class_idx is None:class_idx = out.argmax(dim=1).item()loss = out[0, class_idx]loss.backward()# 计算权重weights = self.grad.mean(dim=(2,3))  # (1,C)cam = (weights.view(-1,1,1) * self.activation[0]).sum(dim=0)cam = torch.relu(cam)cam -= cam.min()cam /= cam.max()return cam.cpu().numpy()# 8. 随机选一张验证图做可视化
model.eval()
imgs, labs = next(iter(val_loader))
img, lab = imgs[0:1].to(device), labs[0].item()# 以 conv3 的最后 Conv2d 为 target
# conv3 是 Sequential,取其中的第0层 Conv2d
target_layer = model.conv3[0]
gradcam = GradCAM(model, target_layer)
heatmap = gradcam(img)  # (28,28)# 上采样到 224×224
heatmap = np.uint8(255 * heatmap)
heatmap = Image.fromarray(heatmap).resize((224,224), resample=Image.BILINEAR)
heatmap = np.array(heatmap) / 255.0# 反归一化 & 可视化叠加
inv_norm = transforms.Normalize(mean=[-0.485/0.229, -0.456/0.224, -0.406/0.225],std =[1/0.229,       1/0.224,       1/0.225]
)
img_show = inv_norm(img[0]).permute(1,2,0).cpu().numpy()
img_show = np.clip(img_show, 0, 1)plt.figure(figsize=(8,4))
plt.subplot(1,2,1)
plt.imshow(img_show)
plt.title(f'Label={lab}')
plt.axis('off')plt.subplot(1,2,2)
plt.imshow(img_show, alpha=0.6)
plt.imshow(heatmap, cmap='jet', alpha=0.4)
plt.title('Grad-CAM')
plt.axis('off')
plt.tight_layout()
plt.show()

代码没问题但跑的很慢不知道啥原因。

浙大疏锦行-CSDN博客

http://www.xdnf.cn/news/10610.html

相关文章:

  • 《多状态DP:状态设计与状态转移方程速成指南》​
  • Leetcode 1136. 并行课程
  • MySQL语法练习 - 基础DDL/DML/DQL/DCL练习
  • 监督学习 vs 无监督学习:AI两大学习范式深度解析
  • Java内部类详细教程
  • 06.MySQL数据库操作详解
  • Retrievers检索器+RAG文档助手项目实战
  • 字符串加解密
  • 配置刷新技术
  • 【Python 进阶3】常见的 call 和 forward 区别
  • JavaSE 字符串:深入解析 String、StringBuilder与 StringBuffer
  • 第十章:Next的Seo实践
  • 力扣HOT100之多维动态规划:62. 不同路径
  • C. Basketball Exercise
  • Vue-6-前端框架Vue之基于Plotly.js绘制曲线
  • 3,信号与槽机制
  • BUUCTF[ACTF2020 新生赛]Include 1题解
  • NVM,Node.Js 管理工具
  • 【Delphi】接收windows文件夹中文件拖拽
  • (Python网络爬虫);抓取B站404页面小漫画
  • Python-matplotlib库之核心对象
  • 设计模式——备忘录设计模式(行为型)
  • Kotlin 中 companion object 扩展函数详解
  • Java连接Redis和基础操作命令
  • 【Linux】Ubuntu 20.04 英文系统显示中文字体异常
  • 什么是线程上下文切换?
  • 【SpringBoot】| 接口架构风格—RESTful
  • 概率统计:AI大模型的数学支柱
  • Linux--进程概念
  • 【redis实战篇】第七天