基于卷积神经网络的肺炎影像分类分割智能诊断系统

项目参考 AAAI Association for the Advancement of Artificial Intelligence

研究背景与意义：

肺炎是一种常见的呼吸系统感染疾病，其主要病因包括细菌、病毒和真菌等。肺炎的早期诊断对于患者的治疗和预后至关重要。传统的肺炎诊断方法主要依赖于医生的经验和肺部影像学的观察，这种方法存在主观性强、诊断效率低等问题。随着计算机科学和人工智能的快速发展，基于卷积神经网络的肺炎影像分类分割智能诊断系统逐渐成为研究的热点。

卷积神经网络（Con v olut ion al Neur al Ne two rk，CNN）是一种模仿人类视觉系统的深度学习算法，具有自动学习和特征提取的能力。通过对大量的肺部影像数据进行训练，CNN可以自动识别和提取肺部影像中的特征，从而实现对肺炎的自动诊断。

基于卷积神经网络的肺炎影像分类分割智能诊断系统具有以下几个方面的意义：

综上所述，基于卷积神经网络的肺炎影像分类分割智能诊断系统具有重要的研究意义和应用价值。通过提高肺炎诊断的准确性和效率，该系统可以为医生提供辅助决策的依据，促进医学研究和教育的发展，最终提高肺炎患者的治疗效果和生存质量。



class ImageClassifier:
    def __init__(self, weights_path, data_path, img_size=(224, 224), device=''):
        self.device = select_device(device)
        self.model = DetectMultiBackend(weights_path, device=self.device, data=data_path)
        self.names = self.model.names
        self.img_size = img_size
        self.model.warmup(imgsz=(1, 3, *img_size))

    def classify(self, image):
        image_tensor = torch.Tensor(image).to(self.device)
        image_tensor = image_tensor.float()
        if len(image_tensor.shape) == 3:
            image_tensor = image_tensor[None]
        results = self.model(image_tensor)
        pred = F.softmax(results, dim=1)
        max_i = pred.argmax(dim=1).item()  # 使用 argmax 找到最大置信度的索引
        max_confidence = float(pred[0][max_i])  # 获取最大置信度的值
        return self.names[max_i], max_confidence


def load_image(image_path, img_size):
    dataset = LoadImages(image_path, img_size=img_size, transforms=classify_transforms(img_size[0]))
    return next(iter(dataset))[1]

if __name__ == '__main__':

    weights_path = './best.pt'
    data_path = './data/coco128.yaml'
    image_path = './test/1.jpg'

    classifier = ImageClassifier(weights_path, data_path)
    image = load_image(image_path, classifier.img_size)
    results = classifier.classify(image)
    print(results)

另外，还有一个辅助函数load_image(image_path, img_size)，用于加载图像并进行预处理。

在if __name__ == '__main__':部分，创建了一个ImageClassifier对象，加载图像并进行分类，最后打印结果。




def export_formats():
    # YOLOv5 export formats
    x = [
        ['PyTorch', '-', '.pt', True, True],
        ['TorchScript', 'torchscript', '.torchscript', True, True],
        ['ONNX', 'onnx', '.onnx', True, True],
        ['OpenVINO', 'openvino', '_openvino_model', True, False],
        ['TensorRT', 'engine', '.engine', False, True],
        ['CoreML', 'coreml', '.mlmodel', True, False],
        ['TensorFlow SavedModel', 'saved_model', '_saved_model', True, True],
        ['TensorFlow GraphDef', 'pb', '.pb', True, True],
        ['TensorFlow Lite', 'tflite', '.tflite', True, False],
        ['TensorFlow Edge TPU', 'edgetpu', '_edgetpu.tflite', False, False],
        ['TensorFlow.js', 'tfjs', '_web_model', False, False],
        ['PaddlePaddle', 'paddle', '_paddle_model', True, True],]
    return pd.DataFrame(x, columns=['Format', 'Argument', 'Suffix', 'CPU', 'GPU'])


def try_export(inner_func):
    # YOLOv5 export decorator, i..e @try_export
    inner_args = get_default_args(inner_func)

    def outer_func(*args, **kwargs):
        prefix = inner_args['prefix']
        try:
            with Profile() as dt:
                f, model = inner_func(*args, **kwargs)
            LOGGER.info(f'{prefix} export success ✅ {dt.t:.1f}s, saved as {f} ({file_size(f):.1f} MB)')
            return f, model
        except Exception as e:
            LOGGER.info(f'{prefix} export failure ❌ {dt.t:.1f}s: {e}')
            return None, None

    return outer_func


@try_export
def export_torchscript(model, im, file, optimize, prefix=colorstr('TorchScript:')):
    # YOLOv5 TorchScript model export
    LOGGER.info(f'n{prefix} starting export with torch {torch.__version__}...')
    f = file.with_suffix('.torchscript')

    ts = torch.jit.trace(model, im, strict=False)
    d = {'shape': im.shape, 'stride': int(max(model.stride)), 'names': model.names}
    extra_files = {'config.txt': json.dumps(d)}  # torch._C.ExtraFilesMap()
    if optimize:  # https://pytorch.org/tutorials/recipes/mobile_interpreter.html
        optimize_for_mobile(ts)._save_for_lite_interpreter(str(f), _extra_files=extra_files)
    else:
        ts.save(str(f), _extra_files=extra_files)
    return f, None


@try_export
def export_onnx(model, im, file, opset, dynamic, simplify, prefix=colorstr('ONNX:')):
    # YOLOv5 ONNX export
    check_requirements('onnx>=1.12.0')
    import onnx

    LOGGER.info(f'n{prefix} starting export with onnx {onnx.__version__}...')
    f = file.with_suffix('.onnx')

    output_names = ['output0', 'output1'] if isinstance(model, SegmentationModel) else ['output0']
    if dynamic:
        dynamic = {'images': {0: 'batch', 2: 'height', 3: 'width'}}  # shape(1,3,640,640)
        if isinstance(model, SegmentationModel):
            dynamic['output0'] = {0: 'batch', 1: 'anchors'}  # shape(1,25200,85)
            dynamic['output1'] = {0: 'batch', 2: 'mask_height', 3: 'mask_width'}  # shape(1,32,160,160)
        elif isinstance(model, DetectionModel):
            dynamic['output0'] = {0: 'batch', 1: 'anchors'}  # shape(1,25200,85)

    torch.onnx.export(
        model.cpu() if dynamic else model,  # --dynamic only compatible with cpu
        im.cpu() if dynamic else im,
        f,
        verbose=False,
        opset_version=opset,
        do_constant_folding=True,  # WARNING: DNN inference with torch>=1.12 may require do_constant_folding=False
        input_names=['images'],
        output_names=output_names,
        dynamic_axes=dynamic or None)

    # Checks
    model_onnx = onnx.load(f)  # load onnx model
    onnx.checker.check_model(model_onnx)  # check onnx model

    # Metadata
    d = {'stride': int(max(model.stride)), 'names': model.names}
    for k, v in d.items():
        meta = model_onnx.metadata_props.add()
        meta.key, meta.value = k, str(v)
    onnx.save(model_onnx, f)

    # Simplify
    if simplify:
        try:
            cuda = torch.cuda.is_available()
            check_requirements(('onnxruntime-gpu' if cuda else 'onnxruntime', 'onnx-simplifier>=0.4.1'))
            import onnxsim

            LOGGER.info(f'{prefix} simplifying with onnx-simplifier {onnxsim.__version__}...')
            model_onnx, check = onnxsim.simplify(model_onnx)
            ass



class ImageSegmentation:
    def __init__(self, image_path, model_path):
        self.image_path = image_path
        self.model_path = model_path

    def load_dataset(self):
        images = glob.glob(self.image_path)
        anno = images
        dataset = tf.data.Dataset.from_tensor_slices((images, anno))
        train_count = len(images)
        data_train = dataset.take(train_count)
        return data_train

    def read_jpg(self, path):
        img = tf.io.read_file(path)
        img = tf.image.decode_jpeg(img, channels=3)
        return img

    def read_png(self, path):
        img = tf.io.read_file(path)
        img = tf.image.decode_png(img, channels=1)
        return img

    def normal_img(self, input_image, input_anno):
        input_image = tf.cast(input_image, tf.float32)
        input_image = input_image / 127.5 - 1
        input_anno -= 1
        return input_image, input_anno

    def load_images(self, input_images_path, input_anno_path):
        input_image = self.read_jpg(input_images_path)
        input_anno = self.read_png(input_anno_path)
        input_image = tf.image.resize(input_image, (224, 224))
        input_anno = tf.image.resize(input_anno, (224, 224))
        return self.normal_img(input_image, input_anno)

    def set_config(self, data_train):
        data_train = data_train.map(self.load_images, num_parallel_calls=tf.data.experimental.AUTOTUNE)
        BATCH_SIZE = 32
        data_train = data_train.repeat().shuffle(100).batch(BATCH_SIZE)
        return data_train

    def predict(self):
        data_train = self.load_dataset()
        data_train = self.set_config(data_train)
        new_model = tf.keras.models.load_model(self.model_path)
        for image, mask in data_train.take(1):
            pred_mask = new_model.predict(image)
            pred_mask = tf.argmax(pred_mask, axis=-1)
            pred_mask = pred_mask[..., tf.newaxis]

            print(np.unique(pred_mask[0].numpy()))
            plt.figure(figsize=(10, 10))
            plt.subplot(1, 3, 1)
            plt.imshow(tf.keras.preprocessing.image.array_to_img(image[0]))
            plt.subplot(1, 3, 2)
            plt.imshow(tf.keras.preprocessing.image.array_to_img(mask[0]))
            plt.subplot(1, 3, 3)
            plt.imshow(tf.keras.preprocessing.image.array_to_img(pred_mask[0]))
            plt.show()



class ImageLoader:
    def __init__(self, images_path, anno_path, batch_size):
        self.images_path = images_path
        self.anno_path = anno_path
        self.batch_size = batch_size
        self.dataset = None
        self.train_count = None
        self.test_count = None
        self.data_train = None
        self.data_test = None

    def read_jpg(self, path):
        img = tf.io.read_file(path)
        img = tf.image.decode_jpeg(img, channels=3)
        return img

    def read_png(self, path):
        img = tf.io.read_file(path)
        img = tf.image.decode_png(img, channels=1)
        return img

    def normal_img(self, input_image, input_anno):
        input_image = tf.cast(input_image, tf.float32)
        input_image = input_image / 127.5 - 1
        return input_image, input_anno

    def load_images(self, input_images_path, input_anno_path):
        input_image = self.read_jpg(input_images_path)
        input_anno = self.read_png(input_anno_path)
        input_image = tf.image.resize(input_image, (224, 224))
        input_anno = tf.image.resize(input_anno, (224, 224))
        return self.normal_img(input_image, input_anno)

    def prepare_data(self):
        images = glob.glob(self.images_path)
        anno = glob.glob(self.anno_path)
        np.random.seed(2019)
        index = np.random.permutation(len(images))
        images = np.array(images)[index]
        anno = np.array(anno)[index]
        dataset = tf.data.Dataset.from_tensor_slices((images, anno))
        test_count = int(len(images) * 0.2)
        train_count = len(images) - test_count
        data_train = dataset.skip(test_count)
        data_test = dataset.take(test_count)
        data_train = data_train.map(self.load_images, num_parallel_calls=tf.data.experimental.AUTOTUNE)
        data_test = data_test.map(self.load_images, num_parallel_calls=tf.data.experimental.AUTOTUNE)
        data_train = data_train.repeat().shuffle(100).batch(self.batch_size)
        data_test = data_test.batch(self.batch_size)
        self.dataset = dataset
        self.train_count = train_count
        self.test_count = test_count
        self.data_train = data_train
        self.data_test = data_test
        ......



def load_dataset(image_path):
    images = glob.glob(image_path)
    anno = images
    dataset = tf.data.Dataset.from_tensor_slices((images, anno))  # 创建dataset
    train_count = len(images)
    data_train = dataset.take(train_count)
    return data_train

def read_jpg(path):  # jpg图像预处理
    img = tf.io.read_file(path)
    img = tf.image.decode_jpeg(img, channels=3)
    return img

def read_png(path):  # png图像预处理
    img = tf.io.read_file(path)
    img = tf.image.decode_png(img, channels=1)
    return img

def normal_img(input_image, input_anno):  # 归一化处理 0-255 转化为0-1
    input_image = tf.cast(input_image, tf.float32)  # 改变数据类型为float32
    input_image = input_image / 127.5 - 1  # 使jpg图片每个像素的值为 -1~1的范围
    input_anno -= 1  # 使png图片每个像素分类的范围在0,1,2之中
    return input_image, input_anno

def load_images(input_images_path, input_anno_path):  # 定义加载函数
    input_image = read_jpg(input_images_path)  # 加载图片
    input_anno = read_png(input_anno_path)  # 加载annotations
    input_image = tf.image.resize(input_image, (224, 224))  # 规范图片到同样的尺寸(224,224)
    input_anno = tf.image.resize(input_anno, (224, 224))  # 规范图片到同样的尺寸(224,224)
    return normal_img(input_image, input_anno)  # 归一化处理

def set_config(data_train):
    data_train = data_train.map(load_images,
                                num_parallel_calls=tf.data.experimental.AUTOTUNE)  # 设置多线程数为自适应最优配置
    BATCH_SIZE = 32  # 设置batch_size
    data_train = data_train.repeat().shuffle(100).batch(BATCH_SIZE)  # 设置学习率 batch_size
    return data_train

def seg(info1):
    global area1,area2
    area1 = 0
    check_version() #检查主要环境版本
    image_path = info1 #predict图片集完整路径（注意格式中的*）6
    data_train = load_dataset(image_path) #加载dataset
    data_train = set_config(data_train) #设置config
    new_model = tf.keras.models.load_model('./train/fei.h5')  # 加载完整模型
    #print(new_model.summary())  #展示模型的架构
    #以下均为绘图
    skip = 0
    for image, mask in data_train.take(1):
        pred_mask = new_model.predict(image)
        pred_mask = tf.argmax(pred_mask, axis=-1)
        pred_mask = pred_mask[..., tf.newaxis]

        print(np.unique(pred_mask[0].numpy()))
        plt.figure(figsize=(10, 10))
        plt.subplot(1, 3, 1)
        plt.imshow(tf.keras.preprocessing.image.array_to_img(image[0]))
        plt.subplot(1, 3, 2)
        plt.imshow(tf.keras.preprocessing.image.array_to_img(mask[0]))
        plt.subplot(1, 3, 3)
        plt.imshow(tf.keras.preprocessing.image.array_to_img(pred_mask[0]))
        if skip == 0:
            plt.imsave('./seg.jpg',
                       tf.keras.preprocessing.image.array_to_img(pred_mask[0]))
            skip = 1
        if skip == 1:
            break



class Conv(nn.Module):
    # Standard convolution with args(ch_in, ch_out, kernel, stride, padding, groups, dilation, activation)
    default_act = nn.SiLU()  # default activation

    def __init__(self, c1, c2, k=1, s=1, p=None, g=1, d=1, act=True):
        super().__init__()
        self.conv = nn.Conv2d(c1, c2, k, s, autopad(k, p, d), groups=g, dilation=d, bias=False)
        self.bn = nn.BatchNorm2d(c2)
        self.act = self.default_act if act is True else act if isinstance(act, nn.Module) else nn.Identity()

    def forward(self, x):
        return self.act(self.bn(self.conv(x)))

    def forward_fuse(self, x):
        return self.act(self.conv(x))


class DWConv(Conv):
    # Depth-wise convolution
    def __init__(self, c1, c2, k=1, s=1, d=1, act=True):  # ch_in, ch_out, kernel, stride, dilation, activation
        super().__init__(c1, c2, k, s, g=math.gcd(c1, c2), d=d, act=act)


class DWConvTranspose2d(nn.ConvTranspose2d):
    # Depth-wise transpose convolution
    def __init__(self, c1, c2, k=1, s=1, p1=0, p2=0):  # ch_in, ch_out, kernel, stride, padding, padding_out
        super().__init__(c1, c2, k, s, p1, p2, groups=math.gcd(c1, c2))


class Focus(nn.Module):
    # Focus wh information into c-space
    def __init__(self, c1, c2, k=1, s=1, p=None, g=1, act=True):  # ch_in, ch_out, kernel, stride, padding, groups
        super().__init__()
        self.conv = Conv(c1 * 4, c2, k, s, p, g, act=act)

    def forward(self, x):  # x(b,c,w,h) -> y(b,4c,w/2,h/2)
        return self.conv(torch.cat((x[..., ::2, ::2], x[..., 1::2, ::2], x[..., ::2, 1::2], x[..., 1::2, 1::2]), 1))

class Bottleneck(nn.Module):
    # Standard bottleneck
    def __init__(self, c1, c2, shortcut=True, g=1, e=0.5):  # ch_in, ch_out, shortcut, groups, expansion
        super().__init__()
        c_ = int(c2 * e)  # hidden channels
        self.cv1 = Conv(c1, c_, 1, 1)
        self.cv2 = Conv(c_, c2, 3, 1, g=g)
        self.add = shortcut and c1 == c2

    def forward(self, x):
        return x + self.cv2(self.cv1

文件路径	功能
Classifier.py	实现图像分类功能
export.py	实现模型导出功能
predict.py	实现图像分割功能
train.py	实现模型训练功能
ui.py	实现用户界面功能
models common.py	包含常用的模型类和函数
modelsexperimental.py	包含实验性的模型类和函数
modelstf.py	包含TensorFlow相关的模型类和函数
models yolo.py	包含YOLOv5模型类和函数
models_init_.py	模型模块的初始化文件
toolscheck_img.py	图像检查工具
toolscheck_seg.py	分割结果检查工具
tools url_get.py	从URL获取图像的工具
utils activations.py	激活函数相关的工具函数
utilsaugmentations.py	数据增强相关的工具函数
utilsautoanchor.py	自动锚框生成的工具函数
utilsautobatch.py	自动批量大小调整的工具函数
utils callbacks.py	回调函数相关的工具函数
utils dataloaders.py	数据加载器相关的工具函数
utilsdownloads.py	下载相关的工具函数
utilsgeneral.py	通用的工具函数
utilsloss.py	损失函数相关的工具函数
utilsmetrics.py	评估指标相关的工具函数
utilsplots.py	绘图相关的工具函数
utilstorch_utils.py	PyTorch相关的工具函数
utilstriton.py	Triton相关的工具函数
utils_init_.py	工具模块的初始化文件
utilsa ws resume.py	AWS相关的工具函数
utilsa ws_init_.py	AWS模块的初始化文件
utilsflask_rest_api example_request.py	Flask REST API示例请求的工具函数
utilsflask_rest_api restapi.py	Flask REST API的工具函数
utilsloggers_init_.py	日志记录器模块的初始化文件
utilslogger sclearm lclearml_utils.py	ClearML日志记录器的工具函数
utilslogger sclearmlhpo.py	ClearML日志记录器的超参数优化工具函数
utilslogger sclearml_init_.py	ClearML日志记录器模块的初始化文件
utilslogger scometcomet_utils.py	Comet日志记录器的工具函数
utilslogger scomethpo.py	Comet日志记录器的超参数优化工具函数
utilslogger scomet_init_.py	Comet日志记录器模块的初始化文件
utilsloggerswandb wan db_utils.py	WandB日志记录器的工具函数
utilsloggerswan db_init_.py	WandB日志记录器模块的初始化文件
utilssegmentaugmentations.py	分割数据增强相关的工具函数
utilssegmentdataloaders.py	分割数据加载器相关的工具函数
utilssegmentgeneral.py	分割通用的工具函数
utilssegment loss.py	分割损失函数相关的工具函数
utilssegment metrics.py	分割评估指标相关的工具函数
utilssegmentplots.py	分割绘图相关的工具函数
utilssegment_init_.py	分割模块的初始化文件