Upload folder using huggingface_hub

Browse files

Files changed (12) hide show

example_input_file/CBCT_01.h5 +3 -0
example_input_file/CBCT_02.h5 +3 -0
example_input_file/CBCT_03.h5 +3 -0
example_input_file/CBCT_04.h5 +3 -0
gradio_app.py +117 -0
model weights/rail_0_iter_7995_best.pth +3 -0
model weights/rail_1_iter_7995_best.pth +3 -0
model weights/rail_2_iter_7995_best.pth +3 -0
model weights/rail_3_iter_7995_best.pth +3 -0
model weights/roi_best_model.pth +3 -0
model.safetensors +1 -1
railnet_model.py +924 -0

example_input_file/CBCT_01.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:19680f9f0b220ee20b55731f386276d3c00496ae861ed3ecedc759d6ec2b8a42
+size 716802048

example_input_file/CBCT_02.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ed421541ed92ab7c203aa8edbfde743d139fef000264a8279353a08087f5735f
+size 716802048

example_input_file/CBCT_03.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4beb84cb31420c30aeb992345192b8bc8e798542f502b4d7d48c6b1060bda8ae
+size 716802048

example_input_file/CBCT_04.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ecfd0c239381a72acecf48de3f309c4a79267f27cfbce00b4f126a8b35fc7a81
+size 839682048

gradio_app.py ADDED Viewed

	@@ -0,0 +1,117 @@

+import os
+import time
+import h5py
+import numpy as np
+import gradio as gr
+import plotly.graph_objects as go
+from railnet_model import RailNetSystem
+os.environ['KMP_DUPLICATE_LIB_OK'] = 'True'
+os.environ["CUDA_VISIBLE_DEVICES"] = "0"
+model = RailNetSystem.from_pretrained(".").cuda()
+model.load_weights(".")
+def wait_for_stable_file(file_path, timeout=5, check_interval=0.2):
+    start_time = time.time()
+    last_size = -1
+    while time.time() - start_time < timeout:
+        current_size = os.path.getsize(file_path)
+        if current_size == last_size:
+            return True
+        last_size = current_size
+        time.sleep(check_interval)
+    return False
+def process_cbct_file(h5_file, save_dir="./output"):
+    if not wait_for_stable_file(h5_file.name):
+        raise RuntimeError("File upload has not been completed or is unstable, please try again.")
+    try:
+        with h5py.File(h5_file.name, "r") as f:
+            if "image" not in f or "label" not in f:
+                raise KeyError("The file is missing ‘image’ or ‘label’ value")
+            image = f["image"][:]
+            label = f["label"][:]
+    except Exception as e:
+        raise RuntimeError(f"Failed to read the .h5 file: {str(e)}")
+    name = os.path.basename(h5_file.name).replace(".h5", "")
+    pred, dice, jc, hd, asd = model(image, label, save_dir, name)
+    return pred, f"Dice: {dice:.4f}, Jaccard: {jc:.4f}, 95HD: {hd:.2f}, ASD: {asd:.2f}"
+def render_plotly_volume(pred, x_eye=1.25, y_eye=1.25, z_eye=1.25):
+    downsample_factor = 2
+    pred_ds = pred[::downsample_factor, ::downsample_factor, ::downsample_factor]
+    fig = go.Figure(data=go.Volume(
+        x=np.repeat(np.arange(pred_ds.shape[0]), pred_ds.shape[1] * pred_ds.shape[2]),
+        y=np.tile(np.repeat(np.arange(pred_ds.shape[1]), pred_ds.shape[2]), pred_ds.shape[0]),
+        z=np.tile(np.arange(pred_ds.shape[2]), pred_ds.shape[0] * pred_ds.shape[1]),
+        value=pred_ds.flatten(),
+        isomin=0.5,
+        isomax=1.0,
+        opacity=0.1,
+        surface_count=1,
+        colorscale=[[0, 'rgb(255, 0, 0)'], [1, 'rgb(255, 0, 0)']],
+        showscale=False
+    ))
+    fig.update_layout(
+        scene=dict(
+            xaxis=dict(visible=False),
+            yaxis=dict(visible=False),
+            zaxis=dict(visible=False),
+            camera=dict(eye=dict(x=x_eye, y=y_eye, z=z_eye))
+        ),
+        margin=dict(l=0, r=0, b=0, t=0)
+    )
+    return fig
+def clear_all():
+    return None, "", None
+with gr.Blocks() as demo:
+    gr.Markdown("<div style='text-align: center; font-size: 28px; font-weight: bold;'>🦷 Demo of RailNet: A CBCT Tooth Segmentation System</div>")
+    gr.Markdown("<div style='text-align: center; font-size: 20px'>✅ Steps: Upload a CBCT example file (.h5)  →  Automatic inference and metrics display  →  View 3D segmentation result (Mouse drag and scroll wheel zooming)</div>")
+    gr.Markdown("<div style='height: 20px;'></div>")
+    gr.Markdown("<div style='font-size: 20px; font-weight: bold;'>📂 Step 1: Upload the .h5 example file containing both ‘image’ and ‘label’ values</div>")
+    file_input = gr.File()
+    with gr.Row():
+        clear_btn = gr.Button("清除", variant="secondary")
+        submit_btn = gr.Button("提交", variant="primary")
+    gr.Markdown("<div style='height: 20px;'></div>")
+    gr.Markdown("<div style='font-size: 20px; font-weight: bold;'>📊 Step 2: Metrics (Dice, Jaccard, 95HD, ASD)</div>")
+    result_text = gr.Textbox()
+    hidden_pred = gr.State(value=None)
+    gr.Markdown("<div style='height: 20px;'></div>")
+    gr.Markdown("<div style='font-size: 20px; font-weight: bold;'>👁️ Step 3: 3D Visualisation</div>")
+    plot_output = gr.Plot()
+    def handle_upload(h5_file):
+        pred, metrics = process_cbct_file(h5_file)
+        fig = render_plotly_volume(pred)
+        return metrics, pred, fig
+    submit_btn.click(
+        fn=handle_upload,
+        inputs=[file_input],
+        outputs=[result_text, hidden_pred, plot_output]
+    )
+    def update_view(pred, x_eye, y_eye, z_eye):
+        if pred is None:
+            return gr.update()
+        return render_plotly_volume(pred, x_eye, y_eye, z_eye)
+    clear_btn.click(
+        fn=clear_all,
+        inputs=[],
+        outputs=[file_input, result_text, plot_output]
+    )
+demo.launch()

model weights/rail_0_iter_7995_best.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9085f5b56d7598efa06a17c09fe4a922feca7039faea329f3b5d3dba4e7479d3
+size 37890229

model weights/rail_1_iter_7995_best.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66a4b9ba3314ff6421db1d2ddebdccc6aecd76477c599decbe2da82eeede2857
+size 37890229

model weights/rail_2_iter_7995_best.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef122d5b0770a92f81c49597daf9205255698f947f11fb39d371cfb1b9fb4359
+size 101339695

model weights/rail_3_iter_7995_best.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01e9210704169266994ebb5f468b323b262c9cbce968b35dc9a74665ae0bf85d
+size 101339695

model weights/roi_best_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:629e02002b680e44bffab99bc5d469502045a24d0347e561f471753738a3ae57
+size 37889184

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:76d4d74def12d6df1e6e1a4ff1fc92818eba6485bd11129eed89f9f97e018c94
 size 37839024

 version https://git-lfs.github.com/spec/v1
+oid sha256:20c9bfd0d3bdbea2411f8c92139f7774f658e4a5d72d2277adac7e2ef368a38a
 size 37839024

railnet_model.py ADDED Viewed

	@@ -0,0 +1,924 @@

+import os
+os.environ['KMP_DUPLICATE_LIB_OK']='True'
+os.environ["CUDA_VISIBLE_DEVICES"] = "0"
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from huggingface_hub import PyTorchModelHubMixin
+import numpy as np
+import nibabel as nib
+from skimage import morphology
+import math
+from scipy import ndimage
+from medpy import metric
+import h5py
+from tqdm import tqdm
+class ConvBlock(nn.Module):
+    def __init__(self, n_stages, n_filters_in, n_filters_out, normalization='none'):
+        super(ConvBlock, self).__init__()
+        ops = []
+        for i in range(n_stages):
+            if i == 0:
+                input_channel = n_filters_in
+            else:
+                input_channel = n_filters_out
+            ops.append(nn.Conv3d(input_channel, n_filters_out, 3, padding=1))
+            if normalization == 'batchnorm':
+                ops.append(nn.BatchNorm3d(n_filters_out))
+            elif normalization == 'groupnorm':
+                ops.append(nn.GroupNorm(num_groups=16, num_channels=n_filters_out))
+            elif normalization == 'instancenorm':
+                ops.append(nn.InstanceNorm3d(n_filters_out))
+            elif normalization != 'none':
+                assert False
+            ops.append(nn.ReLU(inplace=True))
+        self.conv = nn.Sequential(*ops)
+    def forward(self, x):
+        x = self.conv(x)
+        return x
+class DownsamplingConvBlock(nn.Module):
+    def __init__(self, n_filters_in, n_filters_out, stride=2, normalization='none'):
+        super(DownsamplingConvBlock, self).__init__()
+        ops = []
+        if normalization != 'none':
+            ops.append(nn.Conv3d(n_filters_in, n_filters_out, stride, padding=0, stride=stride))
+            if normalization == 'batchnorm':
+                ops.append(nn.BatchNorm3d(n_filters_out))
+            elif normalization == 'groupnorm':
+                ops.append(nn.GroupNorm(num_groups=16, num_channels=n_filters_out))
+            elif normalization == 'instancenorm':
+                ops.append(nn.InstanceNorm3d(n_filters_out))
+            else:
+                assert False
+        else:
+            ops.append(nn.Conv3d(n_filters_in, n_filters_out, stride, padding=0, stride=stride))
+        ops.append(nn.ReLU(inplace=True))
+        self.conv = nn.Sequential(*ops)
+    def forward(self, x):
+        x = self.conv(x)
+        return x
+class UpsamplingDeconvBlock(nn.Module):
+    def __init__(self, n_filters_in, n_filters_out, stride=2, normalization='none'):
+        super(UpsamplingDeconvBlock, self).__init__()
+        ops = []
+        if normalization != 'none':
+            ops.append(nn.ConvTranspose3d(n_filters_in, n_filters_out, stride, padding=0, stride=stride))
+            if normalization == 'batchnorm':
+                ops.append(nn.BatchNorm3d(n_filters_out))
+            elif normalization == 'groupnorm':
+                ops.append(nn.GroupNorm(num_groups=16, num_channels=n_filters_out))
+            elif normalization == 'instancenorm':
+                ops.append(nn.InstanceNorm3d(n_filters_out))
+            else:
+                assert False
+        else:
+            ops.append(nn.ConvTranspose3d(n_filters_in, n_filters_out, stride, padding=0, stride=stride))
+        ops.append(nn.ReLU(inplace=True))
+        self.conv = nn.Sequential(*ops)
+    def forward(self, x):
+        x = self.conv(x)
+        return x
+class Upsampling(nn.Module):
+    def __init__(self, n_filters_in, n_filters_out, stride=2, normalization='none'):
+        super(Upsampling, self).__init__()
+        ops = []
+        ops.append(nn.Upsample(scale_factor=stride, mode='trilinear', align_corners=False))
+        ops.append(nn.Conv3d(n_filters_in, n_filters_out, kernel_size=3, padding=1))
+        if normalization == 'batchnorm':
+            ops.append(nn.BatchNorm3d(n_filters_out))
+        elif normalization == 'groupnorm':
+            ops.append(nn.GroupNorm(num_groups=16, num_channels=n_filters_out))
+        elif normalization == 'instancenorm':
+            ops.append(nn.InstanceNorm3d(n_filters_out))
+        elif normalization != 'none':
+            assert False
+        ops.append(nn.ReLU(inplace=True))
+        self.conv = nn.Sequential(*ops)
+    def forward(self, x):
+        x = self.conv(x)
+        return x
+class ConnectNet(nn.Module):
+    def __init__(self, in_channels, out_channels, input_size):
+        super(ConnectNet, self).__init__()
+        self.encoder = nn.Sequential(
+            nn.Conv3d(in_channels, 128, kernel_size=3, stride=1, padding=1),
+            nn.ReLU(),
+            nn.MaxPool3d(kernel_size=2, stride=2),
+            nn.Conv3d(128, 64, kernel_size=3, stride=1, padding=1),
+            nn.ReLU(),
+            nn.MaxPool3d(kernel_size=2, stride=2)
+        )
+        self.decoder = nn.Sequential(
+            nn.ConvTranspose3d(64, 128, kernel_size=2, stride=2),
+            nn.ReLU(),
+            nn.ConvTranspose3d(128, out_channels, kernel_size=2, stride=2),
+            nn.Sigmoid()
+        )
+    def forward(self, x):
+        encoded = self.encoder(x)
+        decoded = self.decoder(encoded)
+        return decoded
+class VNet(nn.Module):
+    def __init__(self, n_channels=3, n_classes=2, n_filters=16, normalization='none', has_dropout=False):
+        super(VNet, self).__init__()
+        self.has_dropout = has_dropout
+        self.block_one = ConvBlock(1, n_channels, n_filters, normalization=normalization)
+        self.block_one_dw = DownsamplingConvBlock(n_filters, 2 * n_filters, normalization=normalization)
+        self.block_two = ConvBlock(2, n_filters * 2, n_filters * 2, normalization=normalization)
+        self.block_two_dw = DownsamplingConvBlock(n_filters * 2, n_filters * 4, normalization=normalization)
+        self.block_three = ConvBlock(3, n_filters * 4, n_filters * 4, normalization=normalization)
+        self.block_three_dw = DownsamplingConvBlock(n_filters * 4, n_filters * 8, normalization=normalization)
+        self.block_four = ConvBlock(3, n_filters * 8, n_filters * 8, normalization=normalization)
+        self.block_four_dw = DownsamplingConvBlock(n_filters * 8, n_filters * 16, normalization=normalization)
+        self.block_five = ConvBlock(3, n_filters * 16, n_filters * 16, normalization=normalization)
+        self.block_five_up = UpsamplingDeconvBlock(n_filters * 16, n_filters * 8, normalization=normalization)
+        self.block_six = ConvBlock(3, n_filters * 8, n_filters * 8, normalization=normalization)
+        self.block_six_up = UpsamplingDeconvBlock(n_filters * 8, n_filters * 4, normalization=normalization)
+        self.block_seven = ConvBlock(3, n_filters * 4, n_filters * 4, normalization=normalization)
+        self.block_seven_up = UpsamplingDeconvBlock(n_filters * 4, n_filters * 2, normalization=normalization)
+        self.block_eight = ConvBlock(2, n_filters * 2, n_filters * 2, normalization=normalization)
+        self.block_eight_up = UpsamplingDeconvBlock(n_filters * 2, n_filters, normalization=normalization)
+        self.block_nine = ConvBlock(1, n_filters, n_filters, normalization=normalization)
+        self.out_conv = nn.Conv3d(n_filters, n_classes, 1, padding=0)
+        self.dropout = nn.Dropout3d(p=0.5, inplace=False)
+        self.__init_weight()
+    def encoder(self, input):
+        x1 = self.block_one(input)
+        x1_dw = self.block_one_dw(x1)
+        x2 = self.block_two(x1_dw)
+        x2_dw = self.block_two_dw(x2)
+        x3 = self.block_three(x2_dw)
+        x3_dw = self.block_three_dw(x3)
+        x4 = self.block_four(x3_dw)
+        x4_dw = self.block_four_dw(x4)
+        x5 = self.block_five(x4_dw)
+        if self.has_dropout:
+            x5 = self.dropout(x5)
+        res = [x1, x2, x3, x4, x5]
+        return res
+    def decoder(self, features):
+        x1 = features[0]
+        x2 = features[1]
+        x3 = features[2]
+        x4 = features[3]
+        x5 = features[4]
+        x5_up = self.block_five_up(x5)
+        x5_up = x5_up + x4
+        x6 = self.block_six(x5_up)
+        x6_up = self.block_six_up(x6)
+        x6_up = x6_up + x3
+        x7 = self.block_seven(x6_up)
+        x7_up = self.block_seven_up(x7)
+        x7_up = x7_up + x2
+        x8 = self.block_eight(x7_up)
+        x8_up = self.block_eight_up(x8)
+        x8_up = x8_up + x1
+        x9 = self.block_nine(x8_up)
+        if self.has_dropout:
+            x9 = self.dropout(x9)
+        out = self.out_conv(x9)
+        return out
+    def forward(self, input, turnoff_drop=False):
+        if turnoff_drop:
+            has_dropout = self.has_dropout
+            self.has_dropout = False
+        features = self.encoder(input)
+        out = self.decoder(features)
+        if turnoff_drop:
+            self.has_dropout = has_dropout
+        return out
+    def __init_weight(self):
+        for m in self.modules():
+            if isinstance(m, nn.Conv3d) or isinstance(m, nn.ConvTranspose3d):
+                torch.nn.init.kaiming_normal_(m.weight)
+            elif isinstance(m, nn.BatchNorm3d):
+                m.weight.data.fill_(1)
+                m.bias.data.zero_()
+class VNet_roi(nn.Module):
+    def __init__(self, n_channels=3, n_classes=2, n_filters=16, normalization='none', has_dropout=False):
+        super(VNet_roi, self).__init__()
+        self.has_dropout = has_dropout
+        self.block_one = ConvBlock(1, n_channels, n_filters, normalization=normalization)
+        self.block_one_dw = DownsamplingConvBlock(n_filters, 2 * n_filters, normalization=normalization)
+        self.block_two = ConvBlock(2, n_filters * 2, n_filters * 2, normalization=normalization)
+        self.block_two_dw = DownsamplingConvBlock(n_filters * 2, n_filters * 4, normalization=normalization)
+        self.block_three = ConvBlock(3, n_filters * 4, n_filters * 4, normalization=normalization)
+        self.block_three_dw = DownsamplingConvBlock(n_filters * 4, n_filters * 8, normalization=normalization)
+        self.block_four = ConvBlock(3, n_filters * 8, n_filters * 8, normalization=normalization)
+        self.block_four_dw = DownsamplingConvBlock(n_filters * 8, n_filters * 16, normalization=normalization)
+        self.block_five = ConvBlock(3, n_filters * 16, n_filters * 16, normalization=normalization)
+        self.block_five_up = UpsamplingDeconvBlock(n_filters * 16, n_filters * 8, normalization=normalization)
+        self.block_six = ConvBlock(3, n_filters * 8, n_filters * 8, normalization=normalization)
+        self.block_six_up = UpsamplingDeconvBlock(n_filters * 8, n_filters * 4, normalization=normalization)
+        self.block_seven = ConvBlock(3, n_filters * 4, n_filters * 4, normalization=normalization)
+        self.block_seven_up = UpsamplingDeconvBlock(n_filters * 4, n_filters * 2, normalization=normalization)
+        self.block_eight = ConvBlock(2, n_filters * 2, n_filters * 2, normalization=normalization)
+        self.block_eight_up = UpsamplingDeconvBlock(n_filters * 2, n_filters, normalization=normalization)
+        self.block_nine = ConvBlock(1, n_filters, n_filters, normalization=normalization)
+        self.out_conv = nn.Conv3d(n_filters, n_classes, 1, padding=0)
+        self.dropout = nn.Dropout3d(p=0.5, inplace=False)
+        # self.__init_weight()
+    def encoder(self, input):
+        x1 = self.block_one(input)
+        x1_dw = self.block_one_dw(x1)
+        x2 = self.block_two(x1_dw)
+        x2_dw = self.block_two_dw(x2)
+        x3 = self.block_three(x2_dw)
+        x3_dw = self.block_three_dw(x3)
+        x4 = self.block_four(x3_dw)
+        x4_dw = self.block_four_dw(x4)
+        x5 = self.block_five(x4_dw)
+        # x5 = F.dropout3d(x5, p=0.5, training=True)
+        if self.has_dropout:
+            x5 = self.dropout(x5)
+        res = [x1, x2, x3, x4, x5]
+        return res
+    def decoder(self, features):
+        x1 = features[0]
+        x2 = features[1]
+        x3 = features[2]
+        x4 = features[3]
+        x5 = features[4]
+        x5_up = self.block_five_up(x5)
+        x5_up = x5_up + x4
+        x6 = self.block_six(x5_up)
+        x6_up = self.block_six_up(x6)
+        x6_up = x6_up + x3
+        x7 = self.block_seven(x6_up)
+        x7_up = self.block_seven_up(x7)
+        x7_up = x7_up + x2
+        x8 = self.block_eight(x7_up)
+        x8_up = self.block_eight_up(x8)
+        x8_up = x8_up + x1
+        x9 = self.block_nine(x8_up)
+        # x9 = F.dropout3d(x9, p=0.5, training=True)
+        if self.has_dropout:
+            x9 = self.dropout(x9)
+        out = self.out_conv(x9)
+        return out
+    def forward(self, input, turnoff_drop=False):
+        if turnoff_drop:
+            has_dropout = self.has_dropout
+            self.has_dropout = False
+        features = self.encoder(input)
+        out = self.decoder(features)
+        if turnoff_drop:
+            self.has_dropout = has_dropout
+        return out
+class ResVNet(nn.Module):
+    def __init__(self, n_channels=1, n_classes=2, n_filters=16, normalization='instancenorm', has_dropout=False):
+        super(ResVNet, self).__init__()
+        self.resencoder = resnet34()
+        self.has_dropout = has_dropout
+        self.block_one = ConvBlock(1, n_channels, n_filters, normalization=normalization)
+        self.block_one_dw = DownsamplingConvBlock(n_filters, 2 * n_filters, normalization=normalization)
+        self.block_two = ConvBlock(2, n_filters * 2, n_filters * 2, normalization=normalization)
+        self.block_two_dw = DownsamplingConvBlock(n_filters * 2, n_filters * 4, normalization=normalization)
+        self.block_three = ConvBlock(3, n_filters * 4, n_filters * 4, normalization=normalization)
+        self.block_three_dw = DownsamplingConvBlock(n_filters * 4, n_filters * 8, normalization=normalization)
+        self.block_four = ConvBlock(3, n_filters * 8, n_filters * 8, normalization=normalization)
+        self.block_four_dw = DownsamplingConvBlock(n_filters * 8, n_filters * 16, normalization=normalization)
+        self.block_five = ConvBlock(3, n_filters * 16, n_filters * 16, normalization=normalization)
+        self.block_five_up = UpsamplingDeconvBlock(n_filters * 16, n_filters * 8, normalization=normalization)
+        self.block_six = ConvBlock(3, n_filters * 8, n_filters * 8, normalization=normalization)
+        self.block_six_up = UpsamplingDeconvBlock(n_filters * 8, n_filters * 4, normalization=normalization)
+        self.block_seven = ConvBlock(3, n_filters * 4, n_filters * 4, normalization=normalization)
+        self.block_seven_up = UpsamplingDeconvBlock(n_filters * 4, n_filters * 2, normalization=normalization)
+        self.block_eight = ConvBlock(2, n_filters * 2, n_filters * 2, normalization=normalization)
+        self.block_eight_up = UpsamplingDeconvBlock(n_filters * 2, n_filters, normalization=normalization)
+        self.block_nine = ConvBlock(1, n_filters, n_filters, normalization=normalization)
+        self.out_conv = nn.Conv3d(n_filters, n_classes, 1, padding=0)
+        if has_dropout:
+            self.dropout = nn.Dropout3d(p=0.5)
+        self.branchs = nn.ModuleList()
+        for i in range(1):
+            if has_dropout:
+                seq = nn.Sequential(
+                    ConvBlock(1, n_filters, n_filters, normalization=normalization),
+                    nn.Dropout3d(p=0.5),
+                    nn.Conv3d(n_filters, n_classes, 1, padding=0)
+                )
+            else:
+                seq = nn.Sequential(
+                    ConvBlock(1, n_filters, n_filters, normalization=normalization),
+                    nn.Conv3d(n_filters, n_classes, 1, padding=0)
+                )
+            self.branchs.append(seq)
+    def encoder(self, input):
+        x1 = self.block_one(input)
+        x1_dw = self.block_one_dw(x1)
+        x2 = self.block_two(x1_dw)
+        x2_dw = self.block_two_dw(x2)
+        x3 = self.block_three(x2_dw)
+        x3_dw = self.block_three_dw(x3)
+        x4 = self.block_four(x3_dw)
+        x4_dw = self.block_four_dw(x4)
+        x5 = self.block_five(x4_dw)
+        if self.has_dropout:
+            x5 = self.dropout(x5)
+        res = [x1, x2, x3, x4, x5]
+        return res
+    def decoder(self, features):
+        x1 = features[0]
+        x2 = features[1]
+        x3 = features[2]
+        x4 = features[3]
+        x5 = features[4]
+        x5_up = self.block_five_up(x5)
+        x5_up = x5_up + x4
+        x6 = self.block_six(x5_up)
+        x6_up = self.block_six_up(x6)
+        x6_up = x6_up + x3
+        x7 = self.block_seven(x6_up)
+        x7_up = self.block_seven_up(x7)
+        x7_up = x7_up + x2
+        x8 = self.block_eight(x7_up)
+        x8_up = self.block_eight_up(x8)
+        x8_up = x8_up + x1
+        x9 = self.block_nine(x8_up)
+        out = self.out_conv(x9)
+        return out
+    def forward(self, input, turnoff_drop=False):
+        if turnoff_drop:
+            has_dropout = self.has_dropout
+            self.has_dropout = False
+        features = self.resencoder(input)
+        out = self.decoder(features)
+        if turnoff_drop:
+            self.has_dropout = has_dropout
+        return out
+__all__ = ['ResNet',  'resnet34']
+def conv3x3(in_planes, out_planes, stride=1):
+    """3x3 convolution with padding"""
+    return nn.Conv3d(in_planes, out_planes, kernel_size=3, stride=stride, padding=1, bias=False)
+def conv3x3_bn_relu(in_planes, out_planes, stride=1):
+    return nn.Sequential(
+        conv3x3(in_planes, out_planes, stride),
+        nn.InstanceNorm3d(out_planes),
+        nn.ReLU()
+    )
+class BasicBlock(nn.Module):
+    expansion = 1
+    def __init__(self, inplanes, planes, stride=1, downsample=None,
+                 groups=1, base_width=64, dilation=-1):
+        super(BasicBlock, self).__init__()
+        if groups != 1 or base_width != 64:
+            raise ValueError('BasicBlock only supports groups=1 and base_width=64')
+        self.conv1 = conv3x3(inplanes, planes, stride)
+        self.bn1 = nn.InstanceNorm3d(planes)
+        self.relu = nn.ReLU(inplace=True)
+        self.conv2 = conv3x3(planes, planes)
+        self.bn2 = nn.InstanceNorm3d(planes)
+        self.downsample = downsample
+        self.stride = stride
+    def forward(self, x):
+        residual = x
+        out = self.conv1(x)
+        out = self.bn1(out)
+        out = self.relu(out)
+        out = self.conv2(out)
+        out = self.bn2(out)
+        if self.downsample is not None:
+            residual = self.downsample(x)
+        out += residual
+        out = self.relu(out)
+        return out
+class Bottleneck(nn.Module):
+    expansion = 4
+    def __init__(self, inplanes, planes, stride=1, downsample=None,
+                 groups=1, base_width=64, dilation=1):
+        super(Bottleneck, self).__init__()
+        width = int(planes * (base_width / 64.)) * groups
+        self.conv1 = nn.Conv3d(inplanes, width, kernel_size=1, bias=False)
+        self.bn1 = nn.InstanceNorm3d(width)
+        self.conv2 = nn.Conv3d(width, width, kernel_size=3, stride=stride, dilation=dilation,
+                               padding=dilation, groups=groups, bias=False)
+        self.bn2 = nn.InstanceNorm3d(width)
+        self.conv3 = nn.Conv3d(width, planes * self.expansion, kernel_size=1, bias=False)
+        self.bn3 = nn.InstanceNorm3d(planes * self.expansion)
+        self.relu = nn.ReLU(inplace=True)
+        self.downsample = downsample
+        self.stride = stride
+    def forward(self, x):
+        residual = x
+        out = self.conv1(x)
+        out = self.bn1(out)
+        out = self.relu(out)
+        out = self.conv2(out)
+        out = self.bn2(out)
+        out = self.relu(out)
+        out = self.conv3(out)
+        out = self.bn3(out)
+        if self.downsample is not None:
+            residual = self.downsample(x)
+        out += residual
+        out = self.relu(out)
+        return out
+class ResNet(nn.Module):
+    def __init__(self, block, layers, in_channel=1, width=1,
+                 groups=1, width_per_group=64,
+                 mid_dim=1024, low_dim=128,
+                 avg_down=False, deep_stem=False,
+                 head_type='mlp_head', layer4_dilation=1):
+        super(ResNet, self).__init__()
+        self.avg_down = avg_down
+        self.inplanes = 16 * width
+        self.base = int(16 * width)
+        self.groups = groups
+        self.base_width = width_per_group
+        mid_dim = self.base * 8 * block.expansion
+        if deep_stem:
+            self.conv1 = nn.Sequential(
+                conv3x3_bn_relu(in_channel, 32, stride=2),
+                conv3x3_bn_relu(32, 32, stride=1),
+                conv3x3(32, 64, stride=1)
+            )
+        else:
+            self.conv1 = nn.Conv3d(in_channel, self.inplanes, kernel_size=7, stride=1, padding=3, bias=False)
+        self.bn1 = nn.InstanceNorm3d(self.inplanes)
+        self.relu = nn.ReLU(inplace=True)
+        self.maxpool = nn.MaxPool3d(kernel_size=3, stride=2, padding=1)
+        self.layer1 = self._make_layer(block, self.base*2, layers[0],stride=2)
+        self.layer2 = self._make_layer(block, self.base * 4, layers[1], stride=2)
+        self.layer3 = self._make_layer(block, self.base * 8, layers[2], stride=2)
+        if layer4_dilation == 1:
+            self.layer4 = self._make_layer(block, self.base * 16, layers[3], stride=2)
+        elif layer4_dilation == 2:
+            self.layer4 = self._make_layer(block, self.base * 16, layers[3], stride=1, dilation=2)
+        else:
+            raise NotImplementedError
+        self.avgpool = nn.AvgPool3d(7, stride=1)
+    def _make_layer(self, block, planes, blocks, stride=1, dilation=1):
+        downsample = None
+        if stride != 1 or self.inplanes != planes * block.expansion:
+            if self.avg_down:
+                downsample = nn.Sequential(
+                    nn.AvgPool3d(kernel_size=stride, stride=stride),
+                    nn.Conv3d(self.inplanes, planes * block.expansion,
+                              kernel_size=1, stride=1, bias=False),
+                    nn.InstanceNorm3d(planes * block.expansion),
+                )
+            else:
+                downsample = nn.Sequential(
+                    nn.Conv3d(self.inplanes, planes * block.expansion,
+                              kernel_size=1, stride=stride, bias=False),
+                    nn.InstanceNorm3d(planes * block.expansion),
+                )
+        layers = [block(self.inplanes, planes, stride, downsample, self.groups, self.base_width, dilation)]
+        self.inplanes = planes * block.expansion
+        for _ in range(1, blocks):
+            layers.append(block(self.inplanes, planes, groups=self.groups, base_width=self.base_width, dilation=dilation))
+        return nn.Sequential(*layers)
+    def forward(self, x):
+        x = self.conv1(x)
+        x = self.bn1(x)
+        x = self.relu(x)
+        #c2 = self.maxpool(x)
+        c2 = self.layer1(x)
+        c3 = self.layer2(c2)
+        c4 = self.layer3(c3)
+        c5 = self.layer4(c4)
+        return [x,c2,c3,c4,c5]
+def resnet34(**kwargs):
+    return ResNet(BasicBlock, [3, 4, 6, 3], **kwargs)
+def label_rescale(image_label, w_ori, h_ori, z_ori, flag):
+    w_ori, h_ori, z_ori = int(w_ori), int(h_ori), int(z_ori)
+    # resize label map (int)
+    if flag == 'trilinear':
+        teeth_ids = np.unique(image_label)
+        image_label_ori = np.zeros((w_ori, h_ori, z_ori))
+        image_label = torch.from_numpy(image_label).cuda(0)
+        for label_id in range(len(teeth_ids)):
+            image_label_bn = (image_label == teeth_ids[label_id]).float()
+            image_label_bn = image_label_bn[None, None, :, :, :]
+            image_label_bn = torch.nn.functional.interpolate(image_label_bn, size=(w_ori, h_ori, z_ori),
+                                                             mode='trilinear', align_corners=False)
+            image_label_bn = image_label_bn[0, 0, :, :, :]
+            image_label_bn = image_label_bn.cpu().data.numpy()
+            image_label_ori[image_label_bn > 0.5] = teeth_ids[label_id]
+        image_label = image_label_ori
+    if flag == 'nearest':
+        image_label = torch.from_numpy(image_label).cuda(0)
+        image_label = image_label[None, None, :, :, :].float()
+        image_label = torch.nn.functional.interpolate(image_label, size=(w_ori, h_ori, z_ori), mode='nearest')
+        image_label = image_label[0, 0, :, :, :].cpu().data.numpy()
+    return image_label
+def img_crop(image_bbox):
+    if image_bbox.sum() > 0:
+        x_min = np.nonzero(image_bbox)[0].min() - 8
+        x_max = np.nonzero(image_bbox)[0].max() + 8
+        y_min = np.nonzero(image_bbox)[1].min() - 16
+        y_max = np.nonzero(image_bbox)[1].max() + 16
+        z_min = np.nonzero(image_bbox)[2].min() - 16
+        z_max = np.nonzero(image_bbox)[2].max() + 16
+        if x_min < 0:
+            x_min = 0
+        if y_min < 0:
+            y_min = 0
+        if z_min < 0:
+            z_min = 0
+        if x_max > image_bbox.shape[0]:
+            x_max = image_bbox.shape[0]
+        if y_max > image_bbox.shape[1]:
+            y_max = image_bbox.shape[1]
+        if z_max > image_bbox.shape[2]:
+            z_max = image_bbox.shape[2]
+        if (x_max - x_min) % 16 != 0:
+            x_max -= (x_max - x_min) % 16
+        if (y_max - y_min) % 16 != 0:
+            y_max -= (y_max - y_min) % 16
+        if (z_max - z_min) % 16 != 0:
+            z_max -= (z_max - z_min) % 16
+    if image_bbox.sum() == 0:
+        x_min, x_max, y_min, y_max, z_min, z_max = -1, image_bbox.shape[0], 0, image_bbox.shape[1], 0, image_bbox.shape[
+            2]
+    return x_min, x_max, y_min, y_max, z_min, z_max
+def roi_extraction(image, net_roi, ids):
+    w, h, d = image.shape
+    # roi binary segmentation parameters, the input spacing is 0.4 mm
+    print('---run the roi binary segmentation.')
+    stride_xy = 32
+    stride_z = 16
+    patch_size_roi_stage = (112, 112, 80)
+    label_roi = roi_detection(net_roi, image[0:w:2, 0:h:2, 0:d:2], stride_xy, stride_z,
+                              patch_size_roi_stage)  # (400,400,200)
+    print(label_roi.shape, np.max(label_roi))
+    label_roi = label_rescale(label_roi, w, h, d, 'trilinear')  # (800,800,400)
+    label_roi = morphology.remove_small_objects(label_roi.astype(bool), 5000, connectivity=3).astype(float)
+    label_roi = ndimage.grey_dilation(label_roi, size=(5, 5, 5))
+    label_roi = morphology.remove_small_objects(label_roi.astype(bool), 400000, connectivity=3).astype(
+        float)
+    label_roi = ndimage.grey_erosion(label_roi, size=(5, 5, 5))
+    # crop image
+    x_min, x_max, y_min, y_max, z_min, z_max = img_crop(label_roi)
+    if x_min == -1:  # non-foreground label
+        whole_label = np.zeros((w, h, d))
+        return whole_label
+    image = image[x_min:x_max, y_min:y_max, z_min:z_max]
+    print("image shape(after roi): ", image.shape)
+    return image, x_min, x_max, y_min, y_max, z_min, z_max
+def roi_detection(net, image, stride_xy, stride_z, patch_size):
+    w, h, d = image.shape  # (400,400,200)
+    # if the size of image is less than patch_size, then padding it
+    add_pad = False
+    if w < patch_size[0]:
+        w_pad = patch_size[0] - w
+        add_pad = True
+    else:
+        w_pad = 0
+    if h < patch_size[1]:
+        h_pad = patch_size[1] - h
+        add_pad = True
+    else:
+        h_pad = 0
+    if d < patch_size[2]:
+        d_pad = patch_size[2] - d
+        add_pad = True
+    else:
+        d_pad = 0
+    wl_pad, wr_pad = w_pad // 2, w_pad - w_pad // 2
+    hl_pad, hr_pad = h_pad // 2, h_pad - h_pad // 2
+    dl_pad, dr_pad = d_pad // 2, d_pad - d_pad // 2
+    if add_pad:
+        image = np.pad(image, [(wl_pad, wr_pad), (hl_pad, hr_pad), (dl_pad, dr_pad)], mode='constant',
+                       constant_values=0)
+    ww, hh, dd = image.shape
+    sx = math.ceil((ww - patch_size[0]) / stride_xy) + 1  # 2
+    sy = math.ceil((hh - patch_size[1]) / stride_xy) + 1  # 2
+    sz = math.ceil((dd - patch_size[2]) / stride_z) + 1  # 2
+    score_map = np.zeros((2,) + image.shape).astype(np.float32)
+    cnt = np.zeros(image.shape).astype(np.float32)
+    count = 0
+    for x in range(0, sx):
+        xs = min(stride_xy * x, ww - patch_size[0])
+        for y in range(0, sy):
+            ys = min(stride_xy * y, hh - patch_size[1])
+            for z in range(0, sz):
+                zs = min(stride_z * z, dd - patch_size[2])
+                test_patch = image[xs:xs + patch_size[0], ys:ys + patch_size[1],
+                             zs:zs + patch_size[2]]
+                test_patch = np.expand_dims(np.expand_dims(test_patch, axis=0), axis=0).astype(
+                    np.float32)
+                test_patch = torch.from_numpy(test_patch).cuda(0)
+                with torch.no_grad():
+                    y1 = net(test_patch)  # （1,2,256,256,160）
+                y = F.softmax(y1, dim=1)  # （1,2,256,256,160）
+                y = y.cpu().data.numpy()
+                y = y[0, :, :, :, :]  # （2,256,256,160）
+                score_map[:, xs:xs + patch_size[0], ys:ys + patch_size[1], zs:zs + patch_size[2]] \
+                    = score_map[:, xs:xs + patch_size[0], ys:ys + patch_size[1],
+                      zs:zs + patch_size[2]] + y  # (2,400,400,200)
+                cnt[xs:xs + patch_size[0], ys:ys + patch_size[1], zs:zs + patch_size[2]] \
+                    = cnt[xs:xs + patch_size[0], ys:ys + patch_size[1], zs:zs + patch_size[2]] + 1  # (400,400,200)
+                count = count + 1
+    score_map = score_map / np.expand_dims(cnt, axis=0)
+    label_map = np.argmax(score_map, axis=0)  # (400,400,200),0/1
+    if add_pad:
+        label_map = label_map[wl_pad:wl_pad + w, hl_pad:hl_pad + h, dl_pad:dl_pad + d]
+        score_map = score_map[:, wl_pad:wl_pad + w, hl_pad:hl_pad + h, dl_pad:dl_pad + d]
+    return label_map
+def test_single_case_array(model_array, image=None, stride_xy=None, stride_z=None, patch_size=None, num_classes=1):
+    w, h, d = image.shape
+    # if the size of image is less than patch_size, then padding it
+    add_pad = False
+    if w < patch_size[0]:
+        w_pad = patch_size[0]-w
+        add_pad = True
+    else:
+        w_pad = 0
+    if h < patch_size[1]:
+        h_pad = patch_size[1]-h
+        add_pad = True
+    else:
+        h_pad = 0
+    if d < patch_size[2]:
+        d_pad = patch_size[2]-d
+        add_pad = True
+    else:
+        d_pad = 0
+    wl_pad, wr_pad = w_pad//2,w_pad-w_pad//2
+    hl_pad, hr_pad = h_pad//2,h_pad-h_pad//2
+    dl_pad, dr_pad = d_pad//2,d_pad-d_pad//2
+    if add_pad:
+        image = np.pad(image, [(wl_pad,wr_pad),(hl_pad,hr_pad), (dl_pad, dr_pad)], mode='constant', constant_values=0)
+    ww,hh,dd = image.shape
+    sx = math.ceil((ww - patch_size[0]) / stride_xy) + 1
+    sy = math.ceil((hh - patch_size[1]) / stride_xy) + 1
+    sz = math.ceil((dd - patch_size[2]) / stride_z) + 1
+    score_map = np.zeros((num_classes, ) + image.shape).astype(np.float32)
+    cnt = np.zeros(image.shape).astype(np.float32)
+    for x in range(0, sx):
+        xs = min(stride_xy*x, ww-patch_size[0])
+        for y in range(0, sy):
+            ys = min(stride_xy * y,hh-patch_size[1])
+            for z in range(0, sz):
+                zs = min(stride_z * z, dd-patch_size[2])
+                test_patch = image[xs:xs+patch_size[0], ys:ys+patch_size[1], zs:zs+patch_size[2]]
+                test_patch = np.expand_dims(np.expand_dims(test_patch,axis=0),axis=0).astype(np.float32)
+                test_patch = torch.from_numpy(test_patch).cuda()
+                for model in model_array:
+                    output = model(test_patch)
+                    y_temp = F.softmax(output, dim=1)
+                    y_temp = y_temp.cpu().data.numpy()
+                    y += y_temp[0,:,:,:,:]
+                y /= len(model_array)
+                score_map[:, xs:xs+patch_size[0], ys:ys+patch_size[1], zs:zs+patch_size[2]] \
+                  = score_map[:, xs:xs+patch_size[0], ys:ys+patch_size[1], zs:zs+patch_size[2]] + y
+                cnt[xs:xs+patch_size[0], ys:ys+patch_size[1], zs:zs+patch_size[2]] \
+                  = cnt[xs:xs+patch_size[0], ys:ys+patch_size[1], zs:zs+patch_size[2]] + 1
+    score_map = score_map/np.expand_dims(cnt,axis=0)
+    label_map = np.argmax(score_map, axis = 0)
+    if add_pad:
+        label_map = label_map[wl_pad:wl_pad+w,hl_pad:hl_pad+h,dl_pad:dl_pad+d]
+        score_map = score_map[:,wl_pad:wl_pad+w,hl_pad:hl_pad+h,dl_pad:dl_pad+d]
+    return label_map, score_map
+def calculate_metric_percase(pred, gt):
+    dice = metric.binary.dc(pred, gt)
+    jc = metric.binary.jc(pred, gt)
+    hd = metric.binary.hd95(pred, gt)
+    asd = metric.binary.asd(pred, gt)
+    return dice, jc, hd, asd
+class RailNetSystem(nn.Module, PyTorchModelHubMixin):
+    def __init__(self, n_channels: int, n_classes: int, normalization: str):
+        super().__init__()
+        self.num_classes = 2
+        self.net_roi = VNet_roi(n_channels = n_channels, n_classes = n_classes, normalization = normalization, has_dropout=False).cuda()
+        self.model_array = []
+        for i in range(4):
+            if i < 2:
+                model = VNet(n_channels = n_channels, n_classes = n_classes, normalization = normalization, has_dropout=True).cuda()
+            else:
+                model = ResVNet(n_channels = n_channels, n_classes = n_classes, normalization = normalization, has_dropout=True).cuda()
+            self.model_array.append(model)
+    def load_weights(self, weight_dir="."):
+        self.net_roi.load_state_dict(torch.load(os.path.join(weight_dir, "model weights", "roi_best_model.pth"), map_location="cuda", weights_only=True))
+        self.net_roi.eval()
+        model_files = [
+            "rail_0_iter_7995_best.pth",
+            "rail_1_iter_7995_best.pth",
+            "rail_2_iter_7995_best.pth",
+            "rail_3_iter_7995_best.pth",
+        ]
+        for i, file in enumerate(model_files):
+            self.model_array[i].load_state_dict(torch.load(os.path.join(weight_dir, "model weights", file), map_location="cuda", weights_only=True))
+            self.model_array[i].eval()
+    def forward(self, image, label, save_path="./output", name="case"):
+        if not os.path.exists(save_path):
+            os.makedirs(save_path)
+        nib.save(nib.Nifti1Image(image.astype(np.float32), np.eye(4)), os.path.join(save_path, f"{name}_img.nii.gz"))
+        w, h, d = image.shape
+        image, x_min, x_max, y_min, y_max, z_min, z_max = roi_extraction(image, self.net_roi, name)
+        prediction, _ = test_single_case_array(self.model_array, image, stride_xy=64, stride_z=32, patch_size=(112, 112, 80), num_classes=self.num_classes)
+        prediction = morphology.remove_small_objects(prediction.astype(bool), 3000, connectivity=3).astype(float)
+        new_prediction = np.zeros((w, h, d))
+        new_prediction[x_min:x_max, y_min:y_max, z_min:z_max] = prediction
+        dice, jc, hd, asd = calculate_metric_percase(new_prediction, label[:])
+        nib.save(nib.Nifti1Image(new_prediction.astype(np.float32), np.eye(4)), os.path.join(save_path, f"{name}_pred.nii.gz"))
+        return new_prediction, dice, jc, hd, asd