cellpose微调模型效果评估工具

为了对cellpose微调模型在测试数据集上的效果进行评估，在Grok的帮助下弄了一个小工具。
这个评估工具能够读取cellpose保存的npy文件，然后随机抽取指定数量的结构展示mask给专家遍历，然后由专家评估正确与否。专家遍历完成后自动计算正确率。专家的评估记录自动记录到csv表格文件中。而且这个工具还支持断点继续。具体使用效果如下：
完整代码如下：
1
import os
2
from glob import glob
3
import numpy as np
4
import tkinter as tk
5
from tkinter import messagebox, ttk, filedialog
6
import random
7
from PIL import Image, ImageTk
8
import csv
9
import json
10
from scipy.ndimage import center_of_mass
11

12

13
# 默认参数
14
DEFAULT_NUM_STRUCTURES = 200  # 默认检查200个结构
15
DEFAULT_CROP_SIZE = 200  # 默认裁剪区域大小（像素）
16
CONFIG_FILE = 'config.json'  # 配置文件名
17

18

19
class LabelingApp:
20
    def __init__(self, root):
21
        self.root = root
22
        self.root.title("Expert Checking")
23
        self.results = []
24
        self.num_structures = DEFAULT_NUM_STRUCTURES
25
        self.crop_size = DEFAULT_CROP_SIZE
26
        self.directory = None  # 无默认目录
27
        self.structures = []
28
        self.current_structure_idx = 0
29
        self.current_image = None
30
        self.current_mask = None
31
        self.current_label = None
32
        self.current_file = None
33

34

35
        # 加载已有结果
36
        self.load_existing_results()
37

38

39
        # 检查是否有配置文件
40
        config_path = os.path.join(os.getcwd(), CONFIG_FILE)  # 默认检查当前工作目录
41
        if os.path.exists(config_path):
42
            try:
43
                self.load_config(config_path)
44
                if not self.directory or not os.path.isdir(self.directory):
45
                    raise ValueError("Invalid directory in config")
46
                self.load_existing_results()  # 重新加载结果以确保使用配置中的目录
47
                self.label_frame = tk.Frame(root)
48
                self.canvas = tk.Canvas(self.label_frame, width=self.crop_size, height=self.crop_size)
49
                self.canvas.pack()
50
                self.label_var = tk.StringVar()
51
                self.label_var.set("Structure 0/0")
52
                tk.Label(self.label_frame, textvariable=self.label_var).pack()
53
                # 按钮框架用于居中对齐
54
                button_frame = tk.Frame(self.label_frame)
55
                button_frame.pack(pady=10)
56
                tk.Button(button_frame, text="Correct", command=self.label_correct, width=10).pack(side=tk.LEFT, padx=10, fill=tk.X, expand=True)
57
                tk.Button(button_frame, text="Incorrect", command=self.label_incorrect, width=10).pack(side=tk.LEFT, padx=10, fill=tk.X, expand=True)
58
                self.label_frame.pack()
59
                self.load_structures()
60
            except (json.JSONDecodeError, ValueError) as e:
61
                messagebox.showerror("Error", f"Invalid config.json or directory: {str(e)}. Please select a directory.")
62
                self.show_setup_gui()
63
        else:
64
            self.show_setup_gui()
65

66

67
    def show_setup_gui(self):
68
        # GUI 设置窗口，每项配置单独一行
69
        self.setup_frame = tk.Frame(self.root)
70
        self.setup_frame.pack(pady=10)
71

72

73
        # Directory 输入和选择按钮
74
        dir_frame = tk.Frame(self.setup_frame)
75
        dir_frame.pack(fill=tk.X, pady=5)
76
        tk.Label(dir_frame, text="Directory:").pack(anchor=tk.W)
77
        dir_inner_frame = tk.Frame(dir_frame)
78
        dir_inner_frame.pack(fill=tk.X)
79
        self.dir_entry = tk.Entry(dir_inner_frame, width=50)
80
        self.dir_entry.pack(side=tk.LEFT, fill=tk.X, expand=True, padx=(0, 5))
81
        tk.Button(dir_inner_frame, text="Browse", command=self.browse_directory).pack(side=tk.LEFT)
82

83

84
        # Number of Structures 输入
85
        num_frame = tk.Frame(self.setup_frame)
86
        num_frame.pack(fill=tk.X, pady=5)
87
        tk.Label(num_frame, text="Number of Structures (-1 for all):").pack(anchor=tk.W)
88
        self.num_entry = tk.Entry(num_frame, width=50)
89
        self.num_entry.insert(0, str(DEFAULT_NUM_STRUCTURES))
90
        self.num_entry.pack(fill=tk.X, padx=5)
91

92

93
        # Crop Size 输入
94
        crop_frame = tk.Frame(self.setup_frame)
95
        crop_frame.pack(fill=tk.X, pady=5)
96
        tk.Label(crop_frame, text="Crop Size (pixels):").pack(anchor=tk.W)
97
        self.crop_entry = tk.Entry(crop_frame, width=50)
98
        self.crop_entry.insert(0, str(DEFAULT_CROP_SIZE))
99
        self.crop_entry.pack(fill=tk.X, padx=5)
100

101

102
        # Start 按钮
103
        tk.Button(self.setup_frame, text="Start", command=self.start_labeling).pack(pady=10)
104

105

106
    def browse_directory(self):
107
        # 打开目录选择对话框
108
        directory = filedialog.askdirectory()
109
        if directory:
110
            self.dir_entry.delete(0, tk.END)
111
            self.dir_entry.insert(0, directory)
112

113

114
    def load_existing_results(self):
115
        # 加载已有CSV文件
116
        self.results = []
117
        if self.directory and os.path.exists(self.directory):
118
            csv_path = os.path.join(self.directory, 'labeling_results.csv')
119
            if os.path.exists(csv_path):
120
                with open(csv_path, 'r', newline='') as csvfile:
121
                    reader = csv.DictReader(csvfile)
122
                    for row in reader:
123
                        self.results.append({
124
                            'file': row['file'],
125
                            'structure_id': int(row['structure_id']),
126
                            'expert_label': row['expert_label'] == 'True'
127
                        })
128

129

130
    def load_config(self, config_path):
131
        # 加载配置文件
132
        with open(config_path, 'r') as f:
133
            config = json.load(f)
134
        self.directory = config['directory']
135
        self.num_structures = config['num_structures']
136
        self.crop_size = config['crop_size']
137
        self.structures = [(s[0], int(s[1]), s[2], None) for s in config['structures']]
138

139

140
    def save_config(self):
141
        # 保存配置文件
142
        config = {
143
            'directory': str(self.directory),  # 确保字符串
144
            'num_structures': int(self.num_structures),  # 确保整数
145
            'crop_size': int(self.crop_size),  # 确保整数
146
            'structures': [(str(s[0]), int(s[1]), str(s[2])) for s in self.structures]  # 转换为Python原生类型
147
        }
148
        config_path = os.path.join(self.directory, CONFIG_FILE)
149
        with open(config_path, 'w') as f:
150
            json.dump(config, f, indent=2)
151

152

153
    def start_labeling(self):
154
        try:
155
            self.directory = self.dir_entry.get()
156
            self.num_structures = int(self.num_entry.get())
157
            self.crop_size = int(self.crop_entry.get())
158
            if not self.directory:
159
                raise ValueError("Please select a directory")
160
            if self.crop_size <= 0:
161
                raise ValueError("Crop size must be positive")
162
            if not os.path.isdir(self.directory):
163
                raise ValueError("Invalid directory")
164
        except ValueError as e:
165
            messagebox.showerror("Error", str(e))
166
            return
167

168

169
        # 重新加载已有结果以确保使用新选择的目录
170
        self.load_existing_results()
171

172

173
        # 调整画布大小并切换到标签窗口
174
        self.setup_frame.pack_forget()
175
        self.label_frame = tk.Frame(self.root)
176
        self.canvas = tk.Canvas(self.label_frame, width=self.crop_size, height=self.crop_size)
177
        self.canvas.pack()
178
        self.label_var = tk.StringVar()
179
        self.label_var.set("Structure 0/0")
180
        tk.Label(self.label_frame, textvariable=self.label_var).pack()
181
        # 按钮框架用于居中对齐
182
        button_frame = tk.Frame(self.label_frame)
183
        button_frame.pack(pady=10)
184
        tk.Button(button_frame, text="Correct", command=self.label_correct, width=10).pack(side=tk.LEFT, padx=10, fill=tk.X, expand=True)
185
        tk.Button(button_frame, text="Incorrect", command=self.label_incorrect, width=10).pack(side=tk.LEFT, padx=10, fill=tk.X, expand=True)
186
        self.label_frame.pack()
187
        self.load_structures()
188

189

190
    def load_structures(self):
191
        # 获取指定目录下所有npy文件
192
        fps = glob(os.path.join(self.directory, '*.npy'))
193
        if not fps:
194
            messagebox.showerror("Error", "No .npy files found in the specified directory")
195
            self.root.quit()
196
            return
197

198

199
        # 重置结构列表
200
        self.structures = []
201

202

203
        # 收集所有结构
204
        all_structures = []
205
        for fp in fps:
206
            try:
207
                rec = np.load(fp, allow_pickle=True).item()
208
                masks = rec.get('masks')
209
                if masks is None:
210
                    continue  # 跳过没有masks的文件
211
                unique_labels = np.unique(masks)
212
                structures = [label for label in unique_labels if label != 0]
213
                for label in structures:
214
                    all_structures.append((fp, label, rec.get('filename', ''), masks))
215
            except Exception as e:
216
                messagebox.showwarning("Warning", f"Error loading {fp}: {str(e)}")
217
                continue
218

219

220
        if not all_structures:
221
            messagebox.showerror("Error", "No valid structures found in .npy files")
222
            self.root.quit()
223
            return
224

225

226
        # 过滤掉已标签的结构
227
        labeled_set = {(r['file'], r['structure_id']) for r in self.results}
228
        remaining_structures = [
229
            s for s in all_structures
230
            if (s[0], s[1]) not in labeled_set
231
        ]
232

233

234
        # 随机选择结构
235
        if self.num_structures == -1 or self.num_structures >= len(remaining_structures):
236
            self.structures = remaining_structures
237
        else:
238
            self.structures = random.sample(remaining_structures, self.num_structures)
239
        random.shuffle(self.structures)
240

241

242
        # 保存配置
243
        self.save_config()
244

245

246
        if not self.structures:
247
            messagebox.showerror("Error", "No structures available to label after filtering.")
248
            self.root.quit()
249
            return
250
        self.show_structure()
251

252

253
    def show_structure(self):
254
        if self.current_structure_idx >= len(self.structures):
255
            self.save_results()
256
            messagebox.showinfo("Done", f"All structures processed. Results saved.\nAccuracy: {self.calculate_accuracy():.2%}")
257
            self.root.quit()
258
            return
259

260

261
        self.current_file, self.current_label, img_path, self.current_mask = self.structures[self.current_structure_idx]
262
        try:
263
            self.current_image = np.array(Image.open(img_path).convert('RGB'))
264
        except FileNotFoundError:
265
            messagebox.showwarning("Warning", f"Image file {img_path} not found, skipping.")
266
            self.current_structure_idx += 1
267
            self.show_structure()
268
            return
269
        self.label_var.set(f"Structure {self.current_structure_idx + 1}/{len(self.structures)}")
270

271

272
        # 计算结构质心并裁剪
273
        mask = (self.current_mask == self.current_label).astype(np.uint8)
274
        centroid_y, centroid_x = center_of_mass(mask)
275
        centroid_y, centroid_x = int(centroid_y), int(centroid_x)
276
        half_crop = self.crop_size // 2
277

278

279
        # 计算裁剪区域
280
        h, w = self.current_mask.shape
281
        x_start = centroid_x - half_crop
282
        x_end = centroid_x + half_crop
283
        y_start = centroid_y - half_crop
284
        y_end = centroid_y + half_crop
285

286

287
        # 创建全黑背景
288
        cropped_image = np.zeros((self.crop_size, self.crop_size, 3), dtype=np.uint8)
289
        cropped_mask = np.zeros((self.crop_size, self.crop_size), dtype=np.uint8)
290

291

292
        # 计算图像内的有效裁剪区域
293
        src_x_start = max(0, x_start)
294
        src_x_end = min(w, x_end)
295
        src_y_start = max(0, y_start)
296
        src_y_end = min(h, y_end)
297

298

299
        # 计算目标区域的偏移量
300
        dst_x_start = max(0, -x_start)
301
        dst_x_end = min(self.crop_size, w - x_start)
302
        dst_y_start = max(0, -y_start)
303
        dst_y_end = min(self.crop_size, h - y_start)
304

305

306
        # 复制有效区域到目标图像
307
        if src_x_end > src_x_start and src_y_end > src_y_start:
308
            cropped_image[dst_y_start:dst_y_end, dst_x_start:dst_x_end] = \
309
                self.current_image[src_y_start:src_y_end, src_x_start:src_x_end]
310
            cropped_mask[dst_y_start:dst_y_end, dst_x_start:dst_x_end] = \
311
                mask[src_y_start:src_y_end, src_x_start:src_x_end]
312

313

314
        # 创建掩码叠加图像，透明度为0.1
315
        mask_rgb = np.stack([cropped_mask * 0, cropped_mask * 255, cropped_mask * 0], axis=-1)  # 绿色掩码
316
        overlay = np.clip(cropped_image * 0.9 + mask_rgb * 0.1, 0, 255).astype(np.uint8)
317
        img = Image.fromarray(overlay)
318
        self.photo = ImageTk.PhotoImage(img)
319
        self.canvas.create_image(0, 0, anchor=tk.NW, image=self.photo)
320

321

322
    def label_correct(self):
323
        self.save_label(True)
324
        self.current_structure_idx += 1
325
        self.show_structure()
326

327

328
    def label_incorrect(self):
329
        self.save_label(False)
330
        self.current_structure_idx += 1
331
        self.show_structure()
332

333

334
    def save_label(self, expert_label):
335
        self.results.append({
336
            'file': self.current_file,
337
            'structure_id': self.current_label,
338
            'expert_label': expert_label
339
        })
340
        # 增量保存到CSV
341
        self.save_results()
342

343

344
    def calculate_accuracy(self):
345
        if not self.results:
346
            return 0.0
347
        correct = sum(1 for r in self.results if r['expert_label'])
348
        return correct / len(self.results)
349

350

351
    def save_results(self):
352
        # 保存结果到CSV
353
        csv_path = os.path.join(self.directory, 'labeling_results.csv')
354
        with open(csv_path, 'w', newline='') as csvfile:
355
            fieldnames = ['file', 'structure_id', 'expert_label']
356
            writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
357
            writer.writeheader()
358
            for result in self.results:
359
                writer.writerow(result)
360

361

362
# 主程序
363
if __name__ == "__main__":
364
    root = tk.Tk()
365
    app = LabelingApp(root)
366
    root.mainloop()
使用时需要注意的就是运行它的python环境。最好是使用cellpose（目前支持版本为4.0.1）的相同python环境运行该程序，避免对cellpose保存的npy文件读取错误。