OSTrack/app_osyo.py at main · Rtwotwo/OSTrack · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
"""
任务: 导入模型,创建GUI界面,实现对实时视频
      捕获或者视频导入的无人机定位
时间: 2025/03/13-Redal
"""
import pathlib
temp = pathlib.PosixPath
pathlib.PosixPath = pathlib.WindowsPath

import os
import sys
import cv2
import threading
import argparse
import torch
import tkinter as tk
from tkinter import filedialog
from PIL import Image, ImageTk
from util import config
from util import ComputeHistogramImage
from util import CalculateSpectrogramImage
from torchvision.transforms import transforms
from yolov5.models.experimental import attempt_load
from yolo_model import parser
from yolo_model import load_yolo
from bbox import decoder

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
current_path = os.path.dirname(os.path.abspath(__file__))
sys.path.append(current_path)
os.environ['CUDA_VISIBLE_DEVICES'] = '0'
template_transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Resize((192, 192)),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),])
search_transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Resize((384, 384)),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),])


########################  定义GUI界面类  #######################
class OSTrackGUI(tk.Frame):
    """设计OSTrack主界面,用于完成多功能的介绍
       以及相关功能的选择使用"""
    def __init__(self, root=None):
        super().__init__()
        self.root = root
        self.__set_widgets()
        self.frame = None
        self.last_xyxy = None
        self.dx, self.dy = 0, 0
        self.lost_frame_num = 0
        self.video_cap = cv2.VideoCapture(0)

        self.is_running = False
        self.video_cap = None
        self.video_thread = None
        self.live_video_flag = False
        self.import_video_flag = False
        self.track_video_flag = False
        self.export_video_flag = False
        # 初始化模型
        # self.ostrack = config()
        self.template_transform = template_transform
        self.sreach_transform = search_transform
        self.args = parser()
        self.yolo_model = load_yolo(self.args).to(device)
        # 定义缓存变量
        self.img_cached = []
        self.fps = 0
        self.frame_width, self.frame_height = 0, 0
        self.fourcc = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
        self.video_processed_dir = './video'

    def __set_widgets(self):
        self.root.title("OSTrack GUI-Redal")
        self.root.geometry("800x600")
        self.video_label = tk.Label(self.root, text="视频显示区域", width=500, height=400); self.video_label.place(x=0, y=0)
        self.title_label = tk.Label(self.root, text='无人机目标追踪', font=("仿宋", 15), fg="black", width=30, height=2); self.title_label.place(x=505, y=0)
        self.histogram_label = tk.Label(self.root, text="直方图显示区域", font=("仿宋", 10), fg="black", width=300, height=200); self.histogram_label.place(x=0, y=400)
        self.spectrogram_label = tk.Label(self.root, text='频谱图显示区域', font=("仿宋", 10), fg="black", width=200, height=200); self.spectrogram_label.place(x=300, y=400)
        self.message_title_label  = tk.Label(self.root, text='主要功能信息提示', font=("仿宋", 15), fg="black", width=30, height=2 ); self.message_title_label.place(x=505, y=400)
        self.message_label = tk.Label(self.root,text="很感激您能使用我们的软件\n请选择您需要的功能......",
                            font=("仿宋", 12),width=40,height=5, wraplength=300, justify="left"); self.message_label.place(x=505, y=440)

        # 软件主要功能的选择按钮,按钮大小(80, 30)
        self.live_video_button = tk.Button(self.root, text='实时视频', height=1, width=10, command=self.__start_live_video__); self.live_video_button.place(x=550, y=50)
        self.import_video_button = tk.Button(self.root, text='导入视频', height=1, width=10, command=self.__start_import_video__); self.import_video_button.place(x=550, y=80)
        self.exit_button = tk.Button(self.root, text='退出程序', height=1, width=10, command=self.root.quit); self.exit_button.place(x=550, y=110)
        self.live_video_change_button = tk.Button(self.root, text='退出实时', height=1, width=10, command=self.__end_live_video__); self.live_video_change_button.place(x=670, y=50)
        self.import_video_change_button = tk.Button(self.root, text='退出导入', height=1, width=10, command=self.__end_import_video__); self.import_video_change_button.place(x=670, y=80)
        self.frame_shot_button = tk.Button(self.root, text='截取图像', height=1, width=10, command=self.__frame_shot__); self.frame_shot_button.place(x=670, y=110)

        # 界面初始显示图像
        self.main_window_img = cv2.resize( cv2.imread("images/main_window_img.png"), (500, 400) )
        self.main_window_img = ImageTk.PhotoImage(image = Image.fromarray(self.main_window_img))
        self.video_label.config(image=self.main_window_img)
        self.video_label.image = self.main_window_img

        # 应用模型进行跟踪处理按钮
        self.track_model_button = tk.Button(self.root, text='视频跟踪', height=1, width=10, command=self.__track_model__); self.track_model_button.place(x=550, y=170)
        self.video_export_button = tk.Button(self.root, text='视频导出', height=1, width=10, command=self.__video_export__); self.video_export_button.place(x=670, y=170)

    def __start_live_video__(self):
        """功能: 实时视频捕获"""
        if self.video_cap is not None:
            self.video_cap.release()
        self.live_video_flag = True
        self.import_video_flag = False
        text = "实时视频: 调用电脑或外置设备相机\n进行实时视频捕捉,再进行视频跟踪。\n注意: 退出此模式,请双击'退出实时'\n实时视频捕获中......"
        self.message_label.config(text=text)

        self.video_cap = cv2.VideoCapture(0) # 使用默认电脑相机
        self.is_running = True
        self.video_thread = threading.Thread(target=self.__video_loop__)
        self.video_thread.daemon = True
        self.video_thread.start()

    def __end_live_video__(self):
        """功能: 退出实时视频捕获"""
        self.is_running = False
        if self.video_cap is not None:
            self.video_cap.release()
        self.live_video_flag = False
        self.export_video_flag = False
        self.video_cap = None
        self.video_thread = None
        # 恢复为初始状态
        self.video_label.config(image=self.main_window_img)
        self.video_label.image = self.main_window_img

    def __start_import_video__(self):
        """功能: 导入用户视频"""
        file_path = filedialog.askopenfilename(filetypes=[("视频文件", "*.mp4 *.avi *.mov")])
        if file_path:
            if self.video_cap is not None:
                self.video_cap.release()
            self.import_video_flag = True
            self.live_video_flag = False
            self.track_video_flag = False
            text = "导入视频: 导入用户自定义视频文件\n进行视频帧捕捉,再进行跟踪处理。\n注意: 退出此模式,请双击'退出导入'\n用户视频导入中......"
            self.message_label.config(text=text)

            self.video_cap = cv2.VideoCapture(file_path)  # 打开视频文件
            self.is_running = True
            self.video_thread = threading.Thread(target=self.__video_loop__)
            self.video_thread.daemon = True
            self.video_thread.start()
            self.img_cached = [] # 每次导入清除缓存

            file_name = os.path.basename(file_path)
            self.fps = int(self.video_cap.get(cv2.CAP_PROP_FPS))
            self.frame_height = int(self.video_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
            self.frame_width = int(self.video_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
            self.video_processed_dir = os.path.join(self.video_processed_dir, f'processed_{file_name}')

    def __end_import_video__(self):
        """功能: 退出导入视频捕获"""
        self.is_running = False
        if self.video_cap is not None:
            self.video_cap.release()
        self.import_video_flag = False
        self.video_cap = None
        self.video_thread = None
        # 恢复为初始状态
        self.video_label.config(image=self.main_window_img)
        self.video_label.image = self.main_window_img

    def __frame_shot__(self):
        """功能: 截取当前视频帧"""
        frame_save_dir = 'frames'
        if not os.path.exists(frame_save_dir):
            os.makedirs(frame_save_dir)
        frame_number = len(os.listdir(frame_save_dir))
        img_rgb = cv2.cvtColor(self.frame, cv2.COLOR_BGR2RGB)
        cv2.imwrite(f"frames/shot_{frame_number}.jpg", img_rgb)
        text = "截取图像: 用户自定义截取主页面图像\n截取图像已存放在frames文件夹。\n图像截取中......"
        self.message_label.config(text=text)

    def __track_model__(self):
        """功能: 应用模型进行跟踪处理"""
        text = "视频跟踪: 对视频进行无人机跟踪\n并将无人机以边框的形势展示。\n无人机视频跟踪中......"
        self.message_label.config(text=text)
        self.track_video_flag = not self.track_video_flag

    def __video_export__(self):
        """功能: 导出当前处理好的用户自定义的视频"""
        text = "视频导出: 对用户导入视频跟踪处理\n处理视频存放在processed文件夹。\n无人机视频导出中......"
        self.message_label.config(text=text)
        self.export_video_flag = not self.export_video_flag
        if self.export_video_flag:
            # 如果开启导出,初始化视频类
            self.video_processed = cv2.VideoWriter(self.video_processed_dir, self.fourcc,
                                     self.fps, (self.frame_width, self.frame_height))
        if not self.export_video_flag:
            self.video_processed.release()


    def __video_loop__(self):
        """程序主界面播放视频"""
        while self.is_running and self.video_cap.isOpened():
            success, frame = self.video_cap.read()
            if success:
                # 实时调用电脑摄像头捕获
                if self.live_video_flag:
                    self.frame = cv2.flip(cv2.resize( cv2.cvtColor(frame,
                                cv2.COLOR_BGR2RGB), (500, 400)) ,1)
                    # 跟踪无人机
                    if self.track_video_flag:
                        self.frame, _ = decoder(self.yolo_model, self.frame)
                    # 导出无人机视频画面
                    if self.export_video_flag:
                        self.frame = cv2.resize( cv2.cvtColor(self.frame, cv2.COLOR_BGR2RGB),
                                                (self.frame_width, self.frame_height))
                        self.video_processed.write(self.frame)
                        text ="视频跟踪: 对视频进行无人机跟踪\n并将无人机以边框的形势展示。\n无人机视频跟踪中......\n视频导出中......"
                        self.message_label.config(text=text)

                # 调用用户自定义视频捕获
                elif self.import_video_flag:
                    self.frame = cv2.resize( cv2.cvtColor(frame, cv2.COLOR_BGR2RGB),
                                            (self.frame_width, self.frame_height))
                    # 跟踪无人机
                    if self.track_video_flag:
                        self.frame, self.xyxy = decoder(self.yolo_model, self.frame)
                        # if self.xyxy is not None:
                        #     self.lost_frame_num = 0
                        #     if self.last_xyxy is not None:
                        #         # 计算差值
                        #         self.dx = self.last_xyxy[0] - self.xyxy[0]
                        #         self.dy = self.last_xyxy[1] - self.xyxy[1]
                        #     self.last_xyxy = self.xyxy
                        # if self.xyxy is None:
                        #     self.lost_frame_num += 1
                        #     # 确保坐标为整数
                        #     pt1 = (int(self.last_xyxy[0] + self.dx*self.lost_frame_num), int(self.last_xyxy[1] + self.dy*self.lost_frame_num))
                        #     pt2 = (int(self.last_xyxy[2] + self.dx*self.lost_frame_num), int(self.last_xyxy[3] + self.dy*self.lost_frame_num))
                        #     cv2.rectangle(self.frame, pt1, pt2, (0, 255, 0), -1, cv2.LINE_AA)
                        #     # 动态计算tl的值
                        #     tl = round(0.002 * (self.frame.shape[0] + self.frame.shape[1]) / 2) + 1 if round(0.002 * (self.frame.shape[0] + self.frame.shape[1]) / 2) + 1 > 3 else 3
                        #     tf = max(tl - 1, 1)
                        #     cv2.putText(self.frame, f'drone: 0.9', (int(self.last_xyxy[0]), int(self.last_xyxy[1]) - 2), 0, tl / 3, [225, 255, 255], thickness=tf, lineType=cv2.LINE_AA)
                    # 导出无人机视频画面
                    if self.export_video_flag:
                        self.frame = cv2.resize( cv2.cvtColor(self.frame, cv2.COLOR_BGR2RGB),
                                                (self.frame_width, self.frame_height))
                        self.video_processed.write(self.frame)
                        text ="视频跟踪: 对视频进行无人机跟踪\n并将无人机以边框的形势展示。\n无人机视频跟踪中......\n视频导出中......"
                        self.message_label.config(text=text)

                # 计算直方图以及频谱图并显示
                hist_image = ComputeHistogramImage(cv2.cvtColor(self.frame, cv2.COLOR_BGR2RGB))
                spec_image = CalculateSpectrogramImage(self.frame)
                self.__show_frame__(hist_image=hist_image, spec_image=spec_image)
            else: break
            self.root.update_idletasks()

    def __show_frame__(self, hist_image=None, spec_image=None):
        """固定在self.video_label上显示视频"""
        img_fromarray  = Image.fromarray(self.frame)
        imgtk = ImageTk.PhotoImage(image=img_fromarray)
        self.video_label.config(image=imgtk)
        self.video_label.image = imgtk
        # 绘制直方图和频谱图
        if hist_image is not None:
            hist_image = ImageTk.PhotoImage(image=Image.fromarray(hist_image))
            self.histogram_label.config(image=hist_image)
            self.histogram_label.image = hist_image
        if spec_image is not None:
            spec_image = ImageTk.PhotoImage(image=Image.fromarray(spec_image))
            self.spectrogram_label.config(image=spec_image)
            self.spectrogram_label.image = spec_image
        self.root.after(20)


################################  主控测试函数  #############################
if __name__=='__main__':
    root = tk.Tk()
    app = OSTrackGUI(root=root)
    app.mainloop()