Исправление бага с размерностью при обучении

обновил .gitignore
анализ логов nn_inference
10 changed files with 2057 additions and 12 deletions
--- a/.gitignore
+++ b/.gitignore
@ -188,4 +188,6 @@ runtime/
 /.venv-*/*
-/train_scripts/models
+/train_scripts/models
 logs/nn_results_*.csv
--- a/NN_server/Model.py
+++ b/NN_server/Model.py
@ -262,6 +262,7 @@ class Model(object):
            print('Инференс' + self._shablon)
            prediction, probability = self._inference_func(data=self._data, model=self._model, mapping=self._classes,
                                                           shablon=self._shablon)
            print('RESULT' + self._shablon + ': ' + str(prediction) + ' (probability=' + str(probability) + ')')
            Model._add_in_result_list(type_model=self._type_model, ind_inference=self.get_ind_inference(), list_to_add=[prediction, probability])
            self._post_data(prediction=prediction)
--- a/NN_server/Models/ensemble_1200_v44.py
+++ b/NN_server/Models/ensemble_1200_v44.py
@ -0,0 +1,197 @@
 from torchvision import models
 import torch.nn as nn
 import matplotlib
 import numpy as np
 import torch
 import cv2
 import gc
 import io
 def _render_plot(values, figsize=(16, 16), dpi=16):
    import matplotlib.pyplot as plt
    fig = plt.figure(figsize=figsize)
    plt.axes(ylim=(-1, 1))
    plt.plot(values, color="black")
    plt.gca().set_axis_off()
    plt.subplots_adjust(top=1, bottom=0, right=1, left=0, hspace=0, wspace=0)
    plt.margins(0, 0)
    buf = io.BytesIO()
    fig.savefig(buf, format="png", dpi=dpi)
    buf.seek(0)
    img_arr = np.frombuffer(buf.getvalue(), dtype=np.uint8)
    buf.close()
    img = cv2.imdecode(img_arr, 1)
    if img is None:
        raise RuntimeError("failed to decode plot image")
    plt.clf()
    plt.cla()
    plt.close()
    plt.close(fig)
    return np.asarray(cv2.split(img), dtype=np.float32)
 def pre_func_ensemble(data=None, src="", ind_inference=0):
    try:
        import matplotlib.pyplot as plt
        matplotlib.use("Agg")
        plt.ioff()
        real = np.asarray(data[0], dtype=np.float32)
        imag = np.asarray(data[1], dtype=np.float32)
        signal = real + 1j * imag
        img_real = _render_plot(signal.real)
        img_mag = _render_plot(np.abs(signal))
        cv2.destroyAllWindows()
        gc.collect()
        print("Подготовка данных завершена")
        print()
        return [img_real, img_mag]
    except Exception as exc:
        print(str(exc))
        return None
 def build_func_ensemble(file_model="", file_config="", num_classes=None):
    try:
        import matplotlib.pyplot as plt
        matplotlib.use("Agg")
        plt.ioff()
        torch.cuda.empty_cache()
        num_classes = 2
        model1 = models.resnet18(pretrained=False)
        model2 = models.resnet50(pretrained=False)
        model1.fc = nn.Linear(model1.fc.in_features, num_classes)
        model2.fc = nn.Linear(model2.fc.in_features, num_classes)
        class Ensemble(nn.Module):
            def __init__(self, model1, model2):
                super().__init__()
                self.model1 = model1
                self.model2 = model2
                self.fc = nn.Linear(2 * num_classes, num_classes)
            def forward(self, x):
                if isinstance(x, (list, tuple)):
                    x1 = x[0]
                    x2 = x[1] if len(x) > 1 else x[0]
                else:
                    x1 = x
                    x2 = x
                y1 = self.model1(x1)
                y2 = self.model2(x2)
                y = torch.cat((y1, y2), dim=1)
                return self.fc(y)
        model = Ensemble(model1, model2)
        device = "cuda" if torch.cuda.is_available() else "cpu"
        if device != "cpu":
            model = model.to(device)
        model.load_state_dict(torch.load(file_model, map_location=device))
        model.eval()
        cv2.destroyAllWindows()
        gc.collect()
        print("Инициализация модели завершена")
        print()
        return model
    except Exception as exc:
        print(str(exc))
        return None
 def inference_func_ensemble(data=None, model=None, mapping=None, shablon=""):
    try:
        cv2.destroyAllWindows()
        gc.collect()
        torch.cuda.empty_cache()
        device = "cuda" if torch.cuda.is_available() else "cpu"
        if isinstance(data, (list, tuple)) and len(data) >= 2:
            inputs = [
                torch.unsqueeze(torch.tensor(data[0]).cpu(), 0).to(device).float(),
                torch.unsqueeze(torch.tensor(data[1]).cpu(), 0).to(device).float(),
            ]
        else:
            tensor = torch.unsqueeze(torch.tensor(data).cpu(), 0).to(device).float()
            inputs = [tensor, tensor]
        with torch.no_grad():
            output = model(inputs)
            _, predict = torch.max(output.data, 1)
        prediction = mapping[int(np.asarray(predict.cpu())[0])]
        print("PREDICTION" + shablon + ": " + prediction)
        output = output.cpu()
        label = np.asarray(np.argmax(output, axis=1))[0]
        output = np.asarray(torch.squeeze(output, 0))
        expon = np.exp(output - np.max(output))
        probability = round((expon / expon.sum())[label], 2)
        cv2.destroyAllWindows()
        gc.collect()
        print("Уверенность" + shablon + " в предсказании: " + str(probability))
        print("Инференс завершен")
        print()
        return [prediction, probability]
    except Exception as exc:
        print(str(exc))
        return None
 def post_func_ensemble(src="", model_type="", prediction="", model_id=0, ind_inference=0, data=None):
    try:
        import matplotlib.pyplot as plt
        matplotlib.use("Agg")
        plt.ioff()
        if int(ind_inference) <= 100 and isinstance(data, (list, tuple)) and len(data) >= 2:
            fig, ax = plt.subplots()
            ax.imshow(np.moveaxis(data[0], 0, -1))
            plt.savefig(src + "_inference_" + str(ind_inference) + "_" + prediction + "_real_" + str(model_id) + "_" + model_type + ".png")
            plt.clf()
            plt.cla()
            plt.close(fig)
            cv2.destroyAllWindows()
            gc.collect()
            fig, ax = plt.subplots()
            ax.imshow(np.moveaxis(data[1], 0, -1))
            plt.savefig(src + "_inference_" + str(ind_inference) + "_" + prediction + "_mod_" + str(model_id) + "_" + model_type + ".png")
            plt.clf()
            plt.cla()
            plt.close(fig)
            cv2.destroyAllWindows()
            gc.collect()
        plt.clf()
        plt.cla()
        plt.close()
        cv2.destroyAllWindows()
        gc.collect()
        print("Постобработка завершена")
        print()
    except Exception as exc:
        print(str(exc))
        return None
--- a/NN_server/Models/ensemble_2400_v44.py
+++ b/NN_server/Models/ensemble_2400_v44.py
@ -0,0 +1,197 @@
 from torchvision import models
 import torch.nn as nn
 import matplotlib
 import numpy as np
 import torch
 import cv2
 import gc
 import io
 def _render_plot(values, figsize=(16, 16), dpi=16):
    import matplotlib.pyplot as plt
    fig = plt.figure(figsize=figsize)
    plt.axes(ylim=(-1, 1))
    plt.plot(values, color="black")
    plt.gca().set_axis_off()
    plt.subplots_adjust(top=1, bottom=0, right=1, left=0, hspace=0, wspace=0)
    plt.margins(0, 0)
    buf = io.BytesIO()
    fig.savefig(buf, format="png", dpi=dpi)
    buf.seek(0)
    img_arr = np.frombuffer(buf.getvalue(), dtype=np.uint8)
    buf.close()
    img = cv2.imdecode(img_arr, 1)
    if img is None:
        raise RuntimeError("failed to decode plot image")
    plt.clf()
    plt.cla()
    plt.close()
    plt.close(fig)
    return np.asarray(cv2.split(img), dtype=np.float32)
 def pre_func_ensemble(data=None, src="", ind_inference=0):
    try:
        import matplotlib.pyplot as plt
        matplotlib.use("Agg")
        plt.ioff()
        real = np.asarray(data[0], dtype=np.float32)
        imag = np.asarray(data[1], dtype=np.float32)
        signal = real + 1j * imag
        img_real = _render_plot(signal.real)
        img_mag = _render_plot(np.abs(signal))
        cv2.destroyAllWindows()
        gc.collect()
        print("Подготовка данных завершена")
        print()
        return [img_real, img_mag]
    except Exception as exc:
        print(str(exc))
        return None
 def build_func_ensemble(file_model="", file_config="", num_classes=None):
    try:
        import matplotlib.pyplot as plt
        matplotlib.use("Agg")
        plt.ioff()
        torch.cuda.empty_cache()
        num_classes = 2
        model1 = models.resnet18(pretrained=False)
        model2 = models.resnet50(pretrained=False)
        model1.fc = nn.Linear(model1.fc.in_features, num_classes)
        model2.fc = nn.Linear(model2.fc.in_features, num_classes)
        class Ensemble(nn.Module):
            def __init__(self, model1, model2):
                super().__init__()
                self.model1 = model1
                self.model2 = model2
                self.fc = nn.Linear(2 * num_classes, num_classes)
            def forward(self, x):
                if isinstance(x, (list, tuple)):
                    x1 = x[0]
                    x2 = x[1] if len(x) > 1 else x[0]
                else:
                    x1 = x
                    x2 = x
                y1 = self.model1(x1)
                y2 = self.model2(x2)
                y = torch.cat((y1, y2), dim=1)
                return self.fc(y)
        model = Ensemble(model1, model2)
        device = "cuda" if torch.cuda.is_available() else "cpu"
        if device != "cpu":
            model = model.to(device)
        model.load_state_dict(torch.load(file_model, map_location=device))
        model.eval()
        cv2.destroyAllWindows()
        gc.collect()
        print("Инициализация модели завершена")
        print()
        return model
    except Exception as exc:
        print(str(exc))
        return None
 def inference_func_ensemble(data=None, model=None, mapping=None, shablon=""):
    try:
        cv2.destroyAllWindows()
        gc.collect()
        torch.cuda.empty_cache()
        device = "cuda" if torch.cuda.is_available() else "cpu"
        if isinstance(data, (list, tuple)) and len(data) >= 2:
            inputs = [
                torch.unsqueeze(torch.tensor(data[0]).cpu(), 0).to(device).float(),
                torch.unsqueeze(torch.tensor(data[1]).cpu(), 0).to(device).float(),
            ]
        else:
            tensor = torch.unsqueeze(torch.tensor(data).cpu(), 0).to(device).float()
            inputs = [tensor, tensor]
        with torch.no_grad():
            output = model(inputs)
            _, predict = torch.max(output.data, 1)
        prediction = mapping[int(np.asarray(predict.cpu())[0])]
        print("PREDICTION" + shablon + ": " + prediction)
        output = output.cpu()
        label = np.asarray(np.argmax(output, axis=1))[0]
        output = np.asarray(torch.squeeze(output, 0))
        expon = np.exp(output - np.max(output))
        probability = round((expon / expon.sum())[label], 2)
        cv2.destroyAllWindows()
        gc.collect()
        print("Уверенность" + shablon + " в предсказании: " + str(probability))
        print("Инференс завершен")
        print()
        return [prediction, probability]
    except Exception as exc:
        print(str(exc))
        return None
 def post_func_ensemble(src="", model_type="", prediction="", model_id=0, ind_inference=0, data=None):
    try:
        import matplotlib.pyplot as plt
        matplotlib.use("Agg")
        plt.ioff()
        if int(ind_inference) <= 100 and isinstance(data, (list, tuple)) and len(data) >= 2:
            fig, ax = plt.subplots()
            ax.imshow(np.moveaxis(data[0], 0, -1))
            plt.savefig(src + "_inference_" + str(ind_inference) + "_" + prediction + "_real_" + str(model_id) + "_" + model_type + ".png")
            plt.clf()
            plt.cla()
            plt.close(fig)
            cv2.destroyAllWindows()
            gc.collect()
            fig, ax = plt.subplots()
            ax.imshow(np.moveaxis(data[1], 0, -1))
            plt.savefig(src + "_inference_" + str(ind_inference) + "_" + prediction + "_mod_" + str(model_id) + "_" + model_type + ".png")
            plt.clf()
            plt.cla()
            plt.close(fig)
            cv2.destroyAllWindows()
            gc.collect()
        plt.clf()
        plt.cla()
        plt.close()
        cv2.destroyAllWindows()
        gc.collect()
        print("Постобработка завершена")
        print()
    except Exception as exc:
        print(str(exc))
        return None
--- a/NN_server/server.py
+++ b/NN_server/server.py
@ -137,19 +137,29 @@ def receive_data():
                print()
                try:
                    result = 0
-                    if (int(freq) == 2400 and (prediction_list[0] in ['drone', 'drone_noise'] or (prediction_list[0] == 'wifi' and float(probability) >= 0.95))) or (int(freq) == 1200 and (prediction_list[0] in ['drone'] and float(probability) >= 0.95)):
+                    freq_int = int(freq)
-                        result += 0
+                    prediction = prediction_list[0]
-                    if int(freq) in [915]:
+                    prob = float(probability)
-                        result = 0
+
-                    if int(freq) in []:
+                    if freq_int == 2400:
                        if prediction in ["drone", "drone_noise"]:
                            result += 0
                        elif prediction == "wifi" and prob >= 0.95:
                            result += 0
                    elif freq_int == 1200:
                        if prediction == "drone" and prob >= 0.95:
                            result += 8
                    elif freq_int == 915:
                        result = 0
-                    data_to_send={
+
-                        'freq': str(freq),
+                    data_to_send = {
-                        'amplitude': result
+                        "freq": str(freq),
-                        #'triggered': False if result < 7 else True,
+                        "amplitude": result,
-                        #'light_len': result
+                    }
                        }
                    response = requests.post("http://{0}:{1}/process_data".format(gen_server_ip, gen_server_port), json=data_to_send)
                    if response.status_code == 200:
                        print("Данные успешно отправлены!")
--- a/deploy/docker/docker-compose.yml
+++ b/deploy/docker/docker-compose.yml
@ -20,6 +20,7 @@ services:
      - ../../runtime:/app/runtime
      - ../../src:/app/src
      - ../../common:/app/common
      - ../../train_scripts:/app/train_scripts:ro
    networks:
      - dronedetector-net
    extra_hosts:
@ -50,6 +51,7 @@ services:
      - ../../.env:/app/.env:ro
      - ../../NN_server:/app/NN_server
      - ../../common:/app/common
      - ../../train_scripts:/app/train_scripts:ro
    gpus: all
    networks:
      - dronedetector-net
--- a/logs/analysis.ipynb
+++ b/logs/analysis.ipynb
@ -0,0 +1,673 @@
 {
 "cells": [
  {
   "cell_type": "markdown",
   "id": "215a6c3a",
   "metadata": {},
   "source": [
    "# NN inference analysis\n",
    "\n",
    "Анализ CSV с результатами инференса: доля класса `drone`, частоты срабатываний, уверенность модели и интервалы между `drone`-классификациями."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "4e8cff32",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "CSV path: /home/sibscience-4/from_ssh/DroneDetector/logs/nn_results_live_6gb.csv\n",
      "Rows: 27258\n",
      "Time range: 2026-05-04 17:35:21.019627763+07:00 -> 2026-05-05 12:17:19.369858371+07:00\n",
      "Missing freq rows: 0\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>docker_timestamp</th>\n",
       "      <th>event_time_iso</th>\n",
       "      <th>event_time_epoch</th>\n",
       "      <th>freq</th>\n",
       "      <th>model_id</th>\n",
       "      <th>model_type</th>\n",
       "      <th>prediction</th>\n",
       "      <th>probability</th>\n",
       "      <th>ts</th>\n",
       "      <th>local_time</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2026-05-04T10:35:21.019627763Z</td>\n",
       "      <td>2026-05-04T17:35:21+07:00</td>\n",
       "      <td>1.777891e+09</td>\n",
       "      <td>2400</td>\n",
       "      <td>2</td>\n",
       "      <td>ensemble_2400_v44</td>\n",
       "      <td>drone</td>\n",
       "      <td>0.99</td>\n",
       "      <td>2026-05-04 10:35:21.019627763+00:00</td>\n",
       "      <td>2026-05-04 17:35:21.019627763+07:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2026-05-04T10:35:21.019631281Z</td>\n",
       "      <td>2026-05-04T17:35:21+07:00</td>\n",
       "      <td>1.777891e+09</td>\n",
       "      <td>1200</td>\n",
       "      <td>1</td>\n",
       "      <td>ensemble_1200_v44</td>\n",
       "      <td>noise</td>\n",
       "      <td>1.00</td>\n",
       "      <td>2026-05-04 10:35:21.019631281+00:00</td>\n",
       "      <td>2026-05-04 17:35:21.019631281+07:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2026-05-04T10:35:27.048188525Z</td>\n",
       "      <td>2026-05-04T17:35:27+07:00</td>\n",
       "      <td>1.777891e+09</td>\n",
       "      <td>2400</td>\n",
       "      <td>2</td>\n",
       "      <td>ensemble_2400_v44</td>\n",
       "      <td>drone</td>\n",
       "      <td>0.99</td>\n",
       "      <td>2026-05-04 10:35:27.048188525+00:00</td>\n",
       "      <td>2026-05-04 17:35:27.048188525+07:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2026-05-04T10:35:29.238925690Z</td>\n",
       "      <td>2026-05-04T17:35:29+07:00</td>\n",
       "      <td>1.777891e+09</td>\n",
       "      <td>1200</td>\n",
       "      <td>1</td>\n",
       "      <td>ensemble_1200_v44</td>\n",
       "      <td>noise</td>\n",
       "      <td>1.00</td>\n",
       "      <td>2026-05-04 10:35:29.238925690+00:00</td>\n",
       "      <td>2026-05-04 17:35:29.238925690+07:00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2026-05-04T10:35:32.842234116Z</td>\n",
       "      <td>2026-05-04T17:35:32+07:00</td>\n",
       "      <td>1.777891e+09</td>\n",
       "      <td>2400</td>\n",
       "      <td>2</td>\n",
       "      <td>ensemble_2400_v44</td>\n",
       "      <td>drone</td>\n",
       "      <td>0.92</td>\n",
       "      <td>2026-05-04 10:35:32.842234116+00:00</td>\n",
       "      <td>2026-05-04 17:35:32.842234116+07:00</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 docker_timestamp             event_time_iso  \\\n",
       "0  2026-05-04T10:35:21.019627763Z  2026-05-04T17:35:21+07:00   \n",
       "1  2026-05-04T10:35:21.019631281Z  2026-05-04T17:35:21+07:00   \n",
       "2  2026-05-04T10:35:27.048188525Z  2026-05-04T17:35:27+07:00   \n",
       "3  2026-05-04T10:35:29.238925690Z  2026-05-04T17:35:29+07:00   \n",
       "4  2026-05-04T10:35:32.842234116Z  2026-05-04T17:35:32+07:00   \n",
       "\n",
       "   event_time_epoch  freq  model_id         model_type prediction  \\\n",
       "0      1.777891e+09  2400         2  ensemble_2400_v44      drone   \n",
       "1      1.777891e+09  1200         1  ensemble_1200_v44      noise   \n",
       "2      1.777891e+09  2400         2  ensemble_2400_v44      drone   \n",
       "3      1.777891e+09  1200         1  ensemble_1200_v44      noise   \n",
       "4      1.777891e+09  2400         2  ensemble_2400_v44      drone   \n",
       "\n",
       "   probability                                  ts  \\\n",
       "0         0.99 2026-05-04 10:35:21.019627763+00:00   \n",
       "1         1.00 2026-05-04 10:35:21.019631281+00:00   \n",
       "2         0.99 2026-05-04 10:35:27.048188525+00:00   \n",
       "3         1.00 2026-05-04 10:35:29.238925690+00:00   \n",
       "4         0.92 2026-05-04 10:35:32.842234116+00:00   \n",
       "\n",
       "                           local_time  \n",
       "0 2026-05-04 17:35:21.019627763+07:00  \n",
       "1 2026-05-04 17:35:21.019631281+07:00  \n",
       "2 2026-05-04 17:35:27.048188525+07:00  \n",
       "3 2026-05-04 17:35:29.238925690+07:00  \n",
       "4 2026-05-04 17:35:32.842234116+07:00  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "from pathlib import Path\n",
    "import pandas as pd\n",
    "\n",
    "csv_path = Path('/home/sibscience-4/from_ssh/DroneDetector/logs/nn_results_live_6gb.csv')\n",
    "df = pd.read_csv(csv_path)\n",
    "\n",
    "df['ts'] = pd.to_datetime(df['docker_timestamp'], utc=True)\n",
    "df['local_time'] = df['ts'].dt.tz_convert('Asia/Novosibirsk')\n",
    "df['freq'] = pd.to_numeric(df['freq'], errors='coerce').astype('Int64')\n",
    "df['probability'] = pd.to_numeric(df['probability'], errors='coerce')\n",
    "df = df.sort_values('ts').reset_index(drop=True)\n",
    "\n",
    "print(f'CSV path: {csv_path}')\n",
    "print(f'Rows: {len(df)}')\n",
    "print(f'Time range: {df[\"local_time\"].min()} -> {df[\"local_time\"].max()}')\n",
    "print(f'Missing freq rows: {df[\"freq\"].isna().sum()}')\n",
    "display(df.head())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0fcc6dd6",
   "metadata": {},
   "source": [
    "## Общая сводка по частотам и классам"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "7bf0fc3f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>freq</th>\n",
       "      <th>prediction</th>\n",
       "      <th>count</th>\n",
       "      <th>avg_probability</th>\n",
       "      <th>min_probability</th>\n",
       "      <th>max_probability</th>\n",
       "      <th>freq_total</th>\n",
       "      <th>class_rate</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1200</td>\n",
       "      <td>drone</td>\n",
       "      <td>3</td>\n",
       "      <td>0.840000</td>\n",
       "      <td>0.78</td>\n",
       "      <td>0.91</td>\n",
       "      <td>13632</td>\n",
       "      <td>0.000220</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1200</td>\n",
       "      <td>noise</td>\n",
       "      <td>13629</td>\n",
       "      <td>0.997436</td>\n",
       "      <td>0.91</td>\n",
       "      <td>1.00</td>\n",
       "      <td>13632</td>\n",
       "      <td>0.999780</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2400</td>\n",
       "      <td>drone</td>\n",
       "      <td>11921</td>\n",
       "      <td>0.868013</td>\n",
       "      <td>0.50</td>\n",
       "      <td>1.00</td>\n",
       "      <td>13626</td>\n",
       "      <td>0.874872</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2400</td>\n",
       "      <td>noise</td>\n",
       "      <td>1705</td>\n",
       "      <td>0.649185</td>\n",
       "      <td>0.50</td>\n",
       "      <td>1.00</td>\n",
       "      <td>13626</td>\n",
       "      <td>0.125128</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   freq prediction  count  avg_probability  min_probability  max_probability  \\\n",
       "0  1200      drone      3         0.840000             0.78             0.91   \n",
       "1  1200      noise  13629         0.997436             0.91             1.00   \n",
       "2  2400      drone  11921         0.868013             0.50             1.00   \n",
       "3  2400      noise   1705         0.649185             0.50             1.00   \n",
       "\n",
       "   freq_total  class_rate  \n",
       "0       13632    0.000220  \n",
       "1       13632    0.999780  \n",
       "2       13626    0.874872  \n",
       "3       13626    0.125128  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "class_summary = (\n",
    "    df.groupby(['freq', 'prediction'], dropna=False)\n",
    "      .agg(\n",
    "          count=('prediction', 'size'),\n",
    "          avg_probability=('probability', 'mean'),\n",
    "          min_probability=('probability', 'min'),\n",
    "          max_probability=('probability', 'max'),\n",
    "      )\n",
    "      .reset_index()\n",
    ")\n",
    "\n",
    "freq_total = df.groupby('freq', dropna=False).size().rename('freq_total').reset_index()\n",
    "class_summary = class_summary.merge(freq_total, on='freq', how='left')\n",
    "class_summary['class_rate'] = class_summary['count'] / class_summary['freq_total']\n",
    "class_summary = class_summary.sort_values(['freq', 'prediction']).reset_index(drop=True)\n",
    "\n",
    "display(class_summary)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "039fcfa6",
   "metadata": {},
   "source": [
    "## Статистика по классу drone"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "c1ed2bc4",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>freq</th>\n",
       "      <th>total_inferences</th>\n",
       "      <th>drone_count</th>\n",
       "      <th>avg_drone_probability</th>\n",
       "      <th>median_drone_probability</th>\n",
       "      <th>min_drone_probability</th>\n",
       "      <th>max_drone_probability</th>\n",
       "      <th>first_drone_time</th>\n",
       "      <th>last_drone_time</th>\n",
       "      <th>drone_rate</th>\n",
       "      <th>dataset_duration_min</th>\n",
       "      <th>drone_per_min</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1200</td>\n",
       "      <td>13632</td>\n",
       "      <td>3</td>\n",
       "      <td>0.840000</td>\n",
       "      <td>0.83</td>\n",
       "      <td>0.78</td>\n",
       "      <td>0.91</td>\n",
       "      <td>2026-05-05 03:18:55.374394280+07:00</td>\n",
       "      <td>2026-05-05 08:39:23.676669045+07:00</td>\n",
       "      <td>0.000220</td>\n",
       "      <td>1121.972504</td>\n",
       "      <td>0.002674</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2400</td>\n",
       "      <td>13626</td>\n",
       "      <td>11921</td>\n",
       "      <td>0.868013</td>\n",
       "      <td>0.93</td>\n",
       "      <td>0.50</td>\n",
       "      <td>1.00</td>\n",
       "      <td>2026-05-04 17:35:21.019627763+07:00</td>\n",
       "      <td>2026-05-05 12:17:19.369858371+07:00</td>\n",
       "      <td>0.874872</td>\n",
       "      <td>1121.972504</td>\n",
       "      <td>10.625038</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   freq  total_inferences  drone_count  avg_drone_probability  \\\n",
       "0  1200             13632            3               0.840000   \n",
       "1  2400             13626        11921               0.868013   \n",
       "\n",
       "   median_drone_probability  min_drone_probability  max_drone_probability  \\\n",
       "0                      0.83                   0.78                   0.91   \n",
       "1                      0.93                   0.50                   1.00   \n",
       "\n",
       "                     first_drone_time                     last_drone_time  \\\n",
       "0 2026-05-05 03:18:55.374394280+07:00 2026-05-05 08:39:23.676669045+07:00   \n",
       "1 2026-05-04 17:35:21.019627763+07:00 2026-05-05 12:17:19.369858371+07:00   \n",
       "\n",
       "   drone_rate  dataset_duration_min  drone_per_min  \n",
       "0    0.000220           1121.972504       0.002674  \n",
       "1    0.874872           1121.972504      10.625038  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "drone = df[df['prediction'].eq('drone')].copy()\n",
    "\n",
    "total_by_freq = df.groupby('freq', dropna=False).size().rename('total_inferences')\n",
    "drone_by_freq = drone.groupby('freq', dropna=False).agg(\n",
    "    drone_count=('prediction', 'size'),\n",
    "    avg_drone_probability=('probability', 'mean'),\n",
    "    median_drone_probability=('probability', 'median'),\n",
    "    min_drone_probability=('probability', 'min'),\n",
    "    max_drone_probability=('probability', 'max'),\n",
    "    first_drone_time=('local_time', 'min'),\n",
    "    last_drone_time=('local_time', 'max'),\n",
    ")\n",
    "\n",
    "drone_stats = total_by_freq.to_frame().join(drone_by_freq, how='left').fillna({'drone_count': 0})\n",
    "drone_stats['drone_count'] = drone_stats['drone_count'].astype(int)\n",
    "drone_stats['drone_rate'] = drone_stats['drone_count'] / drone_stats['total_inferences']\n",
    "\n",
    "if len(df) > 1:\n",
    "    duration_min = (df['ts'].max() - df['ts'].min()).total_seconds() / 60\n",
    "else:\n",
    "    duration_min = 0\n",
    "\n",
    "drone_stats['dataset_duration_min'] = duration_min\n",
    "drone_stats['drone_per_min'] = drone_stats['drone_count'] / duration_min if duration_min > 0 else 0\n",
    "drone_stats = drone_stats.reset_index().sort_values('freq').reset_index(drop=True)\n",
    "\n",
    "display(drone_stats)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "56ae5e2b",
   "metadata": {},
   "source": [
    "## Интервалы между drone-классификациями"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "0c43eb07",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>freq</th>\n",
       "      <th>interval_count</th>\n",
       "      <th>avg_interval_sec</th>\n",
       "      <th>median_interval_sec</th>\n",
       "      <th>min_interval_sec</th>\n",
       "      <th>max_interval_sec</th>\n",
       "      <th>p90_interval_sec</th>\n",
       "      <th>p95_interval_sec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1200</td>\n",
       "      <td>2</td>\n",
       "      <td>9614.151137</td>\n",
       "      <td>9614.151137</td>\n",
       "      <td>619.196112</td>\n",
       "      <td>18609.106163</td>\n",
       "      <td>16810.115158</td>\n",
       "      <td>17709.610661</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2400</td>\n",
       "      <td>11920</td>\n",
       "      <td>5.647513</td>\n",
       "      <td>4.974157</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>1210.107950</td>\n",
       "      <td>9.203728</td>\n",
       "      <td>10.079097</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   freq  interval_count  avg_interval_sec  median_interval_sec  \\\n",
       "0  1200               2       9614.151137          9614.151137   \n",
       "1  2400           11920          5.647513             4.974157   \n",
       "\n",
       "   min_interval_sec  max_interval_sec  p90_interval_sec  p95_interval_sec  \n",
       "0        619.196112      18609.106163      16810.115158      17709.610661  \n",
       "1          0.000000       1210.107950          9.203728         10.079097  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "if drone.empty:\n",
    "    print('No drone predictions found')\n",
    "    drone_interval_stats = pd.DataFrame()\n",
    "else:\n",
    "    drone = drone.sort_values(['freq', 'ts']).copy()\n",
    "    drone['dt_drone_freq_sec'] = drone.groupby('freq')['ts'].diff().dt.total_seconds()\n",
    "    drone_interval_stats = (\n",
    "        drone.groupby('freq', dropna=False)['dt_drone_freq_sec']\n",
    "             .agg(\n",
    "                 interval_count='count',\n",
    "                 avg_interval_sec='mean',\n",
    "                 median_interval_sec='median',\n",
    "                 min_interval_sec='min',\n",
    "                 max_interval_sec='max',\n",
    "                 p90_interval_sec=lambda s: s.quantile(0.90),\n",
    "                 p95_interval_sec=lambda s: s.quantile(0.95),\n",
    "             )\n",
    "             .reset_index()\n",
    "    )\n",
    "    display(drone_interval_stats)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "2ecf96f0",
   "metadata": {},
   "source": [
    "## Drone-события"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ff14a339",
   "metadata": {},
   "outputs": [],
   "source": [
    "drone_events = drone[[\n",
    "    'local_time',\n",
    "    'docker_timestamp',\n",
    "    'freq',\n",
    "    'model_id',\n",
    "    'model_type',\n",
    "    'prediction',\n",
    "    'probability',\n",
    "]].sort_values('local_time').reset_index(drop=True)\n",
    "\n",
    "display(drone_events.head(50))\n",
    "display(drone_events.tail(50))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "376b84d0",
   "metadata": {},
   "source": [
    "## Частота drone-классификаций по минутам"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5f82f5c1",
   "metadata": {},
   "outputs": [],
   "source": [
    "if drone.empty:\n",
    "    print('No drone predictions found')\n",
    "else:\n",
    "    drone_per_minute = (\n",
    "        drone.set_index('local_time')\n",
    "             .groupby('freq')\n",
    "             .resample('1min')\n",
    "             .size()\n",
    "             .rename('drone_count')\n",
    "             .reset_index()\n",
    "    )\n",
    "    display(drone_per_minute.tail(100))\n",
    "\n",
    "    pivot = drone_per_minute.pivot_table(\n",
    "        index='local_time',\n",
    "        columns='freq',\n",
    "        values='drone_count',\n",
    "        fill_value=0,\n",
    "    )\n",
    "    display(pivot.tail(50))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ad570d05",
   "metadata": {},
   "source": [
    "## Быстрые графики"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "895550a1",
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "if not drone.empty:\n",
    "    ax = drone_stats.set_index('freq')['drone_rate'].plot(kind='bar', figsize=(8, 4), title='Drone rate by frequency')\n",
    "    ax.set_ylabel('drone_count / total_inferences')\n",
    "    plt.show()\n",
    "\n",
    "    ax = drone.boxplot(column='probability', by='freq', figsize=(8, 4))\n",
    "    ax.set_title('Drone probability by frequency')\n",
    "    ax.set_xlabel('freq')\n",
    "    ax.set_ylabel('probability')\n",
    "    plt.suptitle('')\n",
    "    plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "name": "python",
   "pygments_lexer": "ipython3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
 }
--- a/scripts/capture_nn_results.py
+++ b/scripts/capture_nn_results.py
@ -0,0 +1,223 @@
 #!/usr/bin/env python3
 import argparse
 import csv
 import json
 import os
 import re
 import subprocess
 import sys
 import time
 from datetime import datetime, timezone
 RESULT_RE = re.compile(
    r"^(?P<docker_ts>\S+)\s+RESULT Модель (?P<model_id>\d+) с типом (?P<model_type>.+?): "
    r"(?P<prediction>\S+) \(probability=(?P<probability>[-+]?\d+(?:\.\d+)?)\)\s*$"
 )
 FREQ_RE = re.compile(r"(\d{3,5})")
 def parse_args():
    parser = argparse.ArgumentParser(
        description="Capture NN inference RESULT logs into CSV or JSONL until time or size limit."
    )
    parser.add_argument(
        "--output",
        required=True,
        help="Output file path (.csv or .jsonl recommended).",
    )
    parser.add_argument(
        "--format",
        choices=("csv", "jsonl"),
        default="csv",
        help="Output format.",
    )
    parser.add_argument(
        "--minutes",
        type=float,
        default=0.0,
        help="Stop after this many minutes. 0 means no time limit.",
    )
    parser.add_argument(
        "--max-bytes",
        type=int,
        default=3 * 1024 * 1024 * 1024,
        help="Stop when output file reaches this size in bytes. Default: 3 GiB.",
    )
    parser.add_argument(
        "--since",
        default=None,
        help="Optional docker logs --since value, e.g. 20m, 2h, 2026-05-04T12:00:00.",
    )
    parser.add_argument(
        "--tail",
        type=int,
        default=0,
        help="How many previous log lines to include before following. Default: 0.",
    )
    parser.add_argument(
        "--compose-file",
        default="deploy/docker/docker-compose.yml",
        help="Path to docker compose file.",
    )
    parser.add_argument(
        "--service",
        default="dronedetector-nn-server",
        help="Docker compose service name.",
    )
    parser.add_argument(
        "--follow",
        action="store_true",
        help="Follow logs live. By default the script captures a finite history snapshot.",
    )
    return parser.parse_args()
 def extract_freq(model_type):
    matches = FREQ_RE.findall(model_type)
    if not matches:
        return ""
    known_freqs = {"433", "750", "868", "915", "1200", "1500", "2400", "3300", "4500", "5200", "5800"}
    for value in matches:
        if value in known_freqs:
            return value
    return matches[0]
 def parse_docker_timestamp(value):
    try:
        return datetime.fromisoformat(value.replace("Z", "+00:00"))
    except ValueError:
        return datetime.now(timezone.utc)
 def open_output(path, fmt):
    os.makedirs(os.path.dirname(os.path.abspath(path)), exist_ok=True)
    fh = open(path, "a", encoding="utf-8", newline="")
    writer = None
    if fmt == "csv":
        writer = csv.writer(fh)
        if fh.tell() == 0:
            writer.writerow(
                [
                    "docker_timestamp",
                    "event_time_iso",
                    "event_time_epoch",
                    "freq",
                    "model_id",
                    "model_type",
                    "prediction",
                    "probability",
                ]
            )
            fh.flush()
    return fh, writer
 def write_record(fh, writer, fmt, record):
    if fmt == "csv":
        writer.writerow(
            [
                record["docker_timestamp"],
                record["event_time_iso"],
                record["event_time_epoch"],
                record["freq"],
                record["model_id"],
                record["model_type"],
                record["prediction"],
                record["probability"],
            ]
        )
    else:
        fh.write(json.dumps(record, ensure_ascii=False) + "\n")
    fh.flush()
 def build_command(args):
    cmd = [
        "docker",
        "compose",
        "-f",
        args.compose_file,
        "logs",
        "--timestamps",
        "--no-log-prefix",
        args.service,
    ]
    if args.since:
        cmd[5:5] = ["--since", args.since]
    if int(args.tail) > 0:
        cmd[-1:-1] = ["--tail", str(args.tail)]
    if args.follow:
        cmd.insert(-1, "-f")
    return cmd
 def main():
    args = parse_args()
    deadline = time.time() + (args.minutes * 60.0) if args.minutes > 0 else None
    fh, writer = open_output(args.output, args.format)
    cmd = build_command(args)
    print("Running:", " ".join(cmd), file=sys.stderr)
    proc = subprocess.Popen(
        cmd,
        stdout=subprocess.PIPE,
        stderr=subprocess.STDOUT,
        text=True,
        encoding="utf-8",
        errors="replace",
        bufsize=1,
    )
    captured = 0
    try:
        assert proc.stdout is not None
        for line in proc.stdout:
            if deadline is not None and time.time() >= deadline:
                print("Stopping: time limit reached", file=sys.stderr)
                break
            match = RESULT_RE.match(line.rstrip("\n"))
            if not match:
                continue
            docker_dt = parse_docker_timestamp(match.group("docker_ts"))
            event_dt = docker_dt.astimezone()
            model_type = match.group("model_type")
            record = {
                "docker_timestamp": match.group("docker_ts"),
                "event_time_iso": event_dt.isoformat(timespec="seconds"),
                "event_time_epoch": round(docker_dt.timestamp(), 3),
                "freq": extract_freq(model_type),
                "model_id": int(match.group("model_id")),
                "model_type": model_type,
                "prediction": match.group("prediction"),
                "probability": float(match.group("probability")),
            }
            write_record(fh, writer, args.format, record)
            captured += 1
            if fh.tell() >= args.max_bytes:
                print("Stopping: file size limit reached", file=sys.stderr)
                break
    finally:
        try:
            proc.terminate()
        except Exception:
            pass
        try:
            proc.wait(timeout=5)
        except Exception:
            try:
                proc.kill()
            except Exception:
                pass
        fh.close()
    print(f"Captured {captured} inference results into {args.output}", file=sys.stderr)
 if __name__ == "__main__":
    main()
--- a/train_scripts/Training_models2pic_val_loss.ipynb
+++ b/train_scripts/Training_models2pic_val_loss.ipynb
@ -0,0 +1,523 @@
 {
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "e1db882b",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/sibscience-4/from_ssh/DroneDetector/.venv-train/lib/python3.12/site-packages/matplotlib/projections/__init__.py:63: UserWarning: Unable to import Axes3D. This may be due to multiple versions of Matplotlib being installed (e.g. as a system package and as a pip package). As a result, the 3D projection is not available.\n",
      "  warnings.warn(\"Unable to import Axes3D. This may be due to multiple versions of \"\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cuda\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "220"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from sklearn.model_selection import train_test_split\n",
    "from torch.utils.data import Dataset, DataLoader\n",
    "from torch import default_generator, randperm\n",
    "from torch.utils.data.dataset import Subset\n",
    "import torchvision.transforms as transforms\n",
    "from torchvision.io import read_image\n",
    "from importlib import import_module\n",
    "import matplotlib.pyplot as plt\n",
    "from torchvision import models\n",
    "import torch, torchvision\n",
    "from pathlib import Path\n",
    "from PIL import Image\n",
    "import torch.nn as nn\n",
    "from tqdm import tqdm\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib\n",
    "import os, shutil\n",
    "import mlconfig\n",
    "import random\n",
    "import shutil\n",
    "import timeit\n",
    "import copy\n",
    "import time\n",
    "import cv2\n",
    "import csv\n",
    "import sys\n",
    "import io\n",
    "import gc\n",
    "\n",
    "plt.rcParams[\"savefig.bbox\"] = 'tight'\n",
    "torch.manual_seed(1)\n",
    "#matplotlib.use('Agg')\n",
    "device = 'cuda' if torch.cuda.is_available() else 'cpu'\n",
    "print(device)\n",
    "torch.cuda.empty_cache()\n",
    "cv2.destroyAllWindows()\n",
    "gc.collect()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "8e009995",
   "metadata": {},
   "outputs": [],
   "source": [
    "def prepare_and_learning_detection(num_classes, num_samples, path_dataset, model_name, config_name, model,selected_freq):\n",
    "    num_samples_per_class = num_samples // num_classes\n",
    "\n",
    "    #----------Создаём папку для сохранения результатов обучения--------------\n",
    "    os.makedirs(\"models\", exist_ok=True)\n",
    "    ind = 1\n",
    "    while True:\n",
    "        if os.path.exists(\"models/\" + model_name + str(ind)):\n",
    "            ind += 1\n",
    "        else:\n",
    "            os.mkdir(\"models/\" + model_name + str(ind))\n",
    "            path_res = \"models/\" + model_name + str(ind) + '/'\n",
    "            break\n",
    "    \n",
    "    #----------Создаём файл dataset.csv для обучения--------------\n",
    "    \n",
    "    pd_columns = ['file_name']\n",
    "    df = pd.DataFrame(columns=pd_columns)\n",
    "    \n",
    "    subdirs = os.listdir(path_dataset)\n",
    "    \n",
    "    for subdir in subdirs:\n",
    "        freq_dir = os.path.join(path_dataset, subdir, str(selected_freq)+\"_jpg\")\n",
    "        if not os.path.isdir(freq_dir):\n",
    "            print(\"Error1\")\n",
    "            continue\n",
    "        \n",
    "        files_k=[f for f in os.listdir(freq_dir)]\n",
    "        print(len(files_k))\n",
    "        \n",
    "        files = [\n",
    "                f for f in os.listdir(freq_dir)\n",
    "                if os.path.isfile(os.path.join(freq_dir, f)) and f.endswith('imag.png')\n",
    "            ]\n",
    "        num_samples_per_class = min(num_samples_per_class, len(files))\n",
    "        print(f\"num_samples per class {subdir} is {num_samples_per_class}\")\n",
    "\n",
    "    for subdir in subdirs:\n",
    "        freq_dir = os.path.join(path_dataset, subdir, str(selected_freq)+\"_jpg\")\n",
    "        if not os.path.isdir(freq_dir):\n",
    "            print(\"Error1\")\n",
    "            continue\n",
    "\n",
    "        files = [\n",
    "            f for f in os.listdir(freq_dir)\n",
    "            if os.path.isfile(os.path.join(freq_dir, f)) and f.endswith('imag.png')\n",
    "        ]\n",
    "        random.shuffle(files)\n",
    "        files_to_process = files[:num_samples_per_class]\n",
    "\n",
    "        for file in files_to_process:\n",
    "            row = pd.DataFrame({\n",
    "                pd_columns[0]: [str(os.path.join(freq_dir, file))]\n",
    "            })\n",
    "            df = pd.concat([df, row], ignore_index=True)\n",
    "\n",
    "    dataset_csv_path = os.path.join(path_res, 'dataset.csv')\n",
    "    df.to_csv(dataset_csv_path, index=False)\n",
    "\n",
    "    if not os.path.exists(dataset_csv_path):\n",
    "        raise RuntimeError(f'dataset.csv was not created: {dataset_csv_path}')\n",
    "    #----------Импортируем параметры для обучения--------------\n",
    "    \n",
    "    def load_function(attr):\n",
    "        module_, func = attr.rsplit('.', maxsplit=1)\n",
    "        return getattr(import_module(module_), func)\n",
    "    \n",
    "    config = mlconfig.load('config_' + config_name + '.yaml')\n",
    "    \n",
    "    #----------Создаём класс датасета--------------\n",
    "    \n",
    "    class MyDataset(Dataset):\n",
    "        def __init__(self, path_dataset, csv_file):\n",
    "            data=[]\n",
    "            with open(os.path.join(path_dataset, csv_file), newline='') as csvfile:\n",
    "                reader = csv.reader(csvfile, delimiter=' ', quotechar='|')\n",
    "                for row in list(reader)[1:]:\n",
    "                    row = str(row)\n",
    "                    data.append(row[2: len(row)-2])\n",
    "            self.path_dataset = path_dataset\n",
    "            self.target_shape = None\n",
    "            self.target_hw = None\n",
    "            self.sig_filenames = self._validate_files(data)\n",
    "\n",
    "        def _pair_paths(self, filename):\n",
    "            base = os.path.splitext(filename)[0]\n",
    "            if base.endswith(\"real\"):\n",
    "                return base + \".png\", base[:-4] + \"imag.png\"\n",
    "            if base.endswith(\"imag\"):\n",
    "                return base[:-4] + \"real.png\", base + \".png\"\n",
    "            return None, None\n",
    "\n",
    "        @staticmethod\n",
    "        def _read_shape(path):\n",
    "            img = cv2.imread(path)\n",
    "            if img is None:\n",
    "                return None\n",
    "            return img.shape\n",
    "\n",
    "        def _validate_files(self, filenames):\n",
    "            from collections import Counter\n",
    "\n",
    "            candidates = []\n",
    "            dropped = []\n",
    "            shape_counter = Counter()\n",
    "\n",
    "            for filename in filenames:\n",
    "                real_path, imag_path = self._pair_paths(filename)\n",
    "                if real_path is None or imag_path is None:\n",
    "                    dropped.append((filename, \"bad file suffix\"))\n",
    "                    continue\n",
    "\n",
    "                real_shape = self._read_shape(real_path)\n",
    "                imag_shape = self._read_shape(imag_path)\n",
    "                if real_shape is None or imag_shape is None:\n",
    "                    dropped.append((filename, f\"read failed real={real_shape} imag={imag_shape}\"))\n",
    "                    continue\n",
    "                if real_shape != imag_shape:\n",
    "                    dropped.append((filename, f\"pair shape mismatch real={real_shape} imag={imag_shape}\"))\n",
    "                    continue\n",
    "\n",
    "                shape_counter[real_shape] += 1\n",
    "                candidates.append((filename, real_shape))\n",
    "\n",
    "            if not candidates:\n",
    "                raise RuntimeError(\"No valid image pairs left after shape validation\")\n",
    "\n",
    "            preferred_shape = (1600, 1600, 3)\n",
    "            if shape_counter.get(preferred_shape, 0) > 0:\n",
    "                target_shape = preferred_shape\n",
    "            else:\n",
    "                target_shape = shape_counter.most_common(1)[0][0]\n",
    "\n",
    "            self.target_shape = target_shape\n",
    "            self.target_hw = target_shape[:2]\n",
    "            valid = [filename for filename, _shape in candidates]\n",
    "            resized_count = sum(1 for _filename, shape in candidates if shape != target_shape)\n",
    "\n",
    "            print(f\"[dataset-shape-filter] shape_distribution={dict(shape_counter)}\")\n",
    "            print(\n",
    "                f\"[dataset-shape-filter] target_shape={target_shape} \"\n",
    "                f\"kept={len(valid)} dropped={len(dropped)} will_resize={resized_count}\"\n",
    "            )\n",
    "            for filename, reason in dropped[:20]:\n",
    "                print(f\"[dataset-shape-filter] drop {filename}: {reason}\")\n",
    "            if len(dropped) > 20:\n",
    "                print(f\"[dataset-shape-filter] ... {len(dropped) - 20} more dropped\")\n",
    "\n",
    "            return valid\n",
    "\n",
    "        def __len__(self):\n",
    "            return len(self.sig_filenames)\n",
    "\n",
    "        def _read_image_chw(self, path):\n",
    "            img = cv2.imread(path)\n",
    "            if img is None:\n",
    "                raise RuntimeError(f\"failed to read image: {path}\")\n",
    "            if img.shape[:2] != self.target_hw:\n",
    "                img = cv2.resize(\n",
    "                    img,\n",
    "                    (self.target_hw[1], self.target_hw[0]),\n",
    "                    interpolation=cv2.INTER_AREA,\n",
    "                )\n",
    "            return np.asarray(cv2.split(img), dtype=np.float32)\n",
    "\n",
    "        def __getitem__(self, idx):\n",
    "            real_path, imag_path = self._pair_paths(self.sig_filenames[idx])\n",
    "            image_real = self._read_image_chw(real_path)\n",
    "            image_imag = self._read_image_chw(imag_path)\n",
    "\n",
    "            path_parts = set(self.sig_filenames[idx].split('/'))\n",
    "            if 'drone' in path_parts:\n",
    "                label = torch.tensor(0)\n",
    "            elif 'noise' in path_parts:\n",
    "                label = torch.tensor(1)\n",
    "            else:\n",
    "                raise RuntimeError(f\"cannot infer label from path: {self.sig_filenames[idx]}\")\n",
    "\n",
    "            return image_real, image_imag, label\n",
    "\n",
    "    #----------Создаём датасет--------------\n",
    "    \n",
    "    dataset = MyDataset(path_dataset=path_res, csv_file='dataset.csv')\n",
    "    train_set, valid_set = torch.utils.data.random_split(dataset, [0.7, 0.3], generator=torch.Generator().manual_seed(42))\n",
    "    batch_size = config.batch_size\n",
    "    train_dataloader = torch.utils.data.DataLoader(train_set, batch_size=batch_size, shuffle=True, drop_last=True)\n",
    "    valid_dataloader = torch.utils.data.DataLoader(valid_set, batch_size=batch_size, shuffle=False, drop_last=False)\n",
    "    \n",
    "    dataloaders = {}\n",
    "    dataloaders['train'] = train_dataloader\n",
    "    dataloaders['val'] = valid_dataloader\n",
    "    dataset_sizes = {}\n",
    "    dataset_sizes['train'] = len(train_set)\n",
    "    dataset_sizes['val'] = len(valid_set)\n",
    "\n",
    "    #----------Обучаем модель--------------\n",
    "\n",
    "    val_loss = []\n",
    "    val_acc = []\n",
    "    train_loss = []\n",
    "    train_acc = []\n",
    "    epochs = config.epoch\n",
    "    min_delta = 1e-4\n",
    "    \n",
    "    best_val_loss = float('inf')\n",
    "    best_model = copy.deepcopy(model.state_dict())\n",
    "    limit = config.limit\n",
    "    ind_limit = 0\n",
    "    epoch_limit = epochs\n",
    "    \n",
    "    start = timeit.default_timer()\n",
    "    for epoch in range(1, epochs+1):\n",
    "        print(f\"Epoch : {epoch}\\n\")\n",
    "        \n",
    "        for phase in ['train', 'val']:\n",
    "            if phase == 'train':\n",
    "                model.train()\n",
    "            else:\n",
    "                model.eval()\n",
    "\n",
    "            running_loss = 0.0\n",
    "            running_corrects = 0\n",
    "    \n",
    "            for (img1, img2, label) in tqdm(dataloaders[phase]):\n",
    "                img1, img2, label = img1.to(device), img2.to(device), label.to(device)\n",
    "                optimizer.zero_grad()\n",
    "    \n",
    "                with torch.set_grad_enabled(phase == 'train'):\n",
    "                    output = model([img1, img2])\n",
    "                    _, pred = torch.max(output.data, 1)\n",
    "                    loss = criterion(output, label)\n",
    "                    if phase == 'train':\n",
    "                        loss.backward()\n",
    "                        optimizer.step()\n",
    "                \n",
    "                running_loss += loss.item() * img1.size(0)\n",
    "                running_corrects += torch.sum(pred == label.data)\n",
    "    \n",
    "            epoch_loss = running_loss / dataset_sizes[phase]\n",
    "            epoch_acc = running_corrects.double() / dataset_sizes[phase]\n",
    "                \n",
    "            print('{} Loss: {:.4f} Acc: {:.4f}'.format(phase, epoch_loss, epoch_acc))\n",
    "                    \n",
    "            if phase == 'train':\n",
    "                train_loss.append(epoch_loss)\n",
    "                train_acc.append(epoch_acc)\n",
    "            else:\n",
    "                val_loss.append(epoch_loss)\n",
    "                val_acc.append(epoch_acc)\n",
    "                scheduler.step(epoch_loss)\n",
    "\n",
    "                current_lr = optimizer.param_groups[0]['lr']\n",
    "                print(f'val lr: {current_lr:.8f}')\n",
    "\n",
    "                if epoch_loss < (best_val_loss - min_delta):\n",
    "                    ind_limit = 0\n",
    "                    best_val_loss = epoch_loss\n",
    "                    best_model = copy.deepcopy(model.state_dict())\n",
    "                    torch.save(best_model, path_res + model_name + '.pth')\n",
    "                    print(f'saved best model with val_loss={best_val_loss:.4f}')\n",
    "                else:\n",
    "                    ind_limit += 1\n",
    "                    print(f'early stopping patience: {ind_limit}/{limit}')\n",
    "                    \n",
    "                if ind_limit >= limit:\n",
    "                    break\n",
    "                \n",
    "        if ind_limit >= limit:\n",
    "            epoch_limit = epoch\n",
    "            break\n",
    "            \n",
    "        print()\n",
    "    \n",
    "    end = timeit.default_timer()\n",
    "    print(f\"Total time elapsed = {end - start} seconds\")\n",
    "    epoch_limit += 1\n",
    "    \n",
    "    #----------Вывод графиков и сохранение результатов обучения--------------\n",
    "    \n",
    "    train_acc = np.asarray(list(map(lambda x: x.item(), train_acc)))\n",
    "    val_acc = np.asarray(list(map(lambda x: x.item(), val_acc)))\n",
    "    \n",
    "    np.save(path_res+'train_acc.npy', train_acc)\n",
    "    np.save(path_res+'val_acc.npy', val_acc)\n",
    "    np.save(path_res+'train_loss.npy', train_loss)\n",
    "    np.save(path_res+'val_loss.npy', val_loss)\n",
    "    \n",
    "    plt.figure()\n",
    "    plt.plot(range(1,epoch_limit), train_loss, color='blue')\n",
    "    plt.plot(range(1,epoch_limit), val_loss, color='red')\n",
    "    plt.xlabel('Epoch')\n",
    "    plt.ylabel('Loss')  \n",
    "             \n",
    "    plt.title('Loss Curve')\n",
    "    plt.legend(['Train Loss', 'Validation Loss'])\n",
    "    plt.show()\n",
    "    plt.clf()\n",
    "    plt.cla()\n",
    "    plt.close()\n",
    "    \n",
    "    plt.figure()\n",
    "    plt.plot(range(1,epoch_limit), train_acc, color='blue')\n",
    "    plt.plot(range(1,epoch_limit), val_acc, color='red')\n",
    "    plt.xlabel('Epoch')\n",
    "    plt.ylabel('Accuracy')\n",
    "    plt.title('Accuracy Curve')\n",
    "    plt.legend(['Train Accuracy', 'Validation Accuracy'])\n",
    "    plt.show()\n",
    "    \n",
    "    plt.clf()\n",
    "    plt.cla()\n",
    "    plt.close()\n",
    "    torch.cuda.empty_cache()\n",
    "    cv2.destroyAllWindows()\n",
    "    del model\n",
    "    gc.collect()\n",
    "\n",
    "    return path_res, model_name"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bbbe7fea",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/sibscience-4/from_ssh/DroneDetector/.venv-train/lib/python3.12/site-packages/torchvision/models/_utils.py:208: UserWarning: The parameter 'pretrained' is deprecated since 0.13 and may be removed in the future, please use 'weights' instead.\n",
      "  warnings.warn(\n",
      "/home/sibscience-4/from_ssh/DroneDetector/.venv-train/lib/python3.12/site-packages/torchvision/models/_utils.py:223: UserWarning: Arguments other than a weight enum or `None` for 'weights' are deprecated since 0.13 and may be removed in the future. The current behavior is equivalent to passing `weights=None`.\n",
      "  warnings.warn(msg)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Error1\n",
      "Error1\n",
      "Error1\n",
      "Error1\n",
      "Error1\n",
      "Error1\n"
     ]
    },
    {
     "ename": "RuntimeError",
     "evalue": "No valid image pairs left after shape validation",
     "output_type": "error",
     "traceback": [
      "\u001b[31m---------------------------------------------------------------------------\u001b[39m",
      "\u001b[31mRuntimeError\u001b[39m                              Traceback (most recent call last)",
      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[4]\u001b[39m\u001b[32m, line 45\u001b[39m\n\u001b[32m     41\u001b[39m     model = model.to(device)\n\u001b[32m     42\u001b[39m \n\u001b[32m     43\u001b[39m \u001b[38;5;66;03m#----------Создания датасета и обучение модели--------------\u001b[39;00m\n\u001b[32m     44\u001b[39m \n\u001b[32m---> \u001b[39m\u001b[32m45\u001b[39m path_res, model_name = prepare_and_learning_detection(num_classes = num_classes, num_samples = 10000, path_dataset = \"/mnt/data/Dataset_overlay\", \n\u001b[32m     46\u001b[39m                      selected_freq=\u001b[32m1200\u001b[39m,model_name = config_name+\u001b[33m\"1200_\"\u001b[39m, config_name = config_name, model=model)\n\u001b[32m     47\u001b[39m \n\u001b[32m     48\u001b[39m \n",
      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[2]\u001b[39m\u001b[32m, line 183\u001b[39m, in \u001b[36mprepare_and_learning_detection\u001b[39m\u001b[34m(num_classes, num_samples, path_dataset, model_name, config_name, model, selected_freq)\u001b[39m\n\u001b[32m    179\u001b[39m             \u001b[38;5;28;01mreturn\u001b[39;00m image_real, image_imag, label\n\u001b[32m    180\u001b[39m \n\u001b[32m    181\u001b[39m     \u001b[38;5;66;03m#----------Создаём датасет--------------\u001b[39;00m\n\u001b[32m    182\u001b[39m \n\u001b[32m--> \u001b[39m\u001b[32m183\u001b[39m     dataset = MyDataset(path_dataset=path_res, csv_file=\u001b[33m'dataset.csv'\u001b[39m)\n\u001b[32m    184\u001b[39m     train_set, valid_set = torch.utils.data.random_split(dataset, [\u001b[32m0.7\u001b[39m, \u001b[32m0.3\u001b[39m], generator=torch.Generator().manual_seed(\u001b[32m42\u001b[39m))\n\u001b[32m    185\u001b[39m     batch_size = config.batch_size\n\u001b[32m    186\u001b[39m     train_dataloader = torch.utils.data.DataLoader(train_set, batch_size=batch_size, shuffle=\u001b[38;5;28;01mTrue\u001b[39;00m, drop_last=\u001b[38;5;28;01mTrue\u001b[39;00m)\n",
      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[2]\u001b[39m\u001b[32m, line 83\u001b[39m, in \u001b[36mprepare_and_learning_detection.<locals>.MyDataset.__init__\u001b[39m\u001b[34m(self, path_dataset, csv_file)\u001b[39m\n\u001b[32m     79\u001b[39m                     data.append(row[\u001b[32m2\u001b[39m: len(row)-\u001b[32m2\u001b[39m])\n\u001b[32m     80\u001b[39m             self.path_dataset = path_dataset\n\u001b[32m     81\u001b[39m             self.target_shape = \u001b[38;5;28;01mNone\u001b[39;00m\n\u001b[32m     82\u001b[39m             self.target_hw = \u001b[38;5;28;01mNone\u001b[39;00m\n\u001b[32m---> \u001b[39m\u001b[32m83\u001b[39m             self.sig_filenames = self._validate_files(data)\n",
      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[2]\u001b[39m\u001b[32m, line 126\u001b[39m, in \u001b[36mprepare_and_learning_detection.<locals>.MyDataset._validate_files\u001b[39m\u001b[34m(self, filenames)\u001b[39m\n\u001b[32m    122\u001b[39m                 shape_counter[real_shape] += \u001b[32m1\u001b[39m\n\u001b[32m    123\u001b[39m                 candidates.append((filename, real_shape))\n\u001b[32m    124\u001b[39m \n\u001b[32m    125\u001b[39m             \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28;01mnot\u001b[39;00m candidates:\n\u001b[32m--> \u001b[39m\u001b[32m126\u001b[39m                 \u001b[38;5;28;01mraise\u001b[39;00m RuntimeError(\u001b[33m\"No valid image pairs left after shape validation\"\u001b[39m)\n\u001b[32m    127\u001b[39m \n\u001b[32m    128\u001b[39m             preferred_shape = (\u001b[32m1600\u001b[39m, \u001b[32m1600\u001b[39m, \u001b[32m3\u001b[39m)\n\u001b[32m    129\u001b[39m             \u001b[38;5;28;01mif\u001b[39;00m shape_counter.get(preferred_shape, \u001b[32m0\u001b[39m) > \u001b[32m0\u001b[39m:\n",
      "\u001b[31mRuntimeError\u001b[39m: No valid image pairs left after shape validation"
     ]
    }
   ],
   "source": [
    "torch.cuda.empty_cache()\n",
    "cv2.destroyAllWindows()\n",
    "gc.collect()\n",
    "\n",
    "config_name = \"ensemble\"\n",
    "    \n",
    "def load_function(attr):\n",
    "    module_, func = attr.rsplit('.', maxsplit=1)\n",
    "    return getattr(import_module(module_), func)\n",
    "    \n",
    "config = mlconfig.load('config_' + config_name + '.yaml')\n",
    "\n",
    "model1 = models.resnet18(pretrained=False)\n",
    "model2 = models.resnet50(pretrained=False)\n",
    "\n",
    "num_classes = 2\n",
    "\n",
    "model1.fc = nn.Linear(model1.fc.in_features, num_classes)\n",
    "model2.fc = nn.Linear(model2.fc.in_features, num_classes)\n",
    "\n",
    "class Ensemble(nn.Module):\n",
    "    def __init__(self, model1, model2):\n",
    "        super(Ensemble, self).__init__()\n",
    "        self.model1 = model1\n",
    "        self.model2 = model2\n",
    "        self.fc = nn.Linear(2 * num_classes, num_classes)\n",
    "\n",
    "    def forward(self, x):\n",
    "        x1 = self.model1(x[0])\n",
    "        x2 = self.model2(x[1])\n",
    "        x = torch.cat((x1, x2), dim=1)\n",
    "        x = self.fc(x)\n",
    "        return x\n",
    "model = Ensemble(model1, model2)\n",
    "\n",
    "optimizer = load_function(config.optimizer.name)(model.parameters(), lr=config.optimizer.lr)\n",
    "criterion = load_function(config.loss_function.name)()\n",
    "scheduler = load_function(config.scheduler.name)(optimizer, step_size=config.scheduler.step_size, gamma=config.scheduler.gamma)\n",
    "\n",
    "if device != 'cpu':\n",
    "    model = model.to(device)\n",
    "\n",
    "#----------Создания датасета и обучение модели--------------\n",
    "\n",
    "path_res, model_name = prepare_and_learning_detection(num_classes = num_classes, num_samples = 10000, path_dataset = \"/mnt/data/Dataset_overlay\", \n",
    "                     selected_freq=2400,model_name = config_name+\"2400_\", config_name = config_name, model=model)\n",
    "\n",
    "\n",
    "torch.cuda.empty_cache()\n",
    "cv2.destroyAllWindows()\n",
    "del model\n",
    "gc.collect()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "usr",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
 }
--- a/train_scripts/create_dataset_overlay.py
+++ b/train_scripts/create_dataset_overlay.py
@ -0,0 +1,217 @@
 #!/usr/bin/env python3
 import argparse
 import csv
 import os
 import random
 import shutil
 from pathlib import Path
 import cv2
 import matplotlib
 matplotlib.use("Agg")
 import matplotlib.pyplot as plt
 import numpy as np
 from tqdm import tqdm
 DEFAULT_FREQS = (1200, 2400)
 PNG_SUFFIXES = ("_real.png", "_imag.png", "_spec.png")
 def parse_args():
    parser = argparse.ArgumentParser(
        description=(
            "Build a two-class image dataset with drone signatures overlaid on noise images. "
            "The output is ready for Training_models2pic_val_loss.ipynb."
        )
    )
    parser.add_argument("--drone-root", default="/mnt/data/Dataset/drone")
    parser.add_argument("--noise-img-root", default="/mnt/data/Dataset_img/noise")
    parser.add_argument("--output-root", default="/mnt/data/Dataset_overlay")
    parser.add_argument("--freqs", default=",".join(str(v) for v in DEFAULT_FREQS))
    parser.add_argument("--alpha", type=float, default=1.0, help="Overlay strength: 1.0 keeps the darkest drone/noise pixels.")
    parser.add_argument("--limit-per-freq", type=int, default=0, help="0 means use all available noise images per frequency.")
    parser.add_argument("--seed", type=int, default=42)
    parser.add_argument("--copy-noise", action="store_true", help="Copy noise files instead of hardlinking them.")
    parser.add_argument("--overwrite", action="store_true")
    parser.add_argument("--dry-run", action="store_true")
    parser.add_argument("--no-progress", action="store_true", help="Disable tqdm progress bars.")
    return parser.parse_args()
 def parse_freqs(value):
    return [int(item.strip()) for item in value.split(",") if item.strip()]
 def collect_drone_npys(root, freq):
    root = Path(root)
    candidates = []
    candidates.extend((root / str(freq)).rglob("*.npy"))
    candidates.extend((root / f"{freq}_jpg").glob("*.npy"))
    return sorted({p for p in candidates if p.is_file()})
 def collect_noise_npys(root, freq):
    root = Path(root)
    candidates = []
    candidates.extend((root / f"{freq}_jpg").glob("*.npy"))
    candidates.extend((root / str(freq)).rglob("*.npy"))
    return sorted({p for p in candidates if p.is_file()})
 def load_image_tensor(path):
    arr = np.load(path)
    if arr.ndim == 2:
        arr = np.stack([arr, arr, arr], axis=0)
    if arr.ndim == 3 and arr.shape[-1] in (1, 3) and arr.shape[0] not in (1, 3):
        arr = np.moveaxis(arr, -1, 0)
    if arr.ndim != 3:
        raise ValueError(f"expected 3D image tensor, got shape={arr.shape} path={path}")
    if arr.shape[0] == 1:
        arr = np.repeat(arr, 3, axis=0)
    if arr.shape[0] < 3:
        raise ValueError(f"expected at least 3 channels, got shape={arr.shape} path={path}")
    return arr[:3].astype(np.float32, copy=False)
 def resize_like(arr, shape):
    if arr.shape == shape:
        return arr
    channels, height, width = shape
    resized = []
    for channel in arr[:channels]:
        resized.append(cv2.resize(channel, (width, height), interpolation=cv2.INTER_LINEAR))
    return np.asarray(resized, dtype=np.float32)
 def overlay_tensors(noise, drone, alpha):
    drone = resize_like(drone, noise.shape)
    bright_overlay = np.minimum(noise, drone)
    mixed = (1.0 - alpha) * noise + alpha * bright_overlay
    return np.clip(mixed, 0, 255).astype(np.float32)
 def to_uint8(channel):
    arr = np.asarray(channel, dtype=np.float32)
    finite = arr[np.isfinite(arr)]
    if finite.size == 0:
        return np.zeros(arr.shape, dtype=np.uint8)
    min_v = float(finite.min())
    max_v = float(finite.max())
    if min_v >= 0.0 and max_v <= 255.0:
        return np.clip(arr, 0, 255).astype(np.uint8)
    if max_v == min_v:
        return np.zeros(arr.shape, dtype=np.uint8)
    norm = (arr - min_v) / (max_v - min_v)
    return np.clip(norm * 255.0, 0, 255).astype(np.uint8)
 def save_notebook_style_png(path, channel):
    fig = plt.figure(figsize=(16, 16))
    plt.imshow(channel)
    plt.savefig(path)
    plt.clf()
    plt.cla()
    plt.close()
    plt.close(fig)
 def save_sample(base_path, tensor):
    np.save(str(base_path) + ".npy", tensor.astype(np.float32))
    for idx, suffix in enumerate(PNG_SUFFIXES):
        save_notebook_style_png(str(base_path) + suffix, tensor[idx])
 def link_or_copy(src, dst, copy_file):
    dst.parent.mkdir(parents=True, exist_ok=True)
    if dst.exists():
        return
    if copy_file:
        shutil.copy2(src, dst)
        return
    try:
        os.link(src, dst)
    except OSError:
        shutil.copy2(src, dst)
 def copy_noise_family(noise_npy, out_dir, copy_file):
    base_name = noise_npy.name[:-4] if noise_npy.name.endswith(".npy") else noise_npy.name
    link_or_copy(noise_npy, out_dir / noise_npy.name, copy_file)
    for suffix in PNG_SUFFIXES:
        sidecar = noise_npy.with_name(base_name + suffix)
        if sidecar.exists():
            link_or_copy(sidecar, out_dir / sidecar.name, copy_file)
 def main():
    args = parse_args()
    random.seed(args.seed)
    freqs = parse_freqs(args.freqs)
    output_root = Path(args.output_root)
    manifest_rows = []
    if args.overwrite and output_root.exists() and not args.dry_run:
        shutil.rmtree(output_root)
    for freq in freqs:
        drone_files = collect_drone_npys(args.drone_root, freq)
        noise_files = collect_noise_npys(args.noise_img_root, freq)
        if not drone_files:
            raise RuntimeError(f"no drone npy files found for freq={freq} under {args.drone_root}")
        if not noise_files:
            raise RuntimeError(f"no noise image npy files found for freq={freq} under {args.noise_img_root}")
        count = len(noise_files) if args.limit_per_freq <= 0 else min(args.limit_per_freq, len(noise_files))
        selected_noise = noise_files[:]
        random.shuffle(selected_noise)
        selected_noise = selected_noise[:count]
        out_drone_dir = output_root / "drone" / f"{freq}_jpg"
        out_noise_dir = output_root / "noise" / f"{freq}_jpg"
        print(f"freq={freq}: drone_source={len(drone_files)} noise_source={len(noise_files)} output_per_class={count}")
        if args.dry_run:
            continue
        out_drone_dir.mkdir(parents=True, exist_ok=True)
        out_noise_dir.mkdir(parents=True, exist_ok=True)
        iterator = tqdm(
            enumerate(selected_noise),
            total=count,
            desc=f"overlay freq={freq}",
            unit="sample",
            disable=args.no_progress,
        )
        for idx, noise_path in iterator:
            drone_path = drone_files[idx % len(drone_files)]
            noise_tensor = load_image_tensor(noise_path)
            drone_tensor = load_image_tensor(drone_path)
            mixed = overlay_tensors(noise_tensor, drone_tensor, args.alpha)
            out_base = out_drone_dir / f"overlay_{freq}_{idx:06d}"
            save_sample(out_base, mixed)
            copy_noise_family(noise_path, out_noise_dir, args.copy_noise)
            manifest_rows.append({
                "freq": freq,
                "output": str(out_base) + ".npy",
                "noise_source": str(noise_path),
                "drone_source": str(drone_path),
                "alpha": args.alpha,
            })
    if not args.dry_run:
        manifest_path = output_root / "overlay_manifest.csv"
        with manifest_path.open("w", newline="", encoding="utf-8") as fh:
            writer = csv.DictWriter(fh, fieldnames=["freq", "output", "noise_source", "drone_source", "alpha"])
            writer.writeheader()
            writer.writerows(manifest_rows)
        print(f"wrote {len(manifest_rows)} overlay samples")
        print(f"manifest: {manifest_path}")
        print(f"dataset: {output_root}")
 if __name__ == "__main__":
    main()
Author	SHA1	Message	Date
Sergey Revyakin	3bf93aab3f	Исправление бага с размерностью при обучении	2 days ago
Sergey Revyakin	7ad17bb4c4	обновил .gitignore	2 days ago
Sergey Revyakin	0b65c2980d	анализ логов nn_inference	2 days ago
Sergey Revyakin	c70a25cb8f	Новая версия ноутбука для обучения	2 days ago
Sergey Revyakin	94856d0fb8	скрипт для парсинга логов с nn_server	2 days ago
Sergey Revyakin	783fb40eb0	Скрипт сложения png	2 days ago
Sergey Revyakin	a1c99ebf9f	добавил модели inference на двух картинках	2 days ago
Sergey Revyakin	0fad5d6404	примонтировал train_scripts	2 days ago
Sergey Revyakin	c0ccecc270	поменял условие на более читабельное	2 days ago
Sergey Revyakin	6a492a036b	изменение формата логов	2 days ago