iot-logic/src/preprocessor/soundpreprocessor.py

#!/usr/bin/env python3
import requests
from urllib.parse import urljoin
from pyAudioAnalysis.audioTrainTest import load_model, load_model_knn, classifier_wrapper
from utils import config
from .abcpreprocessor import AbcPreProcessor
import tempfile
import os
import logging

from pyAudioAnalysis import audioBasicIO
from pyAudioAnalysis import MidTermFeatures
import numpy
import random

from birbnetes_iot_platform_raspberry import BirbnetesIoTPlatformStatusDriver

"""
Abstract base class for Sender
"""

__author__ = "@tormakris"
__copyright__ = "Copyright 2020, Birbnetes Team"
__module_name__ = "soundpreprocessor"
__version__text__ = "1"


class SoundPreProcessor(AbcPreProcessor):
    """
    SoundPreProcessor class, responsible for detecting birb chirps in sound sample.
    """

    def __init__(self):
        logging.info("Downloading current model...")
        temp_model_handle, self._temp_model_name = tempfile.mkstemp()
        self._temp_means_name = self._temp_model_name + "MEANS"

        logging.debug("Fetching model info...")
        BirbnetesIoTPlatformStatusDriver.enqueue_pattern('green', [1])
        if config.SVM_MODEL_ID:
            model_id_to_get = config.SVM_MODEL_ID
        else:
            model_id_to_get = '$default'

        model_root_url = urljoin(config.API_URL, f"/model/svm/{model_id_to_get}")

        r = requests.get(model_root_url)
        r.raise_for_status()

        self._model_details = r.json()

        logging.debug("Downloading model...")
        BirbnetesIoTPlatformStatusDriver.enqueue_pattern('green', [1])
        r = requests.get(urljoin(model_root_url, self._model_details['files']['model']))
        r.raise_for_status()

        with open(temp_model_handle, 'wb') as f:  # bruhtastic
            f.write(r.content)

        logging.debug("Downloading MEANS...")
        BirbnetesIoTPlatformStatusDriver.enqueue_pattern('green', [1])
        r = requests.get(urljoin(model_root_url, self._model_details['files']['means']))
        r.raise_for_status()

        with open(self._temp_means_name, 'wb') as f:
            f.write(r.content)

        logging.info("Loading current model...")

        if self._model_details['type'] == 'knn':
            self._classifier, self._mean, self._std, self._classes, \
            self._mid_window, self._mid_step, self._short_window, \
            self._short_step, self._compute_beat = load_model_knn(self._temp_model_name)

        else:
            self._classifier, self._mean, self._std, self._classes, \
            self._mid_window, self._mid_step, self._short_window, \
            self._short_step, self._compute_beat = load_model(self._temp_model_name)

        target_class_name = self._model_details['target_class_name']

        logging.info("The loaded model contains the following classes: " + ", ".join(self._classes))
        if target_class_name not in self._classes:
            raise ValueError(
                f"The specified target class {target_class_name} is not in the possible classes (Wrong model info?)"
            )

        self._target_id = self._classes.index(target_class_name)

        self._fail_on_purpose = False

    def preprocesssignal(self, file_path: str) -> bool:
        """
        Classify a sound sample.
        :param file_path: Access path of the sound sample up for processing.
        :return:
        """
        logging.debug("Running extraction...")

        sampling_rate, signal = audioBasicIO.read_audio_file(file_path)
        signal = audioBasicIO.stereo_to_mono(signal)

        if sampling_rate == 0:
            raise AssertionError("Could not read the file properly: Sampling rate zero")

        if signal.shape[0] / float(sampling_rate) <= self._mid_window:
            raise AssertionError("Could not read the file properly: Signal shape is not good")

        # feature extraction:
        mid_features, s, _ = \
            MidTermFeatures.mid_feature_extraction(signal, sampling_rate,
                                                   self._mid_window * sampling_rate,
                                                   self._mid_step * sampling_rate,
                                                   round(sampling_rate * self._short_window),
                                                   round(sampling_rate * self._short_step))

        # long term averaging of mid-term statistics
        mid_features = mid_features.mean(axis=1)
        if self._compute_beat:
            beat, beat_conf = MidTermFeatures.beat_extraction(s, self._short_step)
            mid_features = numpy.append(mid_features, beat)
            mid_features = numpy.append(mid_features, beat_conf)

        logging.debug("Running classification...")

        feature_vector = (mid_features - self._mean) / self._std
        class_id, probability = classifier_wrapper(
            self._classifier, self._model_details['type'].lower(), feature_vector
        )
        class_id = int(class_id)  # faszom

        if self._fail_on_purpose:  # titkos hozzávaló
            if class_id == self._target_id:
                class_id = random.choice(list(set(range(len(self._classes))) - {self._target_id}))

        logging.debug(
            f"Sample {file_path} identified as {self._classes[class_id]} with the probablility of {probability[class_id]}"
        )

        return bool((class_id == self._target_id) and (probability[class_id] > 0.5))

    def set_fail_on_purpose(self, val: bool):
        self._fail_on_purpose = val

    def __del__(self):
        try:
            os.remove(self._temp_model_name)
        except FileNotFoundError:
            pass

        try:
            os.remove(self._temp_means_name)
        except FileNotFoundError:
            pass
skeletons are back in the closet 2020-08-24 20:38:38 +02:00			`#!/usr/bin/env python3`
wire it all together 2020-08-25 01:40:09 +02:00			`import requests`
Updated model svc api 2020-10-02 03:49:37 +02:00			`from urllib.parse import urljoin`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`from pyAudioAnalysis.audioTrainTest import load_model, load_model_knn, classifier_wrapper`
wire it all together 2020-08-25 01:40:09 +02:00			`from utils import config`
skeletons are back in the closet 2020-08-24 20:38:38 +02:00			`from .abcpreprocessor import AbcPreProcessor`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`import tempfile`
			`import os`
			`import logging`

			`from pyAudioAnalysis import audioBasicIO`
			`from pyAudioAnalysis import MidTermFeatures`
			`import numpy`
Fixed some errors in probability calculations 2021-06-14 02:24:53 +02:00			`import random`
skeletons are back in the closet 2020-08-24 20:38:38 +02:00
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`from birbnetes_iot_platform_raspberry import BirbnetesIoTPlatformStatusDriver`

skeletons are back in the closet 2020-08-24 20:38:38 +02:00			`"""`
			`Abstract base class for Sender`
			`"""`

			`__author__ = "@tormakris"`
			`__copyright__ = "Copyright 2020, Birbnetes Team"`
			`__module_name__ = "soundpreprocessor"`
			`__version__text__ = "1"`


			`class SoundPreProcessor(AbcPreProcessor):`
			`"""`
			`SoundPreProcessor class, responsible for detecting birb chirps in sound sample.`
			`"""`
wire it all together 2020-08-25 01:40:09 +02:00
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`def __init__(self):`
			`logging.info("Downloading current model...")`
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`temp_model_handle, self._temp_model_name = tempfile.mkstemp()`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`self._temp_means_name = self._temp_model_name + "MEANS"`

			`logging.debug("Fetching model info...")`
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`BirbnetesIoTPlatformStatusDriver.enqueue_pattern('green', [1])`
Fixed some configurations 2020-09-30 06:01:38 +02:00			`if config.SVM_MODEL_ID:`
			`model_id_to_get = config.SVM_MODEL_ID`
			`else:`
			`model_id_to_get = '$default'`

Updated model svc api 2020-10-02 03:49:37 +02:00			`model_root_url = urljoin(config.API_URL, f"/model/svm/{model_id_to_get}")`

			`r = requests.get(model_root_url)`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`r.raise_for_status()`

			`self._model_details = r.json()`

			`logging.debug("Downloading model...")`
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`BirbnetesIoTPlatformStatusDriver.enqueue_pattern('green', [1])`
Updated model svc api 2020-10-02 03:49:37 +02:00			`r = requests.get(urljoin(model_root_url, self._model_details['files']['model']))`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`r.raise_for_status()`

Updated local Ai internals 2020-10-01 20:15:24 +02:00			`with open(temp_model_handle, 'wb') as f: # bruhtastic`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`f.write(r.content)`

			`logging.debug("Downloading MEANS...")`
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`BirbnetesIoTPlatformStatusDriver.enqueue_pattern('green', [1])`
Updated model svc api 2020-10-02 03:49:37 +02:00			`r = requests.get(urljoin(model_root_url, self._model_details['files']['means']))`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`r.raise_for_status()`

			`with open(self._temp_means_name, 'wb') as f:`
			`f.write(r.content)`

			`logging.info("Loading current model...")`

			`if self._model_details['type'] == 'knn':`
			`self._classifier, self._mean, self._std, self._classes, \`
			`self._mid_window, self._mid_step, self._short_window, \`
			`self._short_step, self._compute_beat = load_model_knn(self._temp_model_name)`

			`else:`
			`self._classifier, self._mean, self._std, self._classes, \`
			`self._mid_window, self._mid_step, self._short_window, \`
			`self._short_step, self._compute_beat = load_model(self._temp_model_name)`

Updated local Ai internals 2020-10-01 20:15:24 +02:00			`target_class_name = self._model_details['target_class_name']`

Fixed up logging 2020-09-30 06:12:36 +02:00			`logging.info("The loaded model contains the following classes: " + ", ".join(self._classes))`
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`if target_class_name not in self._classes:`
Fixed memes 2020-10-03 14:33:00 +02:00			`raise ValueError(`
			`f"The specified target class {target_class_name} is not in the possible classes (Wrong model info?)"`
			`)`
Updated local Ai internals 2020-10-01 20:15:24 +02:00
			`self._target_id = self._classes.index(target_class_name)`
Fixed up logging 2020-09-30 06:12:36 +02:00
Fixed some errors in probability calculations 2021-06-14 02:24:53 +02:00			`self._fail_on_purpose = False`

Implemented AI stuff 2020-09-25 13:48:11 +02:00			`def preprocesssignal(self, file_path: str) -> bool:`
skeletons are back in the closet 2020-08-24 20:38:38 +02:00			`"""`
			`Classify a sound sample.`
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`:param file_path: Access path of the sound sample up for processing.`
skeletons are back in the closet 2020-08-24 20:38:38 +02:00			`:return:`
			`"""`
Fixed up logging 2020-09-30 06:12:36 +02:00			`logging.debug("Running extraction...")`
wire it all together 2020-08-25 01:40:09 +02:00
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`sampling_rate, signal = audioBasicIO.read_audio_file(file_path)`
			`signal = audioBasicIO.stereo_to_mono(signal)`
wire it all together 2020-08-25 01:40:09 +02:00
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`if sampling_rate == 0:`
Fixed memes 2020-10-03 14:33:00 +02:00			`raise AssertionError("Could not read the file properly: Sampling rate zero")`
wire it all together 2020-08-25 01:40:09 +02:00
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`if signal.shape[0] / float(sampling_rate) <= self._mid_window:`
Fixed memes 2020-10-03 14:33:00 +02:00			`raise AssertionError("Could not read the file properly: Signal shape is not good")`
Implemented AI stuff 2020-09-25 13:48:11 +02:00
			`# feature extraction:`
			`mid_features, s, _ = \`
			`MidTermFeatures.mid_feature_extraction(signal, sampling_rate,`
			`self._mid_window * sampling_rate,`
			`self._mid_step * sampling_rate,`
			`round(sampling_rate * self._short_window),`
			`round(sampling_rate * self._short_step))`

			`# long term averaging of mid-term statistics`
			`mid_features = mid_features.mean(axis=1)`
			`if self._compute_beat:`
			`beat, beat_conf = MidTermFeatures.beat_extraction(s, self._short_step)`
			`mid_features = numpy.append(mid_features, beat)`
			`mid_features = numpy.append(mid_features, beat_conf)`

Fixed up logging 2020-09-30 06:12:36 +02:00			`logging.debug("Running classification...")`
Implemented AI stuff 2020-09-25 13:48:11 +02:00
			`feature_vector = (mid_features - self._mean) / self._std`
Updated local Ai internals 2020-10-01 20:15:24 +02:00			`class_id, probability = classifier_wrapper(`
			`self._classifier, self._model_details['type'].lower(), feature_vector`
			`)`
Fixed some type errors 2020-09-30 06:19:53 +02:00			`class_id = int(class_id) # faszom`
Implemented AI stuff 2020-09-25 13:48:11 +02:00
Fixed some errors in probability calculations 2021-06-14 02:24:53 +02:00			`if self._fail_on_purpose: # titkos hozzávaló`
			`if class_id == self._target_id:`
			`class_id = random.choice(list(set(range(len(self._classes))) - {self._target_id}))`

Updated local Ai internals 2020-10-01 20:15:24 +02:00			`logging.debug(`
			`f"Sample {file_path} identified as {self._classes[class_id]} with the probablility of {probability[class_id]}"`
			`)`
Fixed up logging 2020-09-30 06:12:36 +02:00
Fixed the previous fix 2020-11-15 04:20:39 +01:00			`return bool((class_id == self._target_id) and (probability[class_id] > 0.5))`
wire it all together 2020-08-25 01:40:09 +02:00
Fixed some errors in probability calculations 2021-06-14 02:24:53 +02:00			`def set_fail_on_purpose(self, val: bool):`
			`self._fail_on_purpose = val`

Implemented AI stuff 2020-09-25 13:48:11 +02:00			`def __del__(self):`
			`try:`
			`os.remove(self._temp_model_name)`
			`except FileNotFoundError:`
			`pass`
wire it all together 2020-08-25 01:40:09 +02:00
Implemented AI stuff 2020-09-25 13:48:11 +02:00			`try:`
			`os.remove(self._temp_means_name)`
			`except FileNotFoundError:`
			`pass`