Audio in progress

3 years ago · 5cea74b940
parent f55bd55003
commit 5cea74b940
3 changed files with 512 additions and 1 deletions
--- a/Sources/pyOpenRPA/Robot/Audio.py
+++ b/Sources/pyOpenRPA/Robot/Audio.py
@ -0,0 +1,143 @@
 import pyaudio
 from pydub import AudioSegment
 import threading
 import wave
 def DeviceSystemSoundSearchIndex():
    """L-,W+: Выполнить поиск устройства, с помощью которого можно будет выполнить захват аудио, которое поступает из приложений. Например: аудиоконференции Zoom, whatsapp, telegram и т.д.
    """
    pass
 def DeviceListGet():
    """L-,W+: Вернуть список аудио устройст (входящих и исходящих, микрофонов и динамиков).
    from pyOpenRPA.Robot import Audio
    Audio.DeviceListGet()
    :return: [{"IndexInt":1, "NameStr": "", 
            "HostApiInt": 0, "HostApiStr": "MME"|"Windows WASAPI"|"Windows WDM-KS",
            "MaxInputChannelsInt": 0, "MaxOutputChannelsInt": 0,
            "DefaultSampleRateFloat": 44100.0
        },...]
    :rtype: list
    """
    l_result = []
    p = pyaudio.PyAudio()
    for i in range(0, p.get_device_count()):
        l_info = p.get_device_info_by_index(i)
        l_info_dict = {
            "IndexInt":l_info["index"], 
            "NameStr": l_info["name"], 
            "MaxInputChannelsInt": l_info["maxInputChannels"], 
            "MaxOutputChannelsInt": l_info["maxOutputChannels"], 
            "HostApiInt": l_info["hostApi"], 
            "DefaultSampleRateFloat": l_info["defaultSampleRate"],
            "HostApiStr": p.get_host_api_info_by_index(l_info["hostApi"])["name"] #"MME"|"Windows WASAPI"|"Windows WDM-KS"
        }
        l_result.append(l_info_dict)
    return l_result
 class Recorder:
    mStatusStr = "0_READY"
    mAudio = pyaudio.PyAudio()
    mCaptureThread = None
    mStream = None
    mDeviceInt = None
    mChannelCountInt = None
    mFramesInt = 512
    mRecordedFramesList = []
    mUseLoopbackBool = True
    mSampleRateInt = None
    mSampleSizeInt = mAudio.get_sample_size(pyaudio.paInt16)
    mCaptureBool = True
    mFileNameStr = "aux"
    mFileFormatStr = "mp3"
    def __init__(self, inDeviceInt=None):
        self.mDeviceInt = inDeviceInt
    def CaptureStart(self):
        lDeviceInfoDict = self.mAudio.get_device_info_by_index(self.mDeviceInt)
        #Open stream
        self.mSampleRateInt = int(lDeviceInfoDict["defaultSampleRate"])
        self.mChannelCountInt = lDeviceInfoDict["maxInputChannels"] if (lDeviceInfoDict["maxOutputChannels"] < lDeviceInfoDict["maxInputChannels"]) else lDeviceInfoDict["maxOutputChannels"]
        self.mStream = self.mAudio.open(format = pyaudio.paInt16,
                        channels = self.mChannelCountInt,
                        rate = self.mSampleRateInt,
                        input = True,
                        frames_per_buffer = self.mFramesInt,
                        input_device_index = lDeviceInfoDict["index"],
                        as_loopback = self.mUseLoopbackBool)
        self.mCaptureThread = threading.Thread(target=self.__Capture__)
        self.mCaptureThread.start()
    def __Capture__(self):
        while self.mCaptureBool == True:
            self.mRecordedFramesList.append(self.mStream.read(self.mFramesInt))
        self.mStream.stop_stream()
        self.mStream.close()
        #Close module
        self.mAudio.terminate()
        print("done")
    def CaptureStop(self):
        self.mCaptureBool=False
        self.mCaptureThread.join()
        print("done2")
        self.CaptureChunk()
        print("done3")
    def CaptureChunk(self):
        print("CaptureChunk 1")
        waveFile = wave.open(f"{self.mFileNameStr}.{self.mFileFormatStr}", 'wb')
        waveFile.setnchannels(self.mChannelCountInt)
        waveFile.setsampwidth(self.mSampleSizeInt)
        waveFile.setframerate(self.mSampleRateInt)
        waveFile.writeframes(b''.join(self.mRecordedFramesList))
        waveFile.close()
        lSound = AudioSegment(
            # raw audio data (bytes)
            data=b''.join(self.mRecordedFramesList),
            # 2 byte (16 bit) samples
            sample_width=self.mSampleSizeInt,
            # 44.1 kHz frame rate
            frame_rate=self.mSampleRateInt,
            # stereo
            channels=self.mChannelCountInt
        )
        print("CaptureChunk 2")
        print(len(self.mRecordedFramesList))
        lSound.export(f"{self.mFileNameStr}.{self.mFileFormatStr}", format=self.mFileFormatStr)
        print("CaptureChunk 3")
        self.mRecordedFramesList = []
    def FileListGet(self):
        pass
    def FileLastGet(self):
        pass
    def __Callback__(self, inDefList):
        pass
    def __CallbackIsSilent__(self):
        pass
    def __CallbackIsChunked__(self):
        pass
    def __CallbackIsStopped__(self):
        pass
    def __TriggerCenter__(self):
        """L-,W+: Контроль записи / остановки аудио по следующим критериям: 
        - Общая длительность, 
        - Максимальная длительность части, 
        - Максимальная длит тишины (часть), 
        - Максимальная длительность тишины (остановка), 
        """
        pass
--- a/Tools/Jupyter-notebooks/Audio.ipynb
+++ b/Tools/Jupyter-notebooks/Audio.ipynb
@ -0,0 +1,367 @@
 {
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "import os\n",
    "#sys.path.insert(0, os.path.abspath(\"..\\\\..\\\\Sources\")) # FOR WINDOWS\n",
    "sys.path.insert(0, os.path.abspath(\"../../Sources\")) # FOR LINUX\n",
    "import time"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "123\n"
     ]
    }
   ],
   "source": [
    "print(123)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "from pyOpenRPA.Robot import Audio\n",
    "lRec = Audio.Recorder(inDeviceInt=10)\n",
    "lRec.CaptureStart()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "done\n",
      "done2\n",
      "CaptureChunk 1\n"
     ]
    }
   ],
   "source": [
    "lRec.CaptureStop()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Available devices:\n",
      "\n",
      "0\n",
      "0: \t Ïåðåíàçíà÷åíèå çâóêîâûõ óñòð. - Input \n",
      " \t MME \n",
      "\n",
      "0\n",
      "1: \t Ìèêðîôîí (Realtek High Definiti \n",
      " \t MME \n",
      "\n",
      "0\n",
      "2: \t Ìèêðîôîí (EpocCam Camera Audio) \n",
      " \t MME \n",
      "\n",
      "0\n",
      "3: \t Ìèêðîôîí (USB PnP Sound Device) \n",
      " \t MME \n",
      "\n",
      "0\n",
      "4: \t Ïåðåíàçíà÷åíèå çâóêîâûõ óñòð. - Output \n",
      " \t MME \n",
      "\n",
      "0\n",
      "5: \t Äèíàìèêè (USB PnP Sound Device) \n",
      " \t MME \n",
      "\n",
      "0\n",
      "6: \t 2 - NEC LCD1703M (AMD High Defi \n",
      " \t MME \n",
      "\n",
      "0\n",
      "7: \t Äèíàìèêè (Realtek High Definiti \n",
      " \t MME \n",
      "\n",
      "1\n",
      "8: \t 2 - NEC LCD1703M (AMD High Definition Audio Device) \n",
      " \t Windows WASAPI \n",
      "\n",
      "1\n",
      "9: \t Динамики (USB PnP Sound Device) \n",
      " \t Windows WASAPI \n",
      "\n",
      "1\n",
      "10: \t Динамики (Realtek High Definition Audio) \n",
      " \t Windows WASAPI \n",
      "\n",
      "1\n",
      "11: \t Микрофон (EpocCam Camera Audio) \n",
      " \t Windows WASAPI \n",
      "\n",
      "1\n",
      "12: \t Микрофон (Realtek High Definition Audio) \n",
      " \t Windows WASAPI \n",
      "\n",
      "1\n",
      "13: \t Микрофон (USB PnP Sound Device) \n",
      " \t Windows WASAPI \n",
      "\n",
      "2\n",
      "14: \t Стерео микшер (Realtek HD Audio Stereo input) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "15: \t Микрофон (Realtek HD Audio Mic input) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "16: \t Speakers (Realtek HD Audio output) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "17: \t Лин. вход (Realtek HD Audio Line input) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "18: \t Output (AMD HD Audio HDMI out #1) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "19: \t Динамики (USB PnP Sound Device) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "20: \t Микрофон (USB PnP Sound Device) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "21: \t MIDI (EpocCam Audio) \n",
      " \t Windows WDM-KS \n",
      "\n",
      "2\n",
      "22: \t Output (EpocCam Audio) \n",
      " \t Windows WDM-KS \n",
      "\n"
     ]
    }
   ],
   "source": [
    "print (textcolors.blue + \"Available devices:\\n\" + textcolors.end)\n",
    "for i in range(0, p.get_device_count()):\n",
    "    info = p.get_device_info_by_index(i)\n",
    "    print(info[\"hostApi\"])\n",
    "    print (textcolors.green + str(info[\"index\"]) + textcolors.end + \": \\t %s \\n \\t %s \\n\" % (info[\"name\"], p.get_host_api_info_by_index(info[\"hostApi\"])[\"name\"]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "class textcolors:\n",
    "    if not os.name == 'nt':\n",
    "        blue = '\\033[94m'\n",
    "        green = '\\033[92m'\n",
    "        warning = '\\033[93m'\n",
    "        fail = '\\033[91m'\n",
    "        end = '\\033[0m'\n",
    "    else:\n",
    "        blue = ''\n",
    "        green = ''\n",
    "        warning = ''\n",
    "        fail = ''\n",
    "        end = ''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Starting...\n",
      "End.\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<_io.BufferedRandom name='out.mp3'>"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pyaudio\n",
    "defaultframes = 512\n",
    "recorded_frames = []\n",
    "device_info = {}\n",
    "useloopback = True\n",
    "#Use module\n",
    "p = pyaudio.PyAudio()\n",
    "\n",
    "recordtime = 15\n",
    "device_id = 10\n",
    "device_info = p.get_device_info_by_index(device_id)\n",
    "#Open stream\n",
    "channelcount = device_info[\"maxInputChannels\"] if (device_info[\"maxOutputChannels\"] < device_info[\"maxInputChannels\"]) else device_info[\"maxOutputChannels\"]\n",
    "stream = p.open(format = pyaudio.paInt16,\n",
    "                channels = channelcount,\n",
    "                rate = int(device_info[\"defaultSampleRate\"]),\n",
    "                input = True,\n",
    "                frames_per_buffer = defaultframes,\n",
    "                input_device_index = device_info[\"index\"],\n",
    "                as_loopback = useloopback)\n",
    "\n",
    "#Start Recording\n",
    "print (\"Starting...\")\n",
    "\n",
    "for i in range(0, int(int(device_info[\"defaultSampleRate\"]) / defaultframes * recordtime)):\n",
    "    recorded_frames.append(stream.read(defaultframes))\n",
    "\n",
    "print (\"End.\")\n",
    "#Stop Recording\n",
    "\n",
    "stream.stop_stream()\n",
    "stream.close()\n",
    "\n",
    "#Close module\n",
    "p.terminate()\n",
    "\n",
    "filename = \"out.wav\"\n",
    "from pydub import AudioSegment\n",
    "# Advanced usage, if you have raw audio data:\n",
    "sound = AudioSegment(\n",
    "    # raw audio data (bytes)\n",
    "    data=b''.join(recorded_frames),\n",
    "    # 2 byte (16 bit) samples\n",
    "    sample_width=p.get_sample_size(pyaudio.paInt16),\n",
    "    # 44.1 kHz frame rate\n",
    "    frame_rate=int(device_info[\"defaultSampleRate\"]),\n",
    "    # stereo\n",
    "    channels=channelcount\n",
    ")\n",
    "sound.export(\"out.mp3\", format=\"mp3\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "import difflib\n",
    "def similarity_no_case(s1, s2):\n",
    "  normalized1 = s1.lower()\n",
    "  normalized2 = s2.lower()\n",
    "  matcher = difflib.SequenceMatcher(None, normalized1, normalized2)\n",
    "  return matcher.ratio()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.36363636363636365"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "similarity(\"sadsdasd\",\"sadfsdfd                 \")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.2"
  },
  "varInspector": {
   "cols": {
    "lenName": 16,
    "lenType": 16,
    "lenVar": 40
   },
   "kernels_config": {
    "python": {
     "delete_cmd_postfix": "",
     "delete_cmd_prefix": "del ",
     "library": "var_list.py",
     "varRefreshCmd": "print(var_dic_list())"
    },
    "r": {
     "delete_cmd_postfix": ") ",
     "delete_cmd_prefix": "rm(",
     "library": "var_list.r",
     "varRefreshCmd": "cat(var_dic_list()) "
    }
   },
   "types_to_exclude": [
    "module",
    "function",
    "builtin_function_or_method",
    "instance",
    "_Feature"
   ],
   "window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
 }
--- a/changelog.md
+++ b/changelog.md
@ -19,6 +19,7 @@ AGT - AGENT
 - ОБЩЕЕ
 - - Jupyter: запуск из других дисков, отличных от C://
 - - Utils: Функции подготовки файлов / директорий
 - - Utils: String - similarity
 [1.3.0]
 - ПОРТИРОВАНО НА LINUX (Ubuntu, Debian, Astra), адаптация функций