ros-drivers · lucasw · Jul 16, 2016 · Jul 16, 2016 · Jul 19, 2016 · Jul 23, 2016
diff --git a/audio_capture/launch/capture.launch b/audio_capture/launch/capture.launch
@@ -1,16 +1,19 @@
 <launch>
   <!-- arecord -l will show available input devices, use the car number as
       the first number and the subdevice number as the second in a string
-      like hw:1,0 -->
+      like hw:1,0
+      run pacmd list-sources to input specs
+      (but not all possible ones?)
+      -->
   <arg name="dst" default="appsink"/>
   <arg name="device" default=""/>
-  <arg name="format" default="mp3"/>
+  <arg name="format" default="mp3" doc="can only be mp3 or wave"/>
   <arg name="bitrate" default="128"/>
   <arg name="channels" default="1"/>
   <arg name="depth" default="16"/>
   <arg name="sample_rate" default="16000"/>
   <arg name="sample_format" default="S16LE"/>
-  <arg name="ns" default="audio"/>
+  <arg name="ns" default="audio" doc="namespace to run node in"/>
   <arg name="audio_topic" default="audio"/>
 
   <group ns="$(arg ns)">

diff --git a/audio_capture/scripts/audio_capture.py b/audio_capture/scripts/audio_capture.py
@@ -0,0 +1,69 @@
+#!/usr/bin/env python
+# https://adnanalamkhan.wordpress.com/2015/03/01/using-gstreamer-1-0-with-python/
+import gi
+# import rospy
+
+gi.require_version('Gst', '1.0')
+# gi.require_version('Gtk', '3.0')
+# from gi.repository import Gtk
+from gi.repository import GObject
+from gi.repository import Gst as gst
+
+GObject.threads_init()
+gst.init(None)
+# rospy.init_node('audio_capture')
+
+# Create the pipeline for our elements.
+pipeline = gst.Pipeline()
+# Create the elements for our project.
+
+audio_source = gst.ElementFactory.make('filesrc', 'audio_source')
+# audio_source = gst.ElementFactory.make('alsasrc', 'audio_source')
+decode = gst.ElementFactory.make('mad', 'decode')
+convert = gst.ElementFactory.make('audioconvert', 'convert')
+equalizer = gst.ElementFactory.make('equalizer-3bands', 'equalizer')
+audio_sink = gst.ElementFactory.make('autoaudiosink', 'audio_sink')
+
+# Ensure all elements were created successfully.
+if (not pipeline or not audio_source or not decode or
+    not convert or not equalizer or not audio_sink):
+    print('Not all elements could be created.')
+    exit(-1)
+
+# Configure our elements.
+filename = 'blah'  # 'Kevin_MacLeod_-_05_-_Impact_Allegretto.mp3'
+audio_source.set_property('location', filename)
+equalizer.set_property('band1', -24.0)
+equalizer.set_property('band2', -24.0)
+
+# Add our elements to the pipeline.
+pipeline.add(audio_source)
+pipeline.add(decode)
+pipeline.add(convert)
+pipeline.add(equalizer)
+pipeline.add(audio_sink)
+
+# Link our elements together.
+audio_source.link(decode)
+decode.link(convert)
+convert.link(equalizer)
+equalizer.link(audio_sink)
+
+# Set our pipelines state to Playing.
+# check the following documentation whenever you get
+# some AttributeError.
+# link: http://lazka.github.io/pgi-docs/#Gst-1.0/flags.html
+pipeline.set_state(gst.State.PLAYING)
+
+# Wait until error or EOS.
+bus = pipeline.get_bus()
+
+while True:  # not rospy.is_shutdown():
+    # msg = bus.timed_pop_filtered(gst.CLOCK_TIME_NONE, gst.MessageType.ERROR | gst.MessageType.EOS)
+    msg = bus.timed_pop_filtered(1e9, gst.MessageType.ERROR | gst.MessageType.EOS)
+    if msg is None:
+        break
+    print msg
+
+# Free resources.
+pipeline.set_state(gst.State.NULL)
diff --git a/audio_capture/src/audio_capture.cpp b/audio_capture/src/audio_capture.cpp
@@ -127,6 +127,22 @@ namespace audio_transport
             gst_bin_add_many( GST_BIN(_pipeline), _source, _filter, _sink, NULL);
             link_ok = gst_element_link_many( _source, _filter, _sink, NULL);
           }
+#if 0
+          GstCaps *caps;
+          // caps = gst_caps_new_simple("audio/x-raw-int",
+          caps = gst_caps_new_simple("audio/x-raw",
+                                     "channels", G_TYPE_INT, _channels,
+                                     "width",    G_TYPE_INT, _depth,
+                                     "depth",    G_TYPE_INT, _depth,
+                                     "rate",     G_TYPE_INT, _sample_rate,
+                                     "signed",   G_TYPE_BOOLEAN, TRUE,
+                                     NULL);
+
+          g_object_set( G_OBJECT(_sink), "caps", caps, NULL);
+          gst_caps_unref(caps);
+          gst_bin_add_many( GST_BIN(_pipeline), _source, _sink, NULL);
+          link_ok = gst_element_link_many( _source, _sink, NULL);
+#endif
         } else {
           ROS_ERROR_STREAM("format must be \"wave\" or \"mp3\"");
           exitOnMainThread(1);

diff --git a/audio_play/src/audio_play.cpp b/audio_play/src/audio_play.cpp
@@ -140,7 +140,7 @@ namespace audio_transport
         gst_buffer_unref(buffer);
       }
 
-     static void cb_newpad (GstElement *decodebin, GstPad *pad, 
+     static void cb_newpad (GstElement *decodebin, GstPad *pad,
                              gpointer data)
       {
         RosGstPlay *client = reinterpret_cast<RosGstPlay*>(data);

diff --git a/audio_to_float/.gitignore b/audio_to_float/.gitignore
@@ -0,0 +1 @@
+build
diff --git a/audio_to_float/CHANGELOG.rst b/audio_to_float/CHANGELOG.rst
@@ -0,0 +1,88 @@
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+Changelog for package audio_play
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Forthcoming
+-----------
+* Changed message level to warning
+* Fixed problem that CMake uses gstreamer-0.1 instead of gstreamer-1.0
+* Fixed underflow.
+  Before the sink buffer underflows the pipeline is paused. When data is received again the pipeline is set to playing again.
+* Added gstreamer 1.0 dependecies
+* Ported to gstreamer 1.0
+  package.xml dependencies still missing
+* Contributors: Benny
+
+0.2.11 (2016-02-16)
+-------------------
+* Add changelogs
+* Contributors: trainman419
+
+0.2.10 (2016-01-21)
+-------------------
+* Add changelogs
+* Contributors: trainman419
+
+0.2.9 (2015-12-02)
+------------------
+* Add changelogs
+* Contributors: trainman419
+
+0.2.8 (2015-10-02)
+------------------
+* Changed message level to warning
+* Fixed underflow.
+  Before the sink buffer underflows the pipeline is paused. When data is received again the pipeline is set to playing again.
+* Change audio sink to autoaudiosink
+* Update maintainer email
+* Contributors: Benny, Hans Gaiser, trainman419
+
+0.2.7 (2014-07-25)
+------------------
+
+0.2.6 (2014-02-26)
+------------------
+* audio_capture and play _require\_ gstreamer, it's not optional
+* Contributors: v4hn
+
+0.2.5 (2014-01-23)
+------------------
+* "0.2.5"
+* Contributors: trainman419
+
+0.2.4 (2013-09-10)
+------------------
+
+0.2.3 (2013-07-15)
+------------------
+* Fix dependencies and install rules.
+* Contributors: Austin Hendrix
+
+0.2.2 (2013-04-10)
+------------------
+
+0.2.1 (2013-04-08 13:59)
+------------------------
+
+0.2.0 (2013-04-08 13:49)
+------------------------
+* Finish catkinizing audio_common.
+* Catkinize audio_play.
+* Fix typo in package.xml
+* Versions and more URLs.
+* Convert manifests to package.xml
+* Ditch old makefiles.
+* Updates manifest
+* Updated manifests for rodep2
+* oneiric build fixes, bump version to 0.1.6
+* Removed another duplicate thread::thread
+* Added a rosdep.yaml file
+* Fixed to use audio_common_msgs
+* Added ability to use different festival voices
+* Updated documentation
+* Update to audio_play
+* Fixed ignore files
+* Added hgignore files
+* Audio_capture and audio_play working
+* Making separate audio_capture and audio_play packages
+* Contributors: Austin Hendrix, Brian Gerkey, Nate Koenig, nkoenig
diff --git a/audio_to_float/CMakeLists.txt b/audio_to_float/CMakeLists.txt
@@ -0,0 +1,35 @@
+cmake_minimum_required(VERSION 2.8.3)
+
+project(audio_to_float)
+
+find_package(catkin REQUIRED COMPONENTS cv_bridge roscpp audio_common_msgs)
+
+find_package(PkgConfig)
+pkg_check_modules(GST1.0 gstreamer-1.0 REQUIRED)
+pkg_check_modules(GSTAPP1.0 gstreamer-app-1.0 REQUIRED)
+
+find_package(Boost REQUIRED COMPONENTS thread)
+
+include_directories(
+  ${catkin_INCLUDE_DIRS}
+  ${Boost_INCLUDE_DIRS}
+  ${GST1.0_INCLUDE_DIRS}
+  ${GSTAPP1.0_INCLUDE_DIRS}
+)
+
+catkin_package()
+
+add_executable(audio_to_float src/audio_to_float.cpp)
+target_link_libraries(audio_to_float
+  ${catkin_LIBRARIES}
+  ${GST1.0_LIBRARIES}
+  ${GSTAPP1.0_LIBRARIES}
+  ${Boost_LIBRARIES}
+)
+add_dependencies(audio_to_float ${catkin_EXPORTED_TARGETS})
+
+install(TARGETS audio_to_float
+   DESTINATION ${CATKIN_PACKAGE_BIN_DESTINATION})
+
+install(DIRECTORY launch
+   DESTINATION ${CATKIN_PACKAGE_SHARE_DESTINATION})
diff --git a/audio_to_float/launch/audio_to_float.launch b/audio_to_float/launch/audio_to_float.launch
@@ -0,0 +1,13 @@
+<?xml version="1.0"?>
+<launch>
+  <arg name="ns" default="audio"/>
+
+  <include file="$(find audio_capture)/launch/capture.launch">
+  </include>
+  <group ns="$(arg ns)">
+  <node name="audio_to_float" pkg="audio_to_float" type="audio_to_float"
+      output="screen">
+  </node>
+  <node name="view" pkg="audio_to_float" type="view.py" />
+  </group>
+</launch>
diff --git a/audio_to_float/launch/spectrogram.launch b/audio_to_float/launch/spectrogram.launch
@@ -0,0 +1,22 @@
+<?xml version="1.0"?>
+<launch>
+
+  <arg name="float_sample_rate" default="16000"/>
+  <node name="gen_float" pkg="float_to_audio" type="gen_float.py"
+      output="screen" >
+    <param name="sample_rate" value="$(arg float_sample_rate)"/>
+  </node>
+
+  <node name="spectrogram" pkg="audio_to_float" type="spectrogram.py"
+      output="screen" >
+    <param name="sample_rate" value="$(arg float_sample_rate)"/>
+  </node>
+
+  <node name="view_input" pkg="audio_to_float" type="view.py">
+    <remap from="decoded" to="samples"/>
+    <remap from="image" to="image"/>
+    <param name="fade1" value="0.5"/>
+    <param name="fade2" value="0.5"/>
+  </node>
+
+</launch>
diff --git a/audio_to_float/mainpage.dox b/audio_to_float/mainpage.dox
@@ -0,0 +1,22 @@
+/**
+\mainpage
+\htmlinclude manifest.html
+
+\b audio_play is a package that listens to a node that produces audio_msgs, and plays them through a connected speaker.
+
+
+\section codeapi Code API
+
+<!--
+Provide links to specific auto-generated API documentation within your
+package that is of particular interest to a reader. Doxygen will
+document pretty much every part of your code, so do your best here to
+point the reader to the actual API.
+
+If your codebase is fairly large or has different sets of APIs, you
+should use the doxygen 'group' tag to keep these APIs together. For
+example, the roscpp documentation has 'libros' group.
+-->
+
+
+*/
diff --git a/audio_to_float/package.xml b/audio_to_float/package.xml
@@ -0,0 +1,32 @@
+<package>
+   <name>audio_to_float</name>
+   <version>0.2.7</version>
+   <description>
+      Converts a stream of gstreamer AudioData messages to a stream of floating point arrays.
+   </description>
+   <maintainer email="[email protected]">Lucas Walter</maintainer>
+   <author>Lucas Walter</author>
+   <license>BSD</license>
+   <url type="website">http://ros.org/wiki/audio_play</url>
+   <url type="repository">https://github.com/ros-drivers/audio_common</url>
+   <url type="bugtracker">https://github.com/ros-drivers/audio_common/issues</url>
+
+   <buildtool_depend>catkin</buildtool_depend>
+
+   <build_depend>cv_bridge</build_depend>
+   <build_depend>roscpp</build_depend>
+   <build_depend>audio_common_msgs</build_depend>
+   <build_depend>libgstreamer1.0-dev</build_depend>
+   <build_depend>libgstreamer-plugins-base1.0-dev</build_depend>
+
+   <run_depend>cv_bridge</run_depend>
+   <run_depend>roscpp</run_depend>
+   <run_depend>audio_common_msgs</run_depend>
+   <run_depend>libgstreamer1.0-0</run_depend>
+   <run_depend>libgstreamer-plugins-base1.0-0</run_depend>
+   <run_depend>gstreamer1.0-plugins-ugly</run_depend>
+   <run_depend>gstreamer1.0-plugins-good</run_depend>
+
+</package>
+
+
diff --git a/audio_to_float/scripts/spectrogram.py b/audio_to_float/scripts/spectrogram.py
@@ -0,0 +1,52 @@
+#!/usr/bin/env python
+
+import collections
+import numpy as np
+import rospy
+
+# from audio_common_msgs.msg import AudioData
+from cv_bridge import CvBridge
+from scipy import signal
+from sensor_msgs.msg import ChannelFloat32, Image
+
+
+class View():
+    def __init__(self):
+        self.bridge = CvBridge()
+        self.buffer_len = rospy.get_param("~buffer_len", 2**16)
+        self.buffer = collections.deque(maxlen=self.buffer_len)
+        self.sample_rate = rospy.get_param("~sample_rate", 44100)
+        # self.window = 256
+        self.im = None
+        self.pub = rospy.Publisher("image_spectrogram", Image, queue_size=1)
+        self.sub = rospy.Subscriber("samples", ChannelFloat32,
+                                    self.audio_callback, queue_size=1)
+        self.timer = rospy.Timer(rospy.Duration(0.2), self.update)
+
+    def audio_callback(self, msg):
+        for i in range(len(msg.values)):
+            self.buffer.append(msg.values[i])
+
+    def update(self, event):
+        if len(self.buffer) < self.buffer_len:
+            return
+        samples = np.asarray(self.buffer)
+        # TODO(lucasw) this is hugely inefficient if it is re-calculating
+        # for samples that were processed in previous update.
+        f, t, Sxx = signal.spectrogram(samples, self.sample_rate, nperseg=512)
+        # TODO(lucasw) is there a standard spectrogram conversion?
+        Sxx = np.log(1.0 + Sxx * 2**16)
+        mins = np.min(Sxx)
+        maxs = np.max(Sxx)
+        Sxx -= mins
+        print(Sxx.shape, mins, maxs)
+        self.im = (Sxx * 50).astype(np.uint8)
+        # self.im[y0:y1+1, i, :] = 255
+        self.pub.publish(self.bridge.cv2_to_imgmsg(self.im, "mono8"))
+        # rospy.signal_shutdown("")
+
+
+if __name__ == '__main__':
+    rospy.init_node('spectrogram')
+    view = View()
+    rospy.spin()