From 0f163b5443ddc07ef0f87fee22ebab22bdb0b19d Mon Sep 17 00:00:00 2001
From: yomguy <yomguy@parisson.com>
Date: Thu, 25 Nov 2010 22:27:23 +0000
Subject: [PATCH] add analyzer batch

---
 timeside/tools/analyze_batch_awdio.py | 113 ++++++++++++++++++++++++
 timeside/tools/cache.py               | 118 ++++++++++++++++++++++++++
 2 files changed, 231 insertions(+)
 create mode 100644 timeside/tools/analyze_batch_awdio.py
 create mode 100644 timeside/tools/cache.py

diff --git a/timeside/tools/analyze_batch_awdio.py b/timeside/tools/analyze_batch_awdio.py
new file mode 100644
index 0000000..454cd88
--- /dev/null
+++ b/timeside/tools/analyze_batch_awdio.py
@@ -0,0 +1,113 @@
+#!/usr/bin/python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2009-2010 Guillaume Pellerin <yomguy@parisson.com>
+
+# This file is part of TimeSide.
+
+# TimeSide is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 2 of the License, or
+# (at your option) any later version.
+
+# TimeSide is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+
+# You should have received a copy of the GNU General Public License
+# along with TimeSide.  If not, see <http://www.gnu.org/licenses/>.
+
+# Author: Guillaume Pellerin <yomguy@parisson.com>
+
+version = '0.3'
+
+import os
+import sys
+import time
+import datetime
+import timeside
+from logger import Logger
+import Queue
+from threading import Thread
+from cache import Cache
+
+
+class Media2Analyzer(object):
+
+    def __init__(self, media_dir, dest_dir,  log_file):
+        self.root_dir = media_dir
+        self.dest_dir = dest_dir
+        self.threads = 1
+        self.logger = Logger(log_file)
+        self.counter = 0
+        self.force = 0
+        self.cache = TelemetaCache(self.dest_dir)
+
+        self.media_list = self.get_media_list()
+        if not os.path.exists(self.dest_dir):
+            os.makedirs(self.dest_dir)
+        self.path_dict = self.get_path_dict()
+                                   
+    def get_media_list(self):
+        media_list = []
+        for root, dirs, files in os.walk(self.root_dir):
+            if root:
+                for file in files:
+                    if file[0] != '.':
+                        ext = file.split('.')[-1]
+                        media_list.append(root+os.sep+file)
+        return media_list
+
+    def get_path_dict(self):
+        path_dict = {}
+        for media in self.media_list:
+            filename = media.split(os.sep)[-1]
+            name, ext = os.path.splitext(filename)
+            dest_file = name + '.xml'
+            if not os.path.exists(dest_file) or self.force:
+                path_dict[media] = dest_file
+        return path_dict
+
+    def process(self):          
+        for media, file in self.path_dict.iteritems():
+	    self.analyzers = timeside.core.processors(timeside.api.IAnalyzer)
+	    mess = 'Processing ' + media
+	    self.logger.write_info(mess)
+	    if not self.cache.exists(file):
+		analyzers = []
+		analyzers_sub = []
+		decoder  = timeside.decoder.FileDecoder(media)
+		pipe = decoder
+		for analyzer in self.analyzers:
+		    subpipe = analyzer()
+		    analyzers_sub.append(subpipe)
+		    pipe = pipe | subpipe
+		pipe.run()
+		
+		for analyzer in analyzers_sub:
+		    value = analyzer.result()
+		    if analyzer.id() == 'duration':
+			value = datetime.timedelta(0,value)
+		    analyzers.append({'name':analyzer.name(),
+				      'id':analyzer.id(),
+				      'unit':analyzer.unit(),
+				      'value':str(value)})
+		
+		self.cache.write_analyzer_xml(analyzers, file)		    
+
+
+if __name__ == '__main__':
+    if len(sys.argv) <= 2:
+        print """
+        Usage : python analyze_batch.py /path/to/media_dir /path/to/dest_dir
+
+        Dependencies : timeside, python, python-numpy, python-gst0.10, gstreamer0.10-plugins-base
+        See http://code.google.com/p/timeside/ for more information.
+        """
+    else:
+        media_dir = sys.argv[-3]
+        dest_dir = sys.argv[-2]
+        log_file = sys.argv[-1]
+        m = Media2Analyzer(media_dir, dest_dir, log_file)
+        m.process()
diff --git a/timeside/tools/cache.py b/timeside/tools/cache.py
new file mode 100644
index 0000000..8decc97
--- /dev/null
+++ b/timeside/tools/cache.py
@@ -0,0 +1,118 @@
+#!/usr/bin/python
+# -*- coding: utf-8 -*-
+#
+# Copyright (C) 2006-2010 Guillaume Pellerin
+
+# <yomguy@parisson.com>
+
+# This software is a computer program whose purpose is to stream audio
+# and video data through icecast2 servers.
+
+# This software is governed by the CeCILL license under French law and
+# abiding by the rules of distribution of free software. You can use,
+# modify and/ or redistribute the software under the terms of the CeCILL
+# license as circulated by CEA, CNRS and INRIA at the following URL
+# "http://www.cecill.info".
+
+# As a counterpart to the access to the source code and  rights to copy,
+# modify and redistribute granted by the license, users are provided only
+# with a limited warranty and the software's author, the holder of the
+# economic rights, and the successive licensors have only limited
+# liability.
+
+# In this respect, the user's attention is drawn to the risks associated
+# with loading, using,  modifying and/or developing or reproducing the
+# software by the user in light of its specific status of free software,
+# that may mean that it is complicated to manipulate, and that also
+# therefore means that it is reserved for developers and  experienced
+# professionals having in-depth computer knowledge. Users are therefore
+# encouraged to load and test the software's suitability as regards their
+# requirements in conditions enabling the security of their systems and/or
+# data to be ensured and, more generally, to use and operate it in the
+# same conditions as regards security.
+
+# The fact that you are presently reading this means that you have had
+# knowledge of the CeCILL license and that you accept its terms.
+
+# Author: Guillaume Pellerin <yomguy@parisson.com>
+
+import os
+import xml.dom.minidom
+
+
+class Cache(object):
+    
+    def __init__(self, dir, params=None):
+        self.dir = dir
+        self.params = params
+        self.files = self.get_files()
+        
+    def get_files(self):
+        list = []
+        for root, dirs, files in os.walk(self.dir):
+            for file in files:
+                list.append(file)
+        return list
+    
+    def exists(self, file):
+        self.files = self.get_files()
+        return file in self.files
+            
+    def write_bin(self, data, file):
+        path = self.dir + os.sep + file
+        f = open(path, 'w')
+        f.write(data)
+        f.close()
+
+    def read_bin(self, file):
+        path = self.dir + os.sep + file
+        f = open(path,  'r')
+        data = f.read()
+        f.close()
+        return data
+        
+    def read_stream_bin(self, file):
+        path = self.dir + os.sep + file
+        chunk_size = 0x1000
+        f = open(path,  'r')
+        while True:
+            _chunk = f.read(chunk_size)
+            if not len(_chunk):
+                break
+            yield _chunk
+        f.close()
+
+    def write_stream_bin(self, chunk, file_object):
+        file_object.write(chunk)
+
+    def read_analyzer_xml(self, file):
+        list = []
+        path = self.dir + os.sep + file
+        doc = xml.dom.minidom.parse(path)
+        for data in doc.documentElement.getElementsByTagName('data') :
+            name = data.getAttribute('name')
+            id = data.getAttribute('id')
+            unit = data.getAttribute('unit')
+            value = data.getAttribute('value')
+            list.append({'name': name, 'id': id, 'unit': unit, 'value': value})
+        return list
+        
+    def write_analyzer_xml(self, data_list, file):
+        path = self.dir + os.sep + file
+        doc = xml.dom.minidom.Document()
+        root = doc.createElement('telemeta')
+        doc.appendChild(root)
+        for data in data_list:
+            name = data['name']
+            id = data['id']
+            unit = data['unit']
+            value = data['value']
+            node = doc.createElement('data')
+            node.setAttribute('name', name)
+            node.setAttribute('id', id)
+            node.setAttribute('unit', unit)
+            node.setAttribute('value', str(value))
+            root.appendChild(node)
+        f = open(path, "w")
+        f.write(xml.dom.minidom.Document.toprettyxml(doc))
+        f.close()
-- 
2.47.3