moved to github

2025-04-12 17:00:04 -09:00 · 2013-11-18 21:51:27 -05:00 · 2013-11-18 21:51:27 -05:00 · 90a93bc47b
commit 90a93bc47b
15 changed files with 962 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,7 @@
 *.pyc
 wav
 mp3
 *.wav
 *.mp3
 .DS_Store
 *.cnf
--- a/README.md
+++ b/README.md
--- a/dejavu/init.py
+++ b/dejavu/init.py
--- a/dejavu/control.py
+++ b/dejavu/control.py
@ -0,0 +1,106 @@
 from dejavu.database import SQLDatabase
 from dejavu.converter import Converter
 from dejavu.fingerprint import Fingerprinter
 from scipy.io import wavfile
 from multiprocessing import Process
 import wave, os
 import random
 class Dejavu():
    def __init__(self, config):
        self.config = config
        # create components
        self.converter = Converter()
        self.fingerprinter = Fingerprinter(self.config)
        self.fingerprinter.db.setup()
        # get songs previously indexed
        self.songs = self.fingerprinter.db.get_songs()
        self.songnames_set = set() # to know which ones we've computed before
        if self.songs:
            for song in self.songs:
                song_id = song[SQLDatabase.FIELD_SONG_ID]
                song_name = song[SQLDatabase.FIELD_SONGNAME]
                self.songnames_set.add(song_name)
                print "Added: %s to the set of fingerprinted songs..." % song_name
    def chunkify(self, lst, n):
        """
            Splits a list into roughly n equal parts. 
            http://stackoverflow.com/questions/2130016/splitting-a-list-of-arbitrary-size-into-only-roughly-n-equal-parts
        """
        return [lst[i::n] for i in xrange(n)]
    def fingerprint(self, path, output, extensions, nprocesses):
        # convert files, shuffle order
        files = self.converter.find_files(path, extensions)
        random.shuffle(files)
        files_split = self.chunkify(files, nprocesses)
        # split into processes here
        processes = []
        for i in range(nprocesses):
            # need database instance since mysql connections shouldn't be shared across processes
            sql_connection = SQLDatabase( 
                self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_HOSTNAME),
                self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_USERNAME),
                self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_PASSWORD),
                self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_DATABASE))
            # create process and start it
            p = Process(target=self.fingerprint_worker, args=(files_split[i], sql_connection, output))
            p.start()
            processes.append(p)
        # wait for all processes to complete
        for p in processes:
            p.join()
        # delete orphans
        print "Done fingerprinting. Deleting orphaned fingerprints..."
        self.fingerprinter.db.delete_orphans()
    def fingerprint_worker(self, files, sql_connection, output):
        for filename, extension in files:
            # if there are already fingerprints in database, don't re-fingerprint or convert
            song_name = os.path.basename(filename).split(".")[0]
            if song_name in self.songnames_set: 
                print "-> Already fingerprinted, continuing..."
                continue
            # convert to WAV
            wavout_path = self.converter.convert(filename, extension, Converter.WAV, output, song_name)
            # insert song name into database
            song_id = sql_connection.insert_song(song_name)
            # for each channel perform FFT analysis and fingerprinting
            channels = self.extract_channels(wavout_path)
            for c in range(len(channels)):
                channel = channels[c]
                print "-> Fingerprinting channel %d of song %s..." % (c+1, song_name)
                self.fingerprinter.fingerprint(channel, wavout_path, song_id, c+1)
            # only after done fingerprinting do confirm
            sql_connection.set_song_fingerprinted(song_id)
    def extract_channels(self, path):
        """
            Reads channels from disk.
        """
        channels = []
        Fs, frames = wavfile.read(path)
        wave_object = wave.open(path)
        nchannels, sampwidth, framerate, num_frames, comptype, compname = wave_object.getparams()
        assert Fs == self.fingerprinter.Fs
        for channel in range(nchannels):
            channels.append(frames[:, channel])
        return channels
--- a/dejavu/convert.py
+++ b/dejavu/convert.py
@ -0,0 +1,54 @@
 import os, fnmatch
 from pydub import AudioSegment
 class Converter():
    WAV = "wav"
    MP3 = "mp3"
    FORMATS = [
        WAV,
        MP3]
    def __init__(self):
        pass
    def ensure_folder(self, extension):
        if not os.path.exists(extension):
            os.makedirs(extension)
    def find_files(self, path, extensions):
        filepaths = []
        extensions = [e.replace(".", "") for e in extensions if e.replace(".", "") in Converter.FORMATS]
        print "Supported formats: %s" % extensions
        for dirpath, dirnames, files in os.walk(path) :
            for extension in extensions:
                for f in fnmatch.filter(files, "*.%s" % extension):
                    p = os.path.join(dirpath, f)
                    renamed = p.replace(" ", "_")
                    os.rename(p, renamed)
                    #print "Found file: %s with extension %s" % (renamed, extension)
                    filepaths.append((renamed, extension))
        return filepaths
    def convert(self, orig_path, from_format, to_format, output_folder, song_name):
        # start conversion
        self.ensure_folder(output_folder)
        print "-> Now converting: %s from %s format to %s format..." % (song_name, from_format, to_format)
        # MP3 --> WAV
        if from_format == Converter.MP3 and to_format == Converter.WAV:
            newpath = os.path.join(output_folder, "%s.%s" % (song_name, Converter.WAV))
            if os.path.isfile(newpath):
                print "-> Already converted, skipping..."
            else:
                mp3file = AudioSegment.from_mp3(orig_path)
                mp3file.export(newpath, format=Converter.WAV)
        # unsupported
        else:
            print "CONVERSION ERROR:\nThe conversion from %s to %s is not supported!" % (from_format, to_format)
        print "-> Conversion complete."
        return newpath
--- a/dejavu/database.py
+++ b/dejavu/database.py
@ -0,0 +1,320 @@
 import MySQLdb as mysql
 import MySQLdb.cursors as cursors
 import os
 class SQLDatabase():
    """
    Queries:
    1) Find duplicates (shouldn't be any, though):
        select `hash`, `song_id`, `offset`, count(*) cnt 
        from fingerprints 
        group by `hash`, `song_id`, `offset` 
        having cnt > 1
        order by cnt asc;
    2) Get number of hashes by song:
        select song_id, song_name, count(song_id) as num 
        from fingerprints 
        natural join songs
        group by song_id 
        order by count(song_id) desc;
    3) get hashes with highest number of collisions
        select 
            hash, 
            count(distinct song_id) as n 
        from fingerprints 
        group by `hash` 
        order by n DESC;
    => 26 different songs with same fingerprint (392 times):
        select songs.song_name, fingerprints.offset 
        from fingerprints natural join songs 
        where fingerprints.hash = "08d3c833b71c60a7b620322ac0c0aba7bf5a3e73";
    """
    # config keys
    CONNECTION = "connection"
    KEY_USERNAME = "username"
    KEY_DATABASE = "database"
    KEY_PASSWORD = "password"
    KEY_HOSTNAME = "hostname"
    # tables
    FINGERPRINTS_TABLENAME = "fingerprints"
    SONGS_TABLENAME = "songs"
    # fields
    FIELD_HASH = "hash"
    FIELD_SONG_ID = "song_id"
    FIELD_OFFSET = "offset"
    FIELD_SONGNAME = "song_name"
    FIELD_FINGERPRINTED = "fingerprinted"
    # creates
    CREATE_FINGERPRINTS_TABLE = """ 
    CREATE TABLE IF NOT EXISTS `%s` ( 
         `%s` binary(10) not null,
         `%s` mediumint unsigned not null, 
         `%s` int unsigned not null, 
         INDEX(%s),
         UNIQUE(%s, %s, %s)
    );""" % (FINGERPRINTS_TABLENAME, FIELD_HASH, 
            FIELD_SONG_ID, FIELD_OFFSET, FIELD_HASH,
            FIELD_SONG_ID, FIELD_OFFSET, FIELD_HASH)
    CREATE_SONGS_TABLE = """
    CREATE TABLE IF NOT EXISTS `%s` (
        `%s` mediumint unsigned not null auto_increment, 
        `%s` varchar(250) not null,
        `%s` tinyint default 0,
        PRIMARY KEY (`%s`),
        UNIQUE KEY `%s` (`%s`)
    );""" % (SONGS_TABLENAME, FIELD_SONG_ID, FIELD_SONGNAME, FIELD_FINGERPRINTED,
            FIELD_SONG_ID, FIELD_SONG_ID, FIELD_SONG_ID)
    # inserts
    INSERT_FINGERPRINT = "INSERT IGNORE INTO %s (%s, %s, %s) VALUES (UNHEX(%%s), %%s, %%s)" % (
        FINGERPRINTS_TABLENAME, FIELD_HASH, FIELD_SONG_ID, FIELD_OFFSET) # ignore duplicates and don't insert them
    INSERT_SONG = "INSERT INTO %s (%s) VALUES (%%s);" % (
        SONGS_TABLENAME, FIELD_SONGNAME)
    # selects
    SELECT = "SELECT %s, %s FROM %s WHERE %s = UNHEX(%%s);" % (FIELD_SONG_ID, FIELD_OFFSET, FINGERPRINTS_TABLENAME, FIELD_HASH)
    SELECT_ALL = "SELECT %s, %s FROM %s;" % (FIELD_SONG_ID, FIELD_OFFSET, FINGERPRINTS_TABLENAME)
    SELECT_SONG = "SELECT %s FROM %s WHERE %s = %%s" % (FIELD_SONGNAME, SONGS_TABLENAME, FIELD_SONG_ID)
    SELECT_NUM_FINGERPRINTS = "SELECT COUNT(*) as n FROM %s" % (FINGERPRINTS_TABLENAME)
    SELECT_UNIQUE_SONG_IDS = "SELECT COUNT(DISTINCT %s) as n FROM %s WHERE %s = 1;" % (FIELD_SONG_ID, SONGS_TABLENAME, FIELD_FINGERPRINTED)
    SELECT_SONGS = "SELECT %s, %s FROM %s WHERE %s = 1;" % (FIELD_SONG_ID, FIELD_SONGNAME, SONGS_TABLENAME, FIELD_FINGERPRINTED)
    # drops
    DROP_FINGERPRINTS = "DROP TABLE IF EXISTS %s;" % FINGERPRINTS_TABLENAME
    DROP_SONGS = "DROP TABLE IF EXISTS %s;" % SONGS_TABLENAME
    # update
    UPDATE_SONG_FINGERPRINTED = "UPDATE %s SET %s = 1 WHERE %s = %%s" % (SONGS_TABLENAME, FIELD_FINGERPRINTED, FIELD_SONG_ID)
    # delete
    DELETE_UNFINGERPRINTED = "DELETE FROM %s WHERE %s = 0;" % (SONGS_TABLENAME, FIELD_FINGERPRINTED)
    DELETE_ORPHANS = ""
    def __init__(self, hostname, username, password, database):
        # connect
        self.database = database
        try:
            # http://www.halfcooked.com/mt/archives/000969.html
            self.connection = mysql.connect(
                hostname, username, password, 
                database, cursorclass=cursors.DictCursor)  
            self.connection.autocommit(False) # for fast bulk inserts
            self.cursor = self.connection.cursor()
        except mysql.Error, e:
            print "Connection error %d: %s" % (e.args[0], e.args[1])
    def setup(self):
        try:
            # create fingerprints table
            self.cursor.execute("USE %s;" % self.database)
            self.cursor.execute(SQLDatabase.CREATE_FINGERPRINTS_TABLE)
            self.cursor.execute(SQLDatabase.CREATE_SONGS_TABLE)
            self.delete_unfingerprinted_songs()
            self.connection.commit()
        except mysql.Error, e:
            print "Connection error %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
    def empty(self):
        """
            Drops all tables and re-adds them. Be carfeul with this!
        """
        try:
            self.cursor.execute("USE %s;" % self.database)
            # drop tables
            self.cursor.execute(SQLDatabase.DROP_FINGERPRINTS)
            self.cursor.execute(SQLDatabase.DROP_SONGS)
            # recreate
            self.cursor.execute(SQLDatabase.CREATE_FINGERPRINTS_TABLE)
            self.cursor.execute(SQLDatabase.CREATE_SONGS_TABLE)
            self.connection.commit()
        except mysql.Error, e:
            print "Error in empty(), %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
    def delete_orphans(self):
        try:
            self.cursor = self.connection.cursor()
            self.cursor.execute(SQLDatabase.DELETE_ORPHANS)
            self.connection.commit()
        except mysql.Error, e:
            print "Error in delete_orphans(), %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
    def delete_unfingerprinted_songs(self):
        try:
            self.cursor = self.connection.cursor()
            self.cursor.execute(SQLDatabase.DELETE_UNFINGERPRINTED)
            self.connection.commit()
        except mysql.Error, e:
            print "Error in delete_unfingerprinted_songs(), %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
    def get_num_songs(self):
        """
            Returns number of songs the database has fingerprinted.
        """
        try:
            self.cursor = self.connection.cursor()
            self.cursor.execute(SQLDatabase.SELECT_UNIQUE_SONG_IDS)
            record = self.cursor.fetchone()
            return int(record['n'])
        except mysql.Error, e:
            print "Error in get_num_songs(), %d: %s" % (e.args[0], e.args[1])
    def get_num_fingerprints(self):
        """
            Returns number of fingerprints the database has fingerprinted.
        """
        try:
            self.cursor = self.connection.cursor()
            self.cursor.execute(SQLDatabase.SELECT_NUM_FINGERPRINTS)
            record = self.cursor.fetchone()
            return int(record['n'])
        except mysql.Error, e:
            print "Error in get_num_songs(), %d: %s" % (e.args[0], e.args[1])
    def set_song_fingerprinted(self, song_id):
        """
            Set the fingerprinted flag to TRUE (1) once a song has been completely
            fingerprinted in the database. 
        """
        try:
            self.cursor = self.connection.cursor()
            self.cursor.execute(SQLDatabase.UPDATE_SONG_FINGERPRINTED, song_id)
            self.connection.commit()
        except mysql.Error, e:
            print "Error in  set_song_fingerprinted(), %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
    def get_songs(self):
        """
            Return songs that have the fingerprinted flag set TRUE (1). 
        """
        try:
            self.cursor.execute(SQLDatabase.SELECT_SONGS)
            return self.cursor.fetchall()
        except mysql.Error, e:
            print "Error in get_songs(), %d: %s" % (e.args[0], e.args[1])
            return None
    def get_song_by_id(self, sid):
        """
            Returns song by its ID.
        """
        try:
            self.cursor.execute(SQLDatabase.SELECT_SONG, (sid,))
            return self.cursor.fetchone()
        except mysql.Error, e:
            print "Error in get_songs(), %d: %s" % (e.args[0], e.args[1])
            return None
    def insert(self, key, value):
        """
            Insert a (sha1, song_id, offset) row into database. 
            key is a sha1 hash, value = (song_id, offset)
        """
        try:
            args = (key, value[0], value[1])
            self.cursor.execute(SQLDatabase.INSERT_FINGERPRINT, args)
        except mysql.Error, e:
            print "Error in insert(), %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
    def insert_song(self, songname):
        """
            Inserts song in the database and returns the ID of the inserted record.
        """
        try:
            self.cursor.execute(SQLDatabase.INSERT_SONG, (songname,))
            self.connection.commit()
            return int(self.cursor.lastrowid)
        except mysql.Error, e:
            print "Error in insert_song(), %d: %s" % (e.args[0], e.args[1])
            self.connection.rollback()
            return None
    def query(self, key):
        """
            Return all tuples associated with hash. 
            If hash is None, returns all entries in the 
            database (be careful with that one!).
        """
        # select all if no key
        if key is not None:
            sql = SQLDatabase.SELECT
        else:
            sql = SQLDatabase.SELECT_ALL
        matches = []
        try:
            self.cursor.execute(sql, (key,))
            # collect all matches
            records = self.cursor.fetchall()
            for record in records:
                matches.append((record[SQLDatabase.FIELD_SONG_ID], record[SQLDatabase.FIELD_OFFSET]))
        except mysql.Error, e:
            print "Error in query(), %d: %s" % (e.args[0], e.args[1])
        return matches
    def get_iterable_kv_pairs(self):
        """
            Returns all tuples in database. 
        """
        return self.query(None)
    def insert_hashes(self, hashes):
        """
            Insert series of hash => song_id, offset
            values into the database. 
        """
        for h in hashes:
            sha1, val = h
            self.insert(sha1, val)
        self.connection.commit()
    def return_matches(self, hashes):
        """
            Return the (song_id, offset_diff) tuples associated with 
            a list of 
                sha1 => (None, sample_offset)
            values.
        """
        matches = []
        for h in hashes:
            sha1, val = h
            list_of_tups = self.query(sha1)
            if list_of_tups:
                for t in list_of_tups:
                    # (song_id, db_offset, song_sampled_offset)
                    matches.append((t[0], t[1] - val[1]))
        return matches
--- a/dejavu/fingerprint.py
+++ b/dejavu/fingerprint.py
@ -0,0 +1,224 @@
 import numpy as np
 import matplotlib.mlab as mlab
 import matplotlib.pyplot as plt
 import matplotlib.image as mpimg
 from scipy.io import wavfile
 from scipy.ndimage.filters import maximum_filter
 from scipy.ndimage.morphology import generate_binary_structure, iterate_structure, binary_erosion
 from dejavu.database import SQLDatabase
 import os
 import wave
 import sys
 import time
 import hashlib
 import pickle
 class Fingerprinter():
    IDX_FREQ_I = 0
    IDX_TIME_J = 1
    DEFAULT_FS = 44100
    DEFAULT_WINDOW_SIZE = 4096
    DEFAULT_OVERLAP_RATIO = 0.5
    DEFAULT_FAN_VALUE = 15
    DEFAULT_AMP_MIN = 10
    PEAK_NEIGHBORHOOD_SIZE = 20
    MIN_HASH_TIME_DELTA = 0
    def __init__(self, config, 
            Fs=DEFAULT_FS, 
            wsize=DEFAULT_WINDOW_SIZE, 
            wratio=DEFAULT_OVERLAP_RATIO, 
            fan_value=DEFAULT_FAN_VALUE, 
            amp_min=DEFAULT_AMP_MIN):
        self.config = config
        database = SQLDatabase(
            self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_HOSTNAME),
            self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_USERNAME),
            self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_PASSWORD),
            self.config.get(SQLDatabase.CONNECTION, SQLDatabase.KEY_DATABASE))
        self.db = database
        self.Fs = Fs
        self.dt = 1.0 / self.Fs
        self.window_size = wsize
        self.window_overlap_ratio = wratio
        self.fan_value = fan_value
        self.noverlap = int(self.window_size * self.window_overlap_ratio)
        self.amp_min = amp_min
    def fingerprint(self, samples, path, sid, cid):
        """Used for learning known songs"""
        hashes = self.process_channel(samples, song_id=sid)
        print "Generated %d hashes" % len(hashes)
        self.db.insert_hashes(hashes)
    def match(self, samples):
        """Used for matching unknown songs"""
        hashes = self.process_channel(samples)
        matches = self.db.return_matches(hashes)
        return matches
    def process_channel(self, channel_samples, song_id=None):
        """
            FFT the channel, log transform output, find local maxima, then return
            locally sensitive hashes. 
        """
        # FFT the signal and extract frequency components
        arr2D = mlab.specgram(
            channel_samples, 
            NFFT=self.window_size, 
            Fs=self.Fs,
            window=mlab.window_hanning,
            noverlap=self.noverlap)[0]
        # apply log transform since specgram() returns linear array
        arr2D = 10 * np.log10(arr2D)
        arr2D[arr2D == -np.inf] = 0 # replace infs with zeros
        # find local maxima
        local_maxima = self.get_2D_peaks(arr2D, plot=False)
        # return hashes
        return self.generate_hashes(local_maxima, song_id=song_id)
    def get_2D_peaks(self, arr2D, plot=False):
        # http://docs.scipy.org/doc/scipy/reference/generated/scipy.ndimage.morphology.iterate_structure.html#scipy.ndimage.morphology.iterate_structure
        struct = generate_binary_structure(2, 1)
        neighborhood = iterate_structure(struct, Fingerprinter.PEAK_NEIGHBORHOOD_SIZE) 
        # find local maxima using our fliter shape
        local_max = maximum_filter(arr2D, footprint=neighborhood) == arr2D 
        background = (arr2D == 0)
        eroded_background = binary_erosion(background, structure=neighborhood, border_value=1)
        detected_peaks = local_max - eroded_background # this is a boolean mask of arr2D with True at peaks
        # extract peaks
        amps = arr2D[detected_peaks]
        j, i = np.where(detected_peaks) 
        # filter peaks
        amps = amps.flatten()
        peaks = zip(i, j, amps)
        peaks_filtered = [x for x in peaks if x[2] > self.amp_min] # freq, time, amp
        # get indices for frequency and time
        frequency_idx = [x[1] for x in peaks_filtered]
        time_idx = [x[0] for x in peaks_filtered]
        if plot:
            # scatter of the peaks
            fig, ax = plt.subplots()
            ax.imshow(arr2D)
            ax.scatter(time_idx, frequency_idx)
            ax.set_xlabel('Time')
            ax.set_ylabel('Frequency')
            ax.set_title("Spectrogram of \"Blurred Lines\" by Robin Thicke");
            plt.gca().invert_yaxis()
            plt.show()
        return zip(frequency_idx, time_idx)
    def generate_hashes(self, peaks, song_id=None):
        """
        Hash list structure:
           sha1-hash[0:20]    song_id, time_offset
        [(e05b341a9b77a51fd26,   (3, 32)), ... ]
        """
        fingerprinted = set() # to avoid rehashing same pairs
        hashes = []
        for i in range(len(peaks)):
            for j in range(self.fan_value):
                if i+j < len(peaks) and not (i, i+j) in fingerprinted:
                    freq1 = peaks[i][Fingerprinter.IDX_FREQ_I]
                    freq2 = peaks[i+j][Fingerprinter.IDX_FREQ_I]
                    t1 = peaks[i][Fingerprinter.IDX_TIME_J]
                    t2 = peaks[i+j][Fingerprinter.IDX_TIME_J]
                    t_delta = t2 - t1
                    if t_delta >= Fingerprinter.MIN_HASH_TIME_DELTA:
                        h = hashlib.sha1("%s|%s|%s" % (str(freq1), str(freq2), str(t_delta)))
                        hashes.append((h.hexdigest()[0:20], (song_id, t1)))
                    # ensure we don't repeat hashing
                    fingerprinted.add((i, i+j))
        return hashes
    def insert_into_db(self, key, value):
        self.db.insert(key, value)
    def print_stats(self):
        iterable = self.db.get_iterable_kv_pairs()
        counter = {}
        for t in iterable:
            sid, toff = t
            if not sid in counter:
                counter[sid] = 1
            else:
                counter[sid] += 1
        for song_id, count in counter.iteritems():
            song_name = self.song_names[song_id]
            print "%s has %d spectrogram peaks" % (song_name, count)
    def set_song_names(self, wpaths):
        self.song_names = wpaths
    def align_matches(self, matches, starttime, record_seconds=0, verbose=False):
        """
            Finds hash matches that align in time with other matches and finds
            consensus about which hashes are "true" signal from the audio.
            Returns a dictionary with match information.
        """
        # align by diffs
        diff_counter = {}
        largest = 0
        largest_count = 0
        song_id = -1
        for tup in matches:
            sid, diff = tup
            if not diff in diff_counter:
                diff_counter[diff] = {}
            if not sid in diff_counter[diff]:
                diff_counter[diff][sid] = 0
            diff_counter[diff][sid] += 1
            if diff_counter[diff][sid] > largest_count:
                largest = diff
                largest_count = diff_counter[diff][sid]
                song_id = sid
        if verbose: print "Diff is %d with %d offset-aligned matches" % (largest, largest_count)
        #from collections import OrderedDict
        #print OrderedDict(diff_counter)
        # extract idenfication        
        songname = self.db.get_song_by_id(song_id)[SQLDatabase.FIELD_SONGNAME]
        songname = songname.replace("_", " ")
        elapsed = time.time() - starttime
        if verbose: 
            print "Song is %s (song ID = %d) identification took %f seconds" % (songname, song_id, elapsed)
        # return match info
        song = {
            "song_id" : song_id,
            "song_name" : songname,
            "match_time" : elapsed,
            "confidence" : largest_count
        }
        if record_seconds: 
            song['record_time'] = record_seconds
        return song
--- a/dejavu/recognize.py
+++ b/dejavu/recognize.py
@ -0,0 +1,72 @@
 from multiprocessing import Queue, Process
 from dejavu.database import SQLDatabase
 from scipy.io import wavfile
 import wave
 import numpy as np
 import pyaudio
 import sys
 import time
 import array
 class Recognizer(object):
    CHUNK = 8192 # 44100 is a multiple of 1225
    FORMAT = pyaudio.paInt16
    CHANNELS = 2
    RATE = 44100
    def __init__(self, fingerprinter, config):
        self.fingerprinter = fingerprinter
        self.config = config
        self.audio = pyaudio.PyAudio()
    def read(self, filename, verbose=False):
        # read file into channels            
        channels = []
        Fs, frames = wavfile.read(filename)
        wave_object = wave.open(filename)
        nchannels, sampwidth, framerate, num_frames, comptype, compname = wave_object.getparams()
        for channel in range(nchannels):
            channels.append(frames[:, channel])    
        # get matches
        starttime = time.time()
        matches = []
        for channel in channels:
            matches.extend(self.fingerprinter.match(channel))
        return self.fingerprinter.align_matches(matches, starttime, verbose=verbose)
    def listen(self, seconds=10, verbose=False):
        # open stream
        stream = self.audio.open(format=Recognizer.FORMAT,
                        channels=Recognizer.CHANNELS,
                        rate=Recognizer.RATE,
                        input=True,
                        frames_per_buffer=Recognizer.CHUNK)
        # record
        if verbose: print("* recording")
        left, right = [], []
        for i in range(0, int(Recognizer.RATE / Recognizer.CHUNK * seconds)):
            data = stream.read(Recognizer.CHUNK)
            nums = np.fromstring(data, np.int16)
            left.extend(nums[1::2])
            right.extend(nums[0::2])
        if verbose: print("* done recording")
        # close and stop the stream
        stream.stop_stream()
        stream.close()
        # match both channels
        starttime = time.time()
        matches = []
        matches.extend(self.fingerprinter.match(left))
        matches.extend(self.fingerprinter.match(right))
        # align and return
        return self.fingerprinter.align_matches(matches, starttime, record_seconds=seconds, verbose=verbose)
--- a/go.py
+++ b/go.py
@ -0,0 +1,20 @@
 from dejavu.control import Dejavu
 from ConfigParser import ConfigParser
 import warnings
 warnings.filterwarnings("ignore")
 # load config
 config = ConfigParser()
 config.read("dejavu.cnf")
 # create Dejavu object
 dejavu = Dejavu(config)
 dejavu.fingerprint("va_us_top_40/mp3", "va_us_top_40/wav", [".mp3"], 5)
 # recognize microphone audio
 from dejavu.recognize import Recognizer
 recognizer = Recognizer(dejavu.fingerprinter, config)
 # recognize song playing over microphone for 10 seconds
 song = recognizer.listen(seconds=1, verbose=True)
 print song
--- a/performance.py
+++ b/performance.py
@ -0,0 +1,159 @@
 from dejavu.control import Dejavu
 from dejavu.recognize import Recognizer
 from dejavu.convert import Converter
 from dejavu.database import SQLDatabase
 from ConfigParser import ConfigParser
 from scipy.io import wavfile
 import matplotlib.pyplot as plt
 import warnings
 import pyaudio
 import os, wave, sys
 import random
 import numpy as np
 warnings.filterwarnings("ignore")
 config = ConfigParser()
 config.read("dejavu.cnf")
 dejavu = Dejavu(config)
 recognizer = Recognizer(dejavu.fingerprinter, config)
 def test_recording_lengths(recognizer):
    # settings for run
    RATE = 44100
    FORMAT = pyaudio.paInt16
    padding_seconds = 10
    SONG_PADDING = RATE * padding_seconds
    OUTPUT_FILE = "output.wav"
    p = pyaudio.PyAudio()
    c = Converter()
    files = c.find_files("va_us_top_40/wav/", [".wav"])[-25:]
    total = len(files)
    recording_lengths = [4]
    correct = 0
    count = 0
    score = {}
    for r in recording_lengths:
        RECORD_LENGTH = RATE * r
        for tup in files:
            f, ext = tup 
            # read the file
            #print "reading: %s" % f
            Fs, frames = wavfile.read(f)
            wave_object = wave.open(f)
            nchannels, sampwidth, framerate, num_frames, comptype, compname = wave_object.getparams()
            # chose at random a segment of audio to play
            possible_end = num_frames - SONG_PADDING - RECORD_LENGTH
            possible_start = SONG_PADDING
            if possible_end - possible_start < RECORD_LENGTH:
                print "ERROR! Song is too short to sample based on padding and recording seconds preferences."
                sys.exit()
            start = random.randint(possible_start, possible_end)
            end = start + RECORD_LENGTH + 1
            # get that segment of samples
            channels = []
            frames = frames[start:end, :]
            wav_string = frames.tostring()
            # write to disk
            wf = wave.open(OUTPUT_FILE, 'wb')
            wf.setnchannels(nchannels)
            wf.setsampwidth(p.get_sample_size(FORMAT))
            wf.setframerate(RATE)
            wf.writeframes(b''.join(wav_string))
            wf.close()
            # play and test
            correctname = os.path.basename(f).replace(".wav", "").replace("_", " ")
            inp = raw_input("Click ENTER when playing %s ..." % OUTPUT_FILE)
            song = recognizer.listen(seconds=r+1, verbose=False)
            print "PREDICTED: %s" % song['song_name']
            print "ACTUAL: %s" % correctname
            if song['song_name'] == correctname:
                correct += 1
            count += 1
            print "Currently %d correct out of %d in total of %d" % (correct, count, total)
        score[r] = (correct, total)
        print "UPDATE AFTER %d TRIAL: %s" % (r, score)
    return score
 def plot_match_time_trials():
    # I did this manually
    t = np.array([1, 2, 3, 4, 5, 6, 7, 8, 10, 15, 25, 30, 45, 60])
    m = np.array([.47, .79, 1.1, 1.5, 1.8, 2.18, 2.62, 2.8, 3.65, 5.29, 8.92, 10.63, 16.09, 22.29])
    mplust = t + m
    # linear regression
    A = np.matrix([t, np.ones(len(t))])
    print A
    w = np.linalg.lstsq(A.T, mplust)[0]
    line = w[0] * t + w[1]
    print "Equation for line is %f * record_time + %f = time_to_match" % (w[0], w[1])
    # and plot
    plt.title("Recording vs Matching time for \"Get Lucky\" by Daft Punk")
    plt.xlabel("Time recorded (s)")
    plt.ylabel("Time recorded + time to match (s)")
    #plt.scatter(t, mplust)
    plt.plot(t, line, 'r-', t, mplust, 'o')
    plt.show()
 def plot_accuracy():
    # also did this manually
    secs = np.array([1, 2, 3, 4, 5, 6])
    correct = np.array([27.0, 43.0, 44.0, 44.0, 45.0, 45.0]) 
    total = 45.0
    correct = correct / total
    plt.title("Dejavu Recognition Accuracy as a Function of Time")
    plt.xlabel("Time recorded (s)")
    plt.ylabel("Accuracy")
    plt.plot(secs, correct)
    plt.ylim([0.0, 1.05])
    plt.show()
 def plot_hashes_per_song():
    squery = """select song_name, count(song_id) as num 
    from fingerprints 
    natural join songs
    group by song_name 
    order by count(song_id) asc;"""
    sql = SQLDatabase(username="root", password="root", database="dejavu", hostname="localhost")
    cursor = sql.connection.cursor()
    cursor.execute(squery)
    counts = cursor.fetchall()
    songs = []
    count = []
    for item in counts:
        songs.append(item['song_name'].replace("_", " ")[4:])
        count.append(item['num'])
    pos = np.arange(len(songs)) + 0.5
    fig = plt.figure()
    ax = fig.add_subplot(111)
    ax.barh(pos, count, align='center')
    ax.set_yticks(pos, tuple(songs))
    ax.axvline(0, color='k', lw=3)
    ax.set_xlabel('Number of Fingerprints')
    ax.set_title('Number of Fingerprints by Song')
    ax.grid(True)
    plt.show()
 #plot_accuracy()       
 #score = test_recording_lengths(recognizer)
 #plot_match_time_trials() 
 #plot_hashes_per_song() 
--- a/plots/accuracy.png
+++ b/plots/accuracy.png
--- a/plots/blurred_lines_spectrogram.png
+++ b/plots/blurred_lines_spectrogram.png
--- a/plots/blurred_lines_vertical.png
+++ b/plots/blurred_lines_vertical.png
--- a/plots/blurred_lines_zoomed.png
+++ b/plots/blurred_lines_zoomed.png
--- a/plots/matching_time.png
+++ b/plots/matching_time.png