From 143bd4df59cc09cd8a33159b44b22bed4cf683f7 Mon Sep 17 00:00:00 2001
From: MatthewAKelly <matthew.alexander.kelly@gmail.com>
Date: Sun, 2 Mar 2014 14:47:43 -0500
Subject: [PATCH] bad changes

---
 ccm/lib/actr/hdm.py | 627 --------------------------------------------
 ccm/lib/hrr.py      |  95 ++-----
 2 files changed, 17 insertions(+), 705 deletions(-)
 delete mode 100755 ccm/lib/actr/hdm.py

diff --git a/ccm/lib/actr/hdm.py b/ccm/lib/actr/hdm.py
deleted file mode 100755
index f3b11df..0000000
--- a/ccm/lib/actr/hdm.py
+++ /dev/null
@@ -1,627 +0,0 @@
-from __future__ import generators
-import ccm
-import math
-import numpy
-
-##__all__=['Memory','MemorySubModule','DMNoise','DMBaseLevel','DMSalience','DMSpreading','DMFixed',
-##         'Partial','BlendingMemory','DMAssociate']
-__all__=['HDM']
-
-from ccm.lib.actr.buffer import Chunk,Buffer
-# add for hdm
-from ccm.lib.actr.dm import Memory
-from ccm.pattern import Pattern
-from ccm.lib.hrr import HRR
-##class Memory(ccm.Model):
-class HDM(Memory):
-  def __init__(self,buffer,latency=0.05,threshold=0,maximum_time=10.0,finst_size=4,finst_time=3.0):
-    Memory.__init__(self,buffer)
-    self._buffer=buffer
-    self.hdm=[]
-    self.N = 1024
-    self.environment={'?': HRR(N=self.N)}
-    self.placeholder = self.environment['?']
-    self.cLambda = 7
-    self.memory={}
-    self.memStr={}
-    self.slots={}
-    self.error=False
-    self.busy=False
-    self.adaptors=[]
-    self.latency=latency
-    self.threshold=threshold
-    self.maximum_time=maximum_time
-    self.partials=[]
-    self.finst=Finst(self,size=finst_size,time=finst_time)
-    self.record_all_chunks=False
-    self._request_count=0
-    
-  def clear(self):
-    del self.hdm[:]
-    
-  def add(self,chunk,record=None,**keys):
-    # if error flag is true, set to false for production system
-    if self.error: self.error=False
-     
-    # convert chunk to a list of (slot,value) pairs
-    chunkList = self.chunk2list(chunk)
-    # define random Gaussian vectors and random permutations for any undefined values and slots
-    self.defineVectors(chunkList)
-    # get all combinations ranging from pairs of slot-value pairs to sets of self.cLambda size
-    ngrams = self.getOpenNGrams(chunkList,range(1,self.cLambda+1))
-    
-    # update the memory vectors with the information from the chunk
-    for gram in ngrams:
-        for p in xrange(len(gram)):
-            for i in xrange(len(gram)):
-                (slot,value) = gram[i]
-                slotPerm = self.slots[slot]
-                if i == p:
-                    # replace with placeholder
-                    valVec = self.environment['?']
-                    slotvalStr = slot + '(?)'
-                else:
-                    if value.startswith('!'):
-                        valVec = -1 * self.environment[value[1:]]
-                    else:
-                        valVec = self.environment[value]     
-                    slotvalStr = slot + '('+value+')'
-                # permute the value's vector by the slot's permutation & store that
-                slotvalVec = valVec.permute(slotPerm)
-                
-                if i == 0:
-                    chunking = slotvalVec
-                    chunkStr = slotvalStr
-                else:
-                    chunking = chunking * slotvalVec
-                    chunkStr = chunkStr+'*'+slotvalStr   
-            # update memory
-            (slot,value) = gram[p]
-            if value.startswith('!'):
-                self.memory[value] = self.memory[value[1:]] - chunking
-            else: 
-                self.memory[value] = self.memory[value] + chunking
-                
-            try:
-                self.memStr[value] = self.memStr[value] +' + '+ chunkStr
-            except:
-                self.memStr[value] = chunkStr
-    print " HDM: a chunk is added to HDM"
-      
-
-  def request(self,chunk,partial=None,require_new=False):
-     if partial is None and len(self.partials)>0: partial=self.partials[0]
-     self.busy=True
-     if self.error: self.error=False
-     self._request_count+=1
-
-     
-     # convert chunk to a list of (slot,value) pairs
-     chunkList = self.chunk2list(chunk)
-     # define random Gaussian vectors and random permutations for any undefined values and slots
-     self.defineVectors(chunkList)
-     # get all combinations ranging from pairs of slot-value pairs to sets of self.cLambda size
-     ngrams = self.getOpenNGrams(chunkList,range(1,self.cLambda+1))
-
-     # filter out ngrams that don't contain a ?
-     queryGrams = []
-     for gram in ngrams:
-        there_is_one_placeholder  = False
-        for [slot,value] in gram:
-            if value is '?':
-                if there_is_one_placeholder:
-                    there_is_one_placeholder = False
-                    raise Exception('HDM requests must have no more than one ?')
-                else:
-                    there_is_one_placeholder = True
-                
-        if there_is_one_placeholder:
-            queryGrams.append(gram)
-            
-     if not queryGrams:
-        print 'No ? in query'
-        self.fail(self._request_count)
-     else:
-         # construct the query vector as a sum of queryGrams vectors
-         # where each queryGram vector is constructed by binding slotvalue vectors
-         # where each slotvalue vector is a slot permutation of a value vector
-         for j,gram in enumerate(queryGrams):
-            for i, slotvalue in enumerate(gram):
-                [slot,value] = slotvalue
-                slotPerm = self.slots[slot]
-                if value.startswith('!'):
-                    valVec = -1 * self.environment[value[1:]]
-                else:
-                    valVec = self.environment[value]     
-                # permute the value's vector by the slot's permutation
-                slotvalVec = valVec.permute(slotPerm)
-                if i == 0:
-                    # base case
-                    chunkStr = slot+'('+value+')'
-                    chunking = slotvalVec
-                else:
-                    chunkStr = chunkStr+'*'+slot+'('+value+')'
-                    chunking = chunking * slotvalVec
-            if j == 0:
-                queryStr = chunkStr
-                queryVec = chunking
-            else:
-                queryStr = queryStr+' + '+chunkStr
-                queryVec = queryVec + chunking
-         print 'The query is ' + queryStr
-         highestCosine = 0
-         bestMatch = 'none'
-         # find the best match to the query vector in memory
-         for mem,memVec in self.memory.items():
-            thisCosine = memVec.compare(queryVec)
-            print mem, thisCosine
-            if thisCosine > highestCosine:
-                highestCosine = thisCosine 
-                bestMatch = mem
-         print bestMatch
-     
-         if bestMatch == 'none':
-            self.fail(self._request_count)
-         else:
-             print 'Best match is ' + bestMatch + ' = ' + self.memStr[bestMatch]
-             # convert chunkList into a dictionary
-             chunkDict = {}
-             chunkDict.update(chunkList)
-             # replace the placeholder '?' with the retrieved memory 'mem'
-             for slot,value in chunkDict.items():
-                if value is '?':
-                    chunkDict[slot] = bestMatch
-
-             chunkObj = Chunk(chunkDict)
-             chunkObj.activation = highestCosine
-             self.recall(chunkObj,matches=[],request_number=self._request_count)
-
-
-  # chunk2list converts a chunk into a list of (slot,value) pairs
-  # chunk2list checks for unassigned values, i.e., '?stuff'
-  def chunk2list(self,chunk):
-    # if the chunk is a Buffer object, extract the Chunk object from inside it, then turn the Chunk into a string
-    if isinstance(chunk,Buffer):
-        chunk = Chunk(chunk.chunk)
-    # if the chunk is a Chunk object, turn the Chunk into a string
-    if isinstance(chunk,Chunk):
-        chunk = str(chunk)
-    # otherwise, assume it is already a string and modify the string, 
-    # replacing instances of ?stuff with corresponding stuff
-    bound=None
-    if hasattr(self,'sch'):
-        bound=getattr(self.sch,'bound',None)
-    # split the chunkStr where there are spaces to get slot:value pairs
-    slotvaluepairs = chunk.split()
-    # iterate on the slot,value pairs to find ?values that need to be substituted
-    # and undefined values (i.e., values for which there are no defined vectors)
-    # and undefined slots (i.e., slots for which there are no defined permutations)
-    # then add slots and values as pairs (lists of 2) to a list (chunkList)
-    chunkList = []
-    for slotvalue in slotvaluepairs:
-        # split on the colon to get the slot and value
-        slot,value = slotvalue.split(':')
-        if value.startswith('?') and value is not '?':
-            try:
-                # take "?value" without the "?"
-                key = value[1:]
-                # look it up in the "bound dictionary" and substitute
-                value = bound[key]
-            # if "value" in "?value" is undefined, replace with "?"
-            except:
-                value = '?'
-        # update the chunk list with the [slot,value] pair
-        chunkList.append([slot,value])
-            
-    return chunkList
-  
-  # generate Gaussian vectors and random permutations for values & slots without
-  def defineVectors(self,chunkList):
-    for [slot,value] in chunkList:
-        # if it's a new slot, create a new random permutation
-        if slot not in self.slots.keys():
-            self.slots[slot] = numpy.random.permutation(self.N)    
-        # if it starts with ! (i.e., not) just ignore for now
-        if value.startswith('!'):
-            value = value[1:]
-        # if it's a new value, create a new random vector
-        if value not in self.environment.keys():
-            self.environment[value] = HRR(N=self.N)
-            self.memory[value] = HRR(data=numpy.zeros(self.N))#self.environment[value]
-
-
-  def getOpenNGrams(self, seg, scale, spaces=None):
-    '''
-    Returns a list of the open n-grams of the string "seg", with sizes specified
-    by "scale", which should be a list of positive integers in ascending order.
-    "Spaces" indicates whether a space character should be used to mark gaps in
-    non-contiguous n-grams.
-    '''
-    ngrams = []
-    
-    for size in scale:
-        if size > len(seg): break
-    
-        for i in xrange(len(seg)):
-            if i+size > len(seg): break
-            ngrams.append(seg[i:i+size])
-            if i+size == len(seg): continue
-            for b in xrange(1, size):
-                for e in xrange(1, len(seg)-i-size+1):
-                    if spaces is None:
-                        ngrams.append(seg[i:i+b] + seg[i+b+e:i+e+size])
-                    else:
-                        ngrams.append(seg[i:i+b] + [spaces] + seg[i+b+e:i+e+size])
-    return ngrams
-     
-  def fail(self,request_number):
-     if self.threshold is None: 
-         time=self.maximum_time
-     else:
-         time=self.latency*math.exp(-self.threshold)
-         if time>self.maximum_time: time=self.maximum_time 
-     yield time
-     if request_number!=self._request_count: return
-     
-     self.error=True
-     self._buffer.clear()
-     self.busy=False
-  
-  def recall(self,chunk,matches,request_number):
-     self.finst.add(chunk)
-     time=self.latency*math.exp(-chunk.activation)
-     if time>self.maximum_time: time=self.maximum_time
-     yield time
-     if request_number!=self._request_count: return
-     self._buffer.set(chunk)
-     for a in self.adaptors: a.recalled(chunk)
-     self.busy=False
-     
-  
-  def get_activation(self,chunk):
-     if not isinstance(chunk,Chunk):
-         try:
-           chunk=Chunk(chunk,self.sch.bound)
-         except AttributeError:
-           chunk=Chunk(chunk,None)           
-         for c in self.hdm:
-             if chunk==c:
-                 chunk=c
-                 break
-         else:
-             raise Exception('No such chunk found')        
-     act=0
-     for a in self.adaptors:
-        act+=a.activation(chunk)
-     if self.record_all_chunks or chunk.record is True:
-         self.log[str(chunk)]=act 
-     return act   
-                
-  def add_adaptor(self,a):
-     self.adaptors.append(a)
-
-class Finst:
-  def __init__(self,parent,size=4,time=3.0):
-    self.parent=parent
-    self.size=size
-    self.time=time
-    self.obj=[]
-  def contains(self,o):
-    return o in self.obj
-  def add(self,o):
-    if self.size==0: return
-    self.obj.append(o)
-    if len(self.obj)>self.size:
-      self.remove(self.obj[0])
-    self.parent.sch.add(self.remove,args=[o],delay=self.time)
-  def remove(self,o):
-    if o in self.obj: self.obj.remove(o)          
-      
-    
-class MemorySubModule:
-  def __init__(self,parent):
-    self.parent=parent
-    if parent is not None:
-      parent.add_adaptor(self)
-  def create(self,chunk,**keys):
-    pass
-  def merge(self,chunk,**keys):
-    pass
-  def matched(self,chunks):
-    pass  
-  def activation(self,chunk):
-    return 0
-  def recalled(self,chunk):
-    pass
-  def now(self):
-    if self.parent is None or not self.parent._is_converted(): return 0
-    else: return self.parent.now()
-
-class DMNoise(MemorySubModule):
-  def __init__(self,memory,noise=0.3,baseNoise=0.0):
-    MemorySubModule.__init__(self,memory)
-    self.noise=noise
-    self.baseNoise=baseNoise  
-  def create(self,chunk,**keys):
-    chunk.baseNoise=self.logisticNoise(self.baseNoise)
-  def activation(self,chunk):
-    return chunk.baseNoise+self.logisticNoise(self.noise)
-  def logisticNoise(self,s):
-    try:
-      x=self.parent.random.random()
-    except AttributeError:
-      import random
-      x=random.random()
-    return s*math.log(1.0/x-1.0)
-      
-
-
-class DMBaseLevel(MemorySubModule):
-  def __init__(self,memory,decay=0.5,limit=None):
-    MemorySubModule.__init__(self,memory)
-    self.decay=decay
-    self.limit=limit
-  
-  def create(self,chunk,time=0.0,baselevel=None,**keys):
-    chunk.creation=self.now()
-    chunk.times=[chunk.creation-time]
-    chunk.count=1
-    if baselevel is not None and baselevel!='calculate':
-      chunk.baselevel=baselevel
-    
-  def merge(self,chunk,time=0.0,baselevel=None,**keys):
-    chunk.times.append(self.now()-time)
-    chunk.count+=1
-    if self.limit is not None and len(chunk.times)>self.limit:
-      if self.limit==0: del chunk.times[:]
-      else: chunk.times=chunk.times[-self.limit:]
-    if baselevel is not None:
-      if baselevel=='calculate': del chunk.baselevel
-      else: chunk.baselevel=baselevel
-    
-  def activation(self,chunk):
-    if hasattr(chunk,'baselevel'):
-      return chunk.baselevel
-    if self.decay==None: 
-      return 0
-    d=self.decay
-    now=self.now()
-    t=[now-time for time in chunk.times]
-    t=[max(L,0.005) for L in t]
-    
-    exact=0.0
-    approx=0.0
-    if len(t)>0:
-      exact=sum([math.pow(time,-d) for time in t])
-    if self.limit is not None:
-      n=chunk.count
-      k=len(chunk.times)
-      if n>k:
-        tn=now-chunk.creation
-        if k>0:
-          tk=now-chunk.times[0]
-        else:
-          tk=0.0
-        approx=(n-k)/(1-d)*(math.pow(tn,1-d)-math.pow(tk,1-d))/(tn-tk)
-    
-    B=math.log(exact+approx)
-    return B
-
-class DMSpacing(MemorySubModule):
-  def __init__(self,memory,decayScale=0.0,decayIntercept=0.5):
-    MemorySubModule.__init__(self,memory)
-    self.decayScale=decayScale
-    self.decayIntercept=decayIntercept  
-  
-  def create(self,chunk,time=0.0,**keys):
-    chunk.times=[(self.actr.time-time,self.decayIntercept)]
-        
-  def merge(self,chunk,time=0.0,**keys):
-    t=self.now()-time
-    m=self.activation(chunk)
-    d=self.decayScale*math.exp(m)+self.decayIntercept
-    chunk.times.append((t,d))
-    
-  def activation(self,chunk):
-    now=self.now()
-    total=0.0
-    for time,d in chunk.times:
-      total+=math.pow(now-time,-d)
-    B=math.log(total)
-    return B
-
-
-
-class DMSalience(MemorySubModule):
-  def __init__(self,memory):
-    MemorySubModule.__init__(self,memory)
-    self.histogram={}
-    self.weight={}
-    self.memory=memory
-  
-  def weights(self,**weights):
-    self.histogram={}
-    self.weight={}
-    for k,v in weights.items():
-      if k.startswith('_'): k=int(k[1:])
-      self.weight[k]=float(v)
-      self.histogram[k]={}
-    
-  def context(self,pattern):
-    pat=Pattern(pattern)
-    chunks=[x for x in self.memory.hdm if pat.match(x) is not None]
-    for k,hist in self.histogram.items():
-      hist.clear()
-    if len(chunks)==0: raise Exception('No chunks match salience pattern: "%s"'%pattern)
-    dw=1.0/len(chunks)
-    for c in chunks:
-      for k,hist in self.histogram.items():
-        val=c.get(k,None)
-        if val not in hist: hist[val]=dw
-        else: hist[val]+=dw
-        
-  def activation(self,chunk):
-    act=0.0
-    for k,hist in self.histogram.items():
-      val=chunk.get(k,None)
-      p=hist[val]
-      w=self.weight[k]
-      act+=math.log(1.0/p,2)*w
-#    if self.log: self.log.act[`chunk`]=act
-    return act  
-      
-      
-class DMSpreading(MemorySubModule):
-  def __init__(self,memory,*buffers):
-    MemorySubModule.__init__(self,memory)
-    self.strength=1
-    self.buffers=buffers
-    self.weight={}
-    for b in buffers: 
-      self.weight[b]=1
-    self.slots={}
-    
-  def create(self,chunk):
-    for slot in chunk.values():
-      if slot in self.slots:
-        self.slots[slot].append(chunk)
-      else:
-        self.slots[slot]=[chunk]
-  def activation(self,chunk):
-    values=chunk.values()
-  
-    total=0.0
-    for b in self.buffers:
-     ch=b.chunk 
-     if ch is not None:
-      w=self.weight[b]
-      for key,slot in ch.items():
-        if slot in values:
-          s=self.strength-math.log(len(self.slots[slot])+1)
-          total+=w*s
-    return total      
-        
-class DMFixed(MemorySubModule):
-  def __init__(self,memory,default=0):
-    MemorySubModule.__init__(self,memory)
-    self.default=default
-  def create(self,chunk,fixed=None,**keys):
-    if fixed is None: fixed=self.default
-    chunk.fixed=fixed
-  def merge(self,chunk,fixed=0,**keys):
-    chunk.fixed+=fixed
-  def activation(self,chunk):
-    return chunk.fixed
-
-
-class Associated:
-  def __init__(self,a,b):
-    self.a=a
-    self.b=b
-
-class DMAssociate(MemorySubModule):
-  def __init__(self,memory,buffer,weight=1,decay=0.5,limit=None):
-    MemorySubModule.__init__(self,memory)
-    self._buffer=buffer
-    self._mem={}
-    self._bl=DMBaseLevel(None,decay=decay,limit=limit)
-    self.weight=weight
-  def set_association(self,pre,post,baselevel):
-    c=self._mem.get((pre,post),None)
-    if c==None:
-      c=Associated(pre,post)
-      self._bl.create(c)
-      self._mem[(pre,post)]=c
-    c.baselevel=baselevel  
-    
-  def recalled(self,chunk):
-    prechunk=self._buffer.chunk
-    if prechunk is None: return
-    for pk,pv in prechunk.items():
-      for k,v in chunk.items():
-        c=self._mem.get((pv,v),None)
-        if c==None:
-          c=Associated(pv,v)
-          self._bl.create(c)
-          self._mem[(pv,v)]=c
-        else:
-          self._bl.merge(c)
-  def activation(self,chunk):
-    act=0
-    prechunk=self._buffer.chunk
-    if prechunk is None: return 0
-    for pk,pv in prechunk.items():
-      for k,v in chunk.items():
-        c=self._mem.get((pv,v),None)
-        if c is not None:         
-          act+=self._bl.activation(c)
-    return act*self.weight
-        
-        
-        
-        
-    
-          
-    
-class Partial:
-  def __init__(self,memory,strength=1.0,limit=-1.0):
-    self._memory=memory
-    self.limit=limit
-    self.strength=strength
-    self.sims={}
-    memory.partials.append(self)
-    
-  def similarity(self,a,b,value):
-    self.sims[a,b]=value
-    self.sims[b,a]=value
-  
-  def request(self,pattern):
-    self._memory.request(pattern,partial=self)
-    
-  def match(self,key,a,b):
-    m=self.sims.get((a,b),self.limit)
-    p=self.strength
-    return p*m
-    
-      
-class BlendingMemory(Memory):
-  def recall(self,chunk,matches,request_number):
-    keys=list(sorted(chunk.keys()))
-    if not hasattr(chunk,'_blend_keys'):
-      bk=[]
-      for k in keys:
-        try:
-          v=float(chunk[k])
-          bk.append(k)
-        except:
-          pass
-      chunk._blend_keys=tuple(bk)
-    bk=chunk._blend_keys
-    if len(bk)>0:
-      a=chunk.activation
-      chunk=Chunk(chunk)
-      chunk.activation=a
-      
-      for b in bk: chunk[b]=0
-      total_activation=0
-      for m in matches:
-        m.exp_activation=math.exp(m.activation)
-        k=list(sorted(m.keys()))
-        if k==keys:
-          blend={}
-          try:            
-            for b in bk:
-              blend[b]=float(m[b])
-          except ValueError:
-            continue
-          for b in bk:
-            chunk[b]+=blend[b]*m.exp_activation
-          total_activation+=m.exp_activation
-      for b in bk:
-        chunk[b]/=total_activation
-    for m in Memory.recall(self,chunk,matches,request_number):
-      yield m
-      
-    
-  
-  
diff --git a/ccm/lib/hrr.py b/ccm/lib/hrr.py
index cf5a2ac..10fd71d 100644
--- a/ccm/lib/hrr.py
+++ b/ccm/lib/hrr.py
@@ -12,9 +12,7 @@ def __init__(self,N=None,data=None):
         elif N is not None:
             self.randomize(N)
         else:
-            raise Exception('Must specify size or data for HRR')
-    def length(self):
-        return norm(self.v)        
+            raise Exception('Must specify size or data for HRR')
     def normalize(self):
         nrm=norm(self.v)
         if nrm>0: self.v/=nrm
@@ -29,9 +27,7 @@ def __add__(self,other):
         return HRR(data=self.v+other.v)
     def __iadd__(self,other):
         self.v+=other.v
-        return self
-    def __neg__(self):
-        return HRR(data=-self.v)    
+        return self
     def __sub__(self,other):
         return HRR(data=self.v-other.v)
     def __isub__(self,other):
@@ -44,6 +40,17 @@ def __mul__(self,other):
             return HRR(data=x)
         else:
             return HRR(data=self.v*other)
+            
+    def permute(self,permutation):
+        # create a vector of zeroes
+        permutedVector = numpy.zeros(len(self.v))
+        
+        # copy elements from self.v into permutedVector
+        # according to permutation specified by permutation
+        for index, value in numpy.ndenumerate(self.v):
+            permutedVector[permutation[index]] = value
+        return HRR(data=permutedVector)
+        
     def convolve(self,other):
         x=ifft(fft(self.v)*fft(other.v)).real
         return HRR(data=x)
@@ -61,8 +68,6 @@ def compare(self,other):
         scale=norm(self.v)*norm(other.v)
         if scale==0: return 0
         return numpy.dot(self.v,other.v)/(scale)
-    def dot(self,other):
-        return numpy.dot(self.v,other.v)
     def distance(self,other):
         return 1-self.compare(other)
     def __invert__(self):
@@ -142,75 +147,9 @@ def all(self,input):
         
 
         
-                       
-                       
-from math import sin,pi,acos
-class Vocabulary:
-    def __init__(self,dimensions,randomize=True):
-        self.dimensions=dimensions
-        self.randomize=randomize
-        self.hrr={}
-        ident=[0]*dimensions
-        ident[0]=1.0
-        self.hrr['I']=HRR(data=ident)
-    def __getitem__(self,key):
-        if key not in self.hrr:
-            if self.randomize:    
-                self.hrr[key]=HRR(self.dimensions)
-            else:
-                v=[0]*self.dimensions
-                v[len(self.hrr)]=1.0
-                self.hrr[key]=HRR(data=v)    
-        return self.hrr[key]        
-    def parse(self,text):
-        return eval(text,{},self)
-        
-    def text(self,v):
-        matches=[]
-        
-        names=self.hrr.keys()
-        names.sort()
-        names.remove('I')
-
-        for i in range(len(names)):        
-            k=names[i]
-            val=self.hrr[k]
-            c=val.compare(v)
-            if c>0: matches.append((c,k))
-            for j in range(i+1,len(names)):
-                k2=names[j]
-                val2=self.hrr[k2]
-                c=(val*val2).compare(v)                
-                if c>0: matches.append((c,'%s*%s'%(k,k2)))
-        matches.sort()
-        matches.reverse()
-        r=[]
-        for m in matches:
-            if m[0]>0.3: r.append(m)
-            elif len(r)<2: r.append(m)
-            else: break
-        return '+'.join(['%s(%0.2f)'%(k,c) for (c,k) in r])
-         
-         
-        
-    def prob_cleanup(self,compare,vocab_size,steps=10000):
-        # see http://yamlb.wordpress.com/2008/05/20/why-2-random-vectors-are-orthogonal-in-high-dimention/ 
-        #  for argument that the probability af two random vectors being a given angle apart is
-        #  proportional to sin(angle)^(D-2)
-        def prob_func(angle): 
-            return sin(angle)**(self.dimensions-2)
-        angle=acos(compare)
-        num=0
-        dnum=angle/steps
-        denom=0
-        ddenom=pi/steps
-        for i in range(steps):
-            num+=prob_func(pi-angle+dnum*i)
-            denom+=prob_func(ddenom*i)
-        num*=dnum
-        denom*=ddenom    
-        perror1=num/denom    
-        pcorrect=(1-perror1)**vocab_size
-        return pcorrect
+                        
+    
+                                    
+