Added __eq__ to relation object

git-svn-id: http://galileo.dmi.unict.it/svn/relational/trunk@66 014f5005-505e-4b48-8d0a-63407b615a7c
2008-11-30 12:28:16 +00:00 · 2008-11-30 12:28:16 +00:00 · 51745e8218
commit 51745e8218
parent dda1dba1a4
2 changed files with 417 additions and 393 deletions
--- a/3
+++ b/3
@ -45,3 +45,6 @@
 - Outer join methods simplified
 - Form to send a survey
 - Makefile to create .deb package
 0.8
 - Added __eq__ to relation object, will compare ignoring order.
--- a/relation.py
+++ b/relation.py
@ -19,398 +19,419 @@
 from rtypes import *
 class relation (object):
-	'''This objects defines a relation (as a group of consistent tuples) and operations
+    '''This objects defines a relation (as a group of consistent tuples) and operations
-	A relation can be represented using a table
+    A relation can be represented using a table
-	Calling an operation and providing a non relation parameter when it is expected will
+    Calling an operation and providing a non relation parameter when it is expected will
-	result in a None value'''	
+    result in a None value'''    
-	def __init__(self,filename=""):
+    def __init__(self,filename=""):
-		'''Creates a relation, accepts a filename and then it will load the relation from
+        '''Creates a relation, accepts a filename and then it will load the relation from
-		that file. If no parameter is supplied an empty relation is created. Empty
+        that file. If no parameter is supplied an empty relation is created. Empty
-		relations are used in internal operations'''
+        relations are used in internal operations'''
-		if len(filename)==0:#Empty relation
+        if len(filename)==0:#Empty relation
-			self.content=[]
+            self.content=[]
-			self.header=header([])
+            self.header=header([])
-			return
+            return
-		fp=file(filename)
+        fp=file(filename)
-		self.header=header(fp.readline().replace("\n","").strip().split(" "))
+        self.header=header(fp.readline().replace("\n","").strip().split(" "))
-		self.content=[]
+        self.content=[]
-		row=fp.readline()
+        row=fp.readline()
-		while len(row)!=0:#Reads the content of the relation
+        while len(row)!=0:#Reads the content of the relation
-			self.content.append(row.replace("\n","").strip().split(" "))
+            self.content.append(row.replace("\n","").strip().split(" "))
-			row=fp.readline()
+            row=fp.readline()
-		fp.close()
+        fp.close()
-	def save(self,filename):
+    def save(self,filename):
-		'''Saves the relation in a file'''
+        '''Saves the relation in a file'''
-		res=""
+        res=""
-		res+=" ".join(self.header.attributes)
+        res+=" ".join(self.header.attributes)
-		for r in self.content:
+        for r in self.content:
-			res+="\n"
+            res+="\n"
-			res+=" ".join(r)
+            res+=" ".join(r)
-		fp=file(filename,'w')
+        fp=file(filename,'w')
-		fp.write(res)
+        fp.write(res)
-		fp.close()
+        fp.close()
-	def rearrange(self,other):
+    def rearrange(self,other):
-		'''If two relations share the same attributes in a different order, this method
+        '''If two relations share the same attributes in a different order, this method
-		will use projection to make them have the same attributes' order.
+        will use projection to make them have the same attributes' order.
-		It is not exactely related to relational algebra. Just a method used 
+        It is not exactely related to relational algebra. Just a method used 
-		internally.
+        internally.
-		Will return None if they don't share the same attributes'''
+        Will return None if they don't share the same attributes'''
-		if (self.__class__!=other.__class__):
+        if (self.__class__!=other.__class__):
-			return None
+            return None
-		if self.header.sharedAttributes(other.header) == len(self.header.attributes) == len(other.header.attributes):
+        if self.header.sharedAttributes(other.header) == len(self.header.attributes) == len(other.header.attributes):
-			return other.projection(list(self.header.attributes))
+            return other.projection(list(self.header.attributes))
-		return None
+        return None
-	def selection(self,expr):
+    def selection(self,expr):
-		'''Selection, expr must be a valid boolean expression, can contain field names,
+        '''Selection, expr must be a valid boolean expression, can contain field names,
-		constant, math operations and boolean ones.'''
+        constant, math operations and boolean ones.'''
-		attributes={}
+        attributes={}
-		newt=relation()
+        newt=relation()
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		for i in self.content:
+        for i in self.content:
-			for j in range(len(self.header.attributes)):
+            for j in range(len(self.header.attributes)):
-				if i[j].isdigit():
+                if i[j].isdigit():
-					attributes[self.header.attributes[j]]=int(i[j])
+                    attributes[self.header.attributes[j]]=int(i[j])
-				elif rstring(i[j]).isFloat():
+                elif rstring(i[j]).isFloat():
-					attributes[self.header.attributes[j]]=float(i[j])
+                    attributes[self.header.attributes[j]]=float(i[j])
-				elif isDate(i[j]):
+                elif isDate(i[j]):
-					attributes[self.header.attributes[j]]=rdate(i[j])
+                    attributes[self.header.attributes[j]]=rdate(i[j])
-				else:
+                else:
-					attributes[self.header.attributes[j]]=i[j]
+                    attributes[self.header.attributes[j]]=i[j]
-			if eval(expr,attributes):
+            if eval(expr,attributes):
-				newt.content.append(i)
+                newt.content.append(i)
-		return newt
+        return newt
-	def product (self,other):
+    def product (self,other):
-		'''Cartesian product, attributes must be different to avoid collisions
+        '''Cartesian product, attributes must be different to avoid collisions
-		Doing this operation on relations with colliding attributes will 
+        Doing this operation on relations with colliding attributes will 
-		cause the return of a None value.
+        cause the return of a None value.
-		It is possible to use rename on attributes and then use the product'''
+        It is possible to use rename on attributes and then use the product'''
-		if (self.__class__!=other.__class__)or(self.header.sharedAttributes(other.header)!=0):
+        if (self.__class__!=other.__class__)or(self.header.sharedAttributes(other.header)!=0):
-			return None
+            return None
-		newt=relation()
+        newt=relation()
-		newt.header=header(self.header.attributes+other.header.attributes)
+        newt.header=header(self.header.attributes+other.header.attributes)
-		for i in self.content:
+        for i in self.content:
-			for j in other.content:
+            for j in other.content:
-				newt.content.append(i+j)
+                newt.content.append(i+j)
-		return newt
+        return newt
-	def projection(self,* attributes):
+    def projection(self,* attributes):
-		'''Projection operator, takes many parameters, for each field to use.
+        '''Projection operator, takes many parameters, for each field to use.
-		Can also use a single parameter with a list.
+        Can also use a single parameter with a list.
-		Will delete duplicate items
+        Will delete duplicate items
-		If an empty list or no parameters are provided, returns None'''	
+        If an empty list or no parameters are provided, returns None'''    
-		#Parameters are supplied in a list, instead with multiple parameters
+        #Parameters are supplied in a list, instead with multiple parameters
-		if attributes[0].__class__ == list().__class__:
+        if attributes[0].__class__ == list().__class__:
-			attributes=attributes[0]
+            attributes=attributes[0]
-		#Avoiding duplicated attributes
+        #Avoiding duplicated attributes
-		attributes1=[]
+        attributes1=[]
-		for i in attributes:
+        for i in attributes:
-			if i not in attributes1:
+            if i not in attributes1:
-				attributes1.append(i)
+                attributes1.append(i)
-		attributes=attributes1
+        attributes=attributes1
-		ids=self.header.getAttributesId(attributes)
+        ids=self.header.getAttributesId(attributes)
-		if len(ids)==0:
+        if len(ids)==0:
-			return None
+            return None
-		newt=relation()
+        newt=relation()
-		#Create the header
+        #Create the header
-		h=[]
+        h=[]
-		for i in ids:
+        for i in ids:
-			h.append(self.header.attributes[i])
+            h.append(self.header.attributes[i])
-		newt.header=header(h)
+        newt.header=header(h)
-		#Create the body
+        #Create the body
-		for i in self.content:
+        for i in self.content:
-			row=[]
+            row=[]
-			for j in ids:
+            for j in ids:
-				row.append(i[j])
+                row.append(i[j])
-			if row not in newt.content:#Avoids duplicated items
+            if row not in newt.content:#Avoids duplicated items
-				newt.content.append(row)
+                newt.content.append(row)
-		return newt
+        return newt
-	def rename(self,params):
+    def rename(self,params):
-		'''Operation rename. Takes a dictionary
+        '''Operation rename. Takes a dictionary
-		Will replace the itmem with its content.
+        Will replace the itmem with its content.
-		For example if you want to rename a to b, provide {"a":"b"}
+        For example if you want to rename a to b, provide {"a":"b"}
-		If an "old" field doesn't exist, None will be returned'''
+        If an "old" field doesn't exist, None will be returned'''
-		result=[]
+        result=[]
-		newt=relation()
+        newt=relation()
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		for old,new in params.iteritems():
+        for old,new in params.iteritems():
-			if (newt.header.rename(old,new)) == False:
+            if (newt.header.rename(old,new)) == False:
-				return None
+                return None
-		newt.content=list(self.content)
+        newt.content=list(self.content)
-		return newt
+        return newt
-	def intersection(self,other):
+    def intersection(self,other):
-		'''Intersection operation. The result will contain items present in both
+        '''Intersection operation. The result will contain items present in both
-		operands.
+        operands.
-		Will return an empty one if there are no common items.
+        Will return an empty one if there are no common items.
-		Will return None if headers are different.
+        Will return None if headers are different.
-		It is possible to use projection and rename to make headers match.'''
+        It is possible to use projection and rename to make headers match.'''
-		other=self.rearrange(other) #Rearranges attributes' order
+        other=self.rearrange(other) #Rearranges attributes' order
-		if (self.__class__!=other.__class__)or(self.header!=other.header):
+        if (self.__class__!=other.__class__)or(self.header!=other.header):
-			return None
+            return None
-		newt=relation()
+        newt=relation()
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		#Adds only element not in other, duplicating them
+        #Adds only element not in other, duplicating them
-		for e in self.content:
+        for e in self.content:
-			if e in other.content:
+            if e in other.content:
-				newt.content.append(list(e))
+                newt.content.append(list(e))
-		return newt
+        return newt
-	def difference(self,other):
+    def difference(self,other):
-		'''Difference operation. The result will contain items present in first
+        '''Difference operation. The result will contain items present in first
-		operand but not in second one.
+        operand but not in second one.
-		Will return an empty one if the second is a superset of first.
+        Will return an empty one if the second is a superset of first.
-		Will return None if headers are different.
+        Will return None if headers are different.
-		It is possible to use projection and rename to make headers match.'''
+        It is possible to use projection and rename to make headers match.'''
-		other=self.rearrange(other) #Rearranges attributes' order
+        other=self.rearrange(other) #Rearranges attributes' order
-		if (self.__class__!=other.__class__)or(self.header!=other.header):
+        if (self.__class__!=other.__class__)or(self.header!=other.header):
-			return None
+            return None
-		newt=relation()
+        newt=relation()
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		#Adds only element not in other, duplicating them
+        #Adds only element not in other, duplicating them
-		for e in self.content:
+        for e in self.content:
-			if e not in other.content:
+            if e not in other.content:
-				newt.content.append(list(e))
+                newt.content.append(list(e))
-		return newt
+        return newt
-	def union(self,other):
+    def union(self,other):
-		'''Union operation. The result will contain items present in first
+        '''Union operation. The result will contain items present in first
-		and second operands.
+        and second operands.
-		Will return an empty one if both are empty.
+        Will return an empty one if both are empty.
-		Will not insert tuplicated items.
+        Will not insert tuplicated items.
-		Will return None if headers are different.
+        Will return None if headers are different.
-		It is possible to use projection and rename to make headers match.'''
+        It is possible to use projection and rename to make headers match.'''
-		other=self.rearrange(other) #Rearranges attributes' order
+        other=self.rearrange(other) #Rearranges attributes' order
-		if (self.__class__!=other.__class__)or(self.header!=other.header):
+        if (self.__class__!=other.__class__)or(self.header!=other.header):
-			return None
+            return None
-		newt=relation()
+        newt=relation()
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		#Adds element from self, duplicating them all
+        #Adds element from self, duplicating them all
-		for e in self.content:
+        for e in self.content:
-			newt.content.append(list(e))
+            newt.content.append(list(e))
-		for e in other.content:
+        for e in other.content:
-			if e not in newt.content:
+            if e not in newt.content:
-				newt.content.append(list(e))
+                newt.content.append(list(e))
-		return newt
+        return newt
-	def thetajoin(self,other,expr):
+    def thetajoin(self,other,expr):
-		'''Defined as product and then selection with the given expression.'''
+        '''Defined as product and then selection with the given expression.'''
-		return self.product(other).selection(expr)
+        return self.product(other).selection(expr)
-	def outer(self,other):
+    def outer(self,other):
-		'''Does a left and a right outer join and returns their union.'''
+        '''Does a left and a right outer join and returns their union.'''
-		a=self.outer_right(other)
+        a=self.outer_right(other)
-		b=self.outer_left(other)
+        b=self.outer_left(other)
-		print a
+        print a
-		print b
+        print b
-		return a.union(b)
+        return a.union(b)
-	def outer_right(self,other):
+    def outer_right(self,other):
-		'''Outer right join. Considers self as left and param as right. If the
+        '''Outer right join. Considers self as left and param as right. If the
-		tuple has no corrispondence, empy attributes are filled with a "---"
+        tuple has no corrispondence, empy attributes are filled with a "---"
-		string. This is due to the fact that empty string or a space would cause
+        string. This is due to the fact that empty string or a space would cause
-		problems when saving the relation.
+        problems when saving the relation.
-		Just like natural join, it works considering shared attributes.'''
+        Just like natural join, it works considering shared attributes.'''
-		return other.outer_left(self)
+        return other.outer_left(self)
-	def outer_left(self,other,swap=False):
+    def outer_left(self,other,swap=False):
-		'''Outer left join. Considers self as left and param as right. If the 
+        '''Outer left join. Considers self as left and param as right. If the 
-		tuple has no corrispondence, empty attributes are filled with a "---" 
+        tuple has no corrispondence, empty attributes are filled with a "---" 
-		string. This is due to the fact that empty string or a space would cause
+        string. This is due to the fact that empty string or a space would cause
-		problems when saving the relation.
+        problems when saving the relation.
-		Just like natural join, it works considering shared attributes.'''
+        Just like natural join, it works considering shared attributes.'''
-		shared=[]
+        shared=[]
-		for i in self.header.attributes:
+        for i in self.header.attributes:
-			if i in other.header.attributes:
+            if i in other.header.attributes:
-				shared.append(i)
+                shared.append(i)
-		newt=relation() #Creates the new relation
+        newt=relation() #Creates the new relation
-		#Adds all the attributes of the 1st relation
+        #Adds all the attributes of the 1st relation
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		#Adds all the attributes of the 2nd, when non shared
+        #Adds all the attributes of the 2nd, when non shared
-		for i in other.header.attributes:
+        for i in other.header.attributes:
-			if i not in shared:
+            if i not in shared:
-				newt.header.attributes.append(i)
+                newt.header.attributes.append(i)
-		#Shared ids of self
+        #Shared ids of self
-		sid=self.header.getAttributesId(shared)
+        sid=self.header.getAttributesId(shared)
-		#Shared ids of the other relation
+        #Shared ids of the other relation
-		oid=other.header.getAttributesId(shared)
+        oid=other.header.getAttributesId(shared)
-		#Non shared ids of the other relation
+        #Non shared ids of the other relation
-		noid=[]
+        noid=[]
-		for i in range(len(other.header.attributes)):
+        for i in range(len(other.header.attributes)):
-			if i not in oid:
+            if i not in oid:
-				noid.append(i)
+                noid.append(i)
-		for i in self.content:
+        for i in self.content:
-			#Tuple partecipated to the join?
+            #Tuple partecipated to the join?
-			added=False
+            added=False
-			for j in other.content:
+            for j in other.content:
-				match=True
+                match=True
-				for k in range(len(sid)):
+                for k in range(len(sid)):
-					match=match and ( i[sid[k]]== j[oid[k]])
+                    match=match and ( i[sid[k]]== j[oid[k]])
-				if match:
+                if match:
-					item=list(i)
+                    item=list(i)
-					for l in noid:
+                    for l in noid:
-						item.append(j[l])
+                        item.append(j[l])
-					newt.content.append(item)
+                    newt.content.append(item)
-					added=True
+                    added=True
-			#If it didn't partecipate, adds it
+            #If it didn't partecipate, adds it
-			if not added:
+            if not added:
-				item=list(i)
+                item=list(i)
-				for l in range(len(noid)):
+                for l in range(len(noid)):
-					item.append("---")
+                    item.append("---")
-				newt.content.append(item)
+                newt.content.append(item)
-		return newt
+        return newt
-	def join(self,other):
+    def join(self,other):
-		'''Natural join, joins on shared attributes (one or more). If there are no
+        '''Natural join, joins on shared attributes (one or more). If there are no
-		shared attributes, it will behave as cartesian product.'''
+        shared attributes, it will behave as cartesian product.'''
-		shared=[]
+        shared=[]
-		for i in self.header.attributes:
+        for i in self.header.attributes:
-			if i in other.header.attributes:
+            if i in other.header.attributes:
-				shared.append(i)
+                shared.append(i)
-		newt=relation() #Creates the new relation
+        newt=relation() #Creates the new relation
-		#Adds all the attributes of the 1st relation
+        #Adds all the attributes of the 1st relation
-		newt.header=header(list(self.header.attributes))
+        newt.header=header(list(self.header.attributes))
-		#Adds all the attributes of the 2nd, when non shared
+        #Adds all the attributes of the 2nd, when non shared
-		for i in other.header.attributes:
+        for i in other.header.attributes:
-			if i not in shared:
+            if i not in shared:
-				newt.header.attributes.append(i)
+                newt.header.attributes.append(i)
-		#Shared ids of self
+        #Shared ids of self
-		sid=self.header.getAttributesId(shared)
+        sid=self.header.getAttributesId(shared)
-		#Shared ids of the other relation
+        #Shared ids of the other relation
-		oid=other.header.getAttributesId(shared)
+        oid=other.header.getAttributesId(shared)
-		#Non shared ids of the other relation
+        #Non shared ids of the other relation
-		noid=[]
+        noid=[]
-		for i in range(len(other.header.attributes)):
+        for i in range(len(other.header.attributes)):
-			if i not in oid:
+            if i not in oid:
-				noid.append(i)
+                noid.append(i)
-		for i in self.content:
+        for i in self.content:
-			for j in other.content:
+            for j in other.content:
-				match=True
+                match=True
-				for k in range(len(sid)):
+                for k in range(len(sid)):
-					match=match and ( i[sid[k]]== j[oid[k]])
+                    match=match and ( i[sid[k]]== j[oid[k]])
-				if match:
+                if match:
-					item=list(i)
+                    item=list(i)
-					for l in noid:
+                    for l in noid:
-						item.append(j[l])
+                        item.append(j[l])
-					newt.content.append(item)
+                    newt.content.append(item)
-		return newt
+        return newt
    def __eq__(self,other):
        '''Returns true if the relations are the same, ignoring order of items.
        This operation is rather heavy, since it requires sorting and comparing.'''
        other=self.rearrange(other) #Rearranges attributes' order so can compare tuples directly
        if (self.__class__!=other.__class__)or(self.header!=other.header):
            return False #Both parameters must be a relation
-	def __str__(self):
+        #Comparing header
-		'''Returns a string representation of the relation, can be printed with 
+        if len(self.header.attributes) != len(other.header.attributes):
-		monospaced fonts'''
+            return False #Not the same number of attributes -> not equals
-		m_len=[] #Maximum lenght string
+        for i in self.header.attributes:
-		for f in self.header.attributes:
+            if i not in other.header.attributes:
-			m_len.append(len(f))
+                return False #Non shared attribute
-		for f in self.content:
+        #comparing content
-			col=0
+        if len(self.content) != len(other.content):
-			for i in f:
+            return False #Not the same 
-				if len(i)>m_len[col]:
+        for i in self.content:
-					m_len[col]=len(i)
+            if i not in other.content:
-				col+=1
+                return False
        return True
    def __str__(self):
        '''Returns a string representation of the relation, can be printed with 
        monospaced fonts'''
        m_len=[] #Maximum lenght string
        for f in self.header.attributes:
            m_len.append(len(f))
        for f in self.content:
            col=0
            for i in f:
                if len(i)>m_len[col]:
                    m_len[col]=len(i)
                col+=1
-		res=""
+        res=""
-		for f in range(len(self.header.attributes)):
+        for f in range(len(self.header.attributes)):
-			res+="%s"%(self.header.attributes[f].ljust(2+m_len[f]))
+            res+="%s"%(self.header.attributes[f].ljust(2+m_len[f]))
-		for r in self.content:
+        for r in self.content:
-			col=0
+            col=0
-			res+="\n"
+            res+="\n"
-			for i in r:
+            for i in r:
-				res+="%s"% (i.ljust(2+m_len[col]))
+                res+="%s"% (i.ljust(2+m_len[col]))
-				col+=1
+                col+=1
-		return res
+        return res
 class header (object):
-	'''This class defines the header of a relation.
+    '''This class defines the header of a relation.
-	It is used within relations to know if requested operations are accepted'''
+    It is used within relations to know if requested operations are accepted'''
-	def __init__(self,attributes):
+    def __init__(self,attributes):
-		'''Accepts a list with attributes' names. Names MUST be unique'''
+        '''Accepts a list with attributes' names. Names MUST be unique'''
-		self.attributes=attributes
+        self.attributes=attributes
-	def __repr__(self):
+    def __repr__(self):
-		return "header(%s)" % (self.attributes.__repr__())
+        return "header(%s)" % (self.attributes.__repr__())
-	def rename(self,old,new):
+    def rename(self,old,new):
-		'''Renames a field. Doesn't check if it is a duplicate.
+        '''Renames a field. Doesn't check if it is a duplicate.
-		Returns True if the field was renamed, False otherwise'''
+        Returns True if the field was renamed, False otherwise'''
-		for i in range(len(self.attributes)):
+        for i in range(len(self.attributes)):
-			if self.attributes[i]==old:
+            if self.attributes[i]==old:
-				self.attributes[i]=new
+                self.attributes[i]=new
-				return True
+                return True
-		return False #Requested field was not found	
+        return False #Requested field was not found    
-	def sharedAttributes(self,other):
+    def sharedAttributes(self,other):
-		'''Returns how many attributes this header has in common with a given one'''
+        '''Returns how many attributes this header has in common with a given one'''
-		res=0
+        res=0
-		for i in self.attributes:
+        for i in self.attributes:
-			if i in other.attributes:
+            if i in other.attributes:
-				res+=1
+                res+=1
-		return res
+        return res
-	def __str__(self):
+    def __str__(self):
-		'''Returns String representation of the field's list'''
+        '''Returns String representation of the field's list'''
-		return self.attributes.__str__()
+        return self.attributes.__str__()
-	def __eq__(self,other):
+    def __eq__(self,other):
-		return self.attributes==other.attributes
+        return self.attributes==other.attributes
-	def __ne__(self,other):
+    def __ne__(self,other):
-		return self.attributes!=other.attributes
+        return self.attributes!=other.attributes
-	def getAttributesId(self,param):
+    def getAttributesId(self,param):
-		'''Returns a list with numeric index corresponding to field's name'''	
+        '''Returns a list with numeric index corresponding to field's name'''    
-		res=[]
+        res=[]
-		for i in param:
+        for i in param:
-			for j in range(len(self.attributes)):
+            for j in range(len(self.attributes)):
-				if i==self.attributes[j]:
+                if i==self.attributes[j]:
-					res.append(j)
+                    res.append(j)
-		return res
+        return res
 if __name__=="__main__":