Improved docstring

This commit is contained in:
Salvo 'LtWorf' Tomaselli 2015-07-14 15:08:39 +02:00
parent c275c1caf3
commit af02b5a59b

View File

@ -28,19 +28,31 @@ from relational.rtypes import *
class relation (object): class relation (object):
'''This objects defines a relation (as a group of consistent tuples) and operations '''
A relation can be represented using a table This object defines a relation (as a group of consistent tuples) and operations.
Calling an operation and providing a non relation parameter when it is expected will
result in a None value''' A relation is a particular kind of set, which has a number of named attributes and
a number of tuples, which must express a value for every attribute.
Set operations like union, intersection and difference are restricted and can only be
performed on relations which share the same set of named attributes.
The constructor optionally accepts a filename and then it will load the relation from
that file.
If no parameter is supplied an empty relation is created.
Files need to be comma separated as described in RFC4180.
The first line need to contain the attributes of the relation while the
following lines contain the tuples of the relation.
An empty relation needs a header, and can be filled using the insert()
method.
'''
__hash__ = None __hash__ = None
def __init__(self, filename=""): def __init__(self, filename=""):
'''Creates a relation, accepts a filename and then it will load the relation from
that file. If no parameter is supplied an empty relation is created. Empty
relations are used in internal operations.
By default the file will be handled like a comma separated as described in
RFC4180.'''
self._readonly = False self._readonly = False
if len(filename) == 0: # Empty relation if len(filename) == 0: # Empty relation
@ -71,9 +83,9 @@ class relation (object):
return key in self.content return key in self.content
def save(self, filename): def save(self, filename):
'''Saves the relation in a file. By default will save using the csv '''
format as defined in RFC4180, but setting comma_separated to False, Saves the relation in a file. Will save using the csv
it will use the old format with space separated values. format as defined in RFC4180.
''' '''
fp = open(filename, 'w') # Opening file in write mode fp = open(filename, 'w') # Opening file in write mode
@ -105,8 +117,9 @@ class relation (object):
)) ))
def selection(self, expr): def selection(self, expr):
'''Selection, expr must be a valid boolean expression, can contain field names, '''
constant, math operations and boolean ones.''' Selection, expr must be a valid Python expression; can contain field names.
'''
newt = relation() newt = relation()
newt.header = header(self.header) newt.header = header(self.header)
for i in self.content: for i in self.content:
@ -124,10 +137,9 @@ class relation (object):
return newt return newt
def product(self, other): def product(self, other):
'''Cartesian product, attributes must be different to avoid collisions '''
Doing this operation on relations with colliding attributes will Cartesian product. Attributes of the relations must differ.
cause an exception. '''
It is possible to use rename on attributes and then use the product'''
if (not isinstance(other, relation)): if (not isinstance(other, relation)):
raise Exception('Operand must be a relation') raise Exception('Operand must be a relation')
@ -144,10 +156,17 @@ class relation (object):
return newt return newt
def projection(self, * attributes): def projection(self, * attributes):
'''Projection operator, takes many parameters, for each field to use. '''
Can also use a single parameter with a list. Can be called in two different ways:
Will delete duplicate items a.projection('field1','field2')
If an empty list or no parameters are provided, returns None'''
or
a.projection(['field1','field2'])
The cardinality of the result, might be less than the cardinality
of the original object.
'''
# Parameters are supplied in a list, instead with multiple parameters # Parameters are supplied in a list, instead with multiple parameters
if not isinstance(attributes[0], str): if not isinstance(attributes[0], str):
attributes = attributes[0] attributes = attributes[0]
@ -168,9 +187,13 @@ class relation (object):
return newt return newt
def rename(self, params): def rename(self, params):
'''Operation rename. Takes a dictionary '''
Will replace the itmem with its content. Takes a dictionary.
For example if you want to rename a to b, provide {"a":"b"}
Will replace the field name as the key with its value.
For example if you want to rename a to b, call
rel.rename({'a':'b'})
''' '''
result = [] result = []
@ -183,11 +206,11 @@ class relation (object):
return newt return newt
def intersection(self, other): def intersection(self, other):
'''Intersection operation. The result will contain items present in both '''
Intersection operation. The result will contain items present in both
operands. operands.
Will return an empty one if there are no common items. Will return an empty one if there are no common items.
Will return None if headers are different. '''
It is possible to use projection and rename to make headers match.'''
other = self._rearrange(other) # Rearranges attributes' order other = self._rearrange(other) # Rearranges attributes' order
newt = relation() newt = relation()
newt.header = header(self.header) newt.header = header(self.header)
@ -198,9 +221,7 @@ class relation (object):
def difference(self, other): def difference(self, other):
'''Difference operation. The result will contain items present in first '''Difference operation. The result will contain items present in first
operand but not in second one. operand but not in second one.
Will return an empty one if the second is a superset of first. '''
Will return None if headers are different.
It is possible to use projection and rename to make headers match.'''
other = self._rearrange(other) # Rearranges attributes' order other = self._rearrange(other) # Rearranges attributes' order
newt = relation() newt = relation()
newt.header = header(self.header) newt.header = header(self.header)
@ -220,18 +241,16 @@ class relation (object):
# d_headers are the headers from self that aren't also headers in other # d_headers are the headers from self that aren't also headers in other
d_headers = tuple(set(self.header) - set(other.header)) d_headers = tuple(set(self.header) - set(other.header))
''' # Wikipedia defines the division as follows:
Wikipedia defines the division as follows:
a1,....,an are the d_headers # a1,....,an are the d_headers
T := πa1,...,an(R) × S # T := πa1,...,an(R) × S
U := T - R # U := T - R
V := πa1,...,an(U) # V := πa1,...,an(U)
W := πa1,...,an(R) - V # W := πa1,...,an(R) - V
W is the result that we want # W is the result that we want
'''
t = self.projection(d_headers).product(other) t = self.projection(d_headers).product(other)
return self.projection(d_headers).difference(t.difference(self).projection(d_headers)) return self.projection(d_headers).difference(t.difference(self).projection(d_headers))
@ -239,10 +258,7 @@ class relation (object):
def union(self, other): def union(self, other):
'''Union operation. The result will contain items present in first '''Union operation. The result will contain items present in first
and second operands. and second operands.
Will return an empty one if both are empty. '''
Will not insert tuplicated items.
Will return None if headers are different.
It is possible to use projection and rename to make headers match.'''
other = self._rearrange(other) # Rearranges attributes' order other = self._rearrange(other) # Rearranges attributes' order
newt = relation() newt = relation()
newt.header = header(self.header) newt.header = header(self.header)
@ -262,19 +278,19 @@ class relation (object):
return a.union(b) return a.union(b)
def outer_right(self, other): def outer_right(self, other):
'''Outer right join. Considers self as left and param as right. If the '''
Outer right join. Considers self as left and param as right. If the
tuple has no corrispondence, empy attributes are filled with a "---" tuple has no corrispondence, empy attributes are filled with a "---"
string. This is due to the fact that empty string or a space would cause string. This is due to the fact that the None token would cause
problems when saving the relation. problems when saving and reloading the relation.
Just like natural join, it works considering shared attributes.''' Just like natural join, it works considering shared attributes.
'''
return other.outer_left(self) return other.outer_left(self)
def outer_left(self, other, swap=False): def outer_left(self, other, swap=False):
'''Outer left join. Considers self as left and param as right. If the '''
tuple has no corrispondence, empty attributes are filled with a "---" See documentation for outer_right
string. This is due to the fact that empty string or a space would cause '''
problems when saving the relation.
Just like natural join, it works considering shared attributes.'''
shared = self.header.intersection(other.header) shared = self.header.intersection(other.header)
@ -313,8 +329,10 @@ class relation (object):
return newt return newt
def join(self, other): def join(self, other):
'''Natural join, joins on shared attributes (one or more). If there are no '''
shared attributes, it will behave as cartesian product.''' Natural join, joins on shared attributes (one or more). If there are no
shared attributes, it will behave as the cartesian product.
'''
# List of attributes in common between the relations # List of attributes in common between the relations
shared = self.header.intersection(other.header) shared = self.header.intersection(other.header)
@ -347,8 +365,6 @@ class relation (object):
return newt return newt
def __eq__(self, other): def __eq__(self, other):
'''Returns true if the relations are the same, ignoring order of items.
This operation is rather heavy, since it requires sorting and comparing.'''
if not isinstance(other, relation): if not isinstance(other, relation):
return False return False
@ -368,8 +384,6 @@ class relation (object):
return len(self.content) return len(self.content)
def __str__(self): def __str__(self):
'''Returns a string representation of the relation, can be printed with
monospaced fonts'''
m_len = [] # Maximum lenght string m_len = [] # Maximum lenght string
for f in self.header: for f in self.header:
m_len.append(len(f)) m_len.append(len(f))
@ -395,13 +409,19 @@ class relation (object):
return res return res
def update(self, expr, dic): def update(self, expr, dic):
'''Update, expr must be a valid boolean expression, can contain field names, '''
constant, math operations and boolean ones. Updates certain values of a relation.
expr must be a valid Python expression that can contain field names.
This operation will change the relation itself instead of generating a new one, This operation will change the relation itself instead of generating a new one,
updating all the tuples that make expr true. updating all the tuples where expr evaluates as True.
Dic must be a dictionary that has the form field name:value. Every kind of value
Dic must be a dictionary that has the form "field name":"new value". Every kind of value
will be converted into a string. will be converted into a string.
Returns the number of affected rows.'''
Returns the number of affected rows.
'''
self._make_writable() self._make_writable()
affected = 0 affected = 0
attributes = {} attributes = {}
@ -409,7 +429,7 @@ class relation (object):
f_ids = self.header.getAttributesId(keys) f_ids = self.header.getAttributesId(keys)
# new_content=[] #New content of the relation # new_content=[] #New content of the relation
for i in self.content: for i in set(self.content):
for j, attr in enumerate(self.header): for j, attr in enumerate(self.header):
attributes[attr] = i[j].autocast() attributes[attr] = i[j].autocast()
@ -426,10 +446,14 @@ class relation (object):
return affected return affected
def insert(self, values): def insert(self, values):
'''Inserts a tuple in the relation. '''
Inserts a tuple in the relation.
This function will not insert duplicate tuples. This function will not insert duplicate tuples.
All the values will be converted in string. All the values will be converted in string.
Will return the number of inserted rows.''' Will return the number of inserted rows.
Will fail if the tuple has the wrong amount of items.
'''
if len(self.header) != len(values): if len(self.header) != len(values):
raise Exception( raise Exception(
@ -446,13 +470,13 @@ class relation (object):
return len(self.content) - prevlen return len(self.content) - prevlen
def delete(self, expr): def delete(self, expr):
'''Delete, expr must be a valid boolean expression, can contain field names, '''
constant, math operations and boolean ones. Delete, expr must be a valid Python expression; can contain field names.
This operation will change the relation itself instead of generating a new one,
deleting all the tuples that make expr true.
Returns the number of affected rows.'''
# Not necessary self._make_writable() This operation will change the relation itself instead of generating a new one,
deleting all the tuples where expr evaluates as True.
Returns the number of affected rows.'''
l = len(self.content) l = len(self.content)
self._readonly = False self._readonly = False