Improved docstring

2015-07-14 15:08:39 +07:00 · 2015-07-14 15:08:39 +07:00 · af02b5a59b
parent c275c1caf3
commit af02b5a59b
1 changed files with 98 additions and 74 deletions
--- a/relational/relation.py
+++ b/relational/relation.py
@ -28,19 +28,31 @@ from relational.rtypes import *

 class relation (object):

-    '''This objects defines a relation (as a group of consistent tuples) and operations
-    A relation can be represented using a table
-    Calling an operation and providing a non relation parameter when it is expected will
-    result in a None value'''
+    '''
+    This object defines a relation (as a group of consistent tuples) and operations.
+
+    A relation is a particular kind of set, which has a number of named attributes and
+    a number of tuples, which must express a value for every attribute.
+
+    Set operations like union, intersection and difference are restricted and can only be
+    performed on relations which share the same set of named attributes.
+
+    The constructor optionally accepts a filename and then it will load the relation from
+    that file.
+
+    If no parameter is supplied an empty relation is created.
+
+    Files need to be comma separated as described in RFC4180.
+
+    The first line need to contain the attributes of the relation while the
+    following lines contain the tuples of the relation.
+
+    An empty relation needs a header, and can be filled using the insert()
+    method.
+    '''
    __hash__ = None

    def __init__(self, filename=""):
-        '''Creates a relation, accepts a filename and then it will load the relation from
-        that file. If no parameter is supplied an empty relation is created. Empty
-        relations are used in internal operations.
-        By default the file will be handled like a comma separated as described in
-        RFC4180.'''
-
        self._readonly = False

        if len(filename) == 0:  # Empty relation
@ -71,9 +83,9 @@ class relation (object):
        return key in self.content

    def save(self, filename):
-        '''Saves the relation in a file. By default will save using the csv
-        format as defined in RFC4180, but setting comma_separated to False,
-        it will use the old format with space separated values.
+        '''
+        Saves the relation in a file. Will save using the csv
+        format as defined in RFC4180.
        '''

        fp = open(filename, 'w')  # Opening file in write mode
@ -105,8 +117,9 @@ class relation (object):
        ))

    def selection(self, expr):
-        '''Selection, expr must be a valid boolean expression, can contain field names,
-        constant, math operations and boolean ones.'''
+        '''
+        Selection, expr must be a valid Python expression; can contain field names.
+        '''
        newt = relation()
        newt.header = header(self.header)
        for i in self.content:
@ -124,10 +137,9 @@ class relation (object):
        return newt

    def product(self, other):
-        '''Cartesian product, attributes must be different to avoid collisions
-        Doing this operation on relations with colliding attributes will
-        cause an exception.
-        It is possible to use rename on attributes and then use the product'''
+        '''
+        Cartesian product. Attributes of the relations must differ.
+        '''

        if (not isinstance(other, relation)):
            raise Exception('Operand must be a relation')
@ -144,10 +156,17 @@ class relation (object):
        return newt

    def projection(self, * attributes):
-        '''Projection operator, takes many parameters, for each field to use.
-        Can also use a single parameter with a list.
-        Will delete duplicate items
-        If an empty list or no parameters are provided, returns None'''
+        '''
+        Can be called in two different ways:
+        a.projection('field1','field2')
+
+        or
+
+        a.projection(['field1','field2'])
+
+        The cardinality of the result, might be less than the cardinality
+        of the original object.
+        '''
        # Parameters are supplied in a list, instead with multiple parameters
        if not isinstance(attributes[0], str):
            attributes = attributes[0]
@ -168,9 +187,13 @@ class relation (object):
        return newt

    def rename(self, params):
-        '''Operation rename. Takes a dictionary
-        Will replace the itmem with its content.
-        For example if you want to rename a to b, provide {"a":"b"}
+        '''
+        Takes a dictionary.
+
+        Will replace the field name as the key with its value.
+
+        For example if you want to rename a to b, call
+        rel.rename({'a':'b'})
        '''
        result = []

@ -183,11 +206,11 @@ class relation (object):
        return newt

    def intersection(self, other):
-        '''Intersection operation. The result will contain items present in both
+        '''
+        Intersection operation. The result will contain items present in both
        operands.
        Will return an empty one if there are no common items.
-        Will return None if headers are different.
-        It is possible to use projection and rename to make headers match.'''
+        '''
        other = self._rearrange(other)  # Rearranges attributes' order
        newt = relation()
        newt.header = header(self.header)
@ -198,9 +221,7 @@ class relation (object):
    def difference(self, other):
        '''Difference operation. The result will contain items present in first
        operand but not in second one.
-        Will return an empty one if the second is a superset of first.
-        Will return None if headers are different.
-        It is possible to use projection and rename to make headers match.'''
+        '''
        other = self._rearrange(other)  # Rearranges attributes' order
        newt = relation()
        newt.header = header(self.header)
@ -220,18 +241,16 @@ class relation (object):
        # d_headers are the headers from self that aren't also headers in other
        d_headers = tuple(set(self.header) - set(other.header))

-        '''
-        Wikipedia defines the division as follows:
+        # Wikipedia defines the division as follows:

-        a1,....,an are the d_headers
+        # a1,....,an are the d_headers

-        T := πa1,...,an(R) × S
-        U := T - R
-        V := πa1,...,an(U)
-        W := πa1,...,an(R) - V
+        # T := πa1,...,an(R) × S
+        # U := T - R
+        # V := πa1,...,an(U)
+        # W := πa1,...,an(R) - V

-        W is the result that we want
-        '''
+        # W is the result that we want

        t = self.projection(d_headers).product(other)
        return self.projection(d_headers).difference(t.difference(self).projection(d_headers))
@ -239,10 +258,7 @@ class relation (object):
    def union(self, other):
        '''Union operation. The result will contain items present in first
        and second operands.
-        Will return an empty one if both are empty.
-        Will not insert tuplicated items.
-        Will return None if headers are different.
-        It is possible to use projection and rename to make headers match.'''
+        '''
        other = self._rearrange(other)  # Rearranges attributes' order
        newt = relation()
        newt.header = header(self.header)
@ -262,19 +278,19 @@ class relation (object):
        return a.union(b)

    def outer_right(self, other):
-        '''Outer right join. Considers self as left and param as right. If the
+        '''
+        Outer right join. Considers self as left and param as right. If the
        tuple has no corrispondence, empy attributes are filled with a "---"
-        string. This is due to the fact that empty string or a space would cause
-        problems when saving the relation.
-        Just like natural join, it works considering shared attributes.'''
+        string. This is due to the fact that the None token would cause
+        problems when saving and reloading the relation.
+        Just like natural join, it works considering shared attributes.
+        '''
        return other.outer_left(self)

    def outer_left(self, other, swap=False):
-        '''Outer left join. Considers self as left and param as right. If the
-        tuple has no corrispondence, empty attributes are filled with a "---"
-        string. This is due to the fact that empty string or a space would cause
-        problems when saving the relation.
-        Just like natural join, it works considering shared attributes.'''
+        '''
+        See documentation for outer_right
+        '''

        shared = self.header.intersection(other.header)

@ -313,8 +329,10 @@ class relation (object):
        return newt

    def join(self, other):
-        '''Natural join, joins on shared attributes (one or more). If there are no
-        shared attributes, it will behave as cartesian product.'''
+        '''
+        Natural join, joins on shared attributes (one or more). If there are no
+        shared attributes, it will behave as the cartesian product.
+        '''

        # List of attributes in common between the relations
        shared = self.header.intersection(other.header)
@ -347,8 +365,6 @@ class relation (object):
        return newt

    def __eq__(self, other):
-        '''Returns true if the relations are the same, ignoring order of items.
-        This operation is rather heavy, since it requires sorting and comparing.'''
        if not isinstance(other, relation):
            return False

@ -368,8 +384,6 @@ class relation (object):
        return len(self.content)

    def __str__(self):
-        '''Returns a string representation of the relation, can be printed with
-        monospaced fonts'''
        m_len = []  # Maximum lenght string
        for f in self.header:
            m_len.append(len(f))
@ -395,13 +409,19 @@ class relation (object):
        return res

    def update(self, expr, dic):
-        '''Update, expr must be a valid boolean expression, can contain field names,
-        constant, math operations and boolean ones.
+        '''
+        Updates certain values of a relation.
+
+        expr must be a valid Python expression that can contain field names.
+
        This operation will change the relation itself instead of generating a new one,
-        updating all the tuples that make expr true.
-        Dic must be a dictionary that has the form field name:value. Every kind of value
+        updating all the tuples where expr evaluates as True.
+
+        Dic must be a dictionary that has the form "field name":"new value". Every kind of value
        will be converted into a string.
-        Returns the number of affected rows.'''
+
+        Returns the number of affected rows.
+        '''
        self._make_writable()
        affected = 0
        attributes = {}
@ -409,7 +429,7 @@ class relation (object):
        f_ids = self.header.getAttributesId(keys)

        # new_content=[] #New content of the relation
-        for i in self.content:
+        for i in set(self.content):
            for j, attr in enumerate(self.header):
                attributes[attr] = i[j].autocast()

@ -426,10 +446,14 @@ class relation (object):
        return affected

    def insert(self, values):
-        '''Inserts a tuple in the relation.
+        '''
+        Inserts a tuple in the relation.
        This function will not insert duplicate tuples.
        All the values will be converted in string.
-        Will return the number of inserted rows.'''
+        Will return the number of inserted rows.
+
+        Will fail if the tuple has the wrong amount of items.
+        '''

        if len(self.header) != len(values):
            raise Exception(
@ -446,13 +470,13 @@ class relation (object):
        return len(self.content) - prevlen

    def delete(self, expr):
-        '''Delete, expr must be a valid boolean expression, can contain field names,
-        constant, math operations and boolean ones.
-        This operation will change the relation itself instead of generating a new one,
-        deleting all the tuples that make expr true.
-        Returns the number of affected rows.'''
+        '''
+        Delete, expr must be a valid Python expression; can contain field names.

-        # Not necessary self._make_writable()
+        This operation will change the relation itself instead of generating a new one,
+        deleting all the tuples where expr evaluates as True.
+
+        Returns the number of affected rows.'''

        l = len(self.content)
        self._readonly = False