# Copyright (c) 2011, 2012 Free Software Foundation
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as
# published by the Free Software Foundation, either version 3 of the
# License, or (at your option) any later version.
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
# You should have received a copy of the GNU Affero General Public License
# along with this program. If not, see .
# This project incorporates work covered by the following copyright and permission notice:
# Copyright (c) 2009, Julien Fache
# All rights reserved.
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# * Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in
# the documentation and/or other materials provided with the
# distribution.
# * Neither the name of the author nor the names of other
# contributors may be used to endorse or promote products derived
# from this software without specific prior written permission.
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
# COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
# (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
# STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
# OF THE POSSIBILITY OF SUCH DAMAGE.
# Copyright (c) 2011, 2012 Free Software Foundation
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as
# published by the Free Software Foundation, either version 3 of the
# License, or (at your option) any later version.
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
# You should have received a copy of the GNU Affero General Public License
# along with this program. If not, see .
"""Test cases for Gstudio's comparison"""
from django.test import TestCase
from gstudio.models import Nodetype
from gstudio.comparison import pearson_score
from gstudio.comparison import VectorBuilder
from gstudio.comparison import ClusteredModel
class ComparisonTestCase(TestCase):
"""Test cases for comparison tools"""
def test_pearson_score(self):
self.assertEquals(pearson_score([42], [42]), 0.0)
self.assertEquals(pearson_score([0, 1, 2], [0, 1, 2]), 0.0)
self.assertEquals(pearson_score([0, 1, 3], [0, 1, 2]),
0.051316701949486232)
self.assertEquals(pearson_score([0, 1, 2], [0, 1, 3]),
0.051316701949486232)
def test_clustered_model(self):
params = {'title': 'My nodetype 1', 'content': 'My content 1',
'tags': 'gstudio, test', 'slug': 'my-nodetype-1'}
Nodetype.objects.create(**params)
params = {'title': 'My nodetype 2', 'content': 'My content 2',
'tags': 'gstudio, test', 'slug': 'my-nodetype-2'}
Nodetype.objects.create(**params)
cm = ClusteredModel(Nodetype.objects.all())
self.assertEquals(cm.dataset().values(), ['1', '2'])
cm = ClusteredModel(Nodetype.objects.all(),
['title', 'excerpt', 'content'])
self.assertEquals(cm.dataset().values(), ['My nodetype 1 My content 1',
'My nodetype 2 My content 2'])
def test_vector_builder(self):
vectors = VectorBuilder(Nodetype.objects.all(),
['title', 'excerpt', 'content'])
params = {'title': 'My nodetype 1', 'content':
'This is my first content',
'tags': 'gstudio, test', 'slug': 'my-nodetype-1'}
Nodetype.objects.create(**params)
params = {'title': 'My nodetype 2', 'content':
'My second nodetype',
'tags': 'gstudio, test', 'slug': 'my-nodetype-2'}
Nodetype.objects.create(**params)
columns, dataset = vectors()
self.assertEquals(columns, ['content', 'This', 'my', 'is', '1',
'second', '2', 'first'])
self.assertEquals(dataset.values(), [[1, 1, 1, 1, 1, 0, 0, 1],
[0, 0, 0, 0, 0, 1, 1, 0]])