cybertools/pyscript/rstat.py
helmutm 4321f24b38 more on rstat.getDataFrame()
git-svn-id: svn://svn.cy55.de/Zope3/src/cybertools/trunk@2099 fd906abe-77d9-0310-91a1-e0d9ade77398
2007-10-08 11:58:24 +00:00

116 lines
3.6 KiB
Python

#
# Copyright (c) 2007 Helmut Merz helmutm@cy55.de
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
#
"""
Working transparently with the R statistics package.
$Id$
"""
import os
import rpy
from rpy import r
from zope.proxy import removeAllProxies
from zope.traversing.browser import absoluteURL
from cybertools.pyscript.plot import registerImage
# not used (yet?):
class RWrapper(object):
def __init__(self, context):
self.context = context
def __getattr__(self, attr):
value = getattr(self.context, attr)
return removeAllProxies(value)
def __call__(self, *args, **kw):
value = self.context.__call__(*args, **kw)
value = removeAllProxies(value)
return RWrapper(value)
rx = RWrapper(r)
with_mode = RWrapper(rpy.with_mode)
#as_py = RWrapper(rpy.as_py)
def gdd(**kw):
r.library('GDD')
filename = os.tempnam(None, 'rplot')
robj = r.GDD(filename, type='jpg', **kw)
return filename + '.jpg', robj
class RStat(object):
def __init__(self, context, request):
self.context = context
self.request = request
def graphics(self, **kw):
request = self.request
context = self.context
fn, robj = gdd(**kw)
key = registerImage(fn)
return '%s/@@plot?image=%s.jpg' % (absoluteURL(context, request), key)
def getDataFrame(self, data):
""" Return an R data.frame.
The ``data`` argument is a sequence of tuples
(rowId, columnId, value). Elements with a columnId
that is not present in all rows is omitted.
"""
def checkId(mapping, id):
for element in mapping.values():
if id not in element:
return False
return True
data = sorted(data)
rows = {}
columns = {}
dataMapping = {}
for rowId, columnId, value in data:
rows.setdefault(rowId, []).append(columnId)
columns.setdefault(columnId, []).append(rowId)
dataMapping[(rowId, columnId)] = value
columnsToOmit = []
for rowId, row in rows.items():
for columnId in row:
if not checkId(rows, columnId):
columnsToOmit.append(columnId)
rowsToOmit = []
for columnId, column in columns.items():
for rowId in column:
if not checkId(columns, rowId):
rowsToOmit.append(rowId)
r.library('ltm')
result = {}
#for rowId, columnId, value in data:
#if columnId not in columnsToOmit:
# if rowId not in rowsToOmit:
# result.setdefault(rowId, []).append(value)
for (rowId, columnId), value in sorted(dataMapping.items()):
if rowId not in rowsToOmit:
result.setdefault(rowId, []).append(value)
self.intermediateData = result
matrix = rpy.with_mode(rpy.NO_CONVERSION, r.data_frame)(**result)
return matrix