mirror of
https://github.com/gristlabs/grist-core.git
synced 2024-10-27 20:44:07 +00:00
0e5c2bee59
Summary: get_cell_value wraps RaisedException with CellError to expand the error message for the user. This is still pretty conceptual, the comments explain some things to think about, but it works and is an improvement. Test Plan: Updated Python unit tests Reviewers: dsagal, paulfitz Reviewed By: dsagal Differential Revision: https://phab.getgrist.com/D2928
630 lines
18 KiB
Python
630 lines
18 KiB
Python
# -*- coding: UTF-8 -*-
|
||
# pylint: disable=unused-argument
|
||
|
||
from __future__ import absolute_import
|
||
import datetime
|
||
import math
|
||
import numbers
|
||
import re
|
||
|
||
import six
|
||
|
||
import column
|
||
from functions import date # pylint: disable=import-error
|
||
from functions.unimplemented import unimplemented
|
||
from objtypes import CellError
|
||
from usertypes import AltText # pylint: disable=import-error
|
||
from records import Record, RecordSet
|
||
|
||
@unimplemented
|
||
def ISBLANK(value):
|
||
"""
|
||
Returns whether a value refers to an empty cell. It isn't implemented in Grist. To check for an
|
||
empty string, use `value == ""`.
|
||
"""
|
||
raise NotImplementedError()
|
||
|
||
|
||
def ISERR(value):
|
||
"""
|
||
Checks whether a value is an error. In other words, it returns true
|
||
if using `value` directly would raise an exception.
|
||
|
||
NOTE: Grist implements this by automatically wrapping the argument to use lazy evaluation.
|
||
|
||
A more Pythonic approach to checking for errors is:
|
||
```
|
||
try:
|
||
... value ...
|
||
except Exception, err:
|
||
... do something about the error ...
|
||
```
|
||
|
||
For example:
|
||
|
||
>>> ISERR("Hello")
|
||
False
|
||
|
||
More tests:
|
||
>>> ISERR(lambda: (1/0.1))
|
||
False
|
||
>>> ISERR(lambda: (1/0.0))
|
||
True
|
||
>>> ISERR(lambda: "test".bar())
|
||
True
|
||
>>> ISERR(lambda: "test".upper())
|
||
False
|
||
>>> ISERR(lambda: AltText("A"))
|
||
False
|
||
>>> ISERR(lambda: float('nan'))
|
||
False
|
||
>>> ISERR(lambda: None)
|
||
False
|
||
"""
|
||
return lazy_value_or_error(value) is _error_sentinel
|
||
|
||
|
||
def ISERROR(value):
|
||
"""
|
||
Checks whether a value is an error or an invalid value. It is similar to `ISERR`, but also
|
||
returns true for an invalid value such as NaN or a text value in a Numeric column.
|
||
|
||
NOTE: Grist implements this by automatically wrapping the argument to use lazy evaluation.
|
||
|
||
>>> ISERROR("Hello")
|
||
False
|
||
>>> ISERROR(AltText("fail"))
|
||
True
|
||
>>> ISERROR(float('nan'))
|
||
True
|
||
|
||
More tests:
|
||
>>> ISERROR(AltText(""))
|
||
True
|
||
>>> [ISERROR(v) for v in [0, None, "", "Test", 17.0]]
|
||
[False, False, False, False, False]
|
||
>>> ISERROR(lambda: (1/0.1))
|
||
False
|
||
>>> ISERROR(lambda: (1/0.0))
|
||
True
|
||
>>> ISERROR(lambda: "test".bar())
|
||
True
|
||
>>> ISERROR(lambda: "test".upper())
|
||
False
|
||
>>> ISERROR(lambda: AltText("A"))
|
||
True
|
||
>>> ISERROR(lambda: float('nan'))
|
||
True
|
||
>>> ISERROR(lambda: None)
|
||
False
|
||
"""
|
||
return is_error(lazy_value_or_error(value))
|
||
|
||
|
||
def ISLOGICAL(value):
|
||
"""
|
||
Checks whether a value is `True` or `False`.
|
||
|
||
>>> ISLOGICAL(True)
|
||
True
|
||
>>> ISLOGICAL(False)
|
||
True
|
||
>>> ISLOGICAL(0)
|
||
False
|
||
>>> ISLOGICAL(None)
|
||
False
|
||
>>> ISLOGICAL("Test")
|
||
False
|
||
"""
|
||
return isinstance(value, bool)
|
||
|
||
|
||
def ISNA(value):
|
||
"""
|
||
Checks whether a value is the error `#N/A`.
|
||
|
||
>>> ISNA(float('nan'))
|
||
True
|
||
>>> ISNA(0.0)
|
||
False
|
||
>>> ISNA('text')
|
||
False
|
||
>>> ISNA(float('-inf'))
|
||
False
|
||
"""
|
||
return isinstance(value, float) and math.isnan(value)
|
||
|
||
|
||
def ISNONTEXT(value):
|
||
"""
|
||
Checks whether a value is non-textual.
|
||
|
||
>>> ISNONTEXT("asdf")
|
||
False
|
||
>>> ISNONTEXT("")
|
||
False
|
||
>>> ISNONTEXT(AltText("text"))
|
||
False
|
||
>>> ISNONTEXT(17.0)
|
||
True
|
||
>>> ISNONTEXT(None)
|
||
True
|
||
>>> ISNONTEXT(datetime.date(2011, 1, 1))
|
||
True
|
||
"""
|
||
return not ISTEXT(value)
|
||
|
||
|
||
def ISNUMBER(value):
|
||
"""
|
||
Checks whether a value is a number.
|
||
|
||
>>> ISNUMBER(17)
|
||
True
|
||
>>> ISNUMBER(-123.123423)
|
||
True
|
||
>>> ISNUMBER(False)
|
||
True
|
||
>>> ISNUMBER(float('nan'))
|
||
True
|
||
>>> ISNUMBER(float('inf'))
|
||
True
|
||
>>> ISNUMBER('17')
|
||
False
|
||
>>> ISNUMBER(None)
|
||
False
|
||
>>> ISNUMBER(datetime.date(2011, 1, 1))
|
||
False
|
||
|
||
More tests:
|
||
>>> ISNUMBER(AltText("text"))
|
||
False
|
||
>>> ISNUMBER('')
|
||
False
|
||
"""
|
||
return isinstance(value, numbers.Number)
|
||
|
||
|
||
def ISREF(value):
|
||
"""
|
||
Checks whether a value is a table record.
|
||
|
||
For example, if a column `person` is of type Reference to the `People` table,
|
||
then `ISREF($person)` is `True`.
|
||
Similarly, `ISREF(People.lookupOne(name=$name))` is `True`. For any other type of value,
|
||
`ISREF()` would evaluate to `False`.
|
||
|
||
>>> ISREF(17)
|
||
False
|
||
>>> ISREF("Roger")
|
||
False
|
||
|
||
"""
|
||
return isinstance(value, Record)
|
||
|
||
|
||
def ISREFLIST(value):
|
||
"""
|
||
Checks whether a value is a [`RecordSet`](#recordset),
|
||
the type of values in Reference List columns.
|
||
|
||
For example, if a column `people` is of type Reference List to the `People` table,
|
||
then `ISREFLIST($people)` is `True`.
|
||
Similarly, `ISREFLIST(People.lookupRecords(name=$name))` is `True`. For any other type of value,
|
||
`ISREFLIST()` would evaluate to `False`.
|
||
|
||
>>> ISREFLIST(17)
|
||
False
|
||
>>> ISREFLIST("Roger")
|
||
False
|
||
|
||
"""
|
||
return isinstance(value, RecordSet)
|
||
|
||
|
||
def ISTEXT(value):
|
||
"""
|
||
Checks whether a value is text.
|
||
|
||
>>> ISTEXT("asdf")
|
||
True
|
||
>>> ISTEXT("")
|
||
True
|
||
>>> ISTEXT(AltText("text"))
|
||
True
|
||
>>> ISTEXT(17.0)
|
||
False
|
||
>>> ISTEXT(None)
|
||
False
|
||
>>> ISTEXT(datetime.date(2011, 1, 1))
|
||
False
|
||
"""
|
||
return isinstance(value, (six.string_types, AltText))
|
||
|
||
|
||
# Regexp for matching email. See ISEMAIL for justification.
|
||
_email_regexp = re.compile(
|
||
r"""
|
||
^\w # Start with an alphanumeric character
|
||
[\w%+/='-]* (\.[\w%+/='-]+)* # Elsewhere allow also a few other special characters
|
||
# But no two consecutive periods
|
||
@
|
||
([A-Za-z0-9] # Each part of hostname must start with alphanumeric
|
||
([A-Za-z0-9-]*[A-Za-z0-9])?\. # May have dashes inside, but end in alphanumeric
|
||
)+
|
||
[A-Za-z]{2,6}$ # Restrict top-level domain to length {2,6}. Google seems
|
||
# to use a whitelist for TLDs longer than 2 characters.
|
||
""", re.UNICODE | re.VERBOSE)
|
||
|
||
|
||
# Regexp for matching hostname part of URLs (see also ISURL). Duplicates part of _email_regexp.
|
||
_hostname_regexp = re.compile(
|
||
r"""^
|
||
([A-Za-z0-9] # Each part of hostname must start with alphanumeric
|
||
([A-Za-z0-9-]*[A-Za-z0-9])?\. # May have dashes inside, but end in alphanumeric
|
||
)+
|
||
[A-Za-z]{2,6}$ # Restrict top-level domain to length {2,6}. Google seems
|
||
""", re.VERBOSE)
|
||
|
||
|
||
def ISEMAIL(value):
|
||
u"""
|
||
Returns whether a value is a valid email address.
|
||
|
||
Note that checking email validity is not an exact science. The technical standard considers many
|
||
email addresses valid that are not used in practice, and would not be considered valid by most
|
||
users. Instead, we follow Google Sheets implementation, with some differences, noted below.
|
||
|
||
>>> ISEMAIL("Abc.123@example.com")
|
||
True
|
||
>>> ISEMAIL("Bob_O-Reilly+tag@example.com")
|
||
True
|
||
>>> ISEMAIL("John Doe")
|
||
False
|
||
>>> ISEMAIL("john@aol...com")
|
||
False
|
||
|
||
More tests:
|
||
>>> ISEMAIL("Abc@example.com") # True, True
|
||
True
|
||
>>> ISEMAIL("Abc.123@example.com") # True, True
|
||
True
|
||
>>> ISEMAIL("foo@bar.com") # True, True
|
||
True
|
||
>>> ISEMAIL("asdf@com.zt") # True, True
|
||
True
|
||
>>> ISEMAIL("Bob_O-Reilly+tag@example.com") # True, True
|
||
True
|
||
>>> ISEMAIL("john@server.department.company.com") # True, True
|
||
True
|
||
>>> ISEMAIL("asdf@mail.ru") # True, True
|
||
True
|
||
>>> ISEMAIL("fabio@foo.qwer.COM") # True, True
|
||
True
|
||
>>> ISEMAIL("user+mailbox/department=shipping@example.com") # False, True
|
||
True
|
||
>>> ISEMAIL(u"user+mailbox/department=shipping@example.com") # False, True
|
||
True
|
||
>>> ISEMAIL("customer/department=shipping@example.com") # False, True
|
||
True
|
||
>>> ISEMAIL("Bob_O'Reilly+tag@example.com") # False, True
|
||
True
|
||
>>> ISEMAIL(u"фыва@mail.ru") # False, True
|
||
True
|
||
>>> ISEMAIL("my@baddash.-.com") # True, False
|
||
False
|
||
>>> ISEMAIL("my@baddash.-a.com") # True, False
|
||
False
|
||
>>> ISEMAIL("my@baddash.b-.com") # True, False
|
||
False
|
||
>>> ISEMAIL("john@-.com") # True, False
|
||
False
|
||
>>> ISEMAIL("fabio@disapproved.solutions") # False, False
|
||
False
|
||
>>> ISEMAIL("!def!xyz%abc@example.com") # False, False
|
||
False
|
||
>>> ISEMAIL("!#$%&'*+-/=?^_`.{|}~@example.com") # False, False
|
||
False
|
||
>>> ISEMAIL(u"伊昭傑@郵件.商務") # False, False
|
||
False
|
||
>>> ISEMAIL(u"राम@मोहन.ईन्फो") # False, Fale
|
||
False
|
||
>>> ISEMAIL(u"юзер@екзампл.ком") # False, False
|
||
False
|
||
>>> ISEMAIL(u"θσερ@εχαμπλε.ψομ") # False, False
|
||
False
|
||
>>> ISEMAIL(u"葉士豪@臺網中心.tw") # False, False
|
||
False
|
||
>>> ISEMAIL(u"jeff@臺網中心.tw") # False, False
|
||
False
|
||
>>> ISEMAIL(u"葉士豪@臺網中心.台灣") # False, False
|
||
False
|
||
>>> ISEMAIL(u"jeff葉@臺網中心.tw") # False, False
|
||
False
|
||
>>> ISEMAIL("my.name@domain.com") # False, False
|
||
False
|
||
>>> ISEMAIL("my.name@domain.com") # False, False
|
||
False
|
||
>>> ISEMAIL("my@.leadingdot.com") # False, False
|
||
False
|
||
>>> ISEMAIL("my@..leadingfwdot.com") # False, False
|
||
False
|
||
>>> ISEMAIL("my@..twodots.com") # False, False
|
||
False
|
||
>>> ISEMAIL("my@twodots..com") # False, False
|
||
False
|
||
>>> ISEMAIL(".leadingdot@domain.com") # False, False
|
||
False
|
||
>>> ISEMAIL("..twodots@domain.com") # False, False
|
||
False
|
||
>>> ISEMAIL("twodots..here@domain.com") # False, False
|
||
False
|
||
>>> ISEMAIL("me@⒈wouldbeinvalid.com") # False, False
|
||
False
|
||
>>> ISEMAIL("Foo Bar <a+2asdf@qwer.bar.com>") # False, False
|
||
False
|
||
>>> ISEMAIL("Abc\\@def@example.com") # False, False
|
||
False
|
||
>>> ISEMAIL("foo@bar@google.com") # False, False
|
||
False
|
||
>>> ISEMAIL("john@aol...com") # False, False
|
||
False
|
||
>>> ISEMAIL("x@ทีเอชนิค.ไทย") # False, False
|
||
False
|
||
>>> ISEMAIL("asdf@mail") # False, False
|
||
False
|
||
>>> ISEMAIL("example@良好Mail.中国") # False, False
|
||
False
|
||
"""
|
||
return bool(_email_regexp.match(value))
|
||
|
||
|
||
_url_regexp = re.compile(
|
||
r"""^
|
||
((ftp|http|https|gopher|mailto|news|telnet|aim)://)?
|
||
(\w+@)? # Allow 'user@' part, esp. useful for mailto: URLs.
|
||
([A-Za-z0-9] # Each part of hostname must start with alphanumeric
|
||
([A-Za-z0-9-]*[A-Za-z0-9])?\. # May have dashes inside, but end in alphanumeric
|
||
)+
|
||
[A-Za-z]{2,6} # Restrict top-level domain to length {2,6}. Google seems
|
||
# to use a whitelist for TLDs longer than 2 characters.
|
||
([/?][-\w!#$%&'()*+,./:;=?@~]*)?$ # Notably, this excludes <, >, and ".
|
||
""", re.VERBOSE)
|
||
|
||
|
||
def ISURL(value):
|
||
"""
|
||
Checks whether a value is a valid URL. It does not need to be fully qualified, or to include
|
||
"http://" and "www". It does not follow a standard, but attempts to work similarly to ISURL in
|
||
Google Sheets, and to return True for text that is likely a URL.
|
||
|
||
Valid protocols include ftp, http, https, gopher, mailto, news, telnet, and aim.
|
||
|
||
>>> ISURL("http://www.getgrist.com")
|
||
True
|
||
>>> ISURL("https://foo.com/test_(wikipedia)#cite-1")
|
||
True
|
||
>>> ISURL("mailto://user@example.com")
|
||
True
|
||
>>> ISURL("http:///a")
|
||
False
|
||
|
||
More tests:
|
||
>>> ISURL("http://www.google.com")
|
||
True
|
||
>>> ISURL("www.google.com/")
|
||
True
|
||
>>> ISURL("google.com")
|
||
True
|
||
>>> ISURL("http://a.b-c.de")
|
||
True
|
||
>>> ISURL("a.b-c.de")
|
||
True
|
||
>>> ISURL("http://j.mp/---")
|
||
True
|
||
>>> ISURL("ftp://foo.bar/baz")
|
||
True
|
||
>>> ISURL("https://foo.com/blah_(wikipedia)#cite-1")
|
||
True
|
||
>>> ISURL("mailto://user@google.com")
|
||
True
|
||
>>> ISURL("http://user@www.google.com")
|
||
True
|
||
>>> ISURL("http://foo.com/!#$%25&'()*+,-./=?@_~")
|
||
True
|
||
>>> ISURL("http://../")
|
||
False
|
||
>>> ISURL("http://??/")
|
||
False
|
||
>>> ISURL("a.-b.cd")
|
||
False
|
||
>>> ISURL("http://foo.bar?q=Spaces should be encoded ")
|
||
False
|
||
>>> ISURL("//")
|
||
False
|
||
>>> ISURL("///a")
|
||
False
|
||
>>> ISURL("http:///a")
|
||
False
|
||
>>> ISURL("bar://www.google.com")
|
||
False
|
||
>>> ISURL("http:// shouldfail.com")
|
||
False
|
||
>>> ISURL("ftps://foo.bar/")
|
||
False
|
||
>>> ISURL("http://-error-.invalid/")
|
||
False
|
||
>>> ISURL("http://0.0.0.0")
|
||
False
|
||
>>> ISURL("http://.www.foo.bar/")
|
||
False
|
||
>>> ISURL("http://.www.foo.bar./")
|
||
False
|
||
>>> ISURL("example.com/file[/].html")
|
||
False
|
||
>>> ISURL("http://example.com/file[/].html")
|
||
False
|
||
>>> ISURL("http://mw1.google.com/kml-samples/gp/seattle/gigapxl/$[level]/r$[y]_c$[x].jpg")
|
||
False
|
||
>>> ISURL("http://foo.com/>")
|
||
False
|
||
"""
|
||
value = value.strip()
|
||
if ' ' in value: # Disallow spaces inside value.
|
||
return False
|
||
return bool(_url_regexp.match(value))
|
||
|
||
|
||
def N(value):
|
||
"""
|
||
Returns the value converted to a number. True/False are converted to 1/0. A date is converted to
|
||
Excel-style serial number of the date. Anything else is converted to 0.
|
||
|
||
>>> N(7)
|
||
7
|
||
>>> N(7.1)
|
||
7.1
|
||
>>> N("Even")
|
||
0
|
||
>>> N("7")
|
||
0
|
||
>>> N(True)
|
||
1
|
||
>>> N(datetime.datetime(2011, 4, 17))
|
||
40650.0
|
||
"""
|
||
if ISNUMBER(value):
|
||
return value
|
||
if isinstance(value, datetime.date):
|
||
return date.DATE_TO_XL(value)
|
||
return 0
|
||
|
||
|
||
def NA():
|
||
"""
|
||
Returns the "value not available" error, `#N/A`.
|
||
|
||
>>> math.isnan(NA())
|
||
True
|
||
"""
|
||
return float('nan')
|
||
|
||
|
||
@unimplemented
|
||
def TYPE(value):
|
||
"""
|
||
Returns a number associated with the type of data passed into the function. This is not
|
||
implemented in Grist. Use `isinstance(value, type)` or `type(value)`.
|
||
"""
|
||
raise NotImplementedError()
|
||
|
||
@unimplemented
|
||
def CELL(info_type, reference):
|
||
"""
|
||
Returns the requested information about the specified cell. This is not implemented in Grist
|
||
"""
|
||
raise NotImplementedError()
|
||
|
||
|
||
def RECORD(record_or_list, dates_as_iso=False, expand_refs=0):
|
||
"""
|
||
Returns a Python dictionary with all fields in the given record. If a list of records is given,
|
||
returns a list of corresponding Python dictionaries.
|
||
|
||
If dates_as_iso is set, Date and DateTime values are converted to string using ISO 8601 format.
|
||
|
||
If expand_refs is set to 1 or higher, Reference values are replaced with a RECORD representation
|
||
of the referenced record, expanding the given number of levels.
|
||
|
||
Error values present in cells of the record are replaced with None value, and a special key of
|
||
"_error_" gets added containing the error messages for those cells. For example:
|
||
`{"Ratio": None, "_error_": {"Ratio": "ZeroDivisionError: integer division or modulo by zero"}}`
|
||
|
||
Note that care is needed to avoid circular references when using RECORD(), since it creates a
|
||
dependency on every cell in the record. In case of RECORD(rec), the cell containing this call
|
||
will be omitted from the resulting dictionary.
|
||
|
||
For example:
|
||
```
|
||
RECORD($Person)
|
||
RECORD(rec)
|
||
RECORD(People.lookupOne(First_Name="Alice"))
|
||
RECORD(People.lookupRecords(Department="HR"))
|
||
```
|
||
"""
|
||
if isinstance(record_or_list, Record):
|
||
return _prepare_record_dict(record_or_list, dates_as_iso=dates_as_iso, expand_refs=expand_refs)
|
||
|
||
try:
|
||
records = list(record_or_list)
|
||
assert all(isinstance(r, Record) for r in records)
|
||
except Exception:
|
||
raise ValueError('RECORD() requires a Record or an iterable of Records')
|
||
|
||
return [_prepare_record_dict(r, dates_as_iso=dates_as_iso, expand_refs=expand_refs)
|
||
for r in records]
|
||
|
||
|
||
def _prepare_record_dict(record, dates_as_iso=False, expand_refs=0):
|
||
table_id = record._table.table_id
|
||
docmodel = record._table._engine.docmodel
|
||
columns = docmodel.get_table_rec(table_id).columns
|
||
frame = record._table._engine.get_current_frame()
|
||
|
||
result = {'id': int(record)}
|
||
errors = {}
|
||
for col in columns:
|
||
col_id = col.colId
|
||
# Skip helper columns.
|
||
if not column.is_visible_column(col_id):
|
||
continue
|
||
|
||
# Avoid trying to access the cell being evaluated, since cycles get detected even if the
|
||
# CircularRef exception is caught. TODO This is hacky, and imperfect. If another column
|
||
# references a column containing the RECORD(rec) call, CircularRefError will still happen.
|
||
if frame and frame.node == (table_id, col_id):
|
||
continue
|
||
|
||
try:
|
||
val = getattr(record, col_id)
|
||
if dates_as_iso and isinstance(val, datetime.date):
|
||
val = val.isoformat()
|
||
elif expand_refs and isinstance(val, (Record, RecordSet)):
|
||
# Reduce expand_refs levels.
|
||
if val:
|
||
val = RECORD(val, dates_as_iso=dates_as_iso, expand_refs=expand_refs - 1)
|
||
else:
|
||
val = None
|
||
result[col_id] = val
|
||
except Exception as e:
|
||
result[col_id] = None
|
||
while isinstance(e, CellError):
|
||
# The extra information from CellError is redundant here
|
||
e = e.error # pylint: disable=no-member
|
||
errors[col_id] = "%s: %s" % (type(e).__name__, str(e))
|
||
|
||
if errors:
|
||
result["_error_"] = errors
|
||
return result
|
||
|
||
|
||
# Unique sentinel value to represent that a lazy value evaluates with an exception.
|
||
_error_sentinel = object()
|
||
|
||
def lazy_value_or_error(value):
|
||
"""
|
||
Evaluates a value like lazy_value(), but returns _error_sentinel on exception.
|
||
"""
|
||
try:
|
||
return value() if callable(value) else value
|
||
except Exception:
|
||
return _error_sentinel
|
||
|
||
def is_error(value):
|
||
"""
|
||
Checks whether a value is an invalid value or _error_sentinel.
|
||
"""
|
||
return ((value is _error_sentinel)
|
||
or isinstance(value, AltText)
|
||
or (isinstance(value, float) and math.isnan(value)))
|