2020-07-27 18:57:36 +00:00
|
|
|
"""
|
|
|
|
gencode.py is the module that generates a python module based on the schema in a grist document.
|
|
|
|
An example of the module it generates is available in usercode.py.
|
|
|
|
|
|
|
|
The schema for grist data is:
|
|
|
|
<schema> = [ <table_info> ]
|
|
|
|
<table_info> = {
|
|
|
|
"tableId": <string>,
|
|
|
|
"columns": [ <column_info> ],
|
|
|
|
}
|
|
|
|
<column_info> = {
|
|
|
|
"id": <string>,
|
|
|
|
"type": <string>
|
|
|
|
"isFormula": <boolean>,
|
|
|
|
"formula": <opt_string>,
|
|
|
|
}
|
|
|
|
"""
|
2021-07-12 20:14:23 +00:00
|
|
|
import linecache
|
2020-07-27 18:57:36 +00:00
|
|
|
import re
|
|
|
|
import imp
|
|
|
|
from collections import OrderedDict
|
|
|
|
|
2021-06-22 15:12:25 +00:00
|
|
|
import six
|
|
|
|
|
2020-07-27 18:57:36 +00:00
|
|
|
import codebuilder
|
2020-07-31 02:10:18 +00:00
|
|
|
from column import is_visible_column
|
2020-07-27 18:57:36 +00:00
|
|
|
import summary
|
|
|
|
import table
|
|
|
|
import textbuilder
|
|
|
|
from usertypes import get_type_default
|
|
|
|
import logger
|
|
|
|
log = logger.Logger(__name__, logger.INFO)
|
|
|
|
|
|
|
|
indent_str = " "
|
|
|
|
|
|
|
|
# Matches newlines that are followed by a non-empty line.
|
|
|
|
indent_line_re = re.compile(r'^(?=.*\S)', re.M)
|
|
|
|
|
|
|
|
def indent(body, levels=1):
|
|
|
|
"""Indents all lines in body (which should be a textbuilder.Builder), except empty ones."""
|
|
|
|
patches = textbuilder.make_regexp_patches(body.get_text(), indent_line_re, indent_str * levels)
|
|
|
|
return textbuilder.Replacer(body, patches)
|
|
|
|
|
|
|
|
#----------------------------------------------------------------------
|
|
|
|
|
|
|
|
def get_grist_type(col_type):
|
|
|
|
"""Returns code for a grist usertype object given a column type string."""
|
|
|
|
col_type_split = col_type.split(':', 1)
|
|
|
|
typename = col_type_split[0]
|
|
|
|
if typename == 'Ref':
|
|
|
|
typename = 'Reference'
|
|
|
|
elif typename == 'RefList':
|
|
|
|
typename = 'ReferenceList'
|
|
|
|
|
|
|
|
arg = col_type_split[1] if len(col_type_split) > 1 else ''
|
|
|
|
arg = arg.strip().replace("'", "\\'")
|
|
|
|
|
|
|
|
return "grist.%s(%s)" % (typename, ("'%s'" % arg) if arg else '')
|
|
|
|
|
|
|
|
|
|
|
|
class GenCode(object):
|
|
|
|
"""
|
|
|
|
GenCode generates the Python code for a Grist document, including converting formulas to Python
|
|
|
|
functions and producing a Python specification of all the tables with data and formula fields.
|
|
|
|
|
|
|
|
To save the costly work of generating formula code, it maintains a formula cache. It is a
|
|
|
|
dictionary mapping (table_id, col_id, formula) to a textbuilder.Builder. On each run of
|
|
|
|
make_module(), it will use the previously cached values for lookups, and replace the contents
|
|
|
|
of the cache with current values. If ever we need to generate code for unrelated schemas, to
|
|
|
|
benefit from the cache, a separate GenCode object should be used for each schema.
|
|
|
|
"""
|
|
|
|
def __init__(self):
|
|
|
|
self._formula_cache = {}
|
|
|
|
self._new_formula_cache = {}
|
|
|
|
self._full_builder = None
|
|
|
|
self._user_builder = None
|
|
|
|
self._usercode = None
|
|
|
|
|
(core) Implement trigger formulas (generalizing default formulas)
Summary:
Trigger formulas can be calculated for new records, or for new records and
updates to certain fields, or all fields. They do not recalculate on open,
and they MAY be set directly by the user, including for data-cleaning.
- Column metadata now includes recalcWhen and recalcDeps fields.
- Trigger formulas are NOT recalculated on open or on schema changes.
- When recalcWhen is "never", formula isn't calculated even for new records.
- When recalcWhen is "allupdates", formula is calculated for new records and
any manual (non-formula) updates to the record.
- When recalcWhen is "", formula is calculated for new records, and changes to
recalcDeps fields (which may be formula fields or column itself).
- A column whose recalcDeps includes itself is a "data-cleaning" column; a
value set by the user will still trigger the formula.
- All trigger-formulas receive a "value" argument (to support the case above).
Small changes
- Update RefLists (used for recalcDeps) when target rows are deleted.
- Add RecordList.__contains__ (for `rec in refList` or `id in refList` checks)
- Clarify that Calculate action has replaced load_done() in practice,
and use it in tests too, to better match reality.
Left for later:
- UI for setting recalcWhen / recalcDeps.
- Implementation of actions such as "Recalculate for all cells".
- Allowing trigger-formulas access to the current user's info.
Test Plan: Added a comprehensive python-side test for various trigger combinations
Reviewers: paulfitz, alexmojaki
Reviewed By: paulfitz
Differential Revision: https://phab.getgrist.com/D2872
2021-06-25 20:34:20 +00:00
|
|
|
def _make_formula_field(self, col_info, table_id, name=None, include_type=True,
|
2021-07-15 00:45:53 +00:00
|
|
|
additional_params=()):
|
2020-07-27 18:57:36 +00:00
|
|
|
"""Returns the code for a formula field."""
|
|
|
|
# If the caller didn't specify a special name, use the colId
|
|
|
|
name = name or col_info.colId
|
|
|
|
|
2021-07-15 00:45:53 +00:00
|
|
|
decl = "def %s(%s):\n" % (
|
|
|
|
name,
|
|
|
|
', '.join(['rec', 'table'] + list(additional_params))
|
|
|
|
)
|
2020-07-27 18:57:36 +00:00
|
|
|
|
|
|
|
# This is where we get to use the formula cache, and save the work of rebuilding formulas.
|
|
|
|
key = (table_id, col_info.colId, col_info.formula)
|
|
|
|
body = self._formula_cache.get(key)
|
|
|
|
if body is None:
|
|
|
|
default = get_type_default(col_info.type)
|
|
|
|
body = codebuilder.make_formula_body(col_info.formula, default, (table_id, col_info.colId))
|
|
|
|
self._new_formula_cache[key] = body
|
|
|
|
|
|
|
|
decorator = ''
|
|
|
|
if include_type and col_info.type != 'Any':
|
|
|
|
decorator = '@grist.formulaType(%s)\n' % get_grist_type(col_info.type)
|
|
|
|
return textbuilder.Combiner(['\n' + decorator + decl, indent(body), '\n'])
|
|
|
|
|
|
|
|
|
|
|
|
def _make_data_field(self, col_info, table_id):
|
|
|
|
"""Returns the code for a data field."""
|
|
|
|
parts = []
|
|
|
|
if col_info.formula:
|
|
|
|
parts.append(self._make_formula_field(col_info, table_id,
|
|
|
|
name=table.get_default_func_name(col_info.colId),
|
(core) Implement trigger formulas (generalizing default formulas)
Summary:
Trigger formulas can be calculated for new records, or for new records and
updates to certain fields, or all fields. They do not recalculate on open,
and they MAY be set directly by the user, including for data-cleaning.
- Column metadata now includes recalcWhen and recalcDeps fields.
- Trigger formulas are NOT recalculated on open or on schema changes.
- When recalcWhen is "never", formula isn't calculated even for new records.
- When recalcWhen is "allupdates", formula is calculated for new records and
any manual (non-formula) updates to the record.
- When recalcWhen is "", formula is calculated for new records, and changes to
recalcDeps fields (which may be formula fields or column itself).
- A column whose recalcDeps includes itself is a "data-cleaning" column; a
value set by the user will still trigger the formula.
- All trigger-formulas receive a "value" argument (to support the case above).
Small changes
- Update RefLists (used for recalcDeps) when target rows are deleted.
- Add RecordList.__contains__ (for `rec in refList` or `id in refList` checks)
- Clarify that Calculate action has replaced load_done() in practice,
and use it in tests too, to better match reality.
Left for later:
- UI for setting recalcWhen / recalcDeps.
- Implementation of actions such as "Recalculate for all cells".
- Allowing trigger-formulas access to the current user's info.
Test Plan: Added a comprehensive python-side test for various trigger combinations
Reviewers: paulfitz, alexmojaki
Reviewed By: paulfitz
Differential Revision: https://phab.getgrist.com/D2872
2021-06-25 20:34:20 +00:00
|
|
|
include_type=False,
|
2021-07-15 00:45:53 +00:00
|
|
|
additional_params=['value', 'user']))
|
2020-07-27 18:57:36 +00:00
|
|
|
parts.append("%s = %s\n" % (col_info.colId, get_grist_type(col_info.type)))
|
|
|
|
return textbuilder.Combiner(parts)
|
|
|
|
|
|
|
|
|
|
|
|
def _make_field(self, col_info, table_id):
|
|
|
|
"""Returns the code for a field."""
|
|
|
|
assert not col_info.colId.startswith("_")
|
|
|
|
if col_info.isFormula:
|
|
|
|
return self._make_formula_field(col_info, table_id)
|
|
|
|
else:
|
|
|
|
return self._make_data_field(col_info, table_id)
|
|
|
|
|
|
|
|
|
2020-07-31 02:10:18 +00:00
|
|
|
def _make_table_model(self, table_info, summary_tables, filter_for_user=False):
|
|
|
|
"""
|
|
|
|
Returns the code for a table model.
|
|
|
|
If filter_for_user is True, includes only user-visible columns.
|
|
|
|
"""
|
2020-07-27 18:57:36 +00:00
|
|
|
table_id = table_info.tableId
|
(core) Nice summary table IDs
Summary:
Changes auto-generated summary table IDs from e.g. `GristSummary_6_Table1` to `Table1_summary_A_B` (meaning `Table1` grouped by `A` and `B`). This makes it easier to write formulas involving summary tables, make API requests, understand logs, etc.
Because these don't encode the source table ID as reliably as before, `decode_summary_table_name` now uses the summary table schema info, not just the summary table ID. Specifically, it looks at the type of the `group` column, which is `RefList:<source table id>`.
Renaming a source table renames the summary table as before, and now renaming a groupby column renames the summary table as well.
Conflicting table names are resolved in the usual way by adding a number at the end, e.g. `Table1_summary_A_B2`. These summary tables are not automatically renamed when the disambiguation is no longer needed.
A new migration renames all summary tables to the new scheme, and updates formulas using summary tables with a simple regex.
Test Plan:
Updated many tests to use the new style of name.
Added new Python tests to for resolving conflicts when renaming source tables and groupby columns.
Added a test for the migration, including renames in formulas.
Reviewers: georgegevoian
Reviewed By: georgegevoian
Differential Revision: https://phab.getgrist.com/D3508
2022-07-11 18:00:25 +00:00
|
|
|
source_table_id = summary.decode_summary_table_name(table_info)
|
2020-07-27 18:57:36 +00:00
|
|
|
|
|
|
|
# Sort columns by "isFormula" to output all data columns before all formula columns.
|
2021-06-22 15:12:25 +00:00
|
|
|
columns = sorted(six.itervalues(table_info.columns), key=lambda c: c.isFormula)
|
2020-07-31 02:10:18 +00:00
|
|
|
if filter_for_user:
|
|
|
|
columns = [c for c in columns if is_visible_column(c.colId)]
|
2020-07-27 18:57:36 +00:00
|
|
|
parts = ["@grist.UserTable\nclass %s:\n" % table_id]
|
|
|
|
if source_table_id:
|
|
|
|
parts.append(indent(textbuilder.Text("_summarySourceTable = %r\n" % source_table_id)))
|
|
|
|
|
|
|
|
for col_info in columns:
|
|
|
|
parts.append(indent(self._make_field(col_info, table_id)))
|
|
|
|
|
|
|
|
if summary_tables:
|
|
|
|
# Include summary formulas, for the user's information.
|
|
|
|
formulas = OrderedDict((c.colId, c) for s in summary_tables
|
2021-06-22 15:12:25 +00:00
|
|
|
for c in six.itervalues(s.columns) if c.isFormula)
|
2020-07-27 18:57:36 +00:00
|
|
|
parts.append(indent(textbuilder.Text("\nclass _Summary:\n")))
|
2021-06-22 15:12:25 +00:00
|
|
|
for col_info in six.itervalues(formulas):
|
2020-07-27 18:57:36 +00:00
|
|
|
parts.append(indent(self._make_field(col_info, table_id), levels=2))
|
|
|
|
|
|
|
|
return textbuilder.Combiner(parts)
|
|
|
|
|
|
|
|
def make_module(self, schema):
|
2022-02-19 09:46:49 +00:00
|
|
|
"""Regenerates the code text and usercode module from updated document schema."""
|
2020-07-27 18:57:36 +00:00
|
|
|
# Collect summary tables to group them by source table.
|
|
|
|
summary_tables = {}
|
2021-06-22 15:12:25 +00:00
|
|
|
for table_info in six.itervalues(schema):
|
(core) Nice summary table IDs
Summary:
Changes auto-generated summary table IDs from e.g. `GristSummary_6_Table1` to `Table1_summary_A_B` (meaning `Table1` grouped by `A` and `B`). This makes it easier to write formulas involving summary tables, make API requests, understand logs, etc.
Because these don't encode the source table ID as reliably as before, `decode_summary_table_name` now uses the summary table schema info, not just the summary table ID. Specifically, it looks at the type of the `group` column, which is `RefList:<source table id>`.
Renaming a source table renames the summary table as before, and now renaming a groupby column renames the summary table as well.
Conflicting table names are resolved in the usual way by adding a number at the end, e.g. `Table1_summary_A_B2`. These summary tables are not automatically renamed when the disambiguation is no longer needed.
A new migration renames all summary tables to the new scheme, and updates formulas using summary tables with a simple regex.
Test Plan:
Updated many tests to use the new style of name.
Added new Python tests to for resolving conflicts when renaming source tables and groupby columns.
Added a test for the migration, including renames in formulas.
Reviewers: georgegevoian
Reviewed By: georgegevoian
Differential Revision: https://phab.getgrist.com/D3508
2022-07-11 18:00:25 +00:00
|
|
|
source_table_id = summary.decode_summary_table_name(table_info)
|
2020-07-27 18:57:36 +00:00
|
|
|
if source_table_id:
|
|
|
|
summary_tables.setdefault(source_table_id, []).append(table_info)
|
|
|
|
|
|
|
|
fullparts = ["import grist\n" +
|
|
|
|
"from functions import * # global uppercase functions\n" +
|
|
|
|
"import datetime, math, re # modules commonly needed in formulas\n"]
|
|
|
|
userparts = fullparts[:]
|
2021-06-22 15:12:25 +00:00
|
|
|
for table_info in six.itervalues(schema):
|
2020-07-27 18:57:36 +00:00
|
|
|
fullparts.append("\n\n")
|
2020-07-31 02:10:18 +00:00
|
|
|
fullparts.append(self._make_table_model(table_info, summary_tables.get(table_info.tableId)))
|
(core) Nice summary table IDs
Summary:
Changes auto-generated summary table IDs from e.g. `GristSummary_6_Table1` to `Table1_summary_A_B` (meaning `Table1` grouped by `A` and `B`). This makes it easier to write formulas involving summary tables, make API requests, understand logs, etc.
Because these don't encode the source table ID as reliably as before, `decode_summary_table_name` now uses the summary table schema info, not just the summary table ID. Specifically, it looks at the type of the `group` column, which is `RefList:<source table id>`.
Renaming a source table renames the summary table as before, and now renaming a groupby column renames the summary table as well.
Conflicting table names are resolved in the usual way by adding a number at the end, e.g. `Table1_summary_A_B2`. These summary tables are not automatically renamed when the disambiguation is no longer needed.
A new migration renames all summary tables to the new scheme, and updates formulas using summary tables with a simple regex.
Test Plan:
Updated many tests to use the new style of name.
Added new Python tests to for resolving conflicts when renaming source tables and groupby columns.
Added a test for the migration, including renames in formulas.
Reviewers: georgegevoian
Reviewed By: georgegevoian
Differential Revision: https://phab.getgrist.com/D3508
2022-07-11 18:00:25 +00:00
|
|
|
if not (
|
|
|
|
_is_special_table(table_info.tableId) or
|
|
|
|
summary.decode_summary_table_name(table_info)
|
|
|
|
):
|
2020-07-27 18:57:36 +00:00
|
|
|
userparts.append("\n\n")
|
2020-07-31 02:10:18 +00:00
|
|
|
userparts.append(self._make_table_model(table_info, summary_tables.get(table_info.tableId),
|
|
|
|
filter_for_user=True))
|
2020-07-27 18:57:36 +00:00
|
|
|
|
|
|
|
# Once all formulas are generated, replace the formula cache with the newly-populated version.
|
|
|
|
self._formula_cache = self._new_formula_cache
|
|
|
|
self._new_formula_cache = {}
|
|
|
|
self._full_builder = textbuilder.Combiner(fullparts)
|
|
|
|
self._user_builder = textbuilder.Combiner(userparts)
|
|
|
|
self._usercode = exec_module_text(self._full_builder.get_text())
|
|
|
|
|
|
|
|
def get_user_text(self):
|
|
|
|
"""Returns the text of the user-facing part of the generated code."""
|
|
|
|
return self._user_builder.get_text()
|
|
|
|
|
|
|
|
@property
|
|
|
|
def usercode(self):
|
|
|
|
"""Returns the generated usercode module."""
|
|
|
|
return self._usercode
|
|
|
|
|
|
|
|
def grist_names(self):
|
|
|
|
return codebuilder.parse_grist_names(self._full_builder)
|
|
|
|
|
|
|
|
|
|
|
|
def _is_special_table(table_id):
|
(core) Nice summary table IDs
Summary:
Changes auto-generated summary table IDs from e.g. `GristSummary_6_Table1` to `Table1_summary_A_B` (meaning `Table1` grouped by `A` and `B`). This makes it easier to write formulas involving summary tables, make API requests, understand logs, etc.
Because these don't encode the source table ID as reliably as before, `decode_summary_table_name` now uses the summary table schema info, not just the summary table ID. Specifically, it looks at the type of the `group` column, which is `RefList:<source table id>`.
Renaming a source table renames the summary table as before, and now renaming a groupby column renames the summary table as well.
Conflicting table names are resolved in the usual way by adding a number at the end, e.g. `Table1_summary_A_B2`. These summary tables are not automatically renamed when the disambiguation is no longer needed.
A new migration renames all summary tables to the new scheme, and updates formulas using summary tables with a simple regex.
Test Plan:
Updated many tests to use the new style of name.
Added new Python tests to for resolving conflicts when renaming source tables and groupby columns.
Added a test for the migration, including renames in formulas.
Reviewers: georgegevoian
Reviewed By: georgegevoian
Differential Revision: https://phab.getgrist.com/D3508
2022-07-11 18:00:25 +00:00
|
|
|
return table_id.startswith("_grist_")
|
2020-07-27 18:57:36 +00:00
|
|
|
|
|
|
|
|
|
|
|
def exec_module_text(module_text):
|
|
|
|
# pylint: disable=exec-used
|
2021-07-12 20:14:23 +00:00
|
|
|
filename = "usercode"
|
|
|
|
mod = imp.new_module(filename)
|
|
|
|
|
|
|
|
# Ensure that source lines show in tracebacks
|
|
|
|
linecache.cache[filename] = (
|
|
|
|
len(module_text),
|
|
|
|
None,
|
|
|
|
[line + '\n' for line in module_text.splitlines()],
|
|
|
|
filename,
|
|
|
|
)
|
|
|
|
|
|
|
|
code_obj = compile(module_text, filename, "exec")
|
|
|
|
exec(code_obj, mod.__dict__)
|
2020-07-27 18:57:36 +00:00
|
|
|
return mod
|