From c13eaf20fa94caf06524603b5ba1134a056d1b73 Mon Sep 17 00:00:00 2001
From: jmalar1 <julien.malard@mail.mcgill.ca>
Date: Tue, 26 Jun 2018 13:27:37 -0400
Subject: [PATCH 01/30] A few fixes (sorry).

---
 tests/test-models | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test-models b/tests/test-models
index d7762091..7fe1b71e 160000
--- a/tests/test-models
+++ b/tests/test-models
@@ -1 +1 @@
-Subproject commit d7762091600d6b40786521207cb564c86ac456f0
+Subproject commit 7fe1b71e175b1392d174c20a9f678b2f2fa45cf8

From dce7e37f1cebc556d56d3cc15c06e391ae12fabc Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Wed, 21 Nov 2018 16:56:44 -0500
Subject: [PATCH 02/30] Added hyperbolic trigonometric functions and ugly hack
 for parsing ! subscripts for now.

---
 pysd/py_backend/vensim/vensim2py.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index f3d4f608..b8b97026 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -369,6 +369,9 @@ def parse_units(units_str):
     "arccos": "np.arccos",
     "arcsin": "np.arcsin",
     "arctan": "np.arctan",
+    "tanh": "np.tanh",
+    "sinh": "np.sinh",
+    "cosh": "np.cosh",
     "if then else": "functions.if_then_else",
     "step": {
         "name": "functions.step",
@@ -637,7 +640,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     arguments = (expr _ ","? _)*
 
     reference = id _ subscript_list?
-    subscript_list = "[" _ ((sub_name / sub_element) _ ","? _)+ "]"
+    subscript_list = "[" _ ((sub_name / sub_element) "!"? _ ","? _)+ "]"
 
     array = (number _ ("," / ";")? _)+ !~r"."  # negative lookahead for anything other than an array
     number = ~r"\d+\.?\d*(e[+-]\d+)?"

From 7910ab5061d8d2d50bc7f01bc3e9151e3a6d3c3f Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Fri, 23 Nov 2018 12:09:22 -0500
Subject: [PATCH 03/30] Fixed unicode error

---
 pysd/py_backend/builder.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 58cc8df6..8a45bcf1 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -154,11 +154,11 @@ def build_element(element, subscript_dict):
     element['doc'] = element['doc'].replace('\\', '\n    ').encode('unicode-escape')
 
     if 'unit' in element:
-        element['unit'] = element['unit'].encode('unicode-escape')
+        element['unit'] = element['unit'].encode('utf8')
     if 'real_name' in element:
-        element['real_name'] = element['real_name'].encode('unicode-escape')
+        element['real_name'] = element['real_name'].encode('utf8')
     if 'eqn' in element:
-        element['eqn'] = element['eqn'].encode('unicode-escape')
+        element['eqn'] = element['eqn'].encode('utf8')
     
     if element['kind'] == 'stateful':
         func = '''

From 08a73776ae115cf4790a74f6291df8dda483abda Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Fri, 23 Nov 2018 12:12:23 -0500
Subject: [PATCH 04/30] Fixed for real

---
 pysd/py_backend/builder.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 8a45bcf1..4f9322b8 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -154,11 +154,11 @@ def build_element(element, subscript_dict):
     element['doc'] = element['doc'].replace('\\', '\n    ').encode('unicode-escape')
 
     if 'unit' in element:
-        element['unit'] = element['unit'].encode('utf8')
+        element['unit'] = element['unit']
     if 'real_name' in element:
-        element['real_name'] = element['real_name'].encode('utf8')
+        element['real_name'] = element['real_name']
     if 'eqn' in element:
-        element['eqn'] = element['eqn'].encode('utf8')
+        element['eqn'] = element['eqn']
     
     if element['kind'] == 'stateful':
         func = '''

From acd48a5d7e181f9efa5b9274fc21b2804c509de9 Mon Sep 17 00:00:00 2001
From: jmalar1 <julien.malard@mail.mcgill.ca>
Date: Tue, 26 Jun 2018 13:27:37 -0400
Subject: [PATCH 05/30] A few fixes (sorry).

---
 tests/test-models | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test-models b/tests/test-models
index 7fe1b71e..630fb864 160000
--- a/tests/test-models
+++ b/tests/test-models
@@ -1 +1 @@
-Subproject commit 7fe1b71e175b1392d174c20a9f678b2f2fa45cf8
+Subproject commit 630fb864fe7d509c32656bcb0a3831e46521a9f7

From ecd5ebe625fc218badeb147c8ad2aa06bbc81503 Mon Sep 17 00:00:00 2001
From: jmalar1 <julien.malard@mail.mcgill.ca>
Date: Tue, 26 Jun 2018 13:27:37 -0400
Subject: [PATCH 06/30] A few fixes (sorry).

---
 pysd/py_backend/functions.py | 322 +++++++++++++++++++++++++++++++++--
 1 file changed, 304 insertions(+), 18 deletions(-)

diff --git a/pysd/py_backend/functions.py b/pysd/py_backend/functions.py
index 8e1a1c77..1c2b733a 100644
--- a/pysd/py_backend/functions.py
+++ b/pysd/py_backend/functions.py
@@ -7,20 +7,23 @@
 """
 
 from __future__ import division, absolute_import
-from functools import wraps
 
-import pandas as pd
-
-import pandas as _pd
-import numpy as np
-from . import utils
 import imp
-import warnings
-import random
 import inspect
+import os
+import random
+import re
+import string
+import warnings
+from functools import wraps, reduce
+
+import numpy as np
+import pandas as _pd
+import pandas as pd
 import xarray as xr
 from funcsigs import signature
-import os
+
+from . import utils
 
 try:
     import scipy.stats as stats
@@ -173,7 +176,7 @@ class Delay(Stateful):
     # This method forces them to acknowledge that additional structure is being created
     # in the delay object.
 
-    def __init__(self, delay_input, delay_time, initial_value, order):
+    def __init__(self, delay_input, delay_time, initial_value, order, subs, subscript_dict):
         """
 
         Parameters
@@ -189,6 +192,8 @@ def __init__(self, delay_input, delay_time, initial_value, order):
         self.input_func = delay_input
         self.order_func = order
         self.order = None
+        self.subs = subs
+        self.subscript_dict = subscript_dict
 
     def initialize(self):
         order = self.order_func()
@@ -196,7 +201,14 @@ def initialize(self):
             warnings.warn('Casting delay order from %f to %i' % (order, int(order)))
         self.order = int(order)  # The order can only be set once
         init_state_value = self.init_func() * self.delay_time_func() / self.order
-        self.state = np.array([init_state_value] * self.order)
+        if self.subs:
+            coords = {d: self.subscript_dict[d] for d in self.subs}
+            size = [len(d) for d in coords.values()]
+            data = np.full((self.order, *size), init_state_value)
+            coords_final = {'delay': np.arange(self.order), **coords}
+            self.state = xr.DataArray(data=data, dims=['delay'] + self.subs, coords=coords_final)
+        else:
+            self.state = np.array([init_state_value] * self.order)
 
     def __call__(self):
         return self.state[-1] / (self.delay_time_func() / self.order)
@@ -263,6 +275,135 @@ def update(self, state):
         pass
 
 
+class Data(Stateful):
+    def __init__(self, file, tab, time_row_or_col, cell, interp, time, root, coords):
+        super(Data, self).__init__()
+        self.file = _resolve_file(file, root=root)
+        self.tab = tab
+        self.time_row_or_col = time_row_or_col
+        self.cell = cell
+        self.time_func = time
+        self.interp = interp
+        self.coords = coords
+
+    def initialize(self):
+        time_across = self.time_row_or_col.isnumeric()
+        size = int(np.product([len(v) for v in self.coords.values()]))
+
+        time_data, data = _get_series_data(
+            file=self.file, tab=self.tab, series_across=time_across, series_row_or_col=self.time_row_or_col,
+            cell=self.cell, size=size
+        )
+        self.state = xr.DataArray(
+            data=data, coords={'time': time_data, **self.coords}, dims=['time'] + list(self.coords)
+        )
+
+    def ddt(self):
+        return 0  # todo: is this correct?
+
+    def update(self, state):
+        # this doesn't change once it's set up.
+        pass
+
+    def __call__(self):
+
+        time = self.time_func()
+        if time > self.state['time'][-1]:
+            return self.state['time'][-1]
+        elif time < self.state['time'][0]:
+            return self.state['time'][0]
+
+        if self.interp == 'interpolate' or self.interp is None:  # 'interpolate' is the default
+            return self.state.interp(time=time)
+        elif self.interp == 'look forward':
+            next_t = self.state['time'][self.state['time'] >= time][0]
+            return self.state.sel(time=next_t)
+        elif self.interp == 'hold backward':
+            last_t = self.state['time'][self.state['time'] <= time][-1]
+            return self.state.sel(time=last_t)
+
+        # For :raw: (or actually any other/invalid) keyword directives
+        try:
+            return self.state.sel(time=time)
+        except KeyError:
+            return np.nan
+
+
+class ExtLookup(Stateful):
+    def __init__(self, file, tab, x_row_or_col, cell, root, coords):
+        super(ExtLookup, self).__init__()
+        self.file = _resolve_file(file, root=root)
+        self.tab = tab
+        self.x_row_or_col = x_row_or_col
+        self.cell = cell
+        self.coords = coords
+
+    def initialize(self):
+        x_across = self.x_row_or_col.isnumeric()
+        size = int(np.product([len(v) for v in self.coords.values()]))
+
+        x_data, data = _get_series_data(
+            file=self.file, tab=self.tab, series_across=x_across, series_row_or_col=self.x_row_or_col,
+            cell=self.cell, size=size
+        )
+        self.state = xr.DataArray(
+            data=data, coords={'x': x_data, **self.coords}, dims=['x'] + list(self.coords)
+        )
+
+    def ddt(self):
+        return 0
+
+    def update(self, state):
+        # this doesn't change once it's set up.
+        pass
+
+    def __call__(self, x):
+        if x > self.state['x'][-1]:
+            return self.state['x'][-1]
+        elif x < self.state['x'][0]:
+            return self.state['x'][0]
+
+        return self.state.interp(x=x)
+
+
+class ExtConstant(Stateful):
+    def __init__(self, file, tab, cell, root, coords):
+        super(ExtConstant, self).__init__()
+        self.file = _resolve_file(file, root=root)
+        self.tab = tab
+        self.transpose = cell[-1] == '*'
+        self.cell = cell.strip('*')
+        self.coords = coords
+
+    def initialize(self):
+        dims = list(self.coords)
+        start_row, start_col = _split_excel_cell(self.cell)
+        end_row = start_row
+        end_col = start_col
+        if dims:
+            if self.transpose:
+                end_row = start_row + len(self.coords[dims[-1]]) - 1
+            else:
+                end_col = _num_to_col(_col_to_num(start_col) + len(self.coords[dims[-1]]) - 1)
+
+            if len(dims) >= 2:
+                if self.transpose:
+                    end_col = _num_to_col(_col_to_num(start_col) + len(self.coords[dims[-2]]) - 1)
+                else:
+                    end_row = start_row + len(self.coords[dims[-2]]) - 1
+        data = _get_data_from_file(self.file, tab=self.tab, rows=[start_row, end_row], cols=[start_col, end_col])
+        self.state = xr.DataArray(
+            data=data, coords=self.coords, dims=list(self.coords)
+        )
+
+    def ddt(self):
+        return 0
+
+    def update(self, state):
+        # this doesn't change once it's set up.
+        pass
+
+
 class Macro(Stateful):
     """
     The Model class implements a stateful representation of the system,
@@ -309,14 +450,13 @@ def __init__(self, py_model_file, params=None, return_func=None, time=None, time
 
         self.py_model_file = py_model_file
 
-
     def __call__(self):
         return self.return_func()
 
     def get_pysd_compiler_version(self):
         """ Returns the version of pysd complier that used for generating this model """
         return self.components.__pysd_version__
-        
+
     def initialize(self, initialization_order=None):
         """
         This function tries to initialize the stateful objects.
@@ -543,7 +683,7 @@ def __init__(self, py_model_file):
         super(Model, self).__init__(py_model_file, None, None, Time())
         self.time.stage = 'Load'
         self.initialize()
-        
+
     def initialize(self):
         """ Initializes the simulation model """
         self.time.update(self.components.initial_time())
@@ -883,12 +1023,12 @@ def pulse_train(time, start, duration, repeat_time, end):
 
 def pulse_magnitude(time, magnitude, start, repeat_time=0):
     """ Implements xmile's PULSE function
-    
+
     PULSE:             Generate a one-DT wide pulse at the given time
        Parameters:     2 or 3:  (magnitude, first time[, interval])
                        Without interval or when interval = 0, the PULSE is generated only once
        Example:        PULSE(20, 12, 5) generates a pulse value of 20/DT at time 12, 17, 22, etc.
-    
+
     In rage [-inf, start) returns 0
     In range [start + n * repeat_time, start + n * repeat_time + dt) return magnitude/dt
     In rage [start + n * repeat_time + dt, start + (n + 1) * repeat_time) return 0
@@ -912,7 +1052,8 @@ def lookup(x, xs, ys):
     Intermediate values are calculated with linear interpolation between the intermediate points.
     Out-of-range values are the same as the closest endpoint (i.e, no extrapolation is performed).
     """
-    return np.interp(x, xs, ys)
+    return _preserve_array(np.interp(x, xs, ys), ref=x)
+
 
 def lookup_extrapolation(x, xs, ys):
     """
@@ -932,6 +1073,7 @@ def lookup_extrapolation(x, xs, ys):
         return ys[length - 1] + (x - xs[length - 1]) * k
     return np.interp(x, xs, ys)
 
+
 def lookup_discrete(x, xs, ys):
     """
     Intermediate values take on the value associated with the next lower x-coordinate (also called a step-wise function). The last two points of a discrete graphical function must have the same y value.
@@ -944,7 +1086,7 @@ def lookup_discrete(x, xs, ys):
 
 
 def if_then_else(condition, val_if_true, val_if_false):
-    return np.where(condition, val_if_true, val_if_false)
+    return xr.where(condition, val_if_true, val_if_false)
 
 
 def xidz(numerator, denominator, value_if_denom_is_zero):
@@ -1038,3 +1180,147 @@ def log(x, base):
     base: base of the logarithm
     """
     return np.log(x) / np.log(base)
+
+
+def and_(x, y):
+    return _preserve_array(np.logical_and(x, y), ref=[x, y])
+
+
+def or_(x, y):
+    return _preserve_array(np.logical_or(x, y), ref=[x, y])
+
+
+def sum(x, dim=None):
+    return x.sum(dim=dim)
+
+
+def prod(x, dim=None):
+    return x.prod(dim=dim)
+
+
+def vmin(x, dim=None):
+    return x.min(dim=dim)
+
+
+def vmax(x, dim=None):
+    return x.max(dim=dim)
+
+
+def _preserve_array(value, ref):
+    if not isinstance(ref, list):
+        ref = [ref]
+    array = next((r for r in ref if isinstance(r, xr.DataArray)), None)
+    if array is not None:
+        return xr.DataArray(data=value, coords=array.coords, dims=array.dims).squeeze()
+    else:
+        return value
+
+
+def get_direct_subscript(file, tab, firstcell, lastcell, prefix):
+    file = _resolve_file(file)
+
+    row_first, col_first = _split_excel_cell(firstcell)
+    row_last, col_last = _split_excel_cell(lastcell)
+    data = _get_data_from_file(
+        file, tab,
+        rows=[row_first, row_last],
+        cols=[col_first, col_last]
+    )
+    return [prefix + str(d) for d in data.flatten()]
+
+
+get_xls_subscript = get_direct_subscript
+
+
+def _get_series_data(file, tab, series_across, series_row_or_col, cell, size):
+    if series_across:
+        series_data = _get_data_from_file(file, tab, rows=int(series_row_or_col), cols=None, dropna=True)
+        first_data_row, first_col = _split_excel_cell(cell)
+        last_col = first_col + series_data.size - 1
+
+        last_data_row = first_data_row + size - 1
+        data = _get_data_from_file(
+            file, tab, rows=[first_data_row, last_data_row], cols=[first_col, last_col])
+    else:
+        first_row, first_col = _split_excel_cell(cell)
+        series_data = _get_data_from_file(
+            file, tab, rows=[first_row, None], cols=series_row_or_col, dropna=True
+        )
+
+        last_row = first_row + series_data.size - 1
+        cols = [first_col, _col_to_num(first_col) + size - 1]
+        data = _get_data_from_file(file, tab, rows=[first_row, last_row], cols=cols)
+
+    return series_data, data
+
+
+def _get_data_from_file(file, tab, rows, cols, dropna=False):
+    ext = os.path.splitext(file)[1].lower()
+    if ext in ['.xls', '.xlsx']:
+        if rows is None:
+            skip = nrows = None
+        elif isinstance(rows, int):
+            skip = rows
+            nrows = None
+        else:
+            skip = rows[0] - 1
+            nrows = rows[1] - skip if rows[1] is not None else None
+        if isinstance(cols, list):
+            cols = [_num_to_col(c) if isinstance(c, int) else c for c in cols]
+            usecols = cols[0] + ":" + cols[1]
+        else:
+            usecols = cols
+
+        data = pd.read_excel(
+            file, sheet_name=tab, header=None, skiprows=skip, nrows=nrows, usecols=usecols
+        )
+        if dropna:
+            data = data.dropna()
+        data = data.values
+        if isinstance(rows, int) or (isinstance(rows, list) and rows[0] == rows[1]):
+            data = data[0]
+        if isinstance(cols, str) or (isinstance(cols, list) and cols[0].lower() == cols[1].lower()):
+            data = data[:, 0]
+
+        return data
+
+    raise NotImplementedError(ext)
+
+
+def _split_excel_cell(cell):
+    return int(re.sub("[a-zA-Z]+", "", cell)), re.sub("[^a-zA-Z]+", "", cell)
+
+
+def _resolve_file(file, root=None, possible_ext=None):
+    possible_ext = possible_ext or ['.xls', '.xlsx', '.odt', '.txt', '.tab']
+
+    if file[0] == '?':
+        file = os.path.join(root, file[1:])
+
+    if os.path.isfile(file):
+        return file
+
+    for ext in possible_ext:
+        if os.path.isfile(file + ext):
+            return file + ext
+
+    raise FileNotFoundError(file)
+
+
+def _col_to_num(col):
+    return reduce(lambda r, x: r * 26 + x + 1, map(string.ascii_lowercase.index, col.lower()), 0)
+
+
+def _num_to_col(num):
+    chars = []
+
+    def divmod_excel(n):
+        a, b = divmod(n, 26)
+        if b == 0:
+            return a - 1, b + 26
+        return a, b
+
+    while num > 0:
+        num, d = divmod_excel(num)
+        chars.append(string.ascii_uppercase[d - 1])
+    return ''.join(reversed(chars)).lower()

From 7ac3aad8a0754d89db1f9ea27c6ab88e8d5bfdb6 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Tue, 10 Sep 2019 10:44:13 -0400
Subject: [PATCH 07/30] Lookup calls with subscripts

---
 pysd/py_backend/vensim/vensim2py.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index b8b97026..3812fd31 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -631,7 +631,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / reference) _ (in_oper _ expr)?
 
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
-    lookup_call = id _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
+    lookup_call = reference _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     call = func _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     build_call = builder _ "(" _ arguments _ ")"
     macro_call = macro _ "(" _ arguments _ ")"

From 32f347bdf8a29a8faf3561d89d4a8e15141059e0 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Tue, 10 Sep 2019 11:04:11 -0400
Subject: [PATCH 08/30] Allow single quoted strings as function arguments

---
 pysd/py_backend/vensim/vensim2py.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 3812fd31..23779ec4 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -628,7 +628,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
 
     expression_grammar = r"""
     expr_type = array / expr / empty
-    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / reference) _ (in_oper _ expr)?
+    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ (in_oper _ expr)?
 
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
     lookup_call = reference _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
@@ -644,6 +644,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
 
     array = (number _ ("," / ";")? _)+ !~r"."  # negative lookahead for anything other than an array
     number = ~r"\d+\.?\d*(e[+-]\d+)?"
+    string = "\'" ( "\\\'" / ~r"[^\']"IU )* "\'"
 
     id = ( basic_id / escape_group )
     basic_id = ~r"\w[\w\d_\s\']*"IU

From d03c5eff6d67924892de0dc3aee989c618e9d9f3 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Tue, 10 Sep 2019 11:05:23 -0400
Subject: [PATCH 09/30] Add data and test definitions, and the possibility of
 data keywords

---
 pysd/py_backend/vensim/vensim2py.py | 18 +++++++++++++++---
 1 file changed, 15 insertions(+), 3 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 23779ec4..0a1252d0 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -230,6 +230,7 @@ def get_equation_components(equation_str):
         - *component* - normal model expression or constant
         - *lookup* - a lookup table
         - *subdef* - a subscript definition
+        - *data* -  a data variable
 
     Examples
     --------
@@ -244,14 +245,17 @@ def get_equation_components(equation_str):
     """
 
     component_structure_grammar = _include_common_grammar(r"""
-    entry = component / subscript_definition / lookup_definition
+    entry = component / test_definition / subscript_definition / lookup_definition / data_definition
     component = name _ subscriptlist? _ "=" _ expression
-    subscript_definition = name _ ":" _ subscript _ ("," _ subscript)*
+    subscript_definition = name _ ":" expression
+    data_definition = name _ subscriptlist? _ &keyword _ ":=" _ expression
     lookup_definition = name _ &"(" _ expression  # uses lookahead assertion to capture whole group
+    test_definition = name _ subscriptlist? _ &keyword _ expression
 
     name = basic_id / escape_group
     subscriptlist = '[' _ subscript _ ("," _ subscript)* _ ']'
     expression = ~r".*"  # expression could be anything, at this point.
+    keyword = ":" _ basic_id _ ":"
 
     subscript = basic_id / escape_group
     """)
@@ -269,6 +273,7 @@ def __init__(self, ast):
             self.real_name = None
             self.expression = None
             self.kind = None
+            self.keyword = None
             self.visit(ast)
 
         def visit_subscript_definition(self, n, vc):
@@ -280,6 +285,12 @@ def visit_lookup_definition(self, n, vc):
         def visit_component(self, n, vc):
             self.kind = 'component'
 
+        def visit_data_definition(self, n, vc):
+            self.kind = 'data'
+
+        def visit_keyword(self, n, vc):
+            self.keyword = n.text.strip()
+
         def visit_name(self, n, vc):
             (name,) = vc
             self.real_name = name.strip()
@@ -302,7 +313,8 @@ def visit__(self, n, vc):
     return {'real_name': parse_object.real_name,
             'subs': parse_object.subscripts,
             'expr': parse_object.expression,
-            'kind': parse_object.kind}
+            'kind': parse_object.kind,
+            'keyword': parse_object.keyword}
 
 
 def parse_units(units_str):

From acaa01f333207fbfbfa617c285a4a76d5931c3cf Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Tue, 10 Sep 2019 11:05:57 -0400
Subject: [PATCH 10/30] Add new data functions

---
 pysd/py_backend/vensim/vensim2py.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 0a1252d0..79efc278 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -440,7 +440,13 @@ def parse_units(units_str):
     # vector functions
     "vmin": "np.min",
     "vmax": "np.max",
-    "prod": "np.prod"
+    "prod": "np.prod",
+
+    # data functions
+    "get xls data": "functions.get_xls_data",
+    "get direct data": "functions.get_direct_data",
+    "get xls constants": "functions.get_xls_constants",
+    "get xls lookups":  "functions.get_xls_lookups"
 }
 
 builders = {

From 8fdb24ca35e82f4c7a7abb944d593182c973842f Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Tue, 10 Sep 2019 11:06:03 -0400
Subject: [PATCH 11/30] Reformat

---
 pysd/py_backend/vensim/vensim2py.py | 22 +++++++++++++---------
 1 file changed, 13 insertions(+), 9 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 79efc278..ff0ef1ea 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -3,15 +3,18 @@
 model. Everything that requires knowledge of vensim syntax should be in this file.
 """
 from __future__ import absolute_import
+
+import os
 import re
+import textwrap
+import warnings
+from io import open
+
+import numpy as np
 import parsimonious
+
 from ...py_backend import builder
 from ...py_backend import utils
-from io import open
-import textwrap
-import numpy as np
-import os
-import warnings
 
 
 def get_file_sections(file_str):
@@ -203,6 +206,7 @@ def _include_common_grammar(source_grammar):
     {common_grammar}
     """.format(source_grammar=source_grammar, common_grammar=common_grammar)
 
+
 def get_equation_components(equation_str):
     """
     Breaks down a string representing only the equation part of a model element.
@@ -239,7 +243,7 @@ def get_equation_components(equation_str):
 
     Notes
     -----
-    in this function we dont create python identifiers, we use real names.
+    in this function we don't create python identifiers, we use real names.
     This is so that when everything comes back together, we can manage
     any potential namespace conflicts properly
     """
@@ -496,9 +500,9 @@ def parse_units(units_str):
 
     "delay fixed": lambda element, subscript_dict, args: builder.add_n_delay(
         delay_input=args[0],
-        delay_time='round('+args[1]+' / time_step() ) * time_step()',
+        delay_time='round(' + args[1] + ' / time_step() ) * time_step()',
         initial_value=args[2],
-        order=args[1]+' / time_step()',
+        order=args[1] + ' / time_step()',
         subs=element['subs'],
         subscript_dict=subscript_dict
     ),
@@ -690,7 +694,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
         'builders': '|'.join(reversed(sorted(builders.keys(), key=len))),
         'macros': '|'.join(reversed(sorted(macro_names_list, key=len)))
     }
-    
+
     class ExpressionParser(parsimonious.NodeVisitor):
         # Todo: at some point, we could make the 'kind' identification recursive on expression,
         # so that if an expression is passed into a builder function, the information

From 1a69cbf95c8d1e8f06dce9dba7c84770d5bdd914 Mon Sep 17 00:00:00 2001
From: Alexey Prey Mulyukin <alexprey@yandex.ru>
Date: Sat, 16 Jun 2018 01:32:24 +0300
Subject: [PATCH 12/30] Implement possibility to put any context information
 into functions without global references

---
 pysd/py_backend/builder.py | 65 +++++++-------------------------------
 1 file changed, 12 insertions(+), 53 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 4f9322b8..570f812e 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -321,7 +321,7 @@ def add_stock(identifier, subs, expression, initial_condition, subscript_dict):
 
     # describe the stateful object
     stateful = {
-        'py_name': '_integ_%s' % identifier,
+        'py_name': 'integ_%s' % identifier,
         'real_name': 'Representation of  %s' % identifier,
         'doc': 'Integrates Expression %s' % expression,
         'py_expr': stateful_py_expr,
@@ -381,7 +381,7 @@ def add_n_delay(delay_input, delay_time, initial_value, order, subs, subscript_d
     # that delay the output by different amounts, they'll overwrite the original function...
 
     stateful = {
-        'py_name': utils.make_python_identifier('_delay_%s_%s_%s_%s' % (delay_input,
+        'py_name': utils.make_python_identifier('delay_%s_%s_%s_%s' % (delay_input,
                                                                        delay_time,
                                                                        initial_value,
                                                                        order))[0],
@@ -441,7 +441,7 @@ def add_n_smooth(smooth_input, smooth_time, initial_value, order, subs, subscrip
         """
 
     stateful = {
-        'py_name': utils.make_python_identifier('_smooth_%s_%s_%s_%s' % (smooth_input,
+        'py_name': utils.make_python_identifier('smooth_%s_%s_%s_%s' % (smooth_input,
                                                                         smooth_time,
                                                                         initial_value,
                                                                         order))[0],
@@ -489,7 +489,7 @@ def add_n_trend(trend_input, average_time, initial_trend, subs, subscript_dict):
         """
 
     stateful = {
-        'py_name': utils.make_python_identifier('_trend_%s_%s_%s' % (trend_input,
+        'py_name': utils.make_python_identifier('trend_%s_%s_%s' % (trend_input,
                                                                     average_time,
                                                                     initial_trend))[0],
         'real_name': 'trend of %s' % trend_input,
@@ -528,7 +528,7 @@ def add_initial(initial_input):
 
     """
     stateful = {
-        'py_name': utils.make_python_identifier('_initial_%s' % initial_input)[0],
+        'py_name': utils.make_python_identifier('initial_%s' % initial_input)[0],
         'real_name': 'Smooth of %s' % initial_input,
         'doc': 'Returns the value taken on during the initialization phase',
         'py_expr': 'functions.Initial(lambda: %s)' % (
@@ -572,11 +572,11 @@ def add_macro(macro_name, filename, arg_names, arg_vals):
                                       zip(arg_names, arg_vals)])
 
     stateful = {
-        'py_name': '_macro_' + macro_name + '_' + '_'.join(
+        'py_name': 'macro_' + macro_name + '_' + '_'.join(
             [utils.make_python_identifier(f)[0] for f in arg_vals]),
         'real_name': 'Macro Instantiation of ' + macro_name,
         'doc': 'Instantiates the Macro',
-        'py_expr': "functions.Macro('%s', %s, '%s', time_initialization=lambda: __data['time'])" % (filename, func_args, macro_name),
+        'py_expr': "functions.Macro('%s', %s, '%s', __data['time'])" % (filename, func_args, macro_name),
         'unit': 'None',
         'lims': 'None',
         'eqn': 'None',
@@ -601,55 +601,14 @@ def add_incomplete(var_name, dependencies):
     # first arg is `self` reference
     return "functions.incomplete(%s)" % ', '.join(dependencies[1:]), []
 
-
 def build_function_call(function_def, user_arguments):
-    """
-
-    Parameters
-    ----------
-    function_def: function definition map with following keys
-        - name: name of the function
-        - parameters: list with description of all parameters of this function
-            - name
-            - optional?
-            - type: [
-                "expression", - provide converted expression as parameter for runtime evaluating before the method call
-                "lambda",     - provide lambda expression as parameter for delayed runtime evaluation in the method call
-                "time",       - provide access to current instance of time object
-                "scope"       - provide access to current instance of scope object (instance of Macro object)
-            ]
-    user_arguments: list of arguments provided from model
-
-    Returns
-    -------
-
-    """
     if isinstance(function_def, str):
         return function_def + "(" + ",".join(user_arguments) + ")"
 
-    if "parameters" in function_def:
-        parameters = function_def["parameters"]
-        arguments = []
-        argument_idx = 0
-        for parameter_idx in range(len(parameters)):
-            parameter_def = parameters[parameter_idx]
-            is_optional = parameter_def["optional"] if "optional" in parameter_def else False
-            if argument_idx >= len(user_arguments) and is_optional:
-                break
-
-            parameter_type = parameter_def["type"] if "type" in parameter_def else "expression"
-
-            user_argument = user_arguments[argument_idx]
-            if parameter_type in ["expression", "lambda"]:
-                argument_idx += 1
-
-            arguments.append({
-                "expression": user_argument,
-                "lambda": "lambda: (" + user_argument + ")",
-                "time": "__data['time']",
-                "scope": "__data['scope']"
-            }[parameter_type])
-
-        return function_def['name'] + "(" + ", ".join(arguments) + ")"
+    if "require_time" in function_def and function_def["require_time"]:
+        user_arguments.insert(0, "__data['time']")
+
+    if "require_scope" in function_def and function_def["require_scope"]:
+        user_arguments.insert(0, "__data['scope']")
 
     return function_def['name'] + "(" + ",".join(user_arguments) + ")"

From 94a2b89a7e87ff0354481944d89575c3aee1b273 Mon Sep 17 00:00:00 2001
From: Alexey Prey Mulyukin <alexprey@yandex.ru>
Date: Sat, 7 Jul 2018 19:45:58 +0300
Subject: [PATCH 13/30] #182: Make builder elements with private style names.

---
 pysd/py_backend/builder.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 570f812e..86151f5d 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -321,7 +321,7 @@ def add_stock(identifier, subs, expression, initial_condition, subscript_dict):
 
     # describe the stateful object
     stateful = {
-        'py_name': 'integ_%s' % identifier,
+        'py_name': '_integ_%s' % identifier,
         'real_name': 'Representation of  %s' % identifier,
         'doc': 'Integrates Expression %s' % expression,
         'py_expr': stateful_py_expr,
@@ -381,7 +381,7 @@ def add_n_delay(delay_input, delay_time, initial_value, order, subs, subscript_d
     # that delay the output by different amounts, they'll overwrite the original function...
 
     stateful = {
-        'py_name': utils.make_python_identifier('delay_%s_%s_%s_%s' % (delay_input,
+        'py_name': utils.make_python_identifier('_delay_%s_%s_%s_%s' % (delay_input,
                                                                        delay_time,
                                                                        initial_value,
                                                                        order))[0],
@@ -441,7 +441,7 @@ def add_n_smooth(smooth_input, smooth_time, initial_value, order, subs, subscrip
         """
 
     stateful = {
-        'py_name': utils.make_python_identifier('smooth_%s_%s_%s_%s' % (smooth_input,
+        'py_name': utils.make_python_identifier('_smooth_%s_%s_%s_%s' % (smooth_input,
                                                                         smooth_time,
                                                                         initial_value,
                                                                         order))[0],
@@ -489,7 +489,7 @@ def add_n_trend(trend_input, average_time, initial_trend, subs, subscript_dict):
         """
 
     stateful = {
-        'py_name': utils.make_python_identifier('trend_%s_%s_%s' % (trend_input,
+        'py_name': utils.make_python_identifier('_trend_%s_%s_%s' % (trend_input,
                                                                     average_time,
                                                                     initial_trend))[0],
         'real_name': 'trend of %s' % trend_input,
@@ -528,7 +528,7 @@ def add_initial(initial_input):
 
     """
     stateful = {
-        'py_name': utils.make_python_identifier('initial_%s' % initial_input)[0],
+        'py_name': utils.make_python_identifier('_initial_%s' % initial_input)[0],
         'real_name': 'Smooth of %s' % initial_input,
         'doc': 'Returns the value taken on during the initialization phase',
         'py_expr': 'functions.Initial(lambda: %s)' % (
@@ -572,7 +572,7 @@ def add_macro(macro_name, filename, arg_names, arg_vals):
                                       zip(arg_names, arg_vals)])
 
     stateful = {
-        'py_name': 'macro_' + macro_name + '_' + '_'.join(
+        'py_name': '_macro_' + macro_name + '_' + '_'.join(
             [utils.make_python_identifier(f)[0] for f in arg_vals]),
         'real_name': 'Macro Instantiation of ' + macro_name,
         'doc': 'Instantiates the Macro',

From 7750ac680449facbe3f60844df0a5f58320e8c93 Mon Sep 17 00:00:00 2001
From: Alexey Prey Mulyukin <alexprey@yandex.ru>
Date: Sat, 14 Jul 2018 23:15:03 +0300
Subject: [PATCH 14/30] Try to solve issue with parsing in python 2.7

---
 pysd/py_backend/vensim/vensim2py.py | 146 ++++++++--------------------
 1 file changed, 38 insertions(+), 108 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index ff0ef1ea..18663e51 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -3,18 +3,15 @@
 model. Everything that requires knowledge of vensim syntax should be in this file.
 """
 from __future__ import absolute_import
-
-import os
 import re
-import textwrap
-import warnings
-from io import open
-
-import numpy as np
 import parsimonious
-
 from ...py_backend import builder
 from ...py_backend import utils
+from io import open
+import textwrap
+import numpy as np
+import os
+import warnings
 
 
 def get_file_sections(file_str):
@@ -189,10 +186,9 @@ def _include_common_grammar(source_grammar):
     name = basic_id / escape_group
     
     # This takes care of models with Unicode variable names
-    basic_id = id_start id_continue*
-    
-    id_start = ~r"[\w]"IU
-    id_continue = id_start / ~r"[0-9\'\$\s\_]"
+    basic_id = id_start (id_continue / ~r"[\'\$\s]")*
+    id_start = ~r"[A-Za-z]" / ~r"[\u00AA\u00B5\u00BA\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u01BA\u01BB\u01BC-\u01BF\u01C0-\u01C3\u01C4-\u0241\u0250-\u02AF\u02B0-\u02C1\u02C6-\u02D1\u02E0-\u02E4\u02EE\u037A\u0386\u0388-\u038A\u038C\u038E-\u03A1\u03A3-\u03CE\u03D0-\u03F5\u03F7-\u0481\u048A-\u04CE\u04D0-\u04F9\u0500-\u050F\u0531-\u0556\u0559\u0561-\u0587\u05D0-\u05EA\u05F0-\u05F2\u0621-\u063A\u0640\u0641-\u064A\u066E-\u066F\u0671-\u06D3\u06D5\u06E5-\u06E6\u06EE-\u06EF\u06FA-\u06FC\u06FF\u0710\u0712-\u072F\u074D-\u076D\u0780-\u07A5\u07B1\u0904-\u0939\u093D\u0950\u0958-\u0961\u097D\u0985-\u098C\u098F-\u0990\u0993-\u09A8\u09AA-\u09B0\u09B2\u09B6-\u09B9\u09BD\u09CE\u09DC-\u09DD\u09DF-\u09E1\u09F0-\u09F1\u0A05-\u0A0A\u0A0F-\u0A10\u0A13-\u0A28\u0A2A-\u0A30\u0A32-\u0A33\u0A35-\u0A36\u0A38-\u0A39\u0A59-\u0A5C\u0A5E\u0A72-\u0A74\u0A85-\u0A8D\u0A8F-\u0A91\u0A93-\u0AA8\u0AAA-\u0AB0\u0AB2-\u0AB3\u0AB5-\u0AB9\u0ABD\u0AD0\u0AE0-\u0AE1\u0B05-\u0B0C\u0B0F-\u0B10\u0B13-\u0B28\u0B2A-\u0B30\u0B32-\u0B33\u0B35-\u0B39\u0B3D\u0B5C-\u0B5D\u0B5F-\u0B61\u0B71\u0B83\u0B85-\u0B8A\u0B8E-\u0B90\u0B92-\u0B95\u0B99-\u0B9A\u0B9C\u0B9E-\u0B9F\u0BA3-\u0BA4\u0BA8-\u0BAA\u0BAE-\u0BB9\u0C05-\u0C0C\u0C0E-\u0C10\u0C12-\u0C28\u0C2A-\u0C33\u0C35-\u0C39\u0C60-\u0C61\u0C85-\u0C8C\u0C8E-\u0C90\u0C92-\u0CA8\u0CAA-\u0CB3\u0CB5-\u0CB9\u0CBD\u0CDE\u0CE0-\u0CE1\u0D05-\u0D0C\u0D0E-\u0D10\u0D12-\u0D28\u0D2A-\u0D39\u0D60-\u0D61\u0D85-\u0D96\u0D9A-\u0DB1\u0DB3-\u0DBB\u0DBD\u0DC0-\u0DC6\u0E01-\u0E30\u0E32-\u0E33\u0E40-\u0E45\u0E46\u0E81-\u0E82\u0E84\u0E87-\u0E88\u0E8A\u0E8D\u0E94-\u0E97\u0E99-\u0E9F\u0EA1-\u0EA3\u0EA5\u0EA7\u0EAA-\u0EAB\u0EAD-\u0EB0\u0EB2-\u0EB3\u0EBD\u0EC0-\u0EC4\u0EC6\u0EDC-\u0EDD\u0F00\u0F40-\u0F47\u0F49-\u0F6A\u0F88-\u0F8B\u1000-\u1021\u1023-\u1027\u1029-\u102A\u1050-\u1055\u10A0-\u10C5\u10D0-\u10FA\u10FC\u1100-\u1159\u115F-\u11A2\u11A8-\u11F9\u1200-\u1248\u124A-\u124D\u1250-\u1256\u1258\u125A-\u125D\u1260-\u1288\u128A-\u128D\u1290-\u12B0\u12B2-\u12B5\u12B8-\u12BE\u12C0\u12C2-\u12C5\u12C8-\u12D6\u12D8-\u1310\u1312-\u1315\u1318-\u135A\u1380-\u138F\u13A0-\u13F4\u1401-\u166C\u166F-\u1676\u1681-\u169A\u16A0-\u16EA\u16EE-\u16F0\u1700-\u170C\u170E-\u1711\u1720-\u1731\u1740-\u1751\u1760-\u176C\u176E-\u1770\u1780-\u17B3\u17D7\u17DC\u1820-\u1842\u1843\u1844-\u1877\u1880-\u18A8\u1900-\u191C\u1950-\u196D\u1970-\u1974\u1980-\u19A9\u19C1-\u19C7\u1A00-\u1A16\u1D00-\u1D2B\u1D2C-\u1D61\u1D62-\u1D77\u1D78\u1D79-\u1D9A\u1D9B-\u1DBF\u1E00-\u1E9B\u1EA0-\u1EF9\u1F00-\u1F15\u1F18-\u1F1D\u1F20-\u1F45\u1F48-\u1F4D\u1F50-\u1F57\u1F59\u1F5B\u1F5D\u1F5F-\u1F7D\u1F80-\u1FB4\u1FB6-\u1FBC\u1FBE\u1FC2-\u1FC4\u1FC6-\u1FCC\u1FD0-\u1FD3\u1FD6-\u1FDB\u1FE0-\u1FEC\u1FF2-\u1FF4\u1FF6-\u1FFC\u2071\u207F\u2090-\u2094\u2102\u2107\u210A-\u2113\u2115\u2118\u2119-\u211D\u2124\u2126\u2128\u212A-\u212D\u212E\u212F-\u2131\u2133-\u2134\u2135-\u2138\u2139\u213C-\u213F\u2145-\u2149\u2160-\u2183\u2C00-\u2C2E\u2C30-\u2C5E\u2C80-\u2CE4\u2D00-\u2D25\u2D30-\u2D65\u2D6F\u2D80-\u2D96\u2DA0-\u2DA6\u2DA8-\u2DAE\u2DB0-\u2DB6\u2DB8-\u2DBE\u2DC0-\u2DC6\u2DC8-\u2DCE\u2DD0-\u2DD6\u2DD8-\u2DDE\u3005\u3006\u3007\u3021-\u3029\u3031-\u3035\u3038-\u303A\u303B\u303C\u3041-\u3096\u309B-\u309C\u309D-\u309E\u309F\u30A1-\u30FA\u30FC-\u30FE\u30FF\u3105-\u312C\u3131-\u318E\u31A0-\u31B7\u31F0-\u31FF\u3400-\u4DB5\u4E00-\u9FBB\uA000-\uA014\uA015\uA016-\uA48C\uA800-\uA801\uA803-\uA805\uA807-\uA80A\uA80C-\uA822\uAC00-\uD7A3\uF900-\uFA2D\uFA30-\uFA6A\uFA70-\uFAD9\uFB00-\uFB06\uFB13-\uFB17\uFB1D\uFB1F-\uFB28\uFB2A-\uFB36\uFB38-\uFB3C\uFB3E\uFB40-\uFB41\uFB43-\uFB44\uFB46-\uFBB1\uFBD3-\uFD3D\uFD50-\uFD8F\uFD92-\uFDC7\uFDF0-\uFDFB\uFE70-\uFE74\uFE76-\uFEFC\uFF21-\uFF3A\uFF41-\uFF5A\uFF66-\uFF6F\uFF70\uFF71-\uFF9D\uFF9E-\uFF9F\uFFA0-\uFFBE\uFFC2-\uFFC7\uFFCA-\uFFCF\uFFD2-\uFFD7\uFFDA-\uFFDC]"iu
+    id_continue = id_start / ~r"[0-9]" / ~r"[\u0300-\u036F\u0483-\u0486\u0591-\u05B9\u05BB-\u05BD\u05BF\u05C1-\u05C2\u05C4-\u05C5\u05C7\u0610-\u0615\u064B-\u065E\u0660-\u0669\u0670\u06D6-\u06DC\u06DF-\u06E4\u06E7-\u06E8\u06EA-\u06ED\u06F0-\u06F9\u0711\u0730-\u074A\u07A6-\u07B0\u0901-\u0902\u0903\u093C\u093E-\u0940\u0941-\u0948\u0949-\u094C\u094D\u0951-\u0954\u0962-\u0963\u0966-\u096F\u0981\u0982-\u0983\u09BC\u09BE-\u09C0\u09C1-\u09C4\u09C7-\u09C8\u09CB-\u09CC\u09CD\u09D7\u09E2-\u09E3\u09E6-\u09EF\u0A01-\u0A02\u0A03\u0A3C\u0A3E-\u0A40\u0A41-\u0A42\u0A47-\u0A48\u0A4B-\u0A4D\u0A66-\u0A6F\u0A70-\u0A71\u0A81-\u0A82\u0A83\u0ABC\u0ABE-\u0AC0\u0AC1-\u0AC5\u0AC7-\u0AC8\u0AC9\u0ACB-\u0ACC\u0ACD\u0AE2-\u0AE3\u0AE6-\u0AEF\u0B01\u0B02-\u0B03\u0B3C\u0B3E\u0B3F\u0B40\u0B41-\u0B43\u0B47-\u0B48\u0B4B-\u0B4C\u0B4D\u0B56\u0B57\u0B66-\u0B6F\u0B82\u0BBE-\u0BBF\u0BC0\u0BC1-\u0BC2\u0BC6-\u0BC8\u0BCA-\u0BCC\u0BCD\u0BD7\u0BE6-\u0BEF\u0C01-\u0C03\u0C3E-\u0C40\u0C41-\u0C44\u0C46-\u0C48\u0C4A-\u0C4D\u0C55-\u0C56\u0C66-\u0C6F\u0C82-\u0C83\u0CBC\u0CBE\u0CBF\u0CC0-\u0CC4\u0CC6\u0CC7-\u0CC8\u0CCA-\u0CCB\u0CCC-\u0CCD\u0CD5-\u0CD6\u0CE6-\u0CEF\u0D02-\u0D03\u0D3E-\u0D40\u0D41-\u0D43\u0D46-\u0D48\u0D4A-\u0D4C\u0D4D\u0D57\u0D66-\u0D6F\u0D82-\u0D83\u0DCA\u0DCF-\u0DD1\u0DD2-\u0DD4\u0DD6\u0DD8-\u0DDF\u0DF2-\u0DF3\u0E31\u0E34-\u0E3A\u0E47-\u0E4E\u0E50-\u0E59\u0EB1\u0EB4-\u0EB9\u0EBB-\u0EBC\u0EC8-\u0ECD\u0ED0-\u0ED9\u0F18-\u0F19\u0F20-\u0F29\u0F35\u0F37\u0F39\u0F3E-\u0F3F\u0F71-\u0F7E\u0F7F\u0F80-\u0F84\u0F86-\u0F87\u0F90-\u0F97\u0F99-\u0FBC\u0FC6\u102C\u102D-\u1030\u1031\u1032\u1036-\u1037\u1038\u1039\u1040-\u1049\u1056-\u1057\u1058-\u1059\u135F\u1369-\u1371\u1712-\u1714\u1732-\u1734\u1752-\u1753\u1772-\u1773\u17B6\u17B7-\u17BD\u17BE-\u17C5\u17C6\u17C7-\u17C8\u17C9-\u17D3\u17DD\u17E0-\u17E9\u180B-\u180D\u1810-\u1819\u18A9\u1920-\u1922\u1923-\u1926\u1927-\u1928\u1929-\u192B\u1930-\u1931\u1932\u1933-\u1938\u1939-\u193B\u1946-\u194F\u19B0-\u19C0\u19C8-\u19C9\u19D0-\u19D9\u1A17-\u1A18\u1A19-\u1A1B\u1DC0-\u1DC3\u203F-\u2040\u2054\u20D0-\u20DC\u20E1\u20E5-\u20EB\u302A-\u302F\u3099-\u309A\uA802\uA806\uA80B\uA823-\uA824\uA825-\uA826\uA827\uFB1E\uFE00-\uFE0F\uFE20-\uFE23\uFE33-\uFE34\uFE4D-\uFE4F\uFF10-\uFF19\uFF3F]"iu
 
     # between quotes, either escaped quote or character that is not a quote
     escape_group = "\"" ( "\\\"" / ~r"[^\"]" )* "\""
@@ -206,7 +202,6 @@ def _include_common_grammar(source_grammar):
     {common_grammar}
     """.format(source_grammar=source_grammar, common_grammar=common_grammar)
 
-
 def get_equation_components(equation_str):
     """
     Breaks down a string representing only the equation part of a model element.
@@ -234,7 +229,6 @@ def get_equation_components(equation_str):
         - *component* - normal model expression or constant
         - *lookup* - a lookup table
         - *subdef* - a subscript definition
-        - *data* -  a data variable
 
     Examples
     --------
@@ -243,23 +237,20 @@ def get_equation_components(equation_str):
 
     Notes
     -----
-    in this function we don't create python identifiers, we use real names.
+    in this function we dont create python identifiers, we use real names.
     This is so that when everything comes back together, we can manage
     any potential namespace conflicts properly
     """
 
     component_structure_grammar = _include_common_grammar(r"""
-    entry = component / test_definition / subscript_definition / lookup_definition / data_definition
+    entry = component / subscript_definition / lookup_definition
     component = name _ subscriptlist? _ "=" _ expression
-    subscript_definition = name _ ":" expression
-    data_definition = name _ subscriptlist? _ &keyword _ ":=" _ expression
+    subscript_definition = name _ ":" _ subscript _ ("," _ subscript)*
     lookup_definition = name _ &"(" _ expression  # uses lookahead assertion to capture whole group
-    test_definition = name _ subscriptlist? _ &keyword _ expression
 
     name = basic_id / escape_group
     subscriptlist = '[' _ subscript _ ("," _ subscript)* _ ']'
     expression = ~r".*"  # expression could be anything, at this point.
-    keyword = ":" _ basic_id _ ":"
 
     subscript = basic_id / escape_group
     """)
@@ -277,7 +268,6 @@ def __init__(self, ast):
             self.real_name = None
             self.expression = None
             self.kind = None
-            self.keyword = None
             self.visit(ast)
 
         def visit_subscript_definition(self, n, vc):
@@ -289,12 +279,6 @@ def visit_lookup_definition(self, n, vc):
         def visit_component(self, n, vc):
             self.kind = 'component'
 
-        def visit_data_definition(self, n, vc):
-            self.kind = 'data'
-
-        def visit_keyword(self, n, vc):
-            self.keyword = n.text.strip()
-
         def visit_name(self, n, vc):
             (name,) = vc
             self.real_name = name.strip()
@@ -317,8 +301,7 @@ def visit__(self, n, vc):
     return {'real_name': parse_object.real_name,
             'subs': parse_object.subscripts,
             'expr': parse_object.expression,
-            'kind': parse_object.kind,
-            'keyword': parse_object.keyword}
+            'kind': parse_object.kind}
 
 
 def parse_units(units_str):
@@ -375,7 +358,8 @@ def parse_units(units_str):
     "sqrt": "np.sqrt",
     "tan": "np.tan",
     "lognormal": "np.random.lognormal",
-    "random normal": "functions.bounded_normal",
+    "random normal":
+        "functions.bounded_normal",
     "poisson": "np.random.poisson",
     "ln": "np.log",
     "log": "functions.log",
@@ -385,58 +369,15 @@ def parse_units(units_str):
     "arccos": "np.arccos",
     "arcsin": "np.arcsin",
     "arctan": "np.arctan",
-    "tanh": "np.tanh",
-    "sinh": "np.sinh",
-    "cosh": "np.cosh",
     "if then else": "functions.if_then_else",
-    "step": {
-        "name": "functions.step",
-        "parameters": [
-            {"name": 'time', "type": 'time'},
-            {"name": 'value'},
-            {"name": 'tstep'}
-        ]
-    },
+    "step": "functions.step",
     "modulo": "np.mod",
-    "pulse": {
-        "name": "functions.pulse",
-        "parameters": [
-            {"name": 'time', "type": 'time'},
-            {"name": 'start'},
-            {"name": "duration"}
-        ]
-    },
-    # time, start, duration, repeat_time, end
-    "pulse train": {
-        "name": "functions.pulse_train",
-        "parameters": [
-            {"name": 'time', "type": 'time'},
-            {"name": 'start'},
-            {"name": 'duration'},
-            {"name": 'repeat_time'},
-            {"name": 'end'}
-        ]
-    },
-    "ramp": {
-        "name": "functions.ramp",
-        "parameters": [
-            {"name": 'time', "type": 'time'},
-            {"name": 'slope'},
-            {"name": 'start'},
-            {"name": 'finish', "optional": True}
-        ]
-    },
+    "pulse": "functions.pulse",
+    "pulse train": "functions.pulse_train",
+    "ramp": "functions.ramp",
     "min": "np.minimum",
     "max": "np.maximum",
-    # time, expr, init_val
-    "active initial": {
-        "name": "functions.active_initial",
-        "parameters": [
-            {"name": 'time', "type": 'time'},
-            {"name": 'expr', "type": 'lambda'},
-            {"name": 'init_val'}
-        ]
-    },
+    "active initial": "functions.active_initial",
     "xidz": "functions.xidz",
     "zidz": "functions.zidz",
     "game": "",  # In the future, may have an actual `functions.game` pass through
@@ -444,13 +385,7 @@ def parse_units(units_str):
     # vector functions
     "vmin": "np.min",
     "vmax": "np.max",
-    "prod": "np.prod",
-
-    # data functions
-    "get xls data": "functions.get_xls_data",
-    "get direct data": "functions.get_direct_data",
-    "get xls constants": "functions.get_xls_constants",
-    "get xls lookups":  "functions.get_xls_lookups"
+    "prod": "np.prod"
 }
 
 builders = {
@@ -500,9 +435,9 @@ def parse_units(units_str):
 
     "delay fixed": lambda element, subscript_dict, args: builder.add_n_delay(
         delay_input=args[0],
-        delay_time='round(' + args[1] + ' / time_step() ) * time_step()',
+        delay_time='round('+args[1]+' / time_step() ) * time_step()',
         initial_value=args[2],
-        order=args[1] + ' / time_step()',
+        order=args[1]+' / time_step()',
         subs=element['subs'],
         subscript_dict=subscript_dict
     ),
@@ -644,16 +579,16 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     in_ops_list = [re.escape(x) for x in in_ops.keys()]
     pre_ops_list = [re.escape(x) for x in pre_ops.keys()]
     if macro_list is not None and len(macro_list) > 0:
-        macro_names_list = [re.escape(x['name']) for x in macro_list]
+        macro_names_list = [x['name'] for x in macro_list]
     else:
         macro_names_list = ['\\a']
 
     expression_grammar = r"""
     expr_type = array / expr / empty
-    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ (in_oper _ expr)?
+    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / lookup_call / call / parens / number / reference) _ (in_oper _ expr)?
 
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
-    lookup_call = reference _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
+    lookup_call = id _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     call = func _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     build_call = builder _ "(" _ arguments _ ")"
     macro_call = macro _ "(" _ arguments _ ")"
@@ -662,24 +597,20 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     arguments = (expr _ ","? _)*
 
     reference = id _ subscript_list?
-    subscript_list = "[" _ ((sub_name / sub_element) "!"? _ ","? _)+ "]"
+    subscript_list = "[" _ ((sub_name / sub_element) _ ","? _)+ "]"
 
     array = (number _ ("," / ";")? _)+ !~r"."  # negative lookahead for anything other than an array
     number = ~r"\d+\.?\d*(e[+-]\d+)?"
-    string = "\'" ( "\\\'" / ~r"[^\']"IU )* "\'"
 
-    id = ( basic_id / escape_group )
-    basic_id = ~r"\w[\w\d_\s\']*"IU
-    escape_group = "\"" ( "\\\"" / ~r"[^\"]"IU )* "\""
-    
-    sub_name = ~r"(%(sub_names)s)"IU  # subscript names (if none, use non-printable character)
-    sub_element = ~r"(%(sub_elems)s)"IU  # subscript elements (if none, use non-printable character)
+    id = ~r"(%(ids)s)"I
+    sub_name = ~r"(%(sub_names)s)"I  # subscript names (if none, use non-printable character)
+    sub_element = ~r"(%(sub_elems)s)"I  # subscript elements (if none, use non-printable character)
 
-    func = ~r"(%(funcs)s)"IU  # functions (case insensitive)
-    in_oper = ~r"(%(in_ops)s)"IU  # infix operators (case insensitive)
-    pre_oper = ~r"(%(pre_ops)s)"IU  # prefix operators (case insensitive)
-    builder = ~r"(%(builders)s)"IU  # builder functions (case insensitive)
-    macro = ~r"(%(macros)s)"IU  # macros from model file (if none, use non-printable character)
+    func = ~r"(%(funcs)s)"I  # functions (case insensitive)
+    in_oper = ~r"(%(in_ops)s)"I  # infix operators (case insensitive)
+    pre_oper = ~r"(%(pre_ops)s)"I  # prefix operators (case insensitive)
+    builder = ~r"(%(builders)s)"I  # builder functions (case insensitive)
+    macro = ~r"(%(macros)s)"I  # macros from model file (if none, use non-printable character)
 
     _ = ~r"[\s\\]*"  # whitespace character
     empty = "" # empty string
@@ -688,6 +619,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
         # peg parser doesn't quit early when finding a partial keyword
         'sub_names': '|'.join(reversed(sorted(sub_names_list, key=len))),
         'sub_elems': '|'.join(reversed(sorted(sub_elems_list, key=len))),
+        'ids': '|'.join(reversed(sorted(ids_list, key=len))),
         'funcs': '|'.join(reversed(sorted(functions.keys(), key=len))),
         'in_ops': '|'.join(reversed(sorted(in_ops_list, key=len))),
         'pre_ops': '|'.join(reversed(sorted(pre_ops_list, key=len))),
@@ -714,11 +646,9 @@ def visit_expr(self, n, vc):
             self.translation = s
             return s
 
-        def visit_call(self, n, vc):
+        def visit_func(self, n, vc):
             self.kind = 'component'
-            function_name = vc[0].lower()
-            arguments = [e.strip() for e in vc[4].split(",")]
-            return builder.build_function_call(functions[function_name], arguments)
+            return functions[n.text.lower()]
 
         def visit_in_oper(self, n, vc):
             return in_ops[n.text.lower()]
@@ -732,7 +662,7 @@ def visit_reference(self, n, vc):
             return id_str + '()'
 
         def visit_id(self, n, vc):
-            return namespace[n.text.strip()]
+            return namespace[n.text]
 
         def visit_lookup_def(self, n, vc):
             """ This exists because vensim has multiple ways of doing lookups.

From 1218bdd39d93adb252b523d2575b1c4744e31707 Mon Sep 17 00:00:00 2001
From: Alexey Prey Mulyukin <alexprey@yandex.ru>
Date: Sat, 16 Mar 2019 00:01:43 +0300
Subject: [PATCH 15/30] Fix issue with setting time object into nested models
 or macros

---
 pysd/py_backend/builder.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 86151f5d..029cd64b 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -576,7 +576,7 @@ def add_macro(macro_name, filename, arg_names, arg_vals):
             [utils.make_python_identifier(f)[0] for f in arg_vals]),
         'real_name': 'Macro Instantiation of ' + macro_name,
         'doc': 'Instantiates the Macro',
-        'py_expr': "functions.Macro('%s', %s, '%s', __data['time'])" % (filename, func_args, macro_name),
+        'py_expr': "functions.Macro('%s', %s, '%s', time_initialization=lambda: __data['time'])" % (filename, func_args, macro_name),
         'unit': 'None',
         'lims': 'None',
         'eqn': 'None',

From fa79e1fd86392fbb7f1de11e13ed17de4dcbc496 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Wed, 21 Nov 2018 16:56:44 -0500
Subject: [PATCH 16/30] Added hyperbolic trigonometric functions and ugly hack
 for parsing ! subscripts for now.

---
 pysd/py_backend/vensim/vensim2py.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 18663e51..d064a24a 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -369,6 +369,9 @@ def parse_units(units_str):
     "arccos": "np.arccos",
     "arcsin": "np.arcsin",
     "arctan": "np.arctan",
+    "tanh": "np.tanh",
+    "sinh": "np.sinh",
+    "cosh": "np.cosh",
     "if then else": "functions.if_then_else",
     "step": "functions.step",
     "modulo": "np.mod",
@@ -597,7 +600,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     arguments = (expr _ ","? _)*
 
     reference = id _ subscript_list?
-    subscript_list = "[" _ ((sub_name / sub_element) _ ","? _)+ "]"
+    subscript_list = "[" _ ((sub_name / sub_element) "!"? _ ","? _)+ "]"
 
     array = (number _ ("," / ";")? _)+ !~r"."  # negative lookahead for anything other than an array
     number = ~r"\d+\.?\d*(e[+-]\d+)?"

From ee8e3e0394fa836fc553d692f77e162bd7a28fae Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Fri, 23 Nov 2018 12:09:22 -0500
Subject: [PATCH 17/30] Fixed unicode error

---
 pysd/py_backend/builder.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 029cd64b..c45012cf 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -154,11 +154,11 @@ def build_element(element, subscript_dict):
     element['doc'] = element['doc'].replace('\\', '\n    ').encode('unicode-escape')
 
     if 'unit' in element:
-        element['unit'] = element['unit']
+        element['unit'] = element['unit'].encode('utf8')
     if 'real_name' in element:
-        element['real_name'] = element['real_name']
+        element['real_name'] = element['real_name'].encode('utf8')
     if 'eqn' in element:
-        element['eqn'] = element['eqn']
+        element['eqn'] = element['eqn'].encode('utf8')
     
     if element['kind'] == 'stateful':
         func = '''

From 65559e81062963a561cf4dd912ce5b0b55c350e1 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Wed, 11 Sep 2019 16:08:27 -0400
Subject: [PATCH 18/30] Work on new functions

---
 pysd/py_backend/vensim/vensim2py.py | 99 ++++++++++++++++++++---------
 1 file changed, 70 insertions(+), 29 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index d064a24a..f3d4f608 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -186,9 +186,10 @@ def _include_common_grammar(source_grammar):
     name = basic_id / escape_group
     
     # This takes care of models with Unicode variable names
-    basic_id = id_start (id_continue / ~r"[\'\$\s]")*
-    id_start = ~r"[A-Za-z]" / ~r"[\u00AA\u00B5\u00BA\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u01BA\u01BB\u01BC-\u01BF\u01C0-\u01C3\u01C4-\u0241\u0250-\u02AF\u02B0-\u02C1\u02C6-\u02D1\u02E0-\u02E4\u02EE\u037A\u0386\u0388-\u038A\u038C\u038E-\u03A1\u03A3-\u03CE\u03D0-\u03F5\u03F7-\u0481\u048A-\u04CE\u04D0-\u04F9\u0500-\u050F\u0531-\u0556\u0559\u0561-\u0587\u05D0-\u05EA\u05F0-\u05F2\u0621-\u063A\u0640\u0641-\u064A\u066E-\u066F\u0671-\u06D3\u06D5\u06E5-\u06E6\u06EE-\u06EF\u06FA-\u06FC\u06FF\u0710\u0712-\u072F\u074D-\u076D\u0780-\u07A5\u07B1\u0904-\u0939\u093D\u0950\u0958-\u0961\u097D\u0985-\u098C\u098F-\u0990\u0993-\u09A8\u09AA-\u09B0\u09B2\u09B6-\u09B9\u09BD\u09CE\u09DC-\u09DD\u09DF-\u09E1\u09F0-\u09F1\u0A05-\u0A0A\u0A0F-\u0A10\u0A13-\u0A28\u0A2A-\u0A30\u0A32-\u0A33\u0A35-\u0A36\u0A38-\u0A39\u0A59-\u0A5C\u0A5E\u0A72-\u0A74\u0A85-\u0A8D\u0A8F-\u0A91\u0A93-\u0AA8\u0AAA-\u0AB0\u0AB2-\u0AB3\u0AB5-\u0AB9\u0ABD\u0AD0\u0AE0-\u0AE1\u0B05-\u0B0C\u0B0F-\u0B10\u0B13-\u0B28\u0B2A-\u0B30\u0B32-\u0B33\u0B35-\u0B39\u0B3D\u0B5C-\u0B5D\u0B5F-\u0B61\u0B71\u0B83\u0B85-\u0B8A\u0B8E-\u0B90\u0B92-\u0B95\u0B99-\u0B9A\u0B9C\u0B9E-\u0B9F\u0BA3-\u0BA4\u0BA8-\u0BAA\u0BAE-\u0BB9\u0C05-\u0C0C\u0C0E-\u0C10\u0C12-\u0C28\u0C2A-\u0C33\u0C35-\u0C39\u0C60-\u0C61\u0C85-\u0C8C\u0C8E-\u0C90\u0C92-\u0CA8\u0CAA-\u0CB3\u0CB5-\u0CB9\u0CBD\u0CDE\u0CE0-\u0CE1\u0D05-\u0D0C\u0D0E-\u0D10\u0D12-\u0D28\u0D2A-\u0D39\u0D60-\u0D61\u0D85-\u0D96\u0D9A-\u0DB1\u0DB3-\u0DBB\u0DBD\u0DC0-\u0DC6\u0E01-\u0E30\u0E32-\u0E33\u0E40-\u0E45\u0E46\u0E81-\u0E82\u0E84\u0E87-\u0E88\u0E8A\u0E8D\u0E94-\u0E97\u0E99-\u0E9F\u0EA1-\u0EA3\u0EA5\u0EA7\u0EAA-\u0EAB\u0EAD-\u0EB0\u0EB2-\u0EB3\u0EBD\u0EC0-\u0EC4\u0EC6\u0EDC-\u0EDD\u0F00\u0F40-\u0F47\u0F49-\u0F6A\u0F88-\u0F8B\u1000-\u1021\u1023-\u1027\u1029-\u102A\u1050-\u1055\u10A0-\u10C5\u10D0-\u10FA\u10FC\u1100-\u1159\u115F-\u11A2\u11A8-\u11F9\u1200-\u1248\u124A-\u124D\u1250-\u1256\u1258\u125A-\u125D\u1260-\u1288\u128A-\u128D\u1290-\u12B0\u12B2-\u12B5\u12B8-\u12BE\u12C0\u12C2-\u12C5\u12C8-\u12D6\u12D8-\u1310\u1312-\u1315\u1318-\u135A\u1380-\u138F\u13A0-\u13F4\u1401-\u166C\u166F-\u1676\u1681-\u169A\u16A0-\u16EA\u16EE-\u16F0\u1700-\u170C\u170E-\u1711\u1720-\u1731\u1740-\u1751\u1760-\u176C\u176E-\u1770\u1780-\u17B3\u17D7\u17DC\u1820-\u1842\u1843\u1844-\u1877\u1880-\u18A8\u1900-\u191C\u1950-\u196D\u1970-\u1974\u1980-\u19A9\u19C1-\u19C7\u1A00-\u1A16\u1D00-\u1D2B\u1D2C-\u1D61\u1D62-\u1D77\u1D78\u1D79-\u1D9A\u1D9B-\u1DBF\u1E00-\u1E9B\u1EA0-\u1EF9\u1F00-\u1F15\u1F18-\u1F1D\u1F20-\u1F45\u1F48-\u1F4D\u1F50-\u1F57\u1F59\u1F5B\u1F5D\u1F5F-\u1F7D\u1F80-\u1FB4\u1FB6-\u1FBC\u1FBE\u1FC2-\u1FC4\u1FC6-\u1FCC\u1FD0-\u1FD3\u1FD6-\u1FDB\u1FE0-\u1FEC\u1FF2-\u1FF4\u1FF6-\u1FFC\u2071\u207F\u2090-\u2094\u2102\u2107\u210A-\u2113\u2115\u2118\u2119-\u211D\u2124\u2126\u2128\u212A-\u212D\u212E\u212F-\u2131\u2133-\u2134\u2135-\u2138\u2139\u213C-\u213F\u2145-\u2149\u2160-\u2183\u2C00-\u2C2E\u2C30-\u2C5E\u2C80-\u2CE4\u2D00-\u2D25\u2D30-\u2D65\u2D6F\u2D80-\u2D96\u2DA0-\u2DA6\u2DA8-\u2DAE\u2DB0-\u2DB6\u2DB8-\u2DBE\u2DC0-\u2DC6\u2DC8-\u2DCE\u2DD0-\u2DD6\u2DD8-\u2DDE\u3005\u3006\u3007\u3021-\u3029\u3031-\u3035\u3038-\u303A\u303B\u303C\u3041-\u3096\u309B-\u309C\u309D-\u309E\u309F\u30A1-\u30FA\u30FC-\u30FE\u30FF\u3105-\u312C\u3131-\u318E\u31A0-\u31B7\u31F0-\u31FF\u3400-\u4DB5\u4E00-\u9FBB\uA000-\uA014\uA015\uA016-\uA48C\uA800-\uA801\uA803-\uA805\uA807-\uA80A\uA80C-\uA822\uAC00-\uD7A3\uF900-\uFA2D\uFA30-\uFA6A\uFA70-\uFAD9\uFB00-\uFB06\uFB13-\uFB17\uFB1D\uFB1F-\uFB28\uFB2A-\uFB36\uFB38-\uFB3C\uFB3E\uFB40-\uFB41\uFB43-\uFB44\uFB46-\uFBB1\uFBD3-\uFD3D\uFD50-\uFD8F\uFD92-\uFDC7\uFDF0-\uFDFB\uFE70-\uFE74\uFE76-\uFEFC\uFF21-\uFF3A\uFF41-\uFF5A\uFF66-\uFF6F\uFF70\uFF71-\uFF9D\uFF9E-\uFF9F\uFFA0-\uFFBE\uFFC2-\uFFC7\uFFCA-\uFFCF\uFFD2-\uFFD7\uFFDA-\uFFDC]"iu
-    id_continue = id_start / ~r"[0-9]" / ~r"[\u0300-\u036F\u0483-\u0486\u0591-\u05B9\u05BB-\u05BD\u05BF\u05C1-\u05C2\u05C4-\u05C5\u05C7\u0610-\u0615\u064B-\u065E\u0660-\u0669\u0670\u06D6-\u06DC\u06DF-\u06E4\u06E7-\u06E8\u06EA-\u06ED\u06F0-\u06F9\u0711\u0730-\u074A\u07A6-\u07B0\u0901-\u0902\u0903\u093C\u093E-\u0940\u0941-\u0948\u0949-\u094C\u094D\u0951-\u0954\u0962-\u0963\u0966-\u096F\u0981\u0982-\u0983\u09BC\u09BE-\u09C0\u09C1-\u09C4\u09C7-\u09C8\u09CB-\u09CC\u09CD\u09D7\u09E2-\u09E3\u09E6-\u09EF\u0A01-\u0A02\u0A03\u0A3C\u0A3E-\u0A40\u0A41-\u0A42\u0A47-\u0A48\u0A4B-\u0A4D\u0A66-\u0A6F\u0A70-\u0A71\u0A81-\u0A82\u0A83\u0ABC\u0ABE-\u0AC0\u0AC1-\u0AC5\u0AC7-\u0AC8\u0AC9\u0ACB-\u0ACC\u0ACD\u0AE2-\u0AE3\u0AE6-\u0AEF\u0B01\u0B02-\u0B03\u0B3C\u0B3E\u0B3F\u0B40\u0B41-\u0B43\u0B47-\u0B48\u0B4B-\u0B4C\u0B4D\u0B56\u0B57\u0B66-\u0B6F\u0B82\u0BBE-\u0BBF\u0BC0\u0BC1-\u0BC2\u0BC6-\u0BC8\u0BCA-\u0BCC\u0BCD\u0BD7\u0BE6-\u0BEF\u0C01-\u0C03\u0C3E-\u0C40\u0C41-\u0C44\u0C46-\u0C48\u0C4A-\u0C4D\u0C55-\u0C56\u0C66-\u0C6F\u0C82-\u0C83\u0CBC\u0CBE\u0CBF\u0CC0-\u0CC4\u0CC6\u0CC7-\u0CC8\u0CCA-\u0CCB\u0CCC-\u0CCD\u0CD5-\u0CD6\u0CE6-\u0CEF\u0D02-\u0D03\u0D3E-\u0D40\u0D41-\u0D43\u0D46-\u0D48\u0D4A-\u0D4C\u0D4D\u0D57\u0D66-\u0D6F\u0D82-\u0D83\u0DCA\u0DCF-\u0DD1\u0DD2-\u0DD4\u0DD6\u0DD8-\u0DDF\u0DF2-\u0DF3\u0E31\u0E34-\u0E3A\u0E47-\u0E4E\u0E50-\u0E59\u0EB1\u0EB4-\u0EB9\u0EBB-\u0EBC\u0EC8-\u0ECD\u0ED0-\u0ED9\u0F18-\u0F19\u0F20-\u0F29\u0F35\u0F37\u0F39\u0F3E-\u0F3F\u0F71-\u0F7E\u0F7F\u0F80-\u0F84\u0F86-\u0F87\u0F90-\u0F97\u0F99-\u0FBC\u0FC6\u102C\u102D-\u1030\u1031\u1032\u1036-\u1037\u1038\u1039\u1040-\u1049\u1056-\u1057\u1058-\u1059\u135F\u1369-\u1371\u1712-\u1714\u1732-\u1734\u1752-\u1753\u1772-\u1773\u17B6\u17B7-\u17BD\u17BE-\u17C5\u17C6\u17C7-\u17C8\u17C9-\u17D3\u17DD\u17E0-\u17E9\u180B-\u180D\u1810-\u1819\u18A9\u1920-\u1922\u1923-\u1926\u1927-\u1928\u1929-\u192B\u1930-\u1931\u1932\u1933-\u1938\u1939-\u193B\u1946-\u194F\u19B0-\u19C0\u19C8-\u19C9\u19D0-\u19D9\u1A17-\u1A18\u1A19-\u1A1B\u1DC0-\u1DC3\u203F-\u2040\u2054\u20D0-\u20DC\u20E1\u20E5-\u20EB\u302A-\u302F\u3099-\u309A\uA802\uA806\uA80B\uA823-\uA824\uA825-\uA826\uA827\uFB1E\uFE00-\uFE0F\uFE20-\uFE23\uFE33-\uFE34\uFE4D-\uFE4F\uFF10-\uFF19\uFF3F]"iu
+    basic_id = id_start id_continue*
+    
+    id_start = ~r"[\w]"IU
+    id_continue = id_start / ~r"[0-9\'\$\s\_]"
 
     # between quotes, either escaped quote or character that is not a quote
     escape_group = "\"" ( "\\\"" / ~r"[^\"]" )* "\""
@@ -358,8 +359,7 @@ def parse_units(units_str):
     "sqrt": "np.sqrt",
     "tan": "np.tan",
     "lognormal": "np.random.lognormal",
-    "random normal":
-        "functions.bounded_normal",
+    "random normal": "functions.bounded_normal",
     "poisson": "np.random.poisson",
     "ln": "np.log",
     "log": "functions.log",
@@ -369,18 +369,55 @@ def parse_units(units_str):
     "arccos": "np.arccos",
     "arcsin": "np.arcsin",
     "arctan": "np.arctan",
-    "tanh": "np.tanh",
-    "sinh": "np.sinh",
-    "cosh": "np.cosh",
     "if then else": "functions.if_then_else",
-    "step": "functions.step",
+    "step": {
+        "name": "functions.step",
+        "parameters": [
+            {"name": 'time', "type": 'time'},
+            {"name": 'value'},
+            {"name": 'tstep'}
+        ]
+    },
     "modulo": "np.mod",
-    "pulse": "functions.pulse",
-    "pulse train": "functions.pulse_train",
-    "ramp": "functions.ramp",
+    "pulse": {
+        "name": "functions.pulse",
+        "parameters": [
+            {"name": 'time', "type": 'time'},
+            {"name": 'start'},
+            {"name": "duration"}
+        ]
+    },
+    # time, start, duration, repeat_time, end
+    "pulse train": {
+        "name": "functions.pulse_train",
+        "parameters": [
+            {"name": 'time', "type": 'time'},
+            {"name": 'start'},
+            {"name": 'duration'},
+            {"name": 'repeat_time'},
+            {"name": 'end'}
+        ]
+    },
+    "ramp": {
+        "name": "functions.ramp",
+        "parameters": [
+            {"name": 'time', "type": 'time'},
+            {"name": 'slope'},
+            {"name": 'start'},
+            {"name": 'finish', "optional": True}
+        ]
+    },
     "min": "np.minimum",
     "max": "np.maximum",
-    "active initial": "functions.active_initial",
+    # time, expr, init_val
+    "active initial": {
+        "name": "functions.active_initial",
+        "parameters": [
+            {"name": 'time', "type": 'time'},
+            {"name": 'expr', "type": 'lambda'},
+            {"name": 'init_val'}
+        ]
+    },
     "xidz": "functions.xidz",
     "zidz": "functions.zidz",
     "game": "",  # In the future, may have an actual `functions.game` pass through
@@ -582,13 +619,13 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     in_ops_list = [re.escape(x) for x in in_ops.keys()]
     pre_ops_list = [re.escape(x) for x in pre_ops.keys()]
     if macro_list is not None and len(macro_list) > 0:
-        macro_names_list = [x['name'] for x in macro_list]
+        macro_names_list = [re.escape(x['name']) for x in macro_list]
     else:
         macro_names_list = ['\\a']
 
     expression_grammar = r"""
     expr_type = array / expr / empty
-    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / lookup_call / call / parens / number / reference) _ (in_oper _ expr)?
+    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / reference) _ (in_oper _ expr)?
 
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
     lookup_call = id _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
@@ -600,20 +637,23 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     arguments = (expr _ ","? _)*
 
     reference = id _ subscript_list?
-    subscript_list = "[" _ ((sub_name / sub_element) "!"? _ ","? _)+ "]"
+    subscript_list = "[" _ ((sub_name / sub_element) _ ","? _)+ "]"
 
     array = (number _ ("," / ";")? _)+ !~r"."  # negative lookahead for anything other than an array
     number = ~r"\d+\.?\d*(e[+-]\d+)?"
 
-    id = ~r"(%(ids)s)"I
-    sub_name = ~r"(%(sub_names)s)"I  # subscript names (if none, use non-printable character)
-    sub_element = ~r"(%(sub_elems)s)"I  # subscript elements (if none, use non-printable character)
+    id = ( basic_id / escape_group )
+    basic_id = ~r"\w[\w\d_\s\']*"IU
+    escape_group = "\"" ( "\\\"" / ~r"[^\"]"IU )* "\""
+    
+    sub_name = ~r"(%(sub_names)s)"IU  # subscript names (if none, use non-printable character)
+    sub_element = ~r"(%(sub_elems)s)"IU  # subscript elements (if none, use non-printable character)
 
-    func = ~r"(%(funcs)s)"I  # functions (case insensitive)
-    in_oper = ~r"(%(in_ops)s)"I  # infix operators (case insensitive)
-    pre_oper = ~r"(%(pre_ops)s)"I  # prefix operators (case insensitive)
-    builder = ~r"(%(builders)s)"I  # builder functions (case insensitive)
-    macro = ~r"(%(macros)s)"I  # macros from model file (if none, use non-printable character)
+    func = ~r"(%(funcs)s)"IU  # functions (case insensitive)
+    in_oper = ~r"(%(in_ops)s)"IU  # infix operators (case insensitive)
+    pre_oper = ~r"(%(pre_ops)s)"IU  # prefix operators (case insensitive)
+    builder = ~r"(%(builders)s)"IU  # builder functions (case insensitive)
+    macro = ~r"(%(macros)s)"IU  # macros from model file (if none, use non-printable character)
 
     _ = ~r"[\s\\]*"  # whitespace character
     empty = "" # empty string
@@ -622,14 +662,13 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
         # peg parser doesn't quit early when finding a partial keyword
         'sub_names': '|'.join(reversed(sorted(sub_names_list, key=len))),
         'sub_elems': '|'.join(reversed(sorted(sub_elems_list, key=len))),
-        'ids': '|'.join(reversed(sorted(ids_list, key=len))),
         'funcs': '|'.join(reversed(sorted(functions.keys(), key=len))),
         'in_ops': '|'.join(reversed(sorted(in_ops_list, key=len))),
         'pre_ops': '|'.join(reversed(sorted(pre_ops_list, key=len))),
         'builders': '|'.join(reversed(sorted(builders.keys(), key=len))),
         'macros': '|'.join(reversed(sorted(macro_names_list, key=len)))
     }
-
+    
     class ExpressionParser(parsimonious.NodeVisitor):
         # Todo: at some point, we could make the 'kind' identification recursive on expression,
         # so that if an expression is passed into a builder function, the information
@@ -649,9 +688,11 @@ def visit_expr(self, n, vc):
             self.translation = s
             return s
 
-        def visit_func(self, n, vc):
+        def visit_call(self, n, vc):
             self.kind = 'component'
-            return functions[n.text.lower()]
+            function_name = vc[0].lower()
+            arguments = [e.strip() for e in vc[4].split(",")]
+            return builder.build_function_call(functions[function_name], arguments)
 
         def visit_in_oper(self, n, vc):
             return in_ops[n.text.lower()]
@@ -665,7 +706,7 @@ def visit_reference(self, n, vc):
             return id_str + '()'
 
         def visit_id(self, n, vc):
-            return namespace[n.text]
+            return namespace[n.text.strip()]
 
         def visit_lookup_def(self, n, vc):
             """ This exists because vensim has multiple ways of doing lookups.

From 0a8e01ac5208d636009e5008ed51ca9e5dd9c5d2 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Wed, 11 Sep 2019 18:51:33 -0400
Subject: [PATCH 19/30] Work on new functions

---
 .idea/vcs.xml                       |   2 +-
 pysd/py_backend/vensim/vensim2py.py | 110 ++++++++++++++++++++++------
 2 files changed, 87 insertions(+), 25 deletions(-)

diff --git a/.idea/vcs.xml b/.idea/vcs.xml
index 9744e003..06b38168 100644
--- a/.idea/vcs.xml
+++ b/.idea/vcs.xml
@@ -2,6 +2,6 @@
 <project version="4">
   <component name="VcsDirectoryMappings">
     <mapping directory="$PROJECT_DIR$" vcs="Git" />
-    <mapping directory="C:\Projects\pysd\tests\test-models" vcs="Git" />
+    <mapping directory="$PROJECT_DIR$/tests/test-models" vcs="Git" />
   </component>
 </project>
\ No newline at end of file
diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index f3d4f608..4b15ecc2 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -3,15 +3,19 @@
 model. Everything that requires knowledge of vensim syntax should be in this file.
 """
 from __future__ import absolute_import
+
+import os
 import re
+import textwrap
+import warnings
+from io import open
+
+import numpy as np
 import parsimonious
+
+from .. import functions as funcs
 from ...py_backend import builder
 from ...py_backend import utils
-from io import open
-import textwrap
-import numpy as np
-import os
-import warnings
 
 
 def get_file_sections(file_str):
@@ -203,7 +207,8 @@ def _include_common_grammar(source_grammar):
     {common_grammar}
     """.format(source_grammar=source_grammar, common_grammar=common_grammar)
 
-def get_equation_components(equation_str):
+
+def get_equation_components(equation_str, root_path):
     """
     Breaks down a string representing only the equation part of a model element.
     Recognizes the various types of model elements that may exist, and identifies them.
@@ -213,6 +218,9 @@ def get_equation_components(equation_str):
     equation_str : basestring
         the first section in each model element - the full equation.
 
+    root_path: basestring
+        the root path of the vensim file (necessary to resolve external data file paths)
+
     Returns
     -------
     Returns a dictionary containing the following:
@@ -230,6 +238,7 @@ def get_equation_components(equation_str):
         - *component* - normal model expression or constant
         - *lookup* - a lookup table
         - *subdef* - a subscript definition
+        - *data* -  a data variable
 
     Examples
     --------
@@ -238,22 +247,29 @@ def get_equation_components(equation_str):
 
     Notes
     -----
-    in this function we dont create python identifiers, we use real names.
+    in this function we don't create python identifiers, we use real names.
     This is so that when everything comes back together, we can manage
     any potential namespace conflicts properly
     """
 
     component_structure_grammar = _include_common_grammar(r"""
-    entry = component / subscript_definition / lookup_definition
+    entry = component / data_definition / test_definition / subscript_definition / lookup_definition
     component = name _ subscriptlist? _ "=" _ expression
-    subscript_definition = name _ ":" _ subscript _ ("," _ subscript)*
+    subscript_definition = name _ ":" _ (imported_subscript / literal_subscript)
+    data_definition = name _ subscriptlist? _ keyword? _ ":=" _ expression
     lookup_definition = name _ &"(" _ expression  # uses lookahead assertion to capture whole group
+    test_definition = name _ subscriptlist? _ &keyword _ expression
 
     name = basic_id / escape_group
+    literal_subscript = subscript _ ("," _ subscript)*
+    imported_subscript = func _ "(" _ (string _ ","? _)* ")"
     subscriptlist = '[' _ subscript _ ("," _ subscript)* _ ']'
     expression = ~r".*"  # expression could be anything, at this point.
+    keyword = ":" _ basic_id _ ":"
 
     subscript = basic_id / escape_group
+    func = basic_id
+    string = "\'" ( "\\\'" / ~r"[^\']"IU )* "\'"
     """)
 
     # replace any amount of whitespace  with a single space
@@ -269,6 +285,7 @@ def __init__(self, ast):
             self.real_name = None
             self.expression = None
             self.kind = None
+            self.keyword = None
             self.visit(ast)
 
         def visit_subscript_definition(self, n, vc):
@@ -280,6 +297,20 @@ def visit_lookup_definition(self, n, vc):
         def visit_component(self, n, vc):
             self.kind = 'component'
 
+        def visit_data_definition(self, n, vc):
+            self.kind = 'data'
+
+        def visit_test_definition(self, n, vc):
+            self.kind = 'test'
+
+        def visit_keyword(self, n, vc):
+            self.keyword = n.text.strip()
+
+        def visit_imported_subscript(self, n, vc):
+            f_str = vc[0]
+            args_str = vc[4]  # todo: make this less fragile?
+            self.subscripts += get_external_data(f_str, args_str, root_path)
+
         def visit_name(self, n, vc):
             (name,) = vc
             self.real_name = name.strip()
@@ -302,7 +333,16 @@ def visit__(self, n, vc):
     return {'real_name': parse_object.real_name,
             'subs': parse_object.subscripts,
             'expr': parse_object.expression,
-            'kind': parse_object.kind}
+            'kind': parse_object.kind,
+            'keyword': parse_object.keyword}
+
+
+def get_external_data(func_str, args_str, root_path):
+    f = subscript_functions[func_str.lower()]
+    args = [x.strip().strip("\'") for x in args_str.split(',')]  # todo: make this less fragile?
+    if args[0][0] == '?':
+        args[0] = os.path.join(root_path, args[0][1:])
+    return f(*args)
 
 
 def parse_units(units_str):
@@ -359,7 +399,8 @@ def parse_units(units_str):
     "sqrt": "np.sqrt",
     "tan": "np.tan",
     "lognormal": "np.random.lognormal",
-    "random normal": "functions.bounded_normal",
+    "random normal":
+        "functions.bounded_normal",
     "poisson": "np.random.poisson",
     "ln": "np.log",
     "log": "functions.log",
@@ -369,6 +410,9 @@ def parse_units(units_str):
     "arccos": "np.arccos",
     "arcsin": "np.arcsin",
     "arctan": "np.arctan",
+    "tanh": "np.tanh",
+    "sinh": "np.sinh",
+    "cosh": "np.cosh",
     "if then else": "functions.if_then_else",
     "step": {
         "name": "functions.step",
@@ -425,9 +469,24 @@ def parse_units(units_str):
     # vector functions
     "vmin": "np.min",
     "vmax": "np.max",
-    "prod": "np.prod"
+    "prod": "np.prod",
+
 }
 
+subscript_functions = {
+    "get xls subscript": funcs.get_xls_subscript,
+    "get direct subscript": funcs.get_direct_subscript
+}
+
+data_functions = {
+    "get xls data": "functions.get_xls_data",
+    "get direct data": "functions.get_direct_data",
+    "get xls constants": "functions.get_xls_constants",
+    "get xls lookups": "functions.get_xls_lookups"
+}
+
+functions.update(data_functions)
+
 builders = {
     "integ": lambda element, subscript_dict, args: builder.add_stock(
         identifier=element['py_name'],
@@ -475,9 +534,9 @@ def parse_units(units_str):
 
     "delay fixed": lambda element, subscript_dict, args: builder.add_n_delay(
         delay_input=args[0],
-        delay_time='round('+args[1]+' / time_step() ) * time_step()',
+        delay_time='round(' + args[1] + ' / time_step() ) * time_step()',
         initial_value=args[2],
-        order=args[1]+' / time_step()',
+        order=args[1] + ' / time_step()',
         subs=element['subs'],
         subscript_dict=subscript_dict
     ),
@@ -625,10 +684,10 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
 
     expression_grammar = r"""
     expr_type = array / expr / empty
-    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / reference) _ (in_oper _ expr)?
+    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ (in_oper _ expr)?
 
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
-    lookup_call = id _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
+    lookup_call = (id _ subscript_list?) _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     call = func _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     build_call = builder _ "(" _ arguments _ ")"
     macro_call = macro _ "(" _ arguments _ ")"
@@ -637,10 +696,11 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     arguments = (expr _ ","? _)*
 
     reference = id _ subscript_list?
-    subscript_list = "[" _ ((sub_name / sub_element) _ ","? _)+ "]"
+    subscript_list = "[" _ ((sub_name / sub_element) "!"? _ ","? _)+ "]"
 
     array = (number _ ("," / ";")? _)+ !~r"."  # negative lookahead for anything other than an array
     number = ~r"\d+\.?\d*(e[+-]\d+)?"
+    string = "\'" ( "\\\'" / ~r"[^\']"IU )* "\'"
 
     id = ( basic_id / escape_group )
     basic_id = ~r"\w[\w\d_\s\']*"IU
@@ -668,7 +728,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
         'builders': '|'.join(reversed(sorted(builders.keys(), key=len))),
         'macros': '|'.join(reversed(sorted(macro_names_list, key=len)))
     }
-    
+
     class ExpressionParser(parsimonious.NodeVisitor):
         # Todo: at some point, we could make the 'kind' identification recursive on expression,
         # so that if an expression is passed into a builder function, the information
@@ -689,8 +749,9 @@ def visit_expr(self, n, vc):
             return s
 
         def visit_call(self, n, vc):
-            self.kind = 'component'
             function_name = vc[0].lower()
+            if function_name not in data_functions:
+                self.kind = 'component'
             arguments = [e.strip() for e in vc[4].split(",")]
             return builder.build_function_call(functions[function_name], arguments)
 
@@ -845,14 +906,14 @@ def generic_visit(self, n, vc):
             'arguments': 'x'}
 
 
-def translate_section(section, macro_list):
+def translate_section(section, macro_list, root_path):
     model_elements = get_model_elements(section['string'])
 
     # extract equation components
     model_docstring = ''
     for entry in model_elements:
         if entry['kind'] == 'entry':
-            entry.update(get_equation_components(entry['eqn']))
+            entry.update(get_equation_components(entry['eqn'], root_path))
         elif entry['kind'] == 'section':
             model_docstring += entry['doc']
 
@@ -880,7 +941,7 @@ def translate_section(section, macro_list):
 
     # Parse components to python syntax.
     for element in model_elements:
-        if element['kind'] == 'component' and 'py_expr' not in element:
+        if (element['kind'] == 'component' and 'py_expr' not in element) or element['kind'] == 'data':
             # Todo: if there is new structure, it should be added to the namespace...
             translation, new_structure = parse_general_expression(element,
                                                                   namespace=namespace,
@@ -893,7 +954,7 @@ def translate_section(section, macro_list):
             element.update(parse_lookup_expression(element))
 
     # send the pieces to be built
-    build_elements = [e for e in model_elements if e['kind'] not in ['subdef', 'section']]
+    build_elements = [e for e in model_elements if e['kind'] not in ['subdef', 'test', 'section']]
     builder.build(build_elements,
                   subscript_dict,
                   namespace,
@@ -924,6 +985,7 @@ def translate_vensim(mdl_file):
     #>>> translate_vensim('../../tests/test-models/tests/limits/test_limits.mdl')
 
     """
+    root_path = os.path.split(mdl_file)[0]
     with open(mdl_file, 'r', encoding='UTF-8') as in_file:
         text = in_file.read()
 
@@ -942,6 +1004,6 @@ def translate_vensim(mdl_file):
     macro_list = [s for s in file_sections if s['name'] is not '_main_']
 
     for section in file_sections:
-        translate_section(section, macro_list)
+        translate_section(section, macro_list, root_path)
 
     return outfile_name

From 3f17fcb6be403d02bacd9046bc330f27d21310cd Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Thu, 12 Sep 2019 15:38:14 -0400
Subject: [PATCH 20/30] Replace np.ones with np.full

---
 pysd/py_backend/builder.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index c45012cf..06d4d3aa 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -284,7 +284,7 @@ def add_stock(identifier, subs, expression, initial_condition, subscript_dict):
             dims = [utils.find_subscript_name(subscript_dict, sub) for sub in subs]
             shape = [len(coords[dim]) for dim in dims]
             initial_condition = textwrap.dedent("""\
-                xr.DataArray(data=np.ones(%(shape)s)*%(value)s,
+                xr.DataArray(data=np.full(%(shape)s, %(value)s),
                              coords=%(coords)s,
                              dims=%(dims)s )""" % {
                 'shape': shape,

From 454b25cc7b39a4e901875bd1605f3dd807a5ce74 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Fri, 13 Sep 2019 19:58:35 -0400
Subject: [PATCH 21/30] More work on data

---
 pysd/py_backend/builder.py          | 140 +++++++++++++++++++++++-----
 pysd/py_backend/vensim/vensim2py.py |  35 ++++++-
 2 files changed, 151 insertions(+), 24 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 06d4d3aa..bc4578d3 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -12,12 +12,13 @@
 from __future__ import absolute_import
 
 import os.path
-import pkg_resources
 import textwrap
 import warnings
+from io import open
+
+import pkg_resources
 import yapf
 
-from io import open
 from .._version import __version__
 from ..py_backend import utils
 
@@ -61,6 +62,7 @@ def build(elements, subscript_dict, namespace, outfile_name):
     import numpy as np
     from pysd import utils
     import xarray as xr
+    import os
 
     from pysd.py_backend.functions import cache
     from pysd.py_backend import functions
@@ -75,6 +77,8 @@ def build(elements, subscript_dict, namespace, outfile_name):
         'scope': None,
         'time': lambda: 0
     }
+    
+    _root = os.path.dirname(__file__)
 
     def _init_outer_references(data):
         for key in data:
@@ -95,8 +99,15 @@ def time():
 
     style_file = pkg_resources.resource_filename("pysd", "py_backend/output_style.yapf")
     text = text.replace('\t', '    ')
-    text, changed = yapf.yapf_api.FormatCode(textwrap.dedent(text),
-                                             style_config=style_file)
+    try:
+        text, changed = yapf.yapf_api.FormatCode(textwrap.dedent(text),
+                                                 style_config=style_file)
+    except:
+        # This is unfortunate but necessary because yapf is apparently not compliant with PEP 3131
+        # (https://www.python.org/dev/peps/pep-3131/)
+        # Alternatively we could skip formatting altogether, or replace yapf with black for all cases?
+        import black
+        text = black.format_file_contents(textwrap.dedent(text), fast=True, mode=black.FileMode())
 
     # this is used for testing
     if outfile_name == 'return':
@@ -150,16 +161,16 @@ def build_element(element, subscript_dict):
                     'ulines': '-' * len(element['real_name']),
                     'contents': contents.replace('\n',
                                                  '\n' + ' ' * indent)})  # indent lines 2 onward
-    
+
     element['doc'] = element['doc'].replace('\\', '\n    ').encode('unicode-escape')
 
     if 'unit' in element:
-        element['unit'] = element['unit'].encode('utf8')
+        element['unit'] = element['unit']
     if 'real_name' in element:
-        element['real_name'] = element['real_name'].encode('utf8')
+        element['real_name'] = element['real_name']
     if 'eqn' in element:
-        element['eqn'] = element['eqn'].encode('utf8')
-    
+        element['eqn'] = element['eqn']
+
     if element['kind'] == 'stateful':
         func = '''
     %(py_name)s = %(py_expr)s
@@ -382,9 +393,9 @@ def add_n_delay(delay_input, delay_time, initial_value, order, subs, subscript_d
 
     stateful = {
         'py_name': utils.make_python_identifier('_delay_%s_%s_%s_%s' % (delay_input,
-                                                                       delay_time,
-                                                                       initial_value,
-                                                                       order))[0],
+                                                                        delay_time,
+                                                                        initial_value,
+                                                                        order))[0],
         'real_name': 'Delay of %s' % delay_input,
         'doc': 'Delay time: %s \n Delay initial value %s \n Delay order %s' % (
             delay_time, initial_value, order),
@@ -442,9 +453,9 @@ def add_n_smooth(smooth_input, smooth_time, initial_value, order, subs, subscrip
 
     stateful = {
         'py_name': utils.make_python_identifier('_smooth_%s_%s_%s_%s' % (smooth_input,
-                                                                        smooth_time,
-                                                                        initial_value,
-                                                                        order))[0],
+                                                                         smooth_time,
+                                                                         initial_value,
+                                                                         order))[0],
         'real_name': 'Smooth of %s' % smooth_input,
         'doc': 'Smooth time: %s \n Smooth initial value %s \n Smooth order %s' % (
             smooth_time, initial_value, order),
@@ -490,8 +501,8 @@ def add_n_trend(trend_input, average_time, initial_trend, subs, subscript_dict):
 
     stateful = {
         'py_name': utils.make_python_identifier('_trend_%s_%s_%s' % (trend_input,
-                                                                    average_time,
-                                                                    initial_trend))[0],
+                                                                     average_time,
+                                                                     initial_trend))[0],
         'real_name': 'trend of %s' % trend_input,
         'doc': 'Trend average time: %s \n Trend initial value %s' % (
             average_time, initial_trend),
@@ -544,6 +555,47 @@ def add_initial(initial_input):
     return "%s()" % stateful['py_name'], [stateful]
 
 
+def add_data(identifier, file, tab, time_row_or_col, cell, subs, subscript_dict, keyword):
+    coords = {dim: subscript_dict[dim] for dim in subs}
+    keyword = '"%s"' % keyword.strip(':').lower() if isinstance(keyword, str) else keyword
+    stateful = {
+        'py_name': utils.make_python_identifier('_data_%s' % identifier)[0],
+        'real_name': 'Data for %s' % identifier,
+        'doc': 'Provides data for data variable %s' % identifier,
+        'py_expr': 'functions.Data('
+                   'file=%s, tab=%s, time_row_or_col=%s, cell=%s, time=time, root=_root, coords=%s, interp=%s'
+                   ')' % (
+                       file, tab, time_row_or_col, cell, coords, keyword
+                   ),
+        'unit': 'None',
+        'lims': 'None',
+        'eqn': 'None',
+        'subs': subs,
+        'kind': 'stateful',
+        'arguments': ''
+    }
+
+    return "%s()" % stateful['py_name'], [stateful]
+
+
+def add_ext_constant(identifier, file, tab, cell, subs, subscript_dict):
+    coords = {dim: subscript_dict[dim] for dim in subs}
+    stateful = {
+        'py_name': utils.make_python_identifier('_data_%s' % identifier)[0],
+        'real_name': 'Data for %s' % identifier,
+        'doc': 'Provides data for constant data variable %s' % identifier,
+        'py_expr': 'functions.ExtConstant(file=%s, tab=%s, root=_root, cell=%s, coords=%s)' % (file, tab, cell, coords),
+        'unit': 'None',
+        'lims': 'None',
+        'eqn': 'None',
+        'subs': subs,
+        'kind': 'stateful',
+        'arguments': ''
+    }
+
+    return "%s()" % stateful['py_name'], [stateful]
+
+
 def add_macro(macro_name, filename, arg_names, arg_vals):
     """
     Constructs a stateful object instantiating a 'Macro'
@@ -576,7 +628,8 @@ def add_macro(macro_name, filename, arg_names, arg_vals):
             [utils.make_python_identifier(f)[0] for f in arg_vals]),
         'real_name': 'Macro Instantiation of ' + macro_name,
         'doc': 'Instantiates the Macro',
-        'py_expr': "functions.Macro('%s', %s, '%s', time_initialization=lambda: __data['time'])" % (filename, func_args, macro_name),
+        'py_expr': "functions.Macro('%s', %s, '%s', time_initialization=lambda: __data['time'])" % (
+            filename, func_args, macro_name),
         'unit': 'None',
         'lims': 'None',
         'eqn': 'None',
@@ -601,14 +654,55 @@ def add_incomplete(var_name, dependencies):
     # first arg is `self` reference
     return "functions.incomplete(%s)" % ', '.join(dependencies[1:]), []
 
+
 def build_function_call(function_def, user_arguments):
+    """
+
+    Parameters
+    ----------
+    function_def: function definition map with following keys
+        - name: name of the function
+        - parameters: list with description of all parameters of this function
+            - name
+            - optional?
+            - type: [
+                "expression", - provide converted expression as parameter for runtime evaluating before the method call
+                "lambda",     - provide lambda expression as parameter for delayed runtime evaluation in the method call
+                "time",       - provide access to current instance of time object
+                "scope"       - provide access to current instance of scope object (instance of Macro object)
+            ]
+    user_arguments: list of arguments provided from model
+
+    Returns
+    -------
+
+    """
     if isinstance(function_def, str):
         return function_def + "(" + ",".join(user_arguments) + ")"
 
-    if "require_time" in function_def and function_def["require_time"]:
-        user_arguments.insert(0, "__data['time']")
-
-    if "require_scope" in function_def and function_def["require_scope"]:
-        user_arguments.insert(0, "__data['scope']")
+    if "parameters" in function_def:
+        parameters = function_def["parameters"]
+        arguments = []
+        argument_idx = 0
+        for parameter_idx in range(len(parameters)):
+            parameter_def = parameters[parameter_idx]
+            is_optional = parameter_def["optional"] if "optional" in parameter_def else False
+            if argument_idx >= len(user_arguments) and is_optional:
+                break
+
+            parameter_type = parameter_def["type"] if "type" in parameter_def else "expression"
+
+            user_argument = user_arguments[argument_idx]
+            if parameter_type in ["expression", "lambda"]:
+                argument_idx += 1
+
+            arguments.append({
+                                 "expression": user_argument,
+                                 "lambda": "lambda: (" + user_argument + ")",
+                                 "time": "__data['time']",
+                                 "scope": "__data['scope']"
+                             }[parameter_type])
+
+        return function_def['name'] + "(" + ", ".join(arguments) + ")"
 
     return function_def['name'] + "(" + ",".join(user_arguments) + ")"
diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 4b15ecc2..017a09e2 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -479,12 +479,23 @@ def parse_units(units_str):
 }
 
 data_functions = {
-    "get xls data": "functions.get_xls_data",
     "get direct data": "functions.get_direct_data",
     "get xls constants": "functions.get_xls_constants",
     "get xls lookups": "functions.get_xls_lookups"
 }
 
+data_ops = {
+    'get data at time': '',
+    'get data between times': '',
+    'get data last time': '',
+    'get data max': '',
+    'get data min': '',
+    'get data median': '',
+    'get data mean': '',
+    'get data stdv': '',
+    'get data total points': ''
+}
+
 functions.update(data_functions)
 
 builders = {
@@ -602,12 +613,34 @@ def parse_units(units_str):
         subs=element['subs'],
         subscript_dict=subscript_dict),
 
+    "get xls data": lambda element, subscript_dict, args: builder.add_data(
+        identifier=element['py_name'],
+        file=args[0],
+        tab=args[1],
+        time_row_or_col=args[2],
+        cell=args[3],
+        subs=element['subs'],
+        subscript_dict=subscript_dict,
+        keyword=element['keyword']
+    ),
+
+    "get xls constants": lambda element, subscript_dict, args: builder.add_ext_constant(
+        identifier=element['py_name'],
+        file=args[0],
+        tab=args[1],
+        cell=args[2],
+        subs=element['subs'],
+        subscript_dict=subscript_dict
+    ),
+
     "initial": lambda element, subscript_dict, args: builder.add_initial(args[0]),
 
     "a function of": lambda element, subscript_dict, args: builder.add_incomplete(
         element['real_name'], args)
 }
 
+builders['get direct data'] = builders['get xls data']  # Both are implemented identically in PySD
+
 
 def parse_general_expression(element, namespace=None, subscript_dict=None, macro_list=None):
     """

From 0f4c89d0f2856fde8d1ed5f24683b6b31b31bce5 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Sat, 14 Sep 2019 20:10:53 -0400
Subject: [PATCH 22/30] Progress on external data and lookups

---
 pysd/py_backend/builder.py          | 21 +++++++++++++++++++-
 pysd/py_backend/vensim/vensim2py.py | 30 ++++++++++++++++++-----------
 2 files changed, 39 insertions(+), 12 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index bc4578d3..9af1ba8e 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -581,7 +581,7 @@ def add_data(identifier, file, tab, time_row_or_col, cell, subs, subscript_dict,
 def add_ext_constant(identifier, file, tab, cell, subs, subscript_dict):
     coords = {dim: subscript_dict[dim] for dim in subs}
     stateful = {
-        'py_name': utils.make_python_identifier('_data_%s' % identifier)[0],
+        'py_name': utils.make_python_identifier('_ext_constant_%s' % identifier)[0],
         'real_name': 'Data for %s' % identifier,
         'doc': 'Provides data for constant data variable %s' % identifier,
         'py_expr': 'functions.ExtConstant(file=%s, tab=%s, root=_root, cell=%s, coords=%s)' % (file, tab, cell, coords),
@@ -596,6 +596,25 @@ def add_ext_constant(identifier, file, tab, cell, subs, subscript_dict):
     return "%s()" % stateful['py_name'], [stateful]
 
 
+def add_ext_lookup(identifier, file, tab, x_row_or_col, cell, subs, subscript_dict):
+    coords = {dim: subscript_dict[dim] for dim in subs}
+    stateful = {
+        'py_name': utils.make_python_identifier('_ext_lookup_%s' % identifier)[0],
+        'real_name': 'External lookup data for %s' % identifier,
+        'doc': 'Provides data for external lookup variable %s' % identifier,
+        'py_expr': 'functions.ExtLookup(file=%s, tab=%s, root=_root, x_row_or_col=%s, cell=%s, coords=%s)'
+                   % (file, tab, x_row_or_col, cell, coords),
+        'unit': 'None',
+        'lims': 'None',
+        'eqn': 'None',
+        'subs': subs,
+        'kind': 'stateful',
+        'arguments': 'x'
+    }
+
+    return "%s(x)" % stateful['py_name'], [stateful]
+
+
 def add_macro(macro_name, filename, arg_names, arg_vals):
     """
     Constructs a stateful object instantiating a 'Macro'
diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 017a09e2..107871a6 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -338,6 +338,8 @@ def visit__(self, n, vc):
 
 
 def get_external_data(func_str, args_str, root_path):
+    # The py model file must be recompiled if external file subscripts change. This could be avoided
+    # if we switch to function-defined subscript values instead of hard-coding them.
     f = subscript_functions[func_str.lower()]
     args = [x.strip().strip("\'") for x in args_str.split(',')]  # todo: make this less fragile?
     if args[0][0] == '?':
@@ -478,12 +480,6 @@ def parse_units(units_str):
     "get direct subscript": funcs.get_direct_subscript
 }
 
-data_functions = {
-    "get direct data": "functions.get_direct_data",
-    "get xls constants": "functions.get_xls_constants",
-    "get xls lookups": "functions.get_xls_lookups"
-}
-
 data_ops = {
     'get data at time': '',
     'get data between times': '',
@@ -496,8 +492,6 @@ def parse_units(units_str):
     'get data total points': ''
 }
 
-functions.update(data_functions)
-
 builders = {
     "integ": lambda element, subscript_dict, args: builder.add_stock(
         identifier=element['py_name'],
@@ -633,6 +627,16 @@ def parse_units(units_str):
         subscript_dict=subscript_dict
     ),
 
+    "get xls lookups": lambda element, subscript_dict, args: builder.add_ext_lookup(
+        identifier=element['py_name'],
+        file=args[0],
+        tab=args[1],
+        x_row_or_col=args[2],
+        cell=args[3],
+        subs=element['subs'],
+        subscript_dict=subscript_dict
+    ),
+
     "initial": lambda element, subscript_dict, args: builder.add_initial(args[0]),
 
     "a function of": lambda element, subscript_dict, args: builder.add_incomplete(
@@ -640,6 +644,7 @@ def parse_units(units_str):
 }
 
 builders['get direct data'] = builders['get xls data']  # Both are implemented identically in PySD
+builders['get direct lookups'] = builders['get xls lookups']  # Both are implemented identically in PySD
 
 
 def parse_general_expression(element, namespace=None, subscript_dict=None, macro_list=None):
@@ -770,6 +775,7 @@ def __init__(self, ast):
             self.translation = ""
             self.kind = 'constant'  # change if we reference anything else
             self.new_structure = []
+            self.arguments = None
             self.visit(ast)
 
         def visit_expr_type(self, n, vc):
@@ -782,9 +788,8 @@ def visit_expr(self, n, vc):
             return s
 
         def visit_call(self, n, vc):
+            self.kind = 'component'
             function_name = vc[0].lower()
-            if function_name not in data_functions:
-                self.kind = 'component'
             arguments = [e.strip() for e in vc[4].split(",")]
             return builder.build_function_call(functions[function_name], arguments)
 
@@ -857,6 +862,9 @@ def visit_build_call(self, n, vc):
             name, structure = builders[builder_name](element, subscript_dict, arglist)
             self.new_structure += structure
 
+            if builder_name in ['get xls lookups', 'get direct lookups']:
+                self.arguments = 'x'
+
             if builder_name == 'delay fixed':
                 warnings.warn("Delay fixed only approximates solution, may not give the same "
                               "result as vensim")
@@ -894,7 +902,7 @@ def generic_visit(self, n, vc):
 
     return ({'py_expr': parse_object.translation,
              'kind': parse_object.kind,
-             'arguments': ''},
+             'arguments': parse_object.arguments or ''},
             parse_object.new_structure)
 
 

From 8f282ef21953fd559151a84a7aab6d0cb88ff24e Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Sun, 15 Sep 2019 14:04:17 -0400
Subject: [PATCH 23/30] Fix '.loc' diretive from subscripts not showing up in
 function call.

---
 pysd/py_backend/vensim/vensim2py.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 107871a6..c88f9b87 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -801,8 +801,8 @@ def visit_pre_oper(self, n, vc):
 
         def visit_reference(self, n, vc):
             self.kind = 'component'
-            id_str = vc[0]
-            return id_str + '()'
+            vc[0] += '()'
+            return ''.join([x.strip(',') for x in vc])
 
         def visit_id(self, n, vc):
             return namespace[n.text.strip()]

From 56805ed30f96cc9d39ce371f2d9eef1e38c31c1d Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Mon, 16 Sep 2019 12:07:53 -0400
Subject: [PATCH 24/30] Basic subscript functions seem to work

---
 pysd/py_backend/vensim/vensim2py.py | 31 +++++++++++++++++++++++++----
 1 file changed, 27 insertions(+), 4 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index c88f9b87..75a0d106 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -722,8 +722,9 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
 
     expression_grammar = r"""
     expr_type = array / expr / empty
-    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ (in_oper _ expr)?
+    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ in_oper_expr?
 
+    in_oper_expr = (in_oper _ expr)
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
     lookup_call = (id _ subscript_list?) _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     call = func _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
@@ -776,6 +777,7 @@ def __init__(self, ast):
             self.kind = 'constant'  # change if we reference anything else
             self.new_structure = []
             self.arguments = None
+            self.in_oper = None
             self.visit(ast)
 
         def visit_expr_type(self, n, vc):
@@ -783,10 +785,26 @@ def visit_expr_type(self, n, vc):
             self.translation = s
 
         def visit_expr(self, n, vc):
-            s = ''.join(filter(None, vc)).strip()
+            if self.in_oper:
+                args = [x for x in vc if len(x.strip())]
+                if len(args) == 3:
+                    args = [''.join(args[0:2]), args[2]]
+                if self.in_oper  == ' and ':
+                    s = 'functions.and_(%s)' % ','.join(args)
+                elif self.in_oper == ' or ':
+                    s = 'functions.or_(%s)' % ','.join(args)
+                else:
+                    s = self.in_oper.join(args)
+                self.in_oper = None
+            else:
+                s = ''.join(filter(None, vc)).strip()
             self.translation = s
             return s
 
+        def visit_in_oper_expr(self, n, vc):
+            self.in_oper = vc[0]
+            return ''.join(filter(None, vc[1:])).strip()
+
         def visit_call(self, n, vc):
             self.kind = 'component'
             function_name = vc[0].lower()
@@ -849,9 +867,13 @@ def visit_subscript_list(self, n, vc):
             subs = [x.strip() for x in refs.split(',')]
             coordinates = utils.make_coord_dict(subs, subscript_dict)
             if len(coordinates):
-                return '.loc[%s]' % repr(coordinates)
+                string = '.loc[%s]' % repr(coordinates)
             else:
-                return ' '
+                string = ' '
+            axis = [str(i) for i, s in enumerate(subs) if s[-1] == '!']
+            if axis:
+                string += ', axis=(%s)' % ','.join(axis)
+            return string
 
         def visit_build_call(self, n, vc):
             call = vc[0]
@@ -897,6 +919,7 @@ def generic_visit(self, n, vc):
             return ''.join(filter(None, vc)) or n.text
 
     parser = parsimonious.Grammar(expression_grammar)
+
     tree = parser.parse(element['expr'])
     parse_object = ExpressionParser(tree)
 

From 5f1c430b46ce7da1ecfae551bbdb6aaacc8a817e Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Mon, 16 Sep 2019 12:57:15 -0400
Subject: [PATCH 25/30] New comments, and squeeze dimensions on xarrays when
 possible

---
 pysd/py_backend/vensim/vensim2py.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 75a0d106..9e0587e1 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -786,6 +786,8 @@ def visit_expr_type(self, n, vc):
 
         def visit_expr(self, n, vc):
             if self.in_oper:
+                # This is rather inelegant, and possibly could be better implemented with a serious reorganization
+                # of the grammar specification for general expressions.
                 args = [x for x in vc if len(x.strip())]
                 if len(args) == 3:
                     args = [''.join(args[0:2]), args[2]]
@@ -867,9 +869,12 @@ def visit_subscript_list(self, n, vc):
             subs = [x.strip() for x in refs.split(',')]
             coordinates = utils.make_coord_dict(subs, subscript_dict)
             if len(coordinates):
-                string = '.loc[%s]' % repr(coordinates)
+                string = '.loc[%s].squeeze()' % repr(coordinates)
             else:
                 string = ' '
+            # Implements basic "!" subscript functionality in Vensim. Does NOT work for matrix diagonals in
+            # FUNC(variable[sub1!,sub1!]) functions, nor with
+            # But works quite well for simple axis specifications, such as "SUM(variable[axis1, axis2!])
             axis = [str(i) for i, s in enumerate(subs) if s[-1] == '!']
             if axis:
                 string += ', axis=(%s)' % ','.join(axis)

From ff081520feb0abc0fdbe18aff3c76e3053e18eaa Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Mon, 16 Sep 2019 16:10:43 -0400
Subject: [PATCH 26/30] Fixed a few errors with "!" functions

---
 pysd/py_backend/builder.py          |  5 ++---
 pysd/py_backend/vensim/vensim2py.py | 12 ++++++------
 2 files changed, 8 insertions(+), 9 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index 9af1ba8e..aa9d9bbc 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -390,7 +390,6 @@ def add_n_delay(delay_input, delay_time, initial_value, order, subs, subscript_d
     """
     # the py name has to be unique to all the passed parameters, or if there are two things
     # that delay the output by different amounts, they'll overwrite the original function...
-
     stateful = {
         'py_name': utils.make_python_identifier('_delay_%s_%s_%s_%s' % (delay_input,
                                                                         delay_time,
@@ -399,8 +398,8 @@ def add_n_delay(delay_input, delay_time, initial_value, order, subs, subscript_d
         'real_name': 'Delay of %s' % delay_input,
         'doc': 'Delay time: %s \n Delay initial value %s \n Delay order %s' % (
             delay_time, initial_value, order),
-        'py_expr': 'functions.Delay(lambda: %s, lambda: %s, lambda: %s, lambda: %s)' % (
-            delay_input, delay_time, initial_value, order),
+        'py_expr': 'functions.Delay(lambda: %s, lambda: %s, lambda: %s, lambda: %s, %s, %s)' % (
+            delay_input, delay_time, initial_value, order, subs, subscript_dict),
         'unit': 'None',
         'lims': 'None',
         'eqn': 'None',
diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 9e0587e1..7a8fba18 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -408,7 +408,7 @@ def parse_units(units_str):
     "log": "functions.log",
     "exprnd": "np.random.exponential",
     "random uniform": "functions.random_uniform",
-    "sum": "np.sum",
+    "sum": "functions.sum",
     "arccos": "np.arccos",
     "arcsin": "np.arcsin",
     "arctan": "np.arctan",
@@ -469,9 +469,9 @@ def parse_units(units_str):
     "game": "",  # In the future, may have an actual `functions.game` pass through
 
     # vector functions
-    "vmin": "np.min",
-    "vmax": "np.max",
-    "prod": "np.prod",
+    "vmin": "functions.min",
+    "vmax": "functions.max",
+    "prod": "functions.prod",
 
 }
 
@@ -875,9 +875,9 @@ def visit_subscript_list(self, n, vc):
             # Implements basic "!" subscript functionality in Vensim. Does NOT work for matrix diagonals in
             # FUNC(variable[sub1!,sub1!]) functions, nor with
             # But works quite well for simple axis specifications, such as "SUM(variable[axis1, axis2!])
-            axis = [str(i) for i, s in enumerate(subs) if s[-1] == '!']
+            axis = ['"%s"' % s.strip('!') for s in subs if s[-1] == '!']
             if axis:
-                string += ', axis=(%s)' % ','.join(axis)
+                string += ', dim=(%s)' % ','.join(axis)
             return string
 
         def visit_build_call(self, n, vc):

From bda0187cb6a2f13aabeb0da51e9a8634a1fa1a09 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Fri, 20 Sep 2019 11:21:34 -0400
Subject: [PATCH 27/30] test_subscript_aggregation works!

---
 pysd/py_backend/vensim/vensim2py.py      | 8 +++++---
 tests/integration_test_vensim_pathway.py | 2 +-
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 7a8fba18..92bae89c 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -469,8 +469,8 @@ def parse_units(units_str):
     "game": "",  # In the future, may have an actual `functions.game` pass through
 
     # vector functions
-    "vmin": "functions.min",
-    "vmax": "functions.max",
+    "vmin": "functions.vmin",
+    "vmax": "functions.vmax",
     "prod": "functions.prod",
 
 }
@@ -804,6 +804,8 @@ def visit_expr(self, n, vc):
             return s
 
         def visit_in_oper_expr(self, n, vc):
+            # We have to pull out the internal operator because the Python "and" and "or" operator do not work with
+            # numpy arrays or xarray DataArrays. We will later replace it with the functions.and_ or functions.or_.
             self.in_oper = vc[0]
             return ''.join(filter(None, vc[1:])).strip()
 
@@ -873,7 +875,7 @@ def visit_subscript_list(self, n, vc):
             else:
                 string = ' '
             # Implements basic "!" subscript functionality in Vensim. Does NOT work for matrix diagonals in
-            # FUNC(variable[sub1!,sub1!]) functions, nor with
+            # FUNC(variable[sub1!,sub1!]) functions, nor with complex operations within the vector function
             # But works quite well for simple axis specifications, such as "SUM(variable[axis1, axis2!])
             axis = ['"%s"' % s.strip('!') for s in subs if s[-1] == '!']
             if axis:
diff --git a/tests/integration_test_vensim_pathway.py b/tests/integration_test_vensim_pathway.py
index 5dafd1e2..4cf68674 100644
--- a/tests/integration_test_vensim_pathway.py
+++ b/tests/integration_test_vensim_pathway.py
@@ -280,7 +280,7 @@ def test_subscript_3d_arrays_widthwise(self):
         output, canon = runner('test-models/tests/subscript_3d_arrays_widthwise/test_subscript_3d_arrays_widthwise.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    @unittest.skip('in branch')
+    # @unittest.skip('in branch')
     def test_subscript_aggregation(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_aggregation/test_subscript_aggregation.mdl')

From f75a3ce4f9dd6481397f75f6631d2dbc83cc50d0 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Mon, 23 Sep 2019 09:23:25 -0400
Subject: [PATCH 28/30] Better and/or operators and fixes on tests

---
 pysd/py_backend/builder.py               |  2 +-
 pysd/py_backend/vensim/vensim2py.py      | 29 +++---------------
 tests/integration_test_vensim_pathway.py | 12 ++++----
 tests/unit_test_vensim2py.py             | 38 ++++++++++++------------
 4 files changed, 31 insertions(+), 50 deletions(-)

diff --git a/pysd/py_backend/builder.py b/pysd/py_backend/builder.py
index aa9d9bbc..3547ffd4 100644
--- a/pysd/py_backend/builder.py
+++ b/pysd/py_backend/builder.py
@@ -670,7 +670,7 @@ def add_incomplete(var_name, dependencies):
                   SyntaxWarning, stacklevel=2)
 
     # first arg is `self` reference
-    return "functions.incomplete(%s)" % ', '.join(dependencies[1:]), []
+    return "functions.incomplete(%s)" % ', '.join(dependencies), []
 
 
 def build_function_call(function_def, user_arguments):
diff --git a/pysd/py_backend/vensim/vensim2py.py b/pysd/py_backend/vensim/vensim2py.py
index 92bae89c..87110165 100644
--- a/pysd/py_backend/vensim/vensim2py.py
+++ b/pysd/py_backend/vensim/vensim2py.py
@@ -208,7 +208,7 @@ def _include_common_grammar(source_grammar):
     """.format(source_grammar=source_grammar, common_grammar=common_grammar)
 
 
-def get_equation_components(equation_str, root_path):
+def get_equation_components(equation_str, root_path=None):
     """
     Breaks down a string representing only the equation part of a model element.
     Recognizes the various types of model elements that may exist, and identifies them.
@@ -701,7 +701,7 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
     in_ops = {
         "+": "+", "-": "-", "*": "*", "/": "/", "^": "**", "=": "==", "<=": "<=", "<>": "!=",
         "<": "<", ">=": ">=", ">": ">",
-        ":and:": " and ", ":or:": " or "}  # spaces important for word-based operators
+        ":and:": " & ", ":or:": " | "}  # spaces perhaps important?
 
     pre_ops = {
         "-": "-", ":not:": " not ",  # spaces important for word-based operators
@@ -722,9 +722,8 @@ def parse_general_expression(element, namespace=None, subscript_dict=None, macro
 
     expression_grammar = r"""
     expr_type = array / expr / empty
-    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ in_oper_expr?
+    expr = _ pre_oper? _ (lookup_def / build_call / macro_call / call / lookup_call / parens / number / string / reference) _ (in_oper _ expr)?
 
-    in_oper_expr = (in_oper _ expr)
     lookup_def = ~r"(WITH\ LOOKUP)"I _ "(" _ expr _ "," _ "(" _  ("[" ~r"[^\]]*" "]" _ ",")?  ( "(" _ expr _ "," _ expr _ ")" _ ","? _ )+ _ ")" _ ")"
     lookup_call = (id _ subscript_list?) _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
     call = func _ "(" _ (expr _ ","? _)* ")"  # these don't need their args parsed...
@@ -785,30 +784,10 @@ def visit_expr_type(self, n, vc):
             self.translation = s
 
         def visit_expr(self, n, vc):
-            if self.in_oper:
-                # This is rather inelegant, and possibly could be better implemented with a serious reorganization
-                # of the grammar specification for general expressions.
-                args = [x for x in vc if len(x.strip())]
-                if len(args) == 3:
-                    args = [''.join(args[0:2]), args[2]]
-                if self.in_oper  == ' and ':
-                    s = 'functions.and_(%s)' % ','.join(args)
-                elif self.in_oper == ' or ':
-                    s = 'functions.or_(%s)' % ','.join(args)
-                else:
-                    s = self.in_oper.join(args)
-                self.in_oper = None
-            else:
-                s = ''.join(filter(None, vc)).strip()
+            s = ''.join(filter(None, vc)).strip()
             self.translation = s
             return s
 
-        def visit_in_oper_expr(self, n, vc):
-            # We have to pull out the internal operator because the Python "and" and "or" operator do not work with
-            # numpy arrays or xarray DataArrays. We will later replace it with the functions.and_ or functions.or_.
-            self.in_oper = vc[0]
-            return ''.join(filter(None, vc[1:])).strip()
-
         def visit_call(self, n, vc):
             self.kind = 'component'
             function_name = vc[0].lower()
diff --git a/tests/integration_test_vensim_pathway.py b/tests/integration_test_vensim_pathway.py
index 4cf68674..69db1561 100644
--- a/tests/integration_test_vensim_pathway.py
+++ b/tests/integration_test_vensim_pathway.py
@@ -137,7 +137,8 @@ def test_lookups(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/lookups/test_lookups.mdl')
         assert_frames_close(output, canon, rtol=rtol)
-        
+
+    @unittest.skip('File not found')
     def test_lookups_without_range(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/lookups_without_range/test_lookups_without_range.mdl')
@@ -250,6 +251,7 @@ def test_sqrt(self):
         output, canon = runner('test-models/tests/sqrt/test_sqrt.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
+    @unittest.skip('File not found')
     def test_subscript_multiples(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_multiples/test_multiple_subscripts.mdl')
@@ -323,25 +325,25 @@ def test_subscript_mixed_assembly(self):
         output, canon = runner('test-models/tests/subscript_mixed_assembly/test_subscript_mixed_assembly.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    @unittest.skip('in branch')
+    # @unittest.skip('in branch')
     def test_subscript_selection(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_selection/subscript_selection.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    @unittest.skip('failing in py3')
+    # @unittest.skip('failing in py3')
     def test_subscript_subranges(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_subranges/test_subscript_subrange.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    @unittest.skip('failing in py3')
+    # @unittest.skip('failing in py3')
     def test_subscript_subranges_equal(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_subranges_equal/test_subscript_subrange_equal.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    @unittest.skip('in branch')
+    # @unittest.skip('in branch')
     def test_subscript_switching(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_switching/subscript_switching.mdl')
diff --git a/tests/unit_test_vensim2py.py b/tests/unit_test_vensim2py.py
index 743d38d8..853ffd9b 100644
--- a/tests/unit_test_vensim2py.py
+++ b/tests/unit_test_vensim2py.py
@@ -71,7 +71,7 @@ def test_basics(self):
         from pysd.py_backend.vensim.vensim2py import get_equation_components
         self.assertEqual(
             get_equation_components(r'constant = 25'),
-            {'expr': '25', 'kind': 'component', 'subs': [], 'real_name': 'constant'}
+            {'expr': '25', 'kind': 'component', 'subs': [], 'real_name': 'constant', 'keyword': None}
         )
 
     def test_equals_handling(self):
@@ -80,7 +80,7 @@ def test_equals_handling(self):
         self.assertEqual(
             get_equation_components(r'Boolean = IF THEN ELSE(1 = 1, 1, 0)'),
             {'expr': 'IF THEN ELSE(1 = 1, 1, 0)', 'kind': 'component', 'subs': [],
-             'real_name': 'Boolean'}
+             'real_name': 'Boolean', 'keyword': None}
         )
 
     def test_whitespace_handling(self):
@@ -89,7 +89,7 @@ def test_whitespace_handling(self):
         self.assertEqual(
             get_equation_components(r'''constant\t =
                                                         \t25\t '''),
-            {'expr': '25', 'kind': 'component', 'subs': [], 'real_name': 'constant'}
+            {'expr': '25', 'kind': 'component', 'subs': [], 'real_name': 'constant', 'keyword': None}
         )
 
         # test eliminating vensim's line continuation character
@@ -97,7 +97,7 @@ def test_whitespace_handling(self):
             get_equation_components(r"""constant [Sub1, \\
                                      Sub2] = 10, 12; 14, 16;"""),
             {'expr': '10, 12; 14, 16;', 'kind': 'component', 'subs': ['Sub1', 'Sub2'],
-             'real_name': 'constant'}
+             'real_name': 'constant', 'keyword': None}
         )
 
     def test_subscript_definition_parsing(self):
@@ -105,7 +105,7 @@ def test_subscript_definition_parsing(self):
         self.assertEqual(
             get_equation_components(r'''Sub1: Entry 1, Entry 2, Entry 3 '''),
             {'expr': None, 'kind': 'subdef', 'subs': ['Entry 1', 'Entry 2', 'Entry 3'],
-             'real_name': 'Sub1'}
+             'real_name': 'Sub1', 'keyword': None}
         )
 
     def test_subscript_references(self):
@@ -113,25 +113,25 @@ def test_subscript_references(self):
         self.assertEqual(
             get_equation_components(r'constant [Sub1, Sub2] = 10, 12; 14, 16;'),
             {'expr': '10, 12; 14, 16;', 'kind': 'component', 'subs': ['Sub1', 'Sub2'],
-             'real_name': 'constant'}
+             'real_name': 'constant', 'keyword': None}
         )
 
         self.assertEqual(
             get_equation_components(r'function [Sub1] = other function[Sub1]'),
             {'expr': 'other function[Sub1]', 'kind': 'component', 'subs': ['Sub1'],
-             'real_name': 'function'}
+             'real_name': 'function', 'keyword': None}
         )
 
         self.assertEqual(
             get_equation_components(r'constant ["S1,b", "S1,c"] = 1, 2; 3, 4;'),
             {'expr': '1, 2; 3, 4;', 'kind': 'component', 'subs': ['"S1,b"', '"S1,c"'],
-             'real_name': 'constant'}
+             'real_name': 'constant', 'keyword': None}
         )
 
         self.assertEqual(
             get_equation_components(r'constant ["S1=b", "S1=c"] = 1, 2; 3, 4;'),
             {'expr': '1, 2; 3, 4;', 'kind': 'component', 'subs': ['"S1=b"', '"S1=c"'],
-             'real_name': 'constant'}
+             'real_name': 'constant', 'keyword': None}
         )
 
     def test_lookup_definitions(self):
@@ -139,26 +139,26 @@ def test_lookup_definitions(self):
         self.assertEqual(
             get_equation_components(r'table([(0,-1)-(45,1)],(0,0),(5,0))'),
             {'expr': '([(0,-1)-(45,1)],(0,0),(5,0))', 'kind': 'lookup', 'subs': [],
-             'real_name': 'table'}
+             'real_name': 'table', 'keyword': None}
         )
 
         self.assertEqual(
             get_equation_components(r'table2 ([(0,-1)-(45,1)],(0,0),(5,0))'),
             {'expr': '([(0,-1)-(45,1)],(0,0),(5,0))', 'kind': 'lookup', 'subs': [],
-             'real_name': 'table2'}
+             'real_name': 'table2', 'keyword': None}
         )
 
     def test_pathological_names(self):
         from pysd.py_backend.vensim.vensim2py import get_equation_components
         self.assertEqual(
             get_equation_components(r'"silly-string" = 25'),
-            {'expr': '25', 'kind': 'component', 'subs': [], 'real_name': '"silly-string"'}
+            {'expr': '25', 'kind': 'component', 'subs': [], 'real_name': '"silly-string"', 'keyword': None}
         )
 
         self.assertEqual(
             get_equation_components(r'"pathological\\-string" = 25'),
             {'expr': '25', 'kind': 'component', 'subs': [],
-             'real_name': r'"pathological\\-string"'}
+             'real_name': r'"pathological\\-string"', 'keyword': None}
         )
 
 
@@ -328,7 +328,7 @@ def test_subscript_3d_depth(self):
         self.assertEqual(a.loc[{'Dim1': 'A', 'Dim2': 'D'}], 1)
         self.assertEqual(a.loc[{'Dim1': 'B', 'Dim2': 'E'}], 4)
 
-    @unittest.skip('in branch')
+    # unittest.skip('in branch')
     def test_subscript_reference(self):
         from pysd.py_backend.vensim.vensim2py import parse_general_expression
         res = parse_general_expression({'expr': 'Var A[Dim1, Dim2]'},
@@ -342,16 +342,16 @@ def test_subscript_reference(self):
                                      {'Var B': 'var_b'},
                                      {'Dim1': ['A', 'B'],
                                       'Dim2': ['C', 'D', 'E']})
-        self.assertEqual(res[0]['py_expr'], "var_b().loc[{'Dim2': ['C']}]")
+        self.assertEqual(res[0]['py_expr'], "var_b().loc[{'Dim2': ['C']}].squeeze()")
 
         res = parse_general_expression({'expr': 'Var C[Dim1, C, H]'},
                                      {'Var C': 'var_c'},
                                      {'Dim1': ['A', 'B'],
                                       'Dim2': ['C', 'D', 'E'],
                                       'Dim3': ['F', 'G', 'H', 'I']})
-        self.assertEqual(res[0]['py_expr'], "var_c().loc[{'Dim2': ['C'], 'Dim3': ['H']}]")
+        self.assertEqual(res[0]['py_expr'], "var_c().loc[{'Dim2': ['C'], 'Dim3': ['H']}].squeeze()")
 
-    @unittest.skip('in branch')
+    # @unittest.skip('in branch')
     def test_subscript_ranges(self):
         from pysd.py_backend.vensim.vensim2py import parse_general_expression
         res = parse_general_expression({'expr': 'Var D[Range1]'},
@@ -360,10 +360,10 @@ def test_subscript_ranges(self):
                                       'Range1': ['C', 'D', 'E']})
         self.assertEqual(res[0]['py_expr'], "var_c().loc[{'Dim1': ['C', 'D', 'E']}]")
 
-    @unittest.skip('need to write this properly')
+    # @unittest.skip('need to write this properly')
     def test_incomplete_expression(self):
         from pysd.py_backend.vensim.vensim2py import parse_general_expression
-        res = parse_general_expression({'expr': 'A FUNCTION OF(Unspecified Eqn,Var A,Var B)'},
+        res = parse_general_expression({'expr': 'A FUNCTION OF(Unspecified Eqn,Var A,Var B)', 'real_name': 'something'},
                                        {'Unspecified Eqn': 'unspecified_eqn',
                                         'Var A': 'var_a',
                                         'Var B': 'var_b'})

From 0cd40b396c04638b3d63f5a9bbc3b2081892227d Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Fri, 11 Oct 2019 11:28:40 -0400
Subject: [PATCH 29/30] Reformat

---
 pysd/pysd.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pysd/pysd.py b/pysd/pysd.py
index 0cb18ef3..a34b45e3 100644
--- a/pysd/pysd.py
+++ b/pysd/pysd.py
@@ -15,13 +15,13 @@
 
 def read_xmile(xmile_file):
     """ Construct a model object from `.xmile` file. """
-    from . import py_backend
     from .py_backend.xmile.xmile2py import translate_xmile
     py_model_file = translate_xmile(xmile_file)
     model = load(py_model_file)
     model.xmile_file = xmile_file
     return model
 
+
 def read_vensim(mdl_file):
     """
     Construct a model from Vensim `.mdl` file.

From 9740617523e7a6adf7c83379b836cc80eb220019 Mon Sep 17 00:00:00 2001
From: julienmalard <julien.malard@mail.mcgill.ca>
Date: Wed, 15 Apr 2020 14:24:52 -0400
Subject: [PATCH 30/30] Recommented failing tests

---
 tests/integration_test_vensim_pathway.py | 10 +++++-----
 tests/test-models                        |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/integration_test_vensim_pathway.py b/tests/integration_test_vensim_pathway.py
index 69db1561..0bd93946 100644
--- a/tests/integration_test_vensim_pathway.py
+++ b/tests/integration_test_vensim_pathway.py
@@ -282,7 +282,7 @@ def test_subscript_3d_arrays_widthwise(self):
         output, canon = runner('test-models/tests/subscript_3d_arrays_widthwise/test_subscript_3d_arrays_widthwise.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    # @unittest.skip('in branch')
+    @unittest.skip('in branch')
     def test_subscript_aggregation(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_aggregation/test_subscript_aggregation.mdl')
@@ -325,25 +325,25 @@ def test_subscript_mixed_assembly(self):
         output, canon = runner('test-models/tests/subscript_mixed_assembly/test_subscript_mixed_assembly.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    # @unittest.skip('in branch')
+    @unittest.skip('in branch')
     def test_subscript_selection(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_selection/subscript_selection.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    # @unittest.skip('failing in py3')
+    @unittest.skip('failing in py3')
     def test_subscript_subranges(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_subranges/test_subscript_subrange.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    # @unittest.skip('failing in py3')
+    @unittest.skip('failing in py3')
     def test_subscript_subranges_equal(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_subranges_equal/test_subscript_subrange_equal.mdl')
         assert_frames_close(output, canon, rtol=rtol)
 
-    # @unittest.skip('in branch')
+    @unittest.skip('in branch')
     def test_subscript_switching(self):
         from.test_utils import runner, assert_frames_close
         output, canon = runner('test-models/tests/subscript_switching/subscript_switching.mdl')
diff --git a/tests/test-models b/tests/test-models
index 630fb864..f05e0dff 160000
--- a/tests/test-models
+++ b/tests/test-models
@@ -1 +1 @@
-Subproject commit 630fb864fe7d509c32656bcb0a3831e46521a9f7
+Subproject commit f05e0dff30736f0c3a7c656519d3579e90f742cf