diff --git a/fastcore/_nbdev.py b/fastcore/_nbdev.py index f97c7ec8..915dec87 100644 --- a/fastcore/_nbdev.py +++ b/fastcore/_nbdev.py @@ -19,136 +19,103 @@ "test_fig_exists": "00_test.ipynb", "ExceptionExpected": "00_test.ipynb", "exception": "00_test.ipynb", - "defaults": "01_foundation.ipynb", - "copy_func": "01_foundation.ipynb", - "patch_to": "01_foundation.ipynb", - "patch": "01_foundation.ipynb", - "patch_property": "01_foundation.ipynb", - "add_docs": "01_foundation.ipynb", - "docs": "01_foundation.ipynb", - "custom_dir": "01_foundation.ipynb", - "arg0": "01_foundation.ipynb", - "arg1": "01_foundation.ipynb", - "arg2": "01_foundation.ipynb", - "arg3": "01_foundation.ipynb", - "arg4": "01_foundation.ipynb", - "coll_repr": "01_foundation.ipynb", - "is_bool": "01_foundation.ipynb", - "mask2idxs": "01_foundation.ipynb", - "cycle": "01_foundation.ipynb", - "zip_cycle": "01_foundation.ipynb", - "is_indexer": "01_foundation.ipynb", - "negate_func": "01_foundation.ipynb", - "GetAttr": "01_foundation.ipynb", - "delegate_attr": "01_foundation.ipynb", - "bind": "01_foundation.ipynb", - "argwhere": "01_foundation.ipynb", - "map_ex": "01_foundation.ipynb", - "filter_ex": "01_foundation.ipynb", - "range_of": "02_utils.ipynb", - "sorted_ex": "01_foundation.ipynb", - "listable_types": "01_foundation.ipynb", - "renumerate": "01_foundation.ipynb", - "first": "01_foundation.ipynb", - "nested_attr": "01_foundation.ipynb", - "stop": "01_foundation.ipynb", - "tst": "01_foundation.ipynb", - "tst2": "01_foundation.ipynb", - "CollBase": "01_foundation.ipynb", - "L": "01_foundation.ipynb", - "L.__signature__": "01_foundation.ipynb", - "save_config_file": "01_foundation.ipynb", - "read_config_file": "01_foundation.ipynb", - "Config": "01_foundation.ipynb", - "ifnone": "02_utils.ipynb", - "maybe_attr": "02_utils.ipynb", - "basic_repr": "02_utils.ipynb", - "get_class": "02_utils.ipynb", - "mk_class": "02_utils.ipynb", - "wrap_class": "02_utils.ipynb", - "ignore_exceptions": "02_utils.ipynb", - "exec_local": "02_utils.ipynb", - "risinstance": "02_utils.ipynb", - "Inf": "02_utils.ipynb", - "in_": "02_utils.ipynb", - "operator.in_": "02_utils.ipynb", - "true": "02_utils.ipynb", - "gen": "02_utils.ipynb", - "chunked": "02_utils.ipynb", - "otherwise": "02_utils.ipynb", - "AttrDict": "02_utils.ipynb", - "dict2obj": "02_utils.ipynb", - "with_cast": "02_utils.ipynb", - "store_attr": "02_utils.ipynb", - "attrdict": "02_utils.ipynb", - "properties": "02_utils.ipynb", - "camel2snake": "02_utils.ipynb", - "snake2camel": "02_utils.ipynb", - "class2attr": "02_utils.ipynb", - "hasattrs": "02_utils.ipynb", - "setattrs": "02_utils.ipynb", - "try_attrs": "02_utils.ipynb", - "ShowPrint": "02_utils.ipynb", - "Int": "02_utils.ipynb", - "Str": "02_utils.ipynb", - "Float": "02_utils.ipynb", - "tuplify": "02_utils.ipynb", - "detuplify": "02_utils.ipynb", - "replicate": "02_utils.ipynb", - "uniqueify": "02_utils.ipynb", - "setify": "02_utils.ipynb", - "merge": "02_utils.ipynb", - "is_listy": "02_utils.ipynb", - "groupby": "02_utils.ipynb", - "last_index": "02_utils.ipynb", - "shufflish": "02_utils.ipynb", - "filter_dict": "02_utils.ipynb", - "filter_keys": "02_utils.ipynb", - "filter_values": "02_utils.ipynb", - "IterLen": "02_utils.ipynb", - "ReindexCollection": "02_utils.ipynb", - "num_methods": "02_utils.ipynb", - "rnum_methods": "02_utils.ipynb", - "inum_methods": "02_utils.ipynb", - "fastuple": "02_utils.ipynb", - "trace": "02_utils.ipynb", - "compose": "02_utils.ipynb", - "maps": "02_utils.ipynb", - "partialler": "02_utils.ipynb", - "mapped": "02_utils.ipynb", - "instantiate": "02_utils.ipynb", - "using_attr": "02_utils.ipynb", - "Self": "02_utils.ipynb", - "Path.readlines": "02_utils.ipynb", - "Path.mk_write": "02_utils.ipynb", - "Path.ls": "02_utils.ipynb", - "open_file": "02_utils.ipynb", - "save_pickle": "02_utils.ipynb", - "load_pickle": "02_utils.ipynb", - "Path.__repr__": "02_utils.ipynb", - "bunzip": "02_utils.ipynb", - "join_path_file": "02_utils.ipynb", - "urlread": "02_utils.ipynb", - "urljson": "02_utils.ipynb", - "run": "02_utils.ipynb", - "do_request": "02_utils.ipynb", - "sort_by_run": "02_utils.ipynb", - "PrettyString": "02_utils.ipynb", - "round_multiple": "02_utils.ipynb", - "even_mults": "02_utils.ipynb", - "num_cpus": "02_utils.ipynb", - "defaults.cpus": "02_utils.ipynb", - "add_props": "02_utils.ipynb", - "ContextManagers": "02_utils.ipynb", - "typed": "02_utils.ipynb", - "str2bool": "02_utils.ipynb", - "set_num_threads": "02_utils.ipynb", - "ProcessPoolExecutor": "02_utils.ipynb", - "ThreadPoolExecutor": "02_utils.ipynb", - "parallel": "02_utils.ipynb", - "run_procs": "02_utils.ipynb", - "parallel_gen": "02_utils.ipynb", - "threaded": "02_utils.ipynb", + "defaults": "01_basics.ipynb", + "ifnone": "01_basics.ipynb", + "maybe_attr": "01_basics.ipynb", + "basic_repr": "01_basics.ipynb", + "is_array": "01_basics.ipynb", + "listify": "01_basics.ipynb", + "get_class": "01_basics.ipynb", + "mk_class": "01_basics.ipynb", + "wrap_class": "01_basics.ipynb", + "ignore_exceptions": "01_basics.ipynb", + "exec_local": "01_basics.ipynb", + "risinstance": "01_basics.ipynb", + "Inf": "01_basics.ipynb", + "in_": "01_basics.ipynb", + "operator.in_": "01_basics.ipynb", + "true": "01_basics.ipynb", + "stop": "01_basics.ipynb", + "gen": "01_basics.ipynb", + "chunked": "01_basics.ipynb", + "otherwise": "01_basics.ipynb", + "AttrDict": "01_basics.ipynb", + "with_cast": "01_basics.ipynb", + "store_attr": "01_basics.ipynb", + "attrdict": "01_basics.ipynb", + "properties": "01_basics.ipynb", + "camel2snake": "01_basics.ipynb", + "snake2camel": "01_basics.ipynb", + "class2attr": "01_basics.ipynb", + "hasattrs": "01_basics.ipynb", + "setattrs": "01_basics.ipynb", + "try_attrs": "01_basics.ipynb", + "ShowPrint": "01_basics.ipynb", + "Int": "01_basics.ipynb", + "Str": "01_basics.ipynb", + "Float": "01_basics.ipynb", + "detuplify": "01_basics.ipynb", + "replicate": "01_basics.ipynb", + "setify": "01_basics.ipynb", + "merge": "01_basics.ipynb", + "range_of": "02_foundation.ipynb", + "groupby": "01_basics.ipynb", + "last_index": "01_basics.ipynb", + "filter_dict": "01_basics.ipynb", + "filter_keys": "01_basics.ipynb", + "filter_values": "01_basics.ipynb", + "cycle": "02_foundation.ipynb", + "zip_cycle": "02_foundation.ipynb", + "sorted_ex": "01_basics.ipynb", + "num_methods": "01_basics.ipynb", + "rnum_methods": "01_basics.ipynb", + "inum_methods": "01_basics.ipynb", + "fastuple": "01_basics.ipynb", + "compose": "01_basics.ipynb", + "maps": "01_basics.ipynb", + "partialler": "01_basics.ipynb", + "instantiate": "01_basics.ipynb", + "using_attr": "01_basics.ipynb", + "Self": "01_basics.ipynb", + "PrettyString": "01_basics.ipynb", + "even_mults": "01_basics.ipynb", + "num_cpus": "01_basics.ipynb", + "defaults.cpus": "01_basics.ipynb", + "add_props": "01_basics.ipynb", + "typed": "01_basics.ipynb", + "copy_func": "02_foundation.ipynb", + "patch_to": "02_foundation.ipynb", + "patch": "02_foundation.ipynb", + "patch_property": "02_foundation.ipynb", + "add_docs": "02_foundation.ipynb", + "docs": "02_foundation.ipynb", + "custom_dir": "02_foundation.ipynb", + "arg0": "02_foundation.ipynb", + "arg1": "02_foundation.ipynb", + "arg2": "02_foundation.ipynb", + "arg3": "02_foundation.ipynb", + "arg4": "02_foundation.ipynb", + "coll_repr": "02_foundation.ipynb", + "is_bool": "02_foundation.ipynb", + "mask2idxs": "02_foundation.ipynb", + "is_indexer": "02_foundation.ipynb", + "negate_func": "02_foundation.ipynb", + "GetAttr": "02_foundation.ipynb", + "delegate_attr": "02_foundation.ipynb", + "bind": "02_foundation.ipynb", + "argwhere": "02_foundation.ipynb", + "map_ex": "02_foundation.ipynb", + "filter_ex": "02_foundation.ipynb", + "listable_types": "02_foundation.ipynb", + "renumerate": "02_foundation.ipynb", + "first": "02_foundation.ipynb", + "nested_attr": "02_foundation.ipynb", + "CollBase": "02_foundation.ipynb", + "L": "02_foundation.ipynb", + "L.__signature__": "02_foundation.ipynb", + "save_config_file": "02_foundation.ipynb", + "read_config_file": "02_foundation.ipynb", + "Config": "02_foundation.ipynb", "type_hints": "03_dispatch.ipynb", "anno_ret": "03_dispatch.ipynb", "lenient_issubclass": "03_dispatch.ipynb", @@ -161,6 +128,40 @@ "retain_type": "03_dispatch.ipynb", "retain_types": "03_dispatch.ipynb", "explode_types": "03_dispatch.ipynb", + "dict2obj": "03_xtras.ipynb", + "tuplify": "03_xtras.ipynb", + "uniqueify": "03_xtras.ipynb", + "is_listy": "03_xtras.ipynb", + "shufflish": "03_xtras.ipynb", + "mapped": "03_xtras.ipynb", + "IterLen": "03_xtras.ipynb", + "ReindexCollection": "03_xtras.ipynb", + "Path.readlines": "03_xtras.ipynb", + "Path.mk_write": "03_xtras.ipynb", + "Path.ls": "03_xtras.ipynb", + "open_file": "03_xtras.ipynb", + "save_pickle": "03_xtras.ipynb", + "load_pickle": "03_xtras.ipynb", + "Path.__repr__": "03_xtras.ipynb", + "bunzip": "03_xtras.ipynb", + "join_path_file": "03_xtras.ipynb", + "urlread": "03_xtras.ipynb", + "urljson": "03_xtras.ipynb", + "run": "03_xtras.ipynb", + "do_request": "03_xtras.ipynb", + "sort_by_run": "03_xtras.ipynb", + "trace": "03_xtras.ipynb", + "round_multiple": "03_xtras.ipynb", + "modified_env": "03_xtras.ipynb", + "ContextManagers": "03_xtras.ipynb", + "str2bool": "03_xtras.ipynb", + "set_num_threads": "03_xtras.ipynb", + "ProcessPoolExecutor": "03_xtras.ipynb", + "ThreadPoolExecutor": "03_xtras.ipynb", + "parallel": "03_xtras.ipynb", + "run_procs": "03_xtras.ipynb", + "parallel_gen": "03_xtras.ipynb", + "threaded": "03_xtras.ipynb", "Transform": "04_transform.ipynb", "InplaceTransform": "04_transform.ipynb", "DisplayedTransform": "04_transform.ipynb", @@ -195,9 +196,10 @@ "call_parse": "07_script.ipynb"} modules = ["test.py", + "basics.py", "foundation.py", - "utils.py", "dispatch.py", + "xtras.py", "transform.py", "logargs.py", "meta.py", diff --git a/fastcore/basics.py b/fastcore/basics.py new file mode 100644 index 00000000..baf7215e --- /dev/null +++ b/fastcore/basics.py @@ -0,0 +1,541 @@ +# AUTOGENERATED! DO NOT EDIT! File to edit: nbs/01_basics.ipynb (unless otherwise specified). + +__all__ = ['defaults', 'ifnone', 'maybe_attr', 'basic_repr', 'is_array', 'listify', 'get_class', 'mk_class', + 'wrap_class', 'ignore_exceptions', 'exec_local', 'risinstance', 'Inf', 'in_', 'lt', 'gt', 'le', 'ge', 'eq', + 'ne', 'add', 'sub', 'mul', 'truediv', 'is_', 'is_not', 'in_', 'true', 'stop', 'gen', 'chunked', 'otherwise', + 'AttrDict', 'with_cast', 'store_attr', 'attrdict', 'properties', 'camel2snake', 'snake2camel', 'class2attr', + 'hasattrs', 'setattrs', 'try_attrs', 'ShowPrint', 'Int', 'Str', 'Float', 'detuplify', 'replicate', 'setify', + 'merge', 'range_of', 'groupby', 'last_index', 'filter_dict', 'filter_keys', 'filter_values', 'cycle', + 'zip_cycle', 'sorted_ex', 'num_methods', 'rnum_methods', 'inum_methods', 'fastuple', 'compose', 'maps', + 'partialler', 'instantiate', 'using_attr', 'Self', 'Self', 'PrettyString', 'even_mults', 'num_cpus', + 'add_props', 'typed'] + +# Cell +from .imports import * + +# Cell +defaults = SimpleNamespace() + +# Cell +def ifnone(a, b): + "`b` if `a` is None else `a`" + return b if a is None else a + +# Cell +def maybe_attr(o, attr): + "`getattr(o,attr,o)`" + return getattr(o,attr,o) + +# Cell +def basic_repr(flds=None): + if isinstance(flds, str): flds = re.split(', *', flds) + flds = list(flds or []) + def _f(self): + sig = ', '.join(f'{o}={maybe_attr(getattr(self,o), "__name__")}' for o in flds) + return f'{self.__class__.__name__}({sig})' + return _f + +# Cell +def is_array(x): return hasattr(x,'__array__') or hasattr(x,'iloc') + +def listify(o): + if o is None: return [] + if isinstance(o, list): return o + if isinstance(o, str) or is_array(o): return [o] + if is_iter(o): return list(o) + return [o] + +# Cell +def get_class(nm, *fld_names, sup=None, doc=None, funcs=None, **flds): + "Dynamically create a class, optionally inheriting from `sup`, containing `fld_names`" + attrs = {} + for f in fld_names: attrs[f] = None + for f in listify(funcs): attrs[f.__name__] = f + for k,v in flds.items(): attrs[k] = v + sup = ifnone(sup, ()) + if not isinstance(sup, tuple): sup=(sup,) + + def _init(self, *args, **kwargs): + for i,v in enumerate(args): setattr(self, list(attrs.keys())[i], v) + for k,v in kwargs.items(): setattr(self,k,v) + + all_flds = [*fld_names,*flds.keys()] + def _eq(self,b): + return all([getattr(self,k)==getattr(b,k) for k in all_flds]) + + if not sup: attrs['__repr__'] = basic_repr(all_flds) + attrs['__init__'] = _init + attrs['__eq__'] = _eq + res = type(nm, sup, attrs) + if doc is not None: res.__doc__ = doc + return res + +# Cell +def mk_class(nm, *fld_names, sup=None, doc=None, funcs=None, mod=None, **flds): + "Create a class using `get_class` and add to the caller's module" + if mod is None: mod = sys._getframe(1).f_locals + res = get_class(nm, *fld_names, sup=sup, doc=doc, funcs=funcs, **flds) + mod[nm] = res + +# Cell +def wrap_class(nm, *fld_names, sup=None, doc=None, funcs=None, **flds): + "Decorator: makes function a method of a new class `nm` passing parameters to `mk_class`" + def _inner(f): + mk_class(nm, *fld_names, sup=sup, doc=doc, funcs=listify(funcs)+[f], mod=f.__globals__, **flds) + return f + return _inner + +# Cell +class ignore_exceptions: + "Context manager to ignore exceptions" + def __enter__(self): pass + def __exit__(self, *args): return True + +# Cell +def exec_local(code, var_name): + "Call `exec` on `code` and return the var `var_name" + loc = {} + exec(code, globals(), loc) + return loc[var_name] + +# Cell +def risinstance(types, obj=None): + "Curried `isinstance` but with args reversed" + if not obj: return partial(risinstance,types) + return isinstance(obj, types) + +# Cell +#hide +class _InfMeta(type): + @property + def count(self): return itertools.count() + @property + def zeros(self): return itertools.cycle([0]) + @property + def ones(self): return itertools.cycle([1]) + @property + def nones(self): return itertools.cycle([None]) + +# Cell +class Inf(metaclass=_InfMeta): + "Infinite lists" + pass + +# Cell +_dumobj = object() +def _oper(op,a,b=_dumobj): return (lambda o:op(o,a)) if b is _dumobj else op(a,b) + +def _mk_op(nm, mod): + "Create an operator using `oper` and add to the caller's module" + op = getattr(operator,nm) + def _inner(a, b=_dumobj): return _oper(op, a,b) + _inner.__name__ = _inner.__qualname__ = nm + _inner.__doc__ = f'Same as `operator.{nm}`, or returns partial if 1 arg' + mod[nm] = _inner + +# Cell +def in_(x, a): + "`True` if `x in a`" + return x in a + +operator.in_ = in_ + +# Cell +#nbdev_comment _all_ = ['lt','gt','le','ge','eq','ne','add','sub','mul','truediv','is_','is_not','in_'] + +# Cell +for op in ['lt','gt','le','ge','eq','ne','add','sub','mul','truediv','is_','is_not','in_']: _mk_op(op, globals()) + +# Cell +def true(*args, **kwargs): + "Predicate: always `True`" + return True + +# Cell +def stop(e=StopIteration): + "Raises exception `e` (by default `StopException`)" + raise e + +# Cell +def gen(func, seq, cond=true): + "Like `(func(o) for o in seq if cond(func(o)))` but handles `StopIteration`" + return itertools.takewhile(cond, map(func,seq)) + +# Cell +def chunked(it, chunk_sz=None, drop_last=False, n_chunks=None): + "Return batches from iterator `it` of size `chunk_sz` (or return `n_chunks` total)" + assert bool(chunk_sz) ^ bool(n_chunks) + if n_chunks: chunk_sz = math.ceil(len(it)/n_chunks) + if not isinstance(it, Iterator): it = iter(it) + while True: + res = list(itertools.islice(it, chunk_sz)) + if res and (len(res)==chunk_sz or not drop_last): yield res + if len(res) 0 else itertools.cycle([None]) + +# Cell +def zip_cycle(x, *args): + "Like `itertools.zip_longest` but `cycle`s through elements of all but first argument" + return zip(x, *map(cycle,args)) + +# Cell +def sorted_ex(iterable, key=None, reverse=False): + "Like `sorted`, but if key is str use `attrgetter`; if int use `itemgetter`" + if isinstance(key,str): k=lambda o:getattr(o,key,0) + elif isinstance(key,int): k=itemgetter(key) + else: k=key + return sorted(iterable, key=k, reverse=reverse) + +# Cell +num_methods = """ + __add__ __sub__ __mul__ __matmul__ __truediv__ __floordiv__ __mod__ __divmod__ __pow__ + __lshift__ __rshift__ __and__ __xor__ __or__ __neg__ __pos__ __abs__ +""".split() +rnum_methods = """ + __radd__ __rsub__ __rmul__ __rmatmul__ __rtruediv__ __rfloordiv__ __rmod__ __rdivmod__ + __rpow__ __rlshift__ __rrshift__ __rand__ __rxor__ __ror__ +""".split() +inum_methods = """ + __iadd__ __isub__ __imul__ __imatmul__ __itruediv__ + __ifloordiv__ __imod__ __ipow__ __ilshift__ __irshift__ __iand__ __ixor__ __ior__ +""".split() + +# Cell +class fastuple(tuple): + "A `tuple` with elementwise ops and more friendly __init__ behavior" + def __new__(cls, x=None, *rest): + if x is None: x = () + if not isinstance(x,tuple): + if len(rest): x = (x,) + else: + try: x = tuple(iter(x)) + except TypeError: x = (x,) + return super().__new__(cls, x+rest if rest else x) + + def _op(self,op,*args): + if not isinstance(self,fastuple): self = fastuple(self) + return type(self)(map(op,self,*map(cycle, args))) + + def mul(self,*args): + "`*` is already defined in `tuple` for replicating, so use `mul` instead" + return fastuple._op(self, operator.mul,*args) + + def add(self,*args): + "`+` is already defined in `tuple` for concat, so use `add` instead" + return fastuple._op(self, operator.add,*args) + +def _get_op(op): + if isinstance(op,str): op = getattr(operator,op) + def _f(self,*args): return self._op(op,*args) + return _f + +for n in num_methods: + if not hasattr(fastuple, n) and hasattr(operator,n): setattr(fastuple,n,_get_op(n)) + +for n in 'eq ne lt le gt ge'.split(): setattr(fastuple,n,_get_op(n)) +setattr(fastuple,'__invert__',_get_op('__not__')) +setattr(fastuple,'max',_get_op(max)) +setattr(fastuple,'min',_get_op(min)) + +# Cell +def compose(*funcs, order=None): + "Create a function that composes all functions in `funcs`, passing along remaining `*args` and `**kwargs` to all" + funcs = listify(funcs) + if len(funcs)==0: return noop + if len(funcs)==1: return funcs[0] + if order is not None: funcs = sorted_ex(funcs, key=order) + def _inner(x, *args, **kwargs): + for f in funcs: x = f(x, *args, **kwargs) + return x + return _inner + +# Cell +def maps(*args, retain=noop): + "Like `map`, except funcs are composed first" + f = compose(*args[:-1]) + def _f(b): return retain(f(b), b) + return map(_f, args[-1]) + +# Cell +def partialler(f, *args, order=None, **kwargs): + "Like `functools.partial` but also copies over docstring" + fnew = partial(f,*args,**kwargs) + fnew.__doc__ = f.__doc__ + if order is not None: fnew.order=order + elif hasattr(f,'order'): fnew.order=f.order + return fnew + +# Cell +def instantiate(t): + "Instantiate `t` if it's a type, otherwise do nothing" + return t() if isinstance(t, type) else t + +# Cell +def _using_attr(f, attr, x): return f(getattr(x,attr)) + +# Cell +def using_attr(f, attr): + "Change function `f` to operate on `attr`" + return partial(_using_attr, f, attr) + +# Cell +class _Self: + "An alternative to `lambda` for calling methods on passed object." + def __init__(self): self.nms,self.args,self.kwargs,self.ready = [],[],[],True + def __repr__(self): return f'self: {self.nms}({self.args}, {self.kwargs})' + + def __call__(self, *args, **kwargs): + if self.ready: + x = args[0] + for n,a,k in zip(self.nms,self.args,self.kwargs): + x = getattr(x,n) + if callable(x) and a is not None: x = x(*a, **k) + return x + else: + self.args.append(args) + self.kwargs.append(kwargs) + self.ready = True + return self + + def __getattr__(self,k): + if not self.ready: + self.args.append(None) + self.kwargs.append(None) + self.nms.append(k) + self.ready = False + return self + +# Cell +class _SelfCls: + def __getattr__(self,k): return getattr(_Self(),k) + def __getitem__(self,i): return self.__getattr__('__getitem__')(i) + +Self = _SelfCls() + +# Cell +#nbdev_comment _all_ = ['Self'] + +# Cell +class PrettyString(str): + "Little hack to get strings to show properly in Jupyter." + def __repr__(self): return self + +# Cell +def even_mults(start, stop, n): + "Build log-stepped array from `start` to `stop` in `n` steps." + if n==1: return stop + mult = stop/start + step = mult**(1/(n-1)) + return [start*(step**i) for i in range(n)] + +# Cell +def num_cpus(): + "Get number of cpus" + try: return len(os.sched_getaffinity(0)) + except AttributeError: return os.cpu_count() + +defaults.cpus = num_cpus() + +# Cell +def add_props(f, g=None, n=2): + "Create properties passing each of `range(n)` to f" + if g is None: return (property(partial(f,i)) for i in range(n)) + return (property(partial(f,i), partial(g,i)) for i in range(n)) + +# Cell +def _typeerr(arg, val, typ): return TypeError(f"{arg}=={val} not {typ}") + +# Cell +def typed(f): + "Decorator to check param and return types at runtime" + names = f.__code__.co_varnames + anno = f.__annotations__ + ret = anno.pop('return',None) + def _f(*args,**kwargs): + kw = {**kwargs} + if len(anno) > 0: + for i,arg in enumerate(args): kw[names[i]] = arg + for k,v in kw.items(): + if not isinstance(v,anno[k]): raise _typeerr(k, v, anno[k]) + res = f(*args,**kwargs) + if ret is not None and not isinstance(res,ret): raise _typeerr("return", res, ret) + return res + return functools.update_wrapper(_f, f) \ No newline at end of file diff --git a/fastcore/foundation.py b/fastcore/foundation.py index 0d83c5bc..b3c975cb 100644 --- a/fastcore/foundation.py +++ b/fastcore/foundation.py @@ -1,22 +1,19 @@ -# AUTOGENERATED! DO NOT EDIT! File to edit: nbs/01_foundation.ipynb (unless otherwise specified). +# AUTOGENERATED! DO NOT EDIT! File to edit: nbs/02_foundation.ipynb (unless otherwise specified). -__all__ = ['defaults', 'copy_func', 'patch_to', 'patch', 'patch_property', 'add_docs', 'docs', 'custom_dir', 'arg0', - 'arg1', 'arg2', 'arg3', 'arg4', 'coll_repr', 'is_bool', 'mask2idxs', 'cycle', 'zip_cycle', 'is_indexer', - 'negate_func', 'GetAttr', 'delegate_attr', 'bind', 'argwhere', 'map_ex', 'filter_ex', 'range_of', - 'sorted_ex', 'listable_types', 'renumerate', 'first', 'nested_attr', 'stop', 'tst', 'tst2', 'CollBase', 'L', - 'save_config_file', 'read_config_file', 'Config'] +__all__ = ['copy_func', 'patch_to', 'patch', 'patch_property', 'add_docs', 'docs', 'custom_dir', 'arg0', 'arg1', 'arg2', + 'arg3', 'arg4', 'coll_repr', 'is_bool', 'mask2idxs', 'cycle', 'zip_cycle', 'is_indexer', 'negate_func', + 'GetAttr', 'delegate_attr', 'bind', 'argwhere', 'map_ex', 'filter_ex', 'range_of', 'listable_types', + 'renumerate', 'first', 'nested_attr', 'CollBase', 'L', 'save_config_file', 'read_config_file', 'Config'] # Cell from .imports import * +from .basics import * from functools import lru_cache from contextlib import contextmanager from copy import copy from configparser import ConfigParser import random,pickle -# Cell -defaults = SimpleNamespace() - # Cell def copy_func(f): "Copy a non-builtin function (NB `copy.copy` does not work for this)" @@ -113,20 +110,10 @@ def mask2idxs(mask): if is_bool(it): return [i for i,m in enumerate(mask) if m] return [int(i) for i in mask] -# Cell -def _is_array(x): return hasattr(x,'__array__') or hasattr(x,'iloc') - -def _listify(o): - if o is None: return [] - if isinstance(o, list): return o - if isinstance(o, str) or _is_array(o): return [o] - if is_iter(o): return list(o) - return [o] - # Cell def cycle(o): "Like `itertools.cycle` except creates list of `None`s if `o` is empty" - o = _listify(o) + o = listify(o) return itertools.cycle(o) if o is not None and len(o) > 0 else itertools.cycle([None]) # Cell @@ -217,14 +204,6 @@ def range_of(a, b=None, step=None): if is_coll(a): a = len(a) return list(range(a,b,step) if step is not None else range(a,b) if b is not None else range(a)) -# Cell -def sorted_ex(iterable, key=None, reverse=False): - "Like `sorted`, but if key is str use `attrgetter`; if int use `itemgetter`" - if isinstance(key,str): k=lambda o:getattr(o,key,0) - elif isinstance(key,int): k=itemgetter(key) - else: k=key - return sorted(iterable, key=k, reverse=reverse) - # Cell listable_types = typing.Collection,Generator,map,filter,zip @@ -247,23 +226,6 @@ def nested_attr(o, attr, default=None): except AttributeError: return default return o -# Cell -def stop(e=StopIteration): - "Raises exception `e` (by default `StopException`)" - raise e - -def tst(): - try: - stop() - except StopIteration: - return True - -def tst2(): - try: - stop(e=ValueError) - except ValueError: - return True - # Cell class CollBase: "Base class for composing a list of `items`" @@ -288,8 +250,8 @@ class L(GetAttr, CollBase, metaclass=_L_Meta): def __init__(self, items=None, *rest, use_list=False, match=None): if rest: items = (items,)+rest if items is None: items = [] - if (use_list is not None) or not _is_array(items): - items = list(items) if use_list else _listify(items) + if (use_list is not None) or not is_array(items): + items = list(items) if use_list else listify(items) if match is not None: if is_coll(match): match = len(match) if len(items)==1: items = items*match @@ -313,7 +275,7 @@ def __setitem__(self, idx, o): "Set `idx` (can be list of indices, or mask, or int) items to `o` (which is broadcast if not iterable)" if isinstance(idx, int): self.items[idx] = o else: - idx = idx if isinstance(idx,L) else _listify(idx) + idx = idx if isinstance(idx,L) else listify(idx) if not is_iter(o): o = [o]*len(idx) for i,o_ in zip(idx,o): self.items[i] = o_ @@ -329,9 +291,9 @@ def __reversed__(self): return self._new(reversed(self.items)) def __invert__(self): return self._new(not i for i in self) def __repr__(self): return repr(self.items) def _repr_pretty_(self, p, cycle): - p.text('...' if cycle else repr(self.items) if _is_array(self.items) else coll_repr(self)) + p.text('...' if cycle else repr(self.items) if is_array(self.items) else coll_repr(self)) def __mul__ (a,b): return a._new(a.items*b) - def __add__ (a,b): return a._new(a.items+_listify(b)) + def __add__ (a,b): return a._new(a.items+listify(b)) def __radd__(a,b): return a._new(b)+a def __addi__(a,b): a.items += list(b) diff --git a/fastcore/test.py b/fastcore/test.py index 9515793d..16aac98f 100644 --- a/fastcore/test.py +++ b/fastcore/test.py @@ -6,7 +6,6 @@ # Cell from .imports import * -from .utils import * from collections import Counter from contextlib import redirect_stdout @@ -102,7 +101,7 @@ def test_fig_exists(ax): # Cell class ExceptionExpected: "Context manager that tests if an exception is raised" - def __init__(self, ex=Exception, regex=''): store_attr() + def __init__(self, ex=Exception, regex=''): self.ex,self.regex = ex,regex def __enter__(self): pass def __exit__(self, type, value, traceback): if not isinstance(value, self.ex) or (self.regex and not re.search(self.regex, f'{value.args}')): diff --git a/fastcore/utils.py b/fastcore/utils.py index 12154310..a98d8f02 100644 --- a/fastcore/utils.py +++ b/fastcore/utils.py @@ -1,865 +1,5 @@ -# AUTOGENERATED! DO NOT EDIT! File to edit: nbs/02_utils.ipynb (unless otherwise specified). - -__all__ = ['ifnone', 'maybe_attr', 'basic_repr', 'get_class', 'mk_class', 'wrap_class', 'ignore_exceptions', - 'exec_local', 'risinstance', 'Inf', 'in_', 'lt', 'gt', 'le', 'ge', 'eq', 'ne', 'add', 'sub', 'mul', - 'truediv', 'is_', 'is_not', 'in_', 'true', 'gen', 'chunked', 'otherwise', 'AttrDict', 'dict2obj', - 'with_cast', 'store_attr', 'attrdict', 'properties', 'camel2snake', 'snake2camel', 'class2attr', 'hasattrs', - 'setattrs', 'try_attrs', 'ShowPrint', 'Int', 'Str', 'Float', 'tuplify', 'detuplify', 'replicate', - 'uniqueify', 'setify', 'merge', 'is_listy', 'range_of', 'groupby', 'last_index', 'shufflish', 'filter_dict', - 'filter_keys', 'filter_values', 'IterLen', 'ReindexCollection', 'num_methods', 'rnum_methods', - 'inum_methods', 'fastuple', 'trace', 'compose', 'maps', 'partialler', 'mapped', 'instantiate', 'using_attr', - 'Self', 'Self', 'open_file', 'save_pickle', 'load_pickle', 'bunzip', 'join_path_file', 'urlread', 'urljson', - 'run', 'do_request', 'sort_by_run', 'PrettyString', 'round_multiple', 'even_mults', 'num_cpus', 'add_props', - 'ContextManagers', 'typed', 'str2bool', 'set_num_threads', 'ProcessPoolExecutor', 'ThreadPoolExecutor', - 'parallel', 'run_procs', 'parallel_gen', 'threaded'] - -# Cell from .imports import * -from .foundation import * -from functools import wraps - -import mimetypes,bz2,pickle,random,json,urllib,subprocess,shlex,bz2,gzip,distutils.util -from contextlib import contextmanager -from pdb import set_trace -from urllib.request import Request,urlopen -from urllib.error import HTTPError -from urllib.parse import urlencode -from threading import Thread - -# Cell -def ifnone(a, b): - "`b` if `a` is None else `a`" - return b if a is None else a - -# Cell -def maybe_attr(o, attr): - "`getattr(o,attr,o)`" - return getattr(o,attr,o) - -# Cell -def basic_repr(flds=None): - if isinstance(flds, str): flds = re.split(', *', flds) - flds = L(flds) - def _f(self): - sig = ', '.join(f'{o}={maybe_attr(getattr(self,o), "__name__")}' for o in flds) - return f'{self.__class__.__name__}({sig})' - return _f - -# Cell -def get_class(nm, *fld_names, sup=None, doc=None, funcs=None, **flds): - "Dynamically create a class, optionally inheriting from `sup`, containing `fld_names`" - attrs = {} - for f in fld_names: attrs[f] = None - for f in L(funcs): attrs[f.__name__] = f - for k,v in flds.items(): attrs[k] = v - sup = ifnone(sup, ()) - if not isinstance(sup, tuple): sup=(sup,) - - def _init(self, *args, **kwargs): - for i,v in enumerate(args): setattr(self, list(attrs.keys())[i], v) - for k,v in kwargs.items(): setattr(self,k,v) - - all_flds = [*fld_names,*flds.keys()] - def _eq(self,b): - return all([getattr(self,k)==getattr(b,k) for k in all_flds]) - - if not sup: attrs['__repr__'] = basic_repr(all_flds) - attrs['__init__'] = _init - attrs['__eq__'] = _eq - res = type(nm, sup, attrs) - if doc is not None: res.__doc__ = doc - return res - -# Cell -def mk_class(nm, *fld_names, sup=None, doc=None, funcs=None, mod=None, **flds): - "Create a class using `get_class` and add to the caller's module" - if mod is None: mod = sys._getframe(1).f_locals - res = get_class(nm, *fld_names, sup=sup, doc=doc, funcs=funcs, **flds) - mod[nm] = res - -# Cell -def wrap_class(nm, *fld_names, sup=None, doc=None, funcs=None, **flds): - "Decorator: makes function a method of a new class `nm` passing parameters to `mk_class`" - def _inner(f): - mk_class(nm, *fld_names, sup=sup, doc=doc, funcs=L(funcs)+f, mod=f.__globals__, **flds) - return f - return _inner - -# Cell -class ignore_exceptions: - "Context manager to ignore exceptions" - def __enter__(self): pass - def __exit__(self, *args): return True - -# Cell -def exec_local(code, var_name): - "Call `exec` on `code` and return the var `var_name" - loc = {} - exec(code, globals(), loc) - return loc[var_name] - -# Cell -def risinstance(types, obj=None): - "Curried `isinstance` but with args reversed" - if not obj: return partial(risinstance,types) - return isinstance(obj, types) - -# Cell -#hide -class _InfMeta(type): - @property - def count(self): return itertools.count() - @property - def zeros(self): return itertools.cycle([0]) - @property - def ones(self): return itertools.cycle([1]) - @property - def nones(self): return itertools.cycle([None]) - -# Cell -class Inf(metaclass=_InfMeta): - "Infinite lists" - pass - -# Cell -_dumobj = object() -def _oper(op,a,b=_dumobj): return (lambda o:op(o,a)) if b is _dumobj else op(a,b) - -def _mk_op(nm, mod): - "Create an operator using `oper` and add to the caller's module" - op = getattr(operator,nm) - def _inner(a, b=_dumobj): return _oper(op, a,b) - _inner.__name__ = _inner.__qualname__ = nm - _inner.__doc__ = f'Same as `operator.{nm}`, or returns partial if 1 arg' - mod[nm] = _inner - -# Cell -def in_(x, a): - "`True` if `x in a`" - return x in a - -operator.in_ = in_ - -# Cell -#nbdev_comment _all_ = ['lt','gt','le','ge','eq','ne','add','sub','mul','truediv','is_','is_not','in_'] - -# Cell -for op in ['lt','gt','le','ge','eq','ne','add','sub','mul','truediv','is_','is_not','in_']: _mk_op(op, globals()) - -# Cell -def true(*args, **kwargs): - "Predicate: always `True`" - return True - -# Cell -def gen(func, seq, cond=true): - "Like `(func(o) for o in seq if cond(func(o)))` but handles `StopIteration`" - return itertools.takewhile(cond, map(func,seq)) - -# Cell -def chunked(it, chunk_sz=None, drop_last=False, n_chunks=None): - "Return batches from iterator `it` of size `chunk_sz` (or return `n_chunks` total)" - assert bool(chunk_sz) ^ bool(n_chunks) - if n_chunks: chunk_sz = math.ceil(len(it)/n_chunks) - if not isinstance(it, Iterator): it = iter(it) - while True: - res = list(itertools.islice(it, chunk_sz)) - if res and (len(res)==chunk_sz or not drop_last): yield res - if len(res) 0: - for i,arg in enumerate(args): kw[names[i]] = arg - for k,v in kw.items(): - if not isinstance(v,anno[k]): raise _typeerr(k, v, anno[k]) - res = f(*args,**kwargs) - if ret is not None and not isinstance(res,ret): raise _typeerr("return", res, ret) - return res - return functools.update_wrapper(_f, f) - -# Cell -def str2bool(s): - "Case-insensitive convert string `s` too a bool (`y`,`yes`,`t`,`true`,`on`,`1`->`True`)" - if not isinstance(s,str): return bool(s) - return bool(distutils.util.strtobool(s)) if s else False - -# Cell -from multiprocessing import Process, Queue -import concurrent.futures -import time -from multiprocessing import Manager - -# Cell -def set_num_threads(nt): - "Get numpy (and others) to use `nt` threads" - try: import mkl; mkl.set_num_threads(nt) - except: pass - try: import torch; torch.set_num_threads(nt) - except: pass - os.environ['IPC_ENABLE']='1' - for o in ['OPENBLAS_NUM_THREADS','NUMEXPR_NUM_THREADS','OMP_NUM_THREADS','MKL_NUM_THREADS']: - os.environ[o] = str(nt) - -# Cell -def _call(lock, pause, n, g, item): - l = False - if pause: - try: - l = lock.acquire(timeout=pause*(n+2)) - time.sleep(pause) - finally: - if l: lock.release() - return g(item) - -# Cell -class ProcessPoolExecutor(concurrent.futures.ProcessPoolExecutor): - "Same as Python's ProcessPoolExecutor, except can pass `max_workers==0` for serial execution" - def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs): - if max_workers is None: max_workers=defaults.cpus - store_attr() - self.not_parallel = max_workers==0 - if self.not_parallel: max_workers=1 - super().__init__(max_workers, **kwargs) - - def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs): - self.lock = Manager().Lock() - g = partial(f, *args, **kwargs) - if self.not_parallel: return map(g, items) - _g = partial(_call, self.lock, self.pause, self.max_workers, g) - try: return super().map(_g, items, timeout=timeout, chunksize=chunksize) - except Exception as e: self.on_exc(e) - -# Cell -class ThreadPoolExecutor(concurrent.futures.ThreadPoolExecutor): - "Same as Python's ThreadPoolExecutor, except can pass `max_workers==0` for serial execution" - def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs): - if max_workers is None: max_workers=defaults.cpus - store_attr() - self.not_parallel = max_workers==0 - if self.not_parallel: max_workers=1 - super().__init__(max_workers, **kwargs) - - def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs): - self.lock = Manager().Lock() - g = partial(f, *args, **kwargs) - if self.not_parallel: return map(g, items) - _g = partial(_call, self.lock, self.pause, self.max_workers, g) - try: return super().map(_g, items, timeout=timeout, chunksize=chunksize) - except Exception as e: self.on_exc(e) - -# Cell -try: from fastprogress import progress_bar -except: progress_bar = None - -# Cell -def parallel(f, items, *args, n_workers=defaults.cpus, total=None, progress=None, pause=0, - threadpool=False, timeout=None, chunksize=1, **kwargs): - "Applies `func` in parallel to `items`, using `n_workers`" - if progress is None: progress = progress_bar is not None - pool = ThreadPoolExecutor if threadpool else ProcessPoolExecutor - with pool(n_workers, pause=pause) as ex: - r = ex.map(f,items, *args, timeout=timeout, chunksize=chunksize, **kwargs) - if progress: - if total is None: total = len(items) - r = progress_bar(r, total=total, leave=False) - return L(r) - -# Cell -def run_procs(f, f_done, args): - "Call `f` for each item in `args` in parallel, yielding `f_done`" - processes = L(args).map(Process, args=arg0, target=f) - for o in processes: o.start() - yield from f_done() - processes.map(Self.join()) - -# Cell -def _f_pg(obj, queue, batch, start_idx): - for i,b in enumerate(obj(batch)): queue.put((start_idx+i,b)) - -def _done_pg(queue, items): return (queue.get() for _ in items) - -# Cell -def parallel_gen(cls, items, n_workers=defaults.cpus, **kwargs): - "Instantiate `cls` in `n_workers` procs & call each on a subset of `items` in parallel." - if n_workers==0: - yield from enumerate(list(cls(**kwargs)(items))) - return - batches = L(chunked(items, n_chunks=n_workers)) - idx = L(itertools.accumulate(0 + batches.map(len))) - queue = Queue() - if progress_bar: items = progress_bar(items, leave=False) - f=partial(_f_pg, cls(**kwargs), queue) - done=partial(_done_pg, queue, items) - yield from run_procs(f, done, L(batches,idx).zip()) +from .test import * +from .basics import * +from .xtras import * -# Cell -def threaded(f): - "Run `f` in a thread, and returns the thread" - @wraps(f) - def _f(*args, **kwargs): - res = Thread(target=f, args=args, kwargs=kwargs) - res.start() - return res - return _f \ No newline at end of file diff --git a/fastcore/xtras.py b/fastcore/xtras.py new file mode 100644 index 00000000..84aecf72 --- /dev/null +++ b/fastcore/xtras.py @@ -0,0 +1,382 @@ +# AUTOGENERATED! DO NOT EDIT! File to edit: nbs/03_xtras.ipynb (unless otherwise specified). + +__all__ = ['dict2obj', 'tuplify', 'uniqueify', 'is_listy', 'shufflish', 'mapped', 'IterLen', 'ReindexCollection', + 'open_file', 'save_pickle', 'load_pickle', 'bunzip', 'join_path_file', 'urlread', 'urljson', 'run', + 'do_request', 'sort_by_run', 'trace', 'round_multiple', 'modified_env', 'ContextManagers', 'str2bool', + 'set_num_threads', 'ProcessPoolExecutor', 'ThreadPoolExecutor', 'parallel', 'run_procs', 'parallel_gen', + 'threaded'] + +# Cell +from .imports import * +from .foundation import * +from .basics import * +from functools import wraps + +import mimetypes,bz2,pickle,random,json,urllib,subprocess,shlex,bz2,gzip,distutils.util +from contextlib import contextmanager,ExitStack +from pdb import set_trace +from urllib.request import Request,urlopen +from urllib.error import HTTPError +from urllib.parse import urlencode +from threading import Thread + +# Cell +def dict2obj(d): + "Convert (possibly nested) dicts (or lists of dicts) to `AttrDict`" + if isinstance(d, (L,list)): return L(d).map(dict2obj) + if not isinstance(d, dict): return d + return AttrDict(**{k:dict2obj(v) for k,v in d.items()}) + +# Cell +def tuplify(o, use_list=False, match=None): + "Make `o` a tuple" + return tuple(L(o, use_list=use_list, match=match)) + +# Cell +def uniqueify(x, sort=False, bidir=False, start=None): + "Unique elements in `x`, optionally `sort`-ed, optionally return reverse correspondence, optionally prepend with elements." + res = L(x).unique() + if start is not None: res = start+res + if sort: res.sort() + if bidir: return res, res.val2idx() + return res + +# Cell +def is_listy(x): + "`isinstance(x, (tuple,list,L,slice,Generator))`" + return isinstance(x, (tuple,list,L,slice,Generator)) + +# Cell +def shufflish(x, pct=0.04): + "Randomly relocate items of `x` up to `pct` of `len(x)` from their starting location" + n = len(x) + return L(x[i] for i in sorted(range_of(x), key=lambda o: o+n*(1+random.random()*pct))) + +# Cell +def mapped(f, it): + "map `f` over `it`, unless it's not listy, in which case return `f(it)`" + return L(it).map(f) if is_listy(it) else f(it) + +# Cell +#hide +class IterLen: + "Base class to add iteration to anything supporting `__len__` and `__getitem__`" + def __iter__(self): return (self[i] for i in range_of(self)) + +# Cell +@docs +class ReindexCollection(GetAttr, IterLen): + "Reindexes collection `coll` with indices `idxs` and optional LRU cache of size `cache`" + _default='coll' + def __init__(self, coll, idxs=None, cache=None, tfm=noop): + if idxs is None: idxs = L.range(coll) + store_attr() + if cache is not None: self._get = functools.lru_cache(maxsize=cache)(self._get) + + def _get(self, i): return self.tfm(self.coll[i]) + def __getitem__(self, i): return self._get(self.idxs[i]) + def __len__(self): return len(self.coll) + def reindex(self, idxs): self.idxs = idxs + def shuffle(self): random.shuffle(self.idxs) + def cache_clear(self): self._get.cache_clear() + def __getstate__(self): return {'coll': self.coll, 'idxs': self.idxs, 'cache': self.cache, 'tfm': self.tfm} + def __setstate__(self, s): self.coll,self.idxs,self.cache,self.tfm = s['coll'],s['idxs'],s['cache'],s['tfm'] + + _docs = dict(reindex="Replace `self.idxs` with idxs", + shuffle="Randomly shuffle indices", + cache_clear="Clear LRU cache") + +# Cell +@patch +def readlines(self:Path, hint=-1, encoding='utf8'): + "Read the content of `self`" + with self.open(encoding=encoding) as f: return f.readlines(hint) + +# Cell +@patch +def mk_write(self:Path, data, encoding=None, errors=None, mode=511): + "Make all parent dirs of `self`" + self.parent.mkdir(exist_ok=True, parents=True, mode=mode) + self.write_text(data, encoding=encoding, errors=errors) + +# Cell +@patch +def ls(self:Path, n_max=None, file_type=None, file_exts=None): + "Contents of path as a list" + extns=L(file_exts) + if file_type: extns += L(k for k,v in mimetypes.types_map.items() if v.startswith(file_type+'/')) + has_extns = len(extns)==0 + res = (o for o in self.iterdir() if has_extns or o.suffix in extns) + if n_max is not None: res = itertools.islice(res, n_max) + return L(res) + +# Cell +def open_file(fn, mode='r'): + "Open a file, with optional compression if gz or bz2 suffix" + if isinstance(fn, io.IOBase): return fn + fn = Path(fn) + if fn.suffix=='.bz2': return bz2.BZ2File(fn, mode) + elif fn.suffix=='.gz' : return gzip.GzipFile(fn, mode) + else: return open(fn,mode) + +# Cell +def save_pickle(fn, o): + "Save a pickle file, to a file name or opened file" + with open_file(fn, 'wb') as f: pickle.dump(o, f) + +# Cell +def load_pickle(fn): + "Load a pickle file from a file name or opened file" + with open_file(fn, 'rb') as f: return pickle.load(f) + +# Cell +@patch +def __repr__(self:Path): + b = getattr(Path, 'BASE_PATH', None) + if b: + try: self = self.relative_to(b) + except: pass + return f"Path({self.as_posix()!r})" + +# Cell +def bunzip(fn): + "bunzip `fn`, raising exception if output already exists" + fn = Path(fn) + assert fn.exists(), f"{fn} doesn't exist" + out_fn = fn.with_suffix('') + assert not out_fn.exists(), f"{out_fn} already exists" + with bz2.BZ2File(fn, 'rb') as src, out_fn.open('wb') as dst: + for d in iter(lambda: src.read(1024*1024), b''): dst.write(d) + +# Cell +def join_path_file(file, path, ext=''): + "Return `path/file` if file is a string or a `Path`, file otherwise" + if not isinstance(file, (str, Path)): return file + path.mkdir(parents=True, exist_ok=True) + return path/f'{file}{ext}' + +# Cell +def urlread(url, data=None, **kwargs): + "Retrieve `url`, using `data` dict or `kwargs` to `POST` if present" + if kwargs and not data: data=kwargs + if data is not None: + if not isinstance(data, (str,bytes)): data = urlencode(data) + if not isinstance(data, bytes): data = data.encode('ascii') + cls = urllib.request.Request + if not isinstance(url,cls): url = cls(url) + url.headers['User-Agent'] = 'Mozilla/5.0' + with urlopen(url, data=data) as res: return res.read() + +# Cell +def urljson(url, data=None): + "Retrieve `url` and decode json" + return json.loads(urlread(url, data=data)) + +# Cell +def run(cmd, *rest, ignore_ex=False, as_bytes=False): + "Pass `cmd` (splitting with `shlex` if string) to `subprocess.run`; return `stdout`; raise `IOError` if fails" + if rest: cmd = (cmd,)+rest + elif isinstance(cmd,str): cmd = shlex.split(cmd) + res = subprocess.run(cmd, capture_output=True) + stdout = res.stdout + if not as_bytes: stdout = stdout.decode() + if ignore_ex: return (res.returncode, stdout) + if res.returncode: raise IOError("{} ;; {}".format(res.stdout, res.stderr)) + return stdout + +# Cell +def do_request(url, post=False, headers=None, **data): + "Call GET or json-encoded POST on `url`, depending on `post`" + if data: + if post: data = json.dumps(data).encode('ascii') + else: + url += "?" + urlencode(data) + data = None + return urljson(Request(url, headers=headers, data=data or None)) + +# Cell +def _is_instance(f, gs): + tst = [g if type(g) in [type, 'function'] else g.__class__ for g in gs] + for g in tst: + if isinstance(f, g) or f==g: return True + return False + +def _is_first(f, gs): + for o in L(getattr(f, 'run_after', None)): + if _is_instance(o, gs): return False + for g in gs: + if _is_instance(f, L(getattr(g, 'run_before', None))): return False + return True + +def sort_by_run(fs): + end = L(fs).attrgot('toward_end') + inp,res = L(fs)[~end] + L(fs)[end], L() + while len(inp): + for i,o in enumerate(inp): + if _is_first(o, inp): + res.append(inp.pop(i)) + break + else: raise Exception("Impossible to sort") + return res + +# Cell +def trace(f): + "Add `set_trace` to an existing function `f`" + if getattr(f, '_traced', False): return f + def _inner(*args,**kwargs): + set_trace() + return f(*args,**kwargs) + _inner._traced = True + return _inner + +# Cell +def round_multiple(x, mult, round_down=False): + "Round `x` to nearest multiple of `mult`" + def _f(x_): return (int if round_down else round)(x_/mult)*mult + res = L(x).map(_f) + return res if is_listy(x) else res[0] + +# Cell +@contextmanager +def modified_env(*delete, **replace): + "Context manager temporarily modifying `os.environ` by deleting `delete` and replacing `replace`" + prev = dict(os.environ) + try: + os.environ.update(replace) + for k in delete: os.environ.pop(k, None) + yield + finally: + os.environ.clear() + os.environ.update(prev) + +# Cell +class ContextManagers(GetAttr): + "Wrapper for `contextlib.ExitStack` which enters a collection of context managers" + def __init__(self, mgrs): self.default,self.stack = L(mgrs),ExitStack() + def __enter__(self): self.default.map(self.stack.enter_context) + def __exit__(self, *args, **kwargs): self.stack.__exit__(*args, **kwargs) + +# Cell +def str2bool(s): + "Case-insensitive convert string `s` too a bool (`y`,`yes`,`t`,`true`,`on`,`1`->`True`)" + if not isinstance(s,str): return bool(s) + return bool(distutils.util.strtobool(s)) if s else False + +# Cell +from multiprocessing import Process, Queue +import concurrent.futures +import time +from multiprocessing import Manager + +# Cell +def set_num_threads(nt): + "Get numpy (and others) to use `nt` threads" + try: import mkl; mkl.set_num_threads(nt) + except: pass + try: import torch; torch.set_num_threads(nt) + except: pass + os.environ['IPC_ENABLE']='1' + for o in ['OPENBLAS_NUM_THREADS','NUMEXPR_NUM_THREADS','OMP_NUM_THREADS','MKL_NUM_THREADS']: + os.environ[o] = str(nt) + +# Cell +def _call(lock, pause, n, g, item): + l = False + if pause: + try: + l = lock.acquire(timeout=pause*(n+2)) + time.sleep(pause) + finally: + if l: lock.release() + return g(item) + +# Cell +class ProcessPoolExecutor(concurrent.futures.ProcessPoolExecutor): + "Same as Python's ProcessPoolExecutor, except can pass `max_workers==0` for serial execution" + def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs): + if max_workers is None: max_workers=defaults.cpus + store_attr() + self.not_parallel = max_workers==0 + if self.not_parallel: max_workers=1 + super().__init__(max_workers, **kwargs) + + def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs): + self.lock = Manager().Lock() + g = partial(f, *args, **kwargs) + if self.not_parallel: return map(g, items) + _g = partial(_call, self.lock, self.pause, self.max_workers, g) + try: return super().map(_g, items, timeout=timeout, chunksize=chunksize) + except Exception as e: self.on_exc(e) + +# Cell +class ThreadPoolExecutor(concurrent.futures.ThreadPoolExecutor): + "Same as Python's ThreadPoolExecutor, except can pass `max_workers==0` for serial execution" + def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs): + if max_workers is None: max_workers=defaults.cpus + store_attr() + self.not_parallel = max_workers==0 + if self.not_parallel: max_workers=1 + super().__init__(max_workers, **kwargs) + + def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs): + self.lock = Manager().Lock() + g = partial(f, *args, **kwargs) + if self.not_parallel: return map(g, items) + _g = partial(_call, self.lock, self.pause, self.max_workers, g) + try: return super().map(_g, items, timeout=timeout, chunksize=chunksize) + except Exception as e: self.on_exc(e) + +# Cell +try: from fastprogress import progress_bar +except: progress_bar = None + +# Cell +def parallel(f, items, *args, n_workers=defaults.cpus, total=None, progress=None, pause=0, + threadpool=False, timeout=None, chunksize=1, **kwargs): + "Applies `func` in parallel to `items`, using `n_workers`" + if progress is None: progress = progress_bar is not None + pool = ThreadPoolExecutor if threadpool else ProcessPoolExecutor + with pool(n_workers, pause=pause) as ex: + r = ex.map(f,items, *args, timeout=timeout, chunksize=chunksize, **kwargs) + if progress: + if total is None: total = len(items) + r = progress_bar(r, total=total, leave=False) + return L(r) + +# Cell +def run_procs(f, f_done, args): + "Call `f` for each item in `args` in parallel, yielding `f_done`" + processes = L(args).map(Process, args=arg0, target=f) + for o in processes: o.start() + yield from f_done() + processes.map(Self.join()) + +# Cell +def _f_pg(obj, queue, batch, start_idx): + for i,b in enumerate(obj(batch)): queue.put((start_idx+i,b)) + +def _done_pg(queue, items): return (queue.get() for _ in items) + +# Cell +def parallel_gen(cls, items, n_workers=defaults.cpus, **kwargs): + "Instantiate `cls` in `n_workers` procs & call each on a subset of `items` in parallel." + if n_workers==0: + yield from enumerate(list(cls(**kwargs)(items))) + return + batches = L(chunked(items, n_chunks=n_workers)) + idx = L(itertools.accumulate(0 + batches.map(len))) + queue = Queue() + if progress_bar: items = progress_bar(items, leave=False) + f=partial(_f_pg, cls(**kwargs), queue) + done=partial(_done_pg, queue, items) + yield from run_procs(f, done, L(batches,idx).zip()) + +# Cell +def threaded(f): + "Run `f` in a thread, and returns the thread" + @wraps(f) + def _f(*args, **kwargs): + res = Thread(target=f, args=args, kwargs=kwargs) + res.start() + return res + return _f \ No newline at end of file diff --git a/nbs/00_test.ipynb b/nbs/00_test.ipynb index 08ba6b70..fd5d0190 100644 --- a/nbs/00_test.ipynb +++ b/nbs/00_test.ipynb @@ -17,7 +17,6 @@ "source": [ "#export\n", "from fastcore.imports import *\n", - "from fastcore.utils import *\n", "from collections import Counter\n", "from contextlib import redirect_stdout" ] @@ -530,7 +529,7 @@ "data": { "image/png": "\n", "text/plain": [ - "" + "" ] }, "execution_count": null, @@ -561,7 +560,7 @@ "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAIAAAACACAAAAADmVT4XAAAK3ElEQVR4nO2a2XIjubGGM7HUXlxKXKTunvEaYb//uzjixJnweNyj1kJRXGqvwpK+ILV1j20UWzo3R/8VCyQLH4BEApkAwLve9a53vetd7/r/LnT+ISJDxhgyxMOfjDGGAJDIEp0MINx/KT0vCALP8yRHADB1XlQaEK3qu5PrdwdgXhin4/E4SZLAZwCg1l+u1i0xZupSmbcHkOF4cjafz7LpJIkYALSX/+vLkgRXOXVvD+Al02y2OD9fzs6yUcwAoE2tooIE731Sp3eBCwDjXMTZcrFYLBbzbDoNAAAgWmxLqEiwLhEErdLmJEt0AEDhB+Hk4tPH5Ww6GaVpcCyP5l3UAmPdbSjEvqybU+p3ApDhaDL/3R9+vJiEoR/Ix79OWaaBYTMNuFitqddvBhBPFh9+/OPvz1POgXN79AMsDWaECG3MCAVasz9lDBwAuJ9MF+cXF+cL71BgDxVxcRiMlLpWMy6CsO6NtQSDOP47AJPRZPnx43KaHOsHJAB8cqIsyVoIR/PtZr8vqk4bO4TAAcCLs4tPnxYj77EIX7pwObb+9GNRblZXV6u8ARgyJ516YDw7X0xCdnj+tnk84vFC9f3my09cG0t2QP0OAMhlGCdxIMAygG9eTgAYBikhmF1qyn2rzaDZ4GCE1hpjDBEyAGAEQPDc0BA4AAcAOa9nZ9Oq7/vXBbC6LffbyPfDY32HUaCHhyfxMJ1kVdsM8kgOAF25XaVChsljERHRcSa8sEcWjLKyKvJXBujr7W3Ag2QUPpQYq60hYMgYZ+wRwIKXTst8477HcAIg3Rb3gRePUs8/NN4Y1Xa9QS6E9D2PAQEhAhAPknGehpINmAcOtNSXW8GD0DM+AiDnYOrtJlfohVE0GvHHVyD3ozSNQ19odwIXAFUxrbnAOmAIIgiE3v36+brFeDTNlhgGj7/kMkqSJPS9AZ7IZbx0Y5qeMSpCDsxLRoFZ/fK3nyuczJYXEE8B8DgrmQziJI4Cr7OEjv7YBcDYvlJcQBlyZMGkic3t55/+p+DZRQvjc/NsFhwAfI+7d4ELABFAEYSiDTiyoKgSe3VzsyKgIC0b9Wy4uQySNIkCj6Pzkug6ZXS1wcpjiP5ok9DqZk8A1pinlY8AgHlAzSSNfKm1K4HznO1zk3MGKJM0wv1dDQC+5PzBCxACAAfG+3ESeV5vXQfBGUBVHUcEEEEUsnbXA4ShL4V4JAAAFFymceRLwY3rRHQGMMcmoRf4XDcKuJSCM3y+HCAgCMHZy9JXAngQdbrjVpnDOvDVd2Rt1yttrPumaDAAgCEGBg7tfRICkNW62xdV2yv3bdkJAED2WxNHACCjmnKzLapOufviUwB+c4YhAJi+3m/2ed0p9yjppB54+vSyHtu3ZVHUbW+sc+KBnQDwULs1xr5oqunrMi/rrh+wGH0nwEt7N31TlmXdKvvbw/TKAN/Kqqaq6qZXAyKT7wBgQnpS8GeDbXXftm2v9P8JgEEvGY9j7+kNiAdfNCg0+x4bCKeL+TTiT+/iQkjBmbsf/j4Ans4/XGQRf4oQuBDiaXl6c4B4ujhfPPQAAQBYa4noNxaJ/6ATHBEiImcsujhfzLPUPw4BEeimKouyVa8cnH5TPeNemKRx+sOfP81GoWQAAEjWqHazurq8vq/U2wIw4cfZxYfldHZxfpYEAgkBwOquzVe//vzz7S7vXzdB8TUA98LxxZ//8odFFMeBlHjoAaua/P7m889/X3ftK0fHXwOIIM2Wv//LXxeCIT3am+2r/d3t9Zcv24GJ6+EAfpotzs+Xi+jwfKzPtvndzc1qkw9NmQ6ehjzMPvzuh8X4MSA75u6ru19/+bzKB3X/SQAsmn388UMWPHb04YMu15f//HI/PFs6HCAYzRazVGiAQ7B+KLZtfr/e1sNz1sM9IROeJ/kh9qRnFkcAyKUc5AbhlG25aop8NCIOcEhZHsTD6XnLBKPWDDvAGQxgm81NIOLsAHDIVyGQmHzCZBJzC+2gPOUJAPXaQz5ePmslAYCcisl86ulW255eN1P6NUCz4xjMP9YpPNsVk0jjs4nX7XetJufA9DQA1eT+/epmrIU4+mEAAIZcYjk7yypt9JDVaLgR2r4t7r/EdpOOx9GDyRMCQBCPslndd6+cqPxa1vT15ldbnC8/ifCxlBAAZJzN67Z65UTlVyKyut3banOXszhJnn9lWTRZNPV++6YAQFa31JV5Bck4ohDpyRBENKnaarutevdTk+E9YIxhPZOVklFgz2KPe76QB6/gRVNtmqJSVa9cc/anBKfGKIBKITP72TiJkzThh42hiCxD1XS0zcu3BAAAALVBatazsyybzsE7nOWJkAfSdAp8VK5T4WQAsAV2u2w+X9aWB+EhLvC9SKi2t0w1tePOwB0AERnnHI87ACKm96ppmq6zXPCQcQbIAdKsarVtm7Z0i9FcARAZl2GSRBLJEiDavqmbsmvqcl91XTeKwkAAAHjxmQJmDW3bziVMdgZg3Iumy+VZxK22jDNTra+vd01Z7tb7qqnnWcYPhuCP0ZNEGOxzcvDJ7hcYuBef/fCnTyNplOGS6/1n2dZN1+SbWlndWS8GAACSqR9woxSibh1S5u5DwGU4Wv74p0ya3nBP6K1stkXXK9WLeJREo8MlBiLBA6mKzaYsPf7f3joAABCZCNJsfnboAaG9ervrZdBqlAysedoGIfj+y8TFqwAAMi79KE2E1YZJZu38hz6Y3RW1TbNRFMhnNVqj+67tnKLUAQCAXEjPY5ZZxpHCTMlsfbvZq3A6n6ah9wTQtVVZlnXvki0c4IgQkAnBgTOLDNAbYTzbzO+2rZdk03F0HHEi0m1dFXlRO11tGeIJkXEuGRwOasFDESZJEKUtD0ej5BinAxAZ3TdVWbklCoZ4QoZcPMsISSYERxl3zIui6DFbRdaorinzsnNKGLvPAkBgiM8CGeQQIHojhcLz/MDnBAhIYI3u6mJftuo1XTEAPEVih/cSMO6zQFlEzrl46ByyRvdNmZdu93qcAYgs2eOG9yke4vJwVvPs9ICs0apr6sZtV+QOYI1WfdcpzoAdIV4GlofeQUREssY1XesanJI1qmubuuqOloX422EociE96eoHB0THVquuKYu8/ncr3NEXI+NSuHti5yEg0n1XF9tNiMx/LDxUSc8ejsYC6NqyATag+3q3vuGqi0OOCPRgdi8Gm7Tpq7xsnKMz92lIti/Xl1hm4zT2fd8XQiCDx/ssDxah6v3m5vKueu1dMQHYvriF/HqSpqN0PBnHIePwOAAP9VO/vbq8/Hy5e4NtOanS1ndJEqeTs8X5ckqMPyM4StXrf/70y9XtmwDous2lH0bJZFH0VluAiD26RQQAoL7c3X7++z9Wef0WgQkZoxr0g6jqLZim7XsdiOMtGjLWKKXb/Ob6+vp22zif2gyPDVttLFlV3G3y5WwcHxOmSHVZ1W21v/3Hl3VeK3ptP/BMpgNS1Wq03lddTw87T52v7/dFvl1fXe8b436p8KTgtNPNTob7RlvDg6NbqjZXN+vtbrvd3BdD8vUnAJAx0ABIwyUnzmEMAFCsri+v7jbbXV6WzgZ4IsBRancXsq7NVyMAgPL2y+XqfpcXVdO97YnJk9qd6Her6SgCAGh29+tdUdVNq4acmw64Xf+teBRHYRT6EgBAN3Xddr1SA6+Ufg8AcsYZe/AD1hpLZIkG3qp917ve9a53vetd7/oXsYyZrAWZvNgAAAAASUVORK5CYII=\n", "text/plain": [ - "" + "" ] }, "execution_count": null, @@ -626,7 +625,7 @@ "#export\n", "class ExceptionExpected:\n", " \"Context manager that tests if an exception is raised\"\n", - " def __init__(self, ex=Exception, regex=''): store_attr()\n", + " def __init__(self, ex=Exception, regex=''): self.ex,self.regex = ex,regex\n", " def __enter__(self): pass\n", " def __exit__(self, type, value, traceback): \n", " if not isinstance(value, self.ex) or (self.regex and not re.search(self.regex, f'{value.args}')):\n", @@ -711,7 +710,9 @@ "output_type": "stream", "text": [ "Converted 00_test.ipynb.\n", + "Converted 01_basics.ipynb.\n", "Converted 01_foundation.ipynb.\n", + "Converted 02_utils-Copy1.ipynb.\n", "Converted 02_utils.ipynb.\n", "Converted 03_dispatch.ipynb.\n", "Converted 04_transform.ipynb.\n", diff --git a/nbs/02_utils.ipynb b/nbs/01_basics.ipynb similarity index 61% rename from nbs/02_utils.ipynb rename to nbs/01_basics.ipynb index bfdb4986..058447fb 100644 --- a/nbs/02_utils.ipynb +++ b/nbs/01_basics.ipynb @@ -6,7 +6,7 @@ "metadata": {}, "outputs": [], "source": [ - "#default_exp utils" + "#default_exp basics" ] }, { @@ -16,17 +16,7 @@ "outputs": [], "source": [ "#export\n", - "from fastcore.imports import *\n", - "from fastcore.foundation import *\n", - "from functools import wraps\n", - "\n", - "import mimetypes,bz2,pickle,random,json,urllib,subprocess,shlex,bz2,gzip,distutils.util\n", - "from contextlib import contextmanager\n", - "from pdb import set_trace\n", - "from urllib.request import Request,urlopen\n", - "from urllib.error import HTTPError\n", - "from urllib.parse import urlencode\n", - "from threading import Thread" + "from fastcore.imports import *" ] }, { @@ -44,9 +34,9 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# Utility functions\n", + "# Basic functionality\n", "\n", - "> Utility functions used in the fastai library" + "> Basic functionality used in the fastai library" ] }, { @@ -56,6 +46,16 @@ "## Basics" ] }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# export\n", + "defaults = SimpleNamespace()" + ] + }, { "cell_type": "code", "execution_count": null, @@ -125,7 +125,7 @@ "#export\n", "def basic_repr(flds=None):\n", " if isinstance(flds, str): flds = re.split(', *', flds)\n", - " flds = L(flds)\n", + " flds = list(flds or [])\n", " def _f(self):\n", " sig = ', '.join(f'{o}={maybe_attr(getattr(self,o), \"__name__\")}' for o in flds)\n", " return f'{self.__class__.__name__}({sig})'\n", @@ -163,6 +163,23 @@ "test_eq(repr(ac), 'AnotherClass(c=some-class, d=bar)')" ] }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def is_array(x): return hasattr(x,'__array__') or hasattr(x,'iloc')\n", + "\n", + "def listify(o):\n", + " if o is None: return []\n", + " if isinstance(o, list): return o\n", + " if isinstance(o, str) or is_array(o): return [o]\n", + " if is_iter(o): return list(o)\n", + " return [o]" + ] + }, { "cell_type": "code", "execution_count": null, @@ -174,7 +191,7 @@ " \"Dynamically create a class, optionally inheriting from `sup`, containing `fld_names`\"\n", " attrs = {}\n", " for f in fld_names: attrs[f] = None\n", - " for f in L(funcs): attrs[f.__name__] = f\n", + " for f in listify(funcs): attrs[f.__name__] = f\n", " for k,v in flds.items(): attrs[k] = v\n", " sup = ifnone(sup, ())\n", " if not isinstance(sup, tuple): sup=(sup,)\n", @@ -275,10 +292,10 @@ "metadata": {}, "outputs": [], "source": [ - "mk_class('_t', a=1, sup=GetAttr)\n", + "mk_class('_t', a=1, sup=dict)\n", "t = _t()\n", "test_eq(t.a, 1)\n", - "assert(isinstance(t,GetAttr))" + "assert(isinstance(t,dict))" ] }, { @@ -296,7 +313,7 @@ { "data": { "text/plain": [ - "<__main__._t at 0x7f2feeb9ec10>" + "{}" ] }, "execution_count": null, @@ -306,7 +323,7 @@ ], "source": [ "def foo(self): return 1\n", - "mk_class('_t', 'a', sup=GetAttr, doc='test doc', funcs=foo)\n", + "mk_class('_t', 'a', sup=dict, doc='test doc', funcs=foo)\n", "\n", "t = _t(3, b=2)\n", "test_eq(t.a, 3)\n", @@ -326,7 +343,7 @@ "def wrap_class(nm, *fld_names, sup=None, doc=None, funcs=None, **flds):\n", " \"Decorator: makes function a method of a new class `nm` passing parameters to `mk_class`\"\n", " def _inner(f):\n", - " mk_class(nm, *fld_names, sup=sup, doc=doc, funcs=L(funcs)+f, mod=f.__globals__, **flds)\n", + " mk_class(nm, *fld_names, sup=sup, doc=doc, funcs=listify(funcs)+[f], mod=f.__globals__, **flds)\n", " return f\n", " return _inner" ] @@ -518,7 +535,7 @@ "metadata": {}, "outputs": [], "source": [ - "mk_class('_t', foo=noops)\n", + "class _t: foo=noops\n", "test_eq(_t().foo(1),1)" ] }, @@ -775,6 +792,18 @@ "assert true([])" ] }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def stop(e=StopIteration):\n", + " \"Raises exception `e` (by default `StopException`)\"\n", + " raise e" + ] + }, { "cell_type": "code", "execution_count": null, @@ -832,7 +861,7 @@ "metadata": {}, "outputs": [], "source": [ - "t = L.range(10)\n", + "t = list(range(10))\n", "test_eq(chunked(t,3), [[0,1,2], [3,4,5], [6,7,8], [9]])\n", "test_eq(chunked(t,3,True), [[0,1,2], [3,4,5], [6,7,8], ])\n", "\n", @@ -842,8 +871,8 @@ "test_eq(chunked(t,3), [[0, 1, 2], [3, 4, 5], [6]])\n", "\n", "t = np.arange(10)\n", - "test_eq(chunked(t,3), L([0,1,2], [3,4,5], [6,7,8], [9]))\n", - "test_eq(chunked(t,3,True), L([0,1,2], [3,4,5], [6,7,8], ))" + "test_eq(chunked(t,3), [[0,1,2], [3,4,5], [6,7,8], [9]])\n", + "test_eq(chunked(t,3,True), [[0,1,2], [3,4,5], [6,7,8], ])" ] }, { @@ -940,68 +969,6 @@ "test_eq(d.b, 3)" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def dict2obj(d):\n", - " \"Convert (possibly nested) dicts (or lists of dicts) to `AttrDict`\"\n", - " if isinstance(d, (L,list)): return L(d).map(dict2obj)\n", - " if not isinstance(d, dict): return d\n", - " return AttrDict(**{k:dict2obj(v) for k,v in d.items()})" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "This is a convenience to give you \"dotted\" access to (possibly nested) dictionaries, e.g:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "{'a': 1, 'b': {'c': 2, 'd': 3}}" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "d1 = dict(a=1, b=dict(c=2,d=3))\n", - "d2 = dict2obj(d1)\n", - "test_eq(d2.b.c, 2)\n", - "test_eq(d2.b['c'], 2)\n", - "d2" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "It can also be used on lists of dicts." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "ds = L(d1, d1)\n", - "test_eq(dict2obj(ds)[0].b.c, 2)" - ] - }, { "cell_type": "code", "execution_count": null, @@ -1071,7 +1038,7 @@ " anno = self.__class__.__init__.__annotations__ if cast else {}\n", " if attrs: return _store_attr(self, anno, **attrs)\n", " ns = re.split(', *', names) if names else args[1:]\n", - " _store_attr(self, anno, **{n:fr.f_locals[n] for n in ns if n not in L(but)})" + " _store_attr(self, anno, **{n:fr.f_locals[n] for n in ns if n not in listify(but)})" ] }, { @@ -1191,7 +1158,7 @@ "outputs": [], "source": [ "class T:\n", - " def __init__(self, a:L, b, c:str): store_attr('a,b,c', cast=True)\n", + " def __init__(self, a:listify, b, c:str): store_attr('a,b,c', cast=True)\n", "\n", "t = T(1,c=2,b=3)\n", "assert t.a==[1] and t.b==3 and t.c=='2'" @@ -1610,7 +1577,9 @@ "source": [ "#export\n", "#hide\n", - "class Int(int,ShowPrint): pass" + "class Int(int,ShowPrint):\n", + " \"An extensible `int`\"\n", + " pass" ] }, { @@ -1621,11 +1590,12 @@ "source": [ "#export \n", "#hide\n", - "class Str(str,ShowPrint): pass\n", - "class Float(float,ShowPrint): pass\n", - "add_docs(Str, \"An extensible `str`\");\n", - "add_docs(Int, \"An extensible `int`\");\n", - "add_docs(Float, \"An extensible `float`\")" + "class Str(str,ShowPrint):\n", + " \"An extensible `str`\"\n", + " pass\n", + "class Float(float,ShowPrint):\n", + " \"An extensible `float`\"\n", + " pass" ] }, { @@ -1665,29 +1635,6 @@ "Functions that manipulate popular python collections." ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def tuplify(o, use_list=False, match=None):\n", - " \"Make `o` a tuple\"\n", - " return tuple(L(o, use_list=use_list, match=match))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(tuplify(None),())\n", - "test_eq(tuplify([1,2,3]),(1,2,3))\n", - "test_eq(tuplify(1,match=[1,2,3]),(1,1,1))" - ] - }, { "cell_type": "code", "execution_count": null, @@ -1735,40 +1682,6 @@ "test_eq(replicate(1, t),(1,1))" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def uniqueify(x, sort=False, bidir=False, start=None):\n", - " \"Unique elements in `x`, optionally `sort`-ed, optionally return reverse correspondence, optionally prepend with elements.\"\n", - " res = L(x).unique()\n", - " if start is not None: res = start+res\n", - " if sort: res.sort()\n", - " if bidir: return res, res.val2idx()\n", - " return res" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# test\n", - "test_eq(set(uniqueify([1,1,0,5,0,3])),{0,1,3,5})\n", - "test_eq(uniqueify([1,1,0,5,0,3], sort=True),[0,1,3,5])\n", - "test_eq(uniqueify([1,1,0,5,0,3], start=[7,8,6]), [7,8,6,1,0,5,3])\n", - "v,o = uniqueify([1,1,0,5,0,3], bidir=True)\n", - "test_eq(v,[1,0,5,3])\n", - "test_eq(o,{1:0, 0: 1, 5: 2, 3: 3})\n", - "v,o = uniqueify([1,1,0,5,0,3], sort=True, bidir=True)\n", - "test_eq(v,[0,1,3,5])\n", - "test_eq(o,{0:0, 1: 1, 3: 2, 5: 3})" - ] - }, { "cell_type": "code", "execution_count": null, @@ -1778,7 +1691,7 @@ "# export\n", "def setify(o): \n", " \"Turn any list like-object into a set.\"\n", - " return o if isinstance(o,set) else set(L(o))" + " return o if isinstance(o,set) else set(listify(o))" ] }, { @@ -1818,31 +1731,6 @@ "test_eq(merge(dict(a=1,b=2), dict(b=3,c=4), None), dict(a=1, b=3, c=4))" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def is_listy(x):\n", - " \"`isinstance(x, (tuple,list,L,slice,Generator))`\"\n", - " return isinstance(x, (tuple,list,L,slice,Generator))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "assert is_listy((1,))\n", - "assert is_listy([1])\n", - "assert is_listy(L([1]))\n", - "assert is_listy(slice(2))\n", - "assert not is_listy(array([1]))" - ] - }, { "cell_type": "code", "execution_count": null, @@ -1910,32 +1798,6 @@ "test_eq(last_index(6, [1, 2, 9, 3, 4, 9, 10]), -1)" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def shufflish(x, pct=0.04):\n", - " \"Randomly relocate items of `x` up to `pct` of `len(x)` from their starting location\"\n", - " n = len(x)\n", - " return L(x[i] for i in sorted(range_of(x), key=lambda o: o+n*(1+random.random()*pct)))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "l = list(range(100))\n", - "l2 = array(shufflish(l))\n", - "test_close(l2[:50 ].mean(), 25, eps=5)\n", - "test_close(l2[-50:].mean(), 75, eps=5)\n", - "test_ne(l,l2)" - ] - }, { "cell_type": "code", "execution_count": null, @@ -1965,7 +1827,7 @@ } ], "source": [ - "letters = L.range(65,73).map_dict(chr)\n", + "letters = {o:chr(o) for o in range(65,73)}\n", "letters" ] }, @@ -1977,7 +1839,7 @@ { "data": { "text/plain": [ - "{70: 'F', 71: 'G'}" + "{65: 'A', 66: 'B', 70: 'F', 71: 'G'}" ] }, "execution_count": null, @@ -1986,7 +1848,7 @@ } ], "source": [ - "filter_dict(letters, lambda k,v: k<3 or v in 'FG')" + "filter_dict(letters, lambda k,v: k<67 or v in 'FG')" ] }, { @@ -2009,7 +1871,7 @@ { "data": { "text/plain": [ - "{}" + "{65: 'A', 66: 'B'}" ] }, "execution_count": null, @@ -2018,7 +1880,7 @@ } ], "source": [ - "filter_keys(letters, lt(3))" + "filter_keys(letters, lt(67))" ] }, { @@ -2054,10 +1916,16 @@ ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "## Reindexing Collections" + "#export\n", + "def cycle(o):\n", + " \"Like `itertools.cycle` except creates list of `None`s if `o` is empty\"\n", + " o = listify(o)\n", + " return itertools.cycle(o) if o is not None and len(o) > 0 else itertools.cycle([None])" ] }, { @@ -2066,11 +1934,10 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "#hide\n", - "class IterLen:\n", - " \"Base class to add iteration to anything supporting `__len__` and `__getitem__`\"\n", - " def __iter__(self): return (self[i] for i in range_of(self))" + "test_eq(itertools.islice(cycle([1,2,3]),5), [1,2,3,1,2])\n", + "test_eq(itertools.islice(cycle([]),3), [None]*3)\n", + "test_eq(itertools.islice(cycle(None),3), [None]*3)\n", + "test_eq(itertools.islice(cycle(1),3), [1,1,1])" ] }, { @@ -2080,99 +1947,107 @@ "outputs": [], "source": [ "#export\n", - "@docs\n", - "class ReindexCollection(GetAttr, IterLen):\n", - " \"Reindexes collection `coll` with indices `idxs` and optional LRU cache of size `cache`\"\n", - " _default='coll'\n", - " def __init__(self, coll, idxs=None, cache=None, tfm=noop):\n", - " if idxs is None: idxs = L.range(coll) \n", - " store_attr()\n", - " if cache is not None: self._get = functools.lru_cache(maxsize=cache)(self._get)\n", - "\n", - " def _get(self, i): return self.tfm(self.coll[i])\n", - " def __getitem__(self, i): return self._get(self.idxs[i])\n", - " def __len__(self): return len(self.coll)\n", - " def reindex(self, idxs): self.idxs = idxs\n", - " def shuffle(self): random.shuffle(self.idxs)\n", - " def cache_clear(self): self._get.cache_clear()\n", - " def __getstate__(self): return {'coll': self.coll, 'idxs': self.idxs, 'cache': self.cache, 'tfm': self.tfm}\n", - " def __setstate__(self, s): self.coll,self.idxs,self.cache,self.tfm = s['coll'],s['idxs'],s['cache'],s['tfm']\n", - "\n", - " _docs = dict(reindex=\"Replace `self.idxs` with idxs\",\n", - " shuffle=\"Randomly shuffle indices\",\n", - " cache_clear=\"Clear LRU cache\")" + "def zip_cycle(x, *args):\n", + " \"Like `itertools.zip_longest` but `cycle`s through elements of all but first argument\"\n", + " return zip(x, *map(cycle,args))" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/markdown": [ - "

class ReindexCollection[source]

\n", - "\n", - "> ReindexCollection(**`coll`**, **`idxs`**=*`None`*, **`cache`**=*`None`*, **`tfm`**=*`noop`*) :: [`GetAttr`](/foundation.html#GetAttr)\n", - "\n", - "Reindexes collection `coll` with indices `idxs` and optional LRU cache of size `cache`" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "show_doc(ReindexCollection, title_level=4)" + "test_eq(zip_cycle([1,2,3,4],list('abc')), [(1, 'a'), (2, 'b'), (3, 'c'), (4, 'a')])" ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "This is useful when constructing batches or organizing data in a particular manner (i.e. for deep learning). This class is primarly used in organizing data for language models in fastai." + "#export\n", + "def sorted_ex(iterable, key=None, reverse=False):\n", + " \"Like `sorted`, but if key is str use `attrgetter`; if int use `itemgetter`\"\n", + " if isinstance(key,str): k=lambda o:getattr(o,key,0)\n", + " elif isinstance(key,int): k=itemgetter(key)\n", + " else: k=key\n", + " return sorted(iterable, key=k, reverse=reverse)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "#### Reindexing\n", - "\n", - "You can supply a custom index upon instantiation with the `idxs` argument, or you can call the `reindex` method to supply a new index for your collection.\n", + "## fastuple\n", "\n", - "Here is how you can reindex a list such that the elements are reversed:" + "A tuple with extended functionality." ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "['e', 'd', 'c', 'b', 'a']" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ - "rc=ReindexCollection(['a', 'b', 'c', 'd', 'e'], idxs=[4,3,2,1,0])\n", - "list(rc)" + "#export\n", + "num_methods = \"\"\"\n", + " __add__ __sub__ __mul__ __matmul__ __truediv__ __floordiv__ __mod__ __divmod__ __pow__\n", + " __lshift__ __rshift__ __and__ __xor__ __or__ __neg__ __pos__ __abs__\n", + "\"\"\".split()\n", + "rnum_methods = \"\"\"\n", + " __radd__ __rsub__ __rmul__ __rmatmul__ __rtruediv__ __rfloordiv__ __rmod__ __rdivmod__\n", + " __rpow__ __rlshift__ __rrshift__ __rand__ __rxor__ __ror__\n", + "\"\"\".split()\n", + "inum_methods = \"\"\"\n", + " __iadd__ __isub__ __imul__ __imatmul__ __itruediv__\n", + " __ifloordiv__ __imod__ __ipow__ __ilshift__ __irshift__ __iand__ __ixor__ __ior__\n", + "\"\"\".split()" ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "Alternatively, you can use the `reindex` method:" + "#export\n", + "class fastuple(tuple):\n", + " \"A `tuple` with elementwise ops and more friendly __init__ behavior\"\n", + " def __new__(cls, x=None, *rest):\n", + " if x is None: x = ()\n", + " if not isinstance(x,tuple):\n", + " if len(rest): x = (x,)\n", + " else:\n", + " try: x = tuple(iter(x))\n", + " except TypeError: x = (x,)\n", + " return super().__new__(cls, x+rest if rest else x)\n", + "\n", + " def _op(self,op,*args):\n", + " if not isinstance(self,fastuple): self = fastuple(self)\n", + " return type(self)(map(op,self,*map(cycle, args)))\n", + "\n", + " def mul(self,*args):\n", + " \"`*` is already defined in `tuple` for replicating, so use `mul` instead\"\n", + " return fastuple._op(self, operator.mul,*args)\n", + "\n", + " def add(self,*args):\n", + " \"`+` is already defined in `tuple` for concat, so use `add` instead\"\n", + " return fastuple._op(self, operator.add,*args)\n", + "\n", + "def _get_op(op):\n", + " if isinstance(op,str): op = getattr(operator,op)\n", + " def _f(self,*args): return self._op(op,*args)\n", + " return _f\n", + "\n", + "for n in num_methods:\n", + " if not hasattr(fastuple, n) and hasattr(operator,n): setattr(fastuple,n,_get_op(n))\n", + "\n", + "for n in 'eq ne lt le gt ge'.split(): setattr(fastuple,n,_get_op(n))\n", + "setattr(fastuple,'__invert__',_get_op('__not__'))\n", + "setattr(fastuple,'max',_get_op(max))\n", + "setattr(fastuple,'min',_get_op(min))" ] }, { @@ -2183,11 +2058,11 @@ { "data": { "text/markdown": [ - "
ReindexCollection.reindex[source]
\n", + "

class fastuple[source]

\n", "\n", - "> ReindexCollection.reindex(**`idxs`**)\n", + "> fastuple(**`x`**=*`None`*, **\\*`rest`**) :: `tuple`\n", "\n", - "Replace `self.idxs` with idxs" + "A `tuple` with elementwise ops and more friendly __init__ behavior" ], "text/plain": [ "" @@ -2198,127 +2073,53 @@ } ], "source": [ - "show_doc(ReindexCollection.reindex, title_level=6)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "['e', 'd', 'c', 'b', 'a']" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "rc=ReindexCollection(['a', 'b', 'c', 'd', 'e'])\n", - "rc.reindex([4,3,2,1,0])\n", - "list(rc)" + "show_doc(fastuple, title_level=4)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "#### LRU Cache" + "#### Friendly init behavior" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "You can optionally specify a LRU cache, which uses [functools.lru_cache](https://docs.python.org/3/library/functools.html#functools.lru_cache) upon instantiation:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "CacheInfo(hits=1, misses=1, maxsize=2, currsize=1)" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "sz = 50\n", - "t = ReindexCollection(L.range(sz), cache=2)\n", + "Common failure modes when trying to initialize a tuple in python:\n", "\n", - "#trigger a cache hit by indexing into the same element multiple times\n", - "t[0], t[0]\n", - "t._get.cache_info()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "You can optionally clear the LRU cache by calling the `cache_clear` method:" + "```py\n", + "tuple(3)\n", + "> TypeError: 'int' object is not iterable\n", + "```\n", + "\n", + "or \n", + "\n", + "```py\n", + "tuple(3, 4)\n", + "> TypeError: tuple expected at most 1 arguments, got 2\n", + "```\n", + "\n", + "However, `fastuple` allows you to define tuples like this and in the usual way:" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/markdown": [ - "
ReindexCollection.cache_clear[source]
\n", - "\n", - "> ReindexCollection.cache_clear()\n", - "\n", - "Clear LRU cache" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "show_doc(ReindexCollection.cache_clear, title_level=5)" + "test_eq(fastuple(3), (3,))\n", + "test_eq(fastuple(3,4), (3, 4))\n", + "test_eq(fastuple((3,4)), (3, 4))" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "CacheInfo(hits=0, misses=0, maxsize=2, currsize=0)" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], "source": [ - "sz = 50\n", - "t = ReindexCollection(L.range(sz), cache=2)\n", - "\n", - "#trigger a cache hit by indexing into the same element multiple times\n", - "t[0], t[0]\n", - "t.cache_clear()\n", - "t._get.cache_info()" + "#### Elementwise operations" ] }, { @@ -2329,11 +2130,11 @@ { "data": { "text/markdown": [ - "
ReindexCollection.shuffle[source]
\n", + "
fastuple.add[source]
\n", "\n", - "> ReindexCollection.shuffle()\n", + "> fastuple.add(**\\*`args`**)\n", "\n", - "Randomly shuffle indices" + "`+` is already defined in `tuple` for concat, so use `add` instead" ], "text/plain": [ "" @@ -2344,105 +2145,7 @@ } ], "source": [ - "show_doc(ReindexCollection.shuffle, title_level=5)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Note that an ordered index is automatically constructed for the data structure even if one is not supplied." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "['e', 'd', 'h', 'f', 'c', 'b', 'g', 'a']" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "rc=ReindexCollection(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'])\n", - "rc.shuffle()\n", - "list(rc)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### Tests" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "sz = 50\n", - "t = ReindexCollection(L.range(sz), cache=2)\n", - "test_eq(list(t), range(sz))\n", - "test_eq(t[sz-1], sz-1)\n", - "test_eq(t._get.cache_info().hits, 1)\n", - "t.shuffle()\n", - "test_eq(t._get.cache_info().hits, 1)\n", - "test_ne(list(t), range(sz))\n", - "test_eq(set(t), set(range(sz)))\n", - "t.cache_clear()\n", - "test_eq(t._get.cache_info().hits, 0)\n", - "test_eq(t.count(0), 1)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#hide\n", - "#Test ReindexCollection pickles\n", - "t1 = pickle.loads(pickle.dumps(t))\n", - "test_eq(list(t), list(t1))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "num_methods = \"\"\"\n", - " __add__ __sub__ __mul__ __matmul__ __truediv__ __floordiv__ __mod__ __divmod__ __pow__\n", - " __lshift__ __rshift__ __and__ __xor__ __or__ __neg__ __pos__ __abs__\n", - "\"\"\".split()\n", - "rnum_methods = \"\"\"\n", - " __radd__ __rsub__ __rmul__ __rmatmul__ __rtruediv__ __rfloordiv__ __rmod__ __rdivmod__\n", - " __rpow__ __rlshift__ __rrshift__ __rand__ __rxor__ __ror__\n", - "\"\"\".split()\n", - "inum_methods = \"\"\"\n", - " __iadd__ __isub__ __imul__ __imatmul__ __itruediv__\n", - " __ifloordiv__ __imod__ __ipow__ __ilshift__ __irshift__ __iand__ __ixor__ __ior__\n", - "\"\"\".split()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## fastuple\n", - "\n", - "A tuple with extended functionality." + "show_doc(fastuple.add, title_level=5)" ] }, { @@ -2451,42 +2154,9 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "class fastuple(tuple):\n", - " \"A `tuple` with elementwise ops and more friendly __init__ behavior\"\n", - " def __new__(cls, x=None, *rest):\n", - " if x is None: x = ()\n", - " if not isinstance(x,tuple):\n", - " if len(rest): x = (x,)\n", - " else:\n", - " try: x = tuple(iter(x))\n", - " except TypeError: x = (x,)\n", - " return super().__new__(cls, x+rest if rest else x)\n", - "\n", - " def _op(self,op,*args):\n", - " if not isinstance(self,fastuple): self = fastuple(self)\n", - " return type(self)(map(op,self,*map(cycle, args)))\n", - "\n", - " def mul(self,*args):\n", - " \"`*` is already defined in `tuple` for replicating, so use `mul` instead\"\n", - " return fastuple._op(self, operator.mul,*args)\n", - "\n", - " def add(self,*args):\n", - " \"`+` is already defined in `tuple` for concat, so use `add` instead\"\n", - " return fastuple._op(self, operator.add,*args)\n", - "\n", - "def _get_op(op):\n", - " if isinstance(op,str): op = getattr(operator,op)\n", - " def _f(self,*args): return self._op(op,*args)\n", - " return _f\n", - "\n", - "for n in num_methods:\n", - " if not hasattr(fastuple, n) and hasattr(operator,n): setattr(fastuple,n,_get_op(n))\n", - "\n", - "for n in 'eq ne lt le gt ge'.split(): setattr(fastuple,n,_get_op(n))\n", - "setattr(fastuple,'__invert__',_get_op('__not__'))\n", - "setattr(fastuple,'max',_get_op(max))\n", - "setattr(fastuple,'min',_get_op(min))" + "test_eq(fastuple.add((1,1),(2,2)), (3,3))\n", + "test_eq_type(fastuple(1,1).add(2), fastuple(3,3))\n", + "test_eq(fastuple('1','2').add('2'), fastuple('12','22'))" ] }, { @@ -2497,120 +2167,11 @@ { "data": { "text/markdown": [ - "

class fastuple[source]

\n", + "
fastuple.mul[source]
\n", "\n", - "> fastuple(**`x`**=*`None`*, **\\*`rest`**) :: `tuple`\n", + "> fastuple.mul(**\\*`args`**)\n", "\n", - "A `tuple` with elementwise ops and more friendly __init__ behavior" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "show_doc(fastuple, title_level=4)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### Friendly init behavior" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Common failure modes when trying to initialize a tuple in python:\n", - "\n", - "```py\n", - "tuple(3)\n", - "> TypeError: 'int' object is not iterable\n", - "```\n", - "\n", - "or \n", - "\n", - "```py\n", - "tuple(3, 4)\n", - "> TypeError: tuple expected at most 1 arguments, got 2\n", - "```\n", - "\n", - "However, `fastuple` allows you to define tuples like this and in the usual way:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(fastuple(3), (3,))\n", - "test_eq(fastuple(3,4), (3, 4))\n", - "test_eq(fastuple((3,4)), (3, 4))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### Elementwise operations" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/markdown": [ - "
fastuple.add[source]
\n", - "\n", - "> fastuple.add(**\\*`args`**)\n", - "\n", - "`+` is already defined in `tuple` for concat, so use `add` instead" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "show_doc(fastuple.add, title_level=5)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(fastuple.add((1,1),(2,2)), (3,3))\n", - "test_eq_type(fastuple(1,1).add(2), fastuple(3,3))\n", - "test_eq(fastuple('1','2').add('2'), fastuple('12','22'))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/markdown": [ - "
fastuple.mul[source]
\n", - "\n", - "> fastuple.mul(**\\*`args`**)\n", - "\n", - "`*` is already defined in `tuple` for replicating, so use `mul` instead" + "`*` is already defined in `tuple` for replicating, so use `mul` instead" ], "text/plain": [ "" @@ -2630,1044 +2191,20 @@ "metadata": {}, "outputs": [], "source": [ - "test_eq_type(fastuple(1,1).mul(2), fastuple(2,2))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### Other Elementwise Operations\n", - "\n", - "Additionally, the following elementwise operations are available:\n", - "- `le`: less than\n", - "- `eq`: equal\n", - "- `gt`: greater than\n", - "- `min`: minimum of" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(fastuple(3,1).le(1), (False, True))\n", - "test_eq(fastuple(3,1).eq(1), (False, True))\n", - "test_eq(fastuple(3,1).gt(1), (True, False))\n", - "test_eq(fastuple(3,1).min(2), (2,1))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "You can also do other elemntwise operations like negate a `fastuple`, or subtract two `fastuple`s:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(-fastuple(1,2), (-1,-2))\n", - "test_eq(~fastuple(1,0,1), (False,True,False))\n", - "\n", - "test_eq(fastuple(1,1)-fastuple(2,2), (-1,-1))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### Other Tests" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(type(fastuple(1)), fastuple)\n", - "test_eq_type(fastuple(1,2), fastuple(1,2))\n", - "test_ne(fastuple(1,2), fastuple(1,3))\n", - "test_eq(fastuple(), ())" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Functions on Functions\n", - "\n", - "Utilities for functional programming or for defining, modifying, or debugging functions. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def trace(f):\n", - " \"Add `set_trace` to an existing function `f`\"\n", - " if getattr(f, '_traced', False): return f\n", - " def _inner(*args,**kwargs):\n", - " set_trace()\n", - " return f(*args,**kwargs)\n", - " _inner._traced = True\n", - " return _inner" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "You can add a breakpoint to an existing function, e.g:\n", - "\n", - "```python\n", - "Path.cwd = trace(Path.cwd)\n", - "Path.cwd()\n", - "```\n", - "\n", - "Now, when the function is called it will drop you into the debugger. Note, you must issue the `s` command when you begin to step into the function that is being traced." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# export\n", - "def compose(*funcs, order=None):\n", - " \"Create a function that composes all functions in `funcs`, passing along remaining `*args` and `**kwargs` to all\"\n", - " funcs = L(funcs)\n", - " if len(funcs)==0: return noop\n", - " if len(funcs)==1: return funcs[0]\n", - " if order is not None: funcs = funcs.sorted(order)\n", - " def _inner(x, *args, **kwargs):\n", - " for f in L(funcs): x = f(x, *args, **kwargs)\n", - " return x\n", - " return _inner" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "f1 = lambda o,p=0: (o*2)+p\n", - "f2 = lambda o,p=1: (o+1)/p\n", - "test_eq(f2(f1(3)), compose(f1,f2)(3))\n", - "test_eq(f2(f1(3,p=3),p=3), compose(f1,f2)(3,p=3))\n", - "test_eq(f2(f1(3, 3), 3), compose(f1,f2)(3, 3))\n", - "\n", - "f1.order = 1\n", - "test_eq(f1(f2(3)), compose(f1,f2, order=\"order\")(3))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def maps(*args, retain=noop):\n", - " \"Like `map`, except funcs are composed first\"\n", - " f = compose(*args[:-1])\n", - " def _f(b): return retain(f(b), b)\n", - " return map(_f, args[-1])" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(maps([1]), [1])\n", - "test_eq(maps(operator.neg, [1,2]), [-1,-2])\n", - "test_eq(maps(operator.neg, operator.neg, [1,2]), [1,2])" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def partialler(f, *args, order=None, **kwargs):\n", - " \"Like `functools.partial` but also copies over docstring\"\n", - " fnew = partial(f,*args,**kwargs)\n", - " fnew.__doc__ = f.__doc__\n", - " if order is not None: fnew.order=order\n", - " elif hasattr(f,'order'): fnew.order=f.order\n", - " return fnew" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def _f(x,a=1):\n", - " \"test func\"\n", - " return x-a\n", - "_f.order=1\n", - "\n", - "f = partialler(_f, 2)\n", - "test_eq(f.order, 1)\n", - "test_eq(f(3), -1)\n", - "f = partialler(_f, a=2, order=3)\n", - "test_eq(f.__doc__, \"test func\")\n", - "test_eq(f.order, 3)\n", - "test_eq(f(3), _f(3,2))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "class partial0:\n", - " \"Like `partialler`, but args passed to callable are inserted at started, instead of at end\"\n", - " def __init__(self, f, *args, order=None, **kwargs):\n", - " self.f,self.args,self.kwargs = f,args,kwargs\n", - " self.order = ifnone(order, getattr(f,'order',None))\n", - " self.__doc__ = f.__doc__\n", - "\n", - " def __call__(self, *args, **kwargs): return self.f(*args, *self.args, **kwargs, **self.kwargs)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "f = partial0(_f, 2)\n", - "test_eq(f.order, 1)\n", - "test_eq(f(3), 1) # NB: different to `partialler` example" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def mapped(f, it):\n", - " \"map `f` over `it`, unless it's not listy, in which case return `f(it)`\"\n", - " return L(it).map(f) if is_listy(it) else f(it)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(mapped(_f,1),0)\n", - "test_eq(mapped(_f,[1,2]),[0,1])\n", - "test_eq(mapped(_f,(1,)),(0,))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def instantiate(t):\n", - " \"Instantiate `t` if it's a type, otherwise do nothing\"\n", - " return t() if isinstance(t, type) else t" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq_type(instantiate(int), 0)\n", - "test_eq_type(instantiate(1), 1)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def _using_attr(f, attr, x): return f(getattr(x,attr))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def using_attr(f, attr):\n", - " \"Change function `f` to operate on `attr`\"\n", - " return partial(_using_attr, f, attr)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "t = Path('/a/b.txt')\n", - "f = using_attr(str.upper, 'name')\n", - "test_eq(f(t), 'B.TXT')" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Self (with an _uppercase_ S)\n", - "\n", - "A Concise Way To Create Lambdas" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "class _Self:\n", - " \"An alternative to `lambda` for calling methods on passed object.\"\n", - " def __init__(self): self.nms,self.args,self.kwargs,self.ready = [],[],[],True\n", - " def __repr__(self): return f'self: {self.nms}({self.args}, {self.kwargs})'\n", - "\n", - " def __call__(self, *args, **kwargs):\n", - " if self.ready:\n", - " x = args[0]\n", - " for n,a,k in zip(self.nms,self.args,self.kwargs):\n", - " x = getattr(x,n)\n", - " if callable(x) and a is not None: x = x(*a, **k)\n", - " return x\n", - " else:\n", - " self.args.append(args)\n", - " self.kwargs.append(kwargs)\n", - " self.ready = True\n", - " return self\n", - "\n", - " def __getattr__(self,k):\n", - " if not self.ready:\n", - " self.args.append(None)\n", - " self.kwargs.append(None)\n", - " self.nms.append(k)\n", - " self.ready = False\n", - " return self" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "class _SelfCls:\n", - " def __getattr__(self,k): return getattr(_Self(),k)\n", - " def __getitem__(self,i): return self.__getattr__('__getitem__')(i)\n", - "\n", - "Self = _SelfCls()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "_all_ = ['Self']" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "This is a concise way to create lambdas that are calling methods on an object (note the capitalization!)\n", - "\n", - "`Self.sum()`, for instance, is a shortcut for `lambda o: o.sum()`." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "f = Self.sum()\n", - "x = array([3.,1])\n", - "test_eq(f(x), 4.)\n", - "\n", - "# This is equivalent to above\n", - "f = lambda o: o.sum()\n", - "x = array([3.,1])\n", - "test_eq(f(x), 4.)\n", - "\n", - "f = Self.argmin()\n", - "arr = np.array([1,2,3,4,5])\n", - "test_eq(f(arr), arr.argmin())\n", - "\n", - "f = Self.sum().is_integer()\n", - "x = array([3.,1])\n", - "test_eq(f(x), True)\n", - "\n", - "f = Self.sum().real.is_integer()\n", - "x = array([3.,1])\n", - "test_eq(f(x), True)\n", - "\n", - "f = Self.imag()\n", - "test_eq(f(3), 0)\n", - "\n", - "f = Self[1]\n", - "test_eq(f(x), 1)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Extensions to Pathlib.Path" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "An extension of the standard python libary [Pathlib.Path](https://docs.python.org/3/library/pathlib.html#basic-use). These extensions are accomplished by monkey patching additional methods onto `Pathlib.Path`." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "@patch\n", - "def readlines(self:Path, hint=-1, encoding='utf8'):\n", - " \"Read the content of `self`\"\n", - " with self.open(encoding=encoding) as f: return f.readlines(hint)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "@patch\n", - "def mk_write(self:Path, data, encoding=None, errors=None, mode=511):\n", - " \"Make all parent dirs of `self`\"\n", - " self.parent.mkdir(exist_ok=True, parents=True, mode=mode)\n", - " self.write_text(data, encoding=encoding, errors=errors)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "@patch\n", - "def ls(self:Path, n_max=None, file_type=None, file_exts=None):\n", - " \"Contents of path as a list\"\n", - " extns=L(file_exts)\n", - " if file_type: extns += L(k for k,v in mimetypes.types_map.items() if v.startswith(file_type+'/'))\n", - " has_extns = len(extns)==0\n", - " res = (o for o in self.iterdir() if has_extns or o.suffix in extns)\n", - " if n_max is not None: res = itertools.islice(res, n_max)\n", - " return L(res)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We add an `ls()` method to `pathlib.Path` which is simply defined as `list(Path.iterdir())`, mainly for convenience in REPL environments such as notebooks." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "Path('.ipynb_checkpoints')" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "path = Path()\n", - "t = path.ls()\n", - "assert len(t)>0\n", - "t1 = path.ls(10)\n", - "test_eq(len(t1), 10)\n", - "t2 = path.ls(file_exts='.ipynb')\n", - "assert len(t)>len(t2)\n", - "t[0]" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "You can also pass an optional `file_type` MIME prefix and/or a list of file extensions." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "(Path('../fastcore/logargs.py'), Path('04_transform.ipynb'))" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "lib_path = (path/'../fastcore')\n", - "txt_files=lib_path.ls(file_type='text')\n", - "assert len(txt_files) > 0 and txt_files[0].suffix=='.py'\n", - "ipy_files=path.ls(file_exts=['.ipynb'])\n", - "assert len(ipy_files) > 0 and ipy_files[0].suffix=='.ipynb'\n", - "txt_files[0],ipy_files[0]" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#hide\n", - "path = Path()\n", - "pkl = pickle.dumps(path)\n", - "p2 = pickle.loads(pkl)\n", - "test_eq(path.ls()[0], p2.ls()[0])" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def open_file(fn, mode='r'):\n", - " \"Open a file, with optional compression if gz or bz2 suffix\"\n", - " if isinstance(fn, io.IOBase): return fn\n", - " fn = Path(fn)\n", - " if fn.suffix=='.bz2': return bz2.BZ2File(fn, mode)\n", - " elif fn.suffix=='.gz' : return gzip.GzipFile(fn, mode)\n", - " else: return open(fn,mode)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def save_pickle(fn, o):\n", - " \"Save a pickle file, to a file name or opened file\"\n", - " with open_file(fn, 'wb') as f: pickle.dump(o, f)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def load_pickle(fn):\n", - " \"Load a pickle file from a file name or opened file\"\n", - " with open_file(fn, 'rb') as f: return pickle.load(f)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "for suf in '.pkl','.bz2','.gz':\n", - " with tempfile.NamedTemporaryFile(suffix=suf) as f:\n", - " fn = Path(f.name)\n", - " save_pickle(fn, 't')\n", - " t = load_pickle(fn)\n", - " test_eq(t,'t')" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "@patch\n", - "def __repr__(self:Path):\n", - " b = getattr(Path, 'BASE_PATH', None)\n", - " if b:\n", - " try: self = self.relative_to(b)\n", - " except: pass\n", - " return f\"Path({self.as_posix()!r})\"" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "fastai also updates the `repr` of `Path` such that, if `Path.BASE_PATH` is defined, all paths are printed relative to that path (as long as they are contained in `Path.BASE_PATH`:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "t = ipy_files[0].absolute()\n", - "try:\n", - " Path.BASE_PATH = t.parent.parent\n", - " test_eq(repr(t), f\"Path('nbs/{t.name}')\")\n", - "finally: Path.BASE_PATH = None" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## File Functions\n", - "\n", - "Utilities (other than extensions to Pathlib.Path) for dealing with IO." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def bunzip(fn):\n", - " \"bunzip `fn`, raising exception if output already exists\"\n", - " fn = Path(fn)\n", - " assert fn.exists(), f\"{fn} doesn't exist\"\n", - " out_fn = fn.with_suffix('')\n", - " assert not out_fn.exists(), f\"{out_fn} already exists\"\n", - " with bz2.BZ2File(fn, 'rb') as src, out_fn.open('wb') as dst:\n", - " for d in iter(lambda: src.read(1024*1024), b''): dst.write(d)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "f = Path('files/test.txt')\n", - "if f.exists(): f.unlink()\n", - "bunzip('files/test.txt.bz2')\n", - "t = f.open().readlines()\n", - "test_eq(len(t),1)\n", - "test_eq(t[0], 'test\\n')\n", - "f.unlink()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def join_path_file(file, path, ext=''):\n", - " \"Return `path/file` if file is a string or a `Path`, file otherwise\"\n", - " if not isinstance(file, (str, Path)): return file\n", - " path.mkdir(parents=True, exist_ok=True)\n", - " return path/f'{file}{ext}'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "path = Path.cwd()/'_tmp'/'tst'\n", - "f = join_path_file('tst.txt', path)\n", - "assert path.exists()\n", - "test_eq(f, path/'tst.txt')\n", - "with open(f, 'w') as f_: assert join_path_file(f_, path) == f_\n", - "shutil.rmtree(Path.cwd()/'_tmp')" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def urlread(url, data=None, **kwargs):\n", - " \"Retrieve `url`, using `data` dict or `kwargs` to `POST` if present\"\n", - " if kwargs and not data: data=kwargs\n", - " if data is not None:\n", - " if not isinstance(data, (str,bytes)): data = urlencode(data)\n", - " if not isinstance(data, bytes): data = data.encode('ascii')\n", - " cls = urllib.request.Request\n", - " if not isinstance(url,cls): url = cls(url)\n", - " url.headers['User-Agent'] = 'Mozilla/5.0'\n", - " with urlopen(url, data=data) as res: return res.read()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def urljson(url, data=None):\n", - " \"Retrieve `url` and decode json\"\n", - " return json.loads(urlread(url, data=data))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def run(cmd, *rest, ignore_ex=False, as_bytes=False):\n", - " \"Pass `cmd` (splitting with `shlex` if string) to `subprocess.run`; return `stdout`; raise `IOError` if fails\"\n", - " if rest: cmd = (cmd,)+rest\n", - " elif isinstance(cmd,str): cmd = shlex.split(cmd)\n", - " res = subprocess.run(cmd, capture_output=True)\n", - " stdout = res.stdout\n", - " if not as_bytes: stdout = stdout.decode()\n", - " if ignore_ex: return (res.returncode, stdout)\n", - " if res.returncode: raise IOError(\"{} ;; {}\".format(res.stdout, res.stderr))\n", - " return stdout" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "You can pass a string (which will be split based on standard shell rules), a list, or pass args directly:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "assert 'ipynb' in run('ls -l')\n", - "assert 'ipynb' in run(['ls', '-l'])\n", - "assert 'ipynb' in run('ls', '-l')" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Some commands fail in non-error situations, like `grep`. Use `ignore_ex` in those cases, which will return a tuple of stdout and returncode:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(run('grep asdfds 00_test.ipynb', ignore_ex=True)[0], 1)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "`run` automatically decodes returned bytes to a `str`. Use `as_bytes` to skip that:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "test_eq(run('echo hi', as_bytes=True), b'hi\\n')" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def do_request(url, post=False, headers=None, **data):\n", - " \"Call GET or json-encoded POST on `url`, depending on `post`\"\n", - " if data:\n", - " if post: data = json.dumps(data).encode('ascii')\n", - " else:\n", - " url += \"?\" + urlencode(data)\n", - " data = None\n", - " return urljson(Request(url, headers=headers, data=data or None))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Sorting Objects From Before/After" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Transforms and callbacks will have run_after/run_before attributes, this function will sort them to respect those requirements (if it's possible). Also, sometimes we want a tranform/callback to be run at the end, but still be able to use run_after/run_before behaviors. For those, the function checks for a toward_end attribute (that needs to be True)." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def _is_instance(f, gs):\n", - " tst = [g if type(g) in [type, 'function'] else g.__class__ for g in gs]\n", - " for g in tst:\n", - " if isinstance(f, g) or f==g: return True\n", - " return False\n", - "\n", - "def _is_first(f, gs):\n", - " for o in L(getattr(f, 'run_after', None)):\n", - " if _is_instance(o, gs): return False\n", - " for g in gs:\n", - " if _is_instance(f, L(getattr(g, 'run_before', None))): return False\n", - " return True\n", - "\n", - "def sort_by_run(fs):\n", - " end = L(fs).attrgot('toward_end')\n", - " inp,res = L(fs)[~end] + L(fs)[end], L()\n", - " while len(inp):\n", - " for i,o in enumerate(inp):\n", - " if _is_first(o, inp):\n", - " res.append(inp.pop(i))\n", - " break\n", - " else: raise Exception(\"Impossible to sort\")\n", - " return res" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "class Tst(): pass \n", - "class Tst1():\n", - " run_before=[Tst]\n", - "class Tst2():\n", - " run_before=Tst\n", - " run_after=Tst1\n", - " \n", - "tsts = [Tst(), Tst1(), Tst2()]\n", - "test_eq(sort_by_run(tsts), [tsts[1], tsts[2], tsts[0]])\n", - "\n", - "Tst2.run_before,Tst2.run_after = Tst1,Tst\n", - "test_fail(lambda: sort_by_run([Tst(), Tst1(), Tst2()]))\n", - "\n", - "def tst1(x): return x\n", - "tst1.run_before = Tst\n", - "test_eq(sort_by_run([tsts[0], tst1]), [tst1, tsts[0]])\n", - " \n", - "class Tst1():\n", - " toward_end=True\n", - "class Tst2():\n", - " toward_end=True\n", - " run_before=Tst1\n", - "tsts = [Tst(), Tst1(), Tst2()]\n", - "test_eq(sort_by_run(tsts), [tsts[0], tsts[2], tsts[1]])" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Other Helpers" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "class PrettyString(str):\n", - " \"Little hack to get strings to show properly in Jupyter.\"\n", - " def __repr__(self): return self" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/markdown": [ - "

class PrettyString[source]

\n", - "\n", - "> PrettyString() :: `str`\n", - "\n", - "Little hack to get strings to show properly in Jupyter." - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "show_doc(PrettyString, title_level=4)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Allow strings with special characters to render properly in Jupyter. Without calling `print()` strings with special characters are displayed like so:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "'a string\\nwith\\nnew\\nlines and\\ttabs'" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "with_special_chars='a string\\nwith\\nnew\\nlines and\\ttabs'\n", - "with_special_chars" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We can correct this with `PrettyString`:" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "a string\n", - "with\n", - "new\n", - "lines and\ttabs" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "PrettyString(with_special_chars)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def round_multiple(x, mult, round_down=False):\n", - " \"Round `x` to nearest multiple of `mult`\"\n", - " def _f(x_): return (int if round_down else round)(x_/mult)*mult\n", - " res = L(x).map(_f)\n", - " return res if is_listy(x) else res[0]" + "test_eq_type(fastuple(1,1).mul(2), fastuple(2,2))" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "test_eq(round_multiple(63,32), 64)\n", - "test_eq(round_multiple(50,32), 64)\n", - "test_eq(round_multiple(40,32), 32)\n", - "test_eq(round_multiple( 0,32), 0)\n", - "test_eq(round_multiple(63,32, round_down=True), 32)\n", - "test_eq(round_multiple((63,40),32), (64,32))" + "#### Other Elementwise Operations\n", + "\n", + "Additionally, the following elementwise operations are available:\n", + "- `le`: less than\n", + "- `eq`: equal\n", + "- `gt`: greater than\n", + "- `min`: minimum of" ] }, { @@ -3676,24 +2213,17 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def even_mults(start, stop, n):\n", - " \"Build log-stepped array from `start` to `stop` in `n` steps.\"\n", - " if n==1: return stop\n", - " mult = stop/start\n", - " step = mult**(1/(n-1))\n", - " return [start*(step**i) for i in range(n)]" + "test_eq(fastuple(3,1).le(1), (False, True))\n", + "test_eq(fastuple(3,1).eq(1), (False, True))\n", + "test_eq(fastuple(3,1).gt(1), (True, False))\n", + "test_eq(fastuple(3,1).min(2), (2,1))" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "test_eq(even_mults(2,8,3), [2,4,8])\n", - "test_eq(even_mults(2,32,5), [2,4,8,16,32])\n", - "test_eq(even_mults(2,8,1), 8)" + "You can also do other elemntwise operations like negate a `fastuple`, or subtract two `fastuple`s:" ] }, { @@ -3702,33 +2232,10 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def num_cpus():\n", - " \"Get number of cpus\"\n", - " try: return len(os.sched_getaffinity(0))\n", - " except AttributeError: return os.cpu_count()\n", + "test_eq(-fastuple(1,2), (-1,-2))\n", + "test_eq(~fastuple(1,0,1), (False,True,False))\n", "\n", - "defaults.cpus = num_cpus()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "64" - ] - }, - "execution_count": null, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "num_cpus()" + "test_eq(fastuple(1,1)-fastuple(2,2), (-1,-1))" ] }, { @@ -3737,24 +2244,19 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def add_props(f, g=None, n=2):\n", - " \"Create properties passing each of `range(n)` to f\"\n", - " if g is None: return (property(partial(f,i)) for i in range(n))\n", - " return (property(partial(f,i), partial(g,i)) for i in range(n))" + "test_eq(type(fastuple(1)), fastuple)\n", + "test_eq_type(fastuple(1,2), fastuple(1,2))\n", + "test_ne(fastuple(1,2), fastuple(1,3))\n", + "test_eq(fastuple(), ())" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "class _T(): a,b = add_props(lambda i,x:i*2)\n", + "## Functions on Functions\n", "\n", - "t = _T()\n", - "test_eq(t.a,0)\n", - "test_eq(t.b,2)" + "Utilities for functional programming or for defining, modifying, or debugging functions. " ] }, { @@ -3763,18 +2265,17 @@ "metadata": {}, "outputs": [], "source": [ - "class _T(): \n", - " def __init__(self, v): self.v=v\n", - " def _set(i, self, v): self.v[i] = v\n", - " a,b = add_props(lambda i,x: x.v[i], _set)\n", - "\n", - "t = _T([0,2])\n", - "test_eq(t.a,0)\n", - "test_eq(t.b,2)\n", - "t.a = t.a+1\n", - "t.b = 3\n", - "test_eq(t.a,1)\n", - "test_eq(t.b,3)" + "# export\n", + "def compose(*funcs, order=None):\n", + " \"Create a function that composes all functions in `funcs`, passing along remaining `*args` and `**kwargs` to all\"\n", + " funcs = listify(funcs)\n", + " if len(funcs)==0: return noop\n", + " if len(funcs)==1: return funcs[0]\n", + " if order is not None: funcs = sorted_ex(funcs, key=order)\n", + " def _inner(x, *args, **kwargs):\n", + " for f in funcs: x = f(x, *args, **kwargs)\n", + " return x\n", + " return _inner" ] }, { @@ -3783,8 +2284,14 @@ "metadata": {}, "outputs": [], "source": [ - "# export\n", - "from contextlib import ExitStack" + "f1 = lambda o,p=0: (o*2)+p\n", + "f2 = lambda o,p=1: (o+1)/p\n", + "test_eq(f2(f1(3)), compose(f1,f2)(3))\n", + "test_eq(f2(f1(3,p=3),p=3), compose(f1,f2)(3,p=3))\n", + "test_eq(f2(f1(3, 3), 3), compose(f1,f2)(3, 3))\n", + "\n", + "f1.order = 1\n", + "test_eq(f1(f2(3)), compose(f1,f2, order=\"order\")(3))" ] }, { @@ -3794,37 +2301,22 @@ "outputs": [], "source": [ "#export\n", - "class ContextManagers(GetAttr):\n", - " \"Wrapper for `contextlib.ExitStack` which enters a collection of context managers\"\n", - " def __init__(self, mgrs): self.default,self.stack = L(mgrs),ExitStack()\n", - " def __enter__(self): self.default.map(self.stack.enter_context)\n", - " def __exit__(self, *args, **kwargs): self.stack.__exit__(*args, **kwargs)" + "def maps(*args, retain=noop):\n", + " \"Like `map`, except funcs are composed first\"\n", + " f = compose(*args[:-1])\n", + " def _f(b): return retain(f(b), b)\n", + " return map(_f, args[-1])" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/markdown": [ - "

class ContextManagers[source]

\n", - "\n", - "> ContextManagers(**`mgrs`**) :: [`GetAttr`](/foundation.html#GetAttr)\n", - "\n", - "Wrapper for `contextlib.ExitStack` which enters a collection of context managers" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "show_doc(ContextManagers, title_level=4)" + "test_eq(maps([1]), [1])\n", + "test_eq(maps(operator.neg, [1,2]), [-1,-2])\n", + "test_eq(maps(operator.neg, operator.neg, [1,2]), [1,2])" ] }, { @@ -3834,7 +2326,13 @@ "outputs": [], "source": [ "#export\n", - "def _typeerr(arg, val, typ): return TypeError(f\"{arg}=={val} not {typ}\")" + "def partialler(f, *args, order=None, **kwargs):\n", + " \"Like `functools.partial` but also copies over docstring\"\n", + " fnew = partial(f,*args,**kwargs)\n", + " fnew.__doc__ = f.__doc__\n", + " if order is not None: fnew.order=order\n", + " elif hasattr(f,'order'): fnew.order=f.order\n", + " return fnew" ] }, { @@ -3843,31 +2341,34 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def typed(f):\n", - " \"Decorator to check param and return types at runtime\"\n", - " names = f.__code__.co_varnames\n", - " anno = f.__annotations__\n", - " ret = anno.pop('return',None)\n", - " def _f(*args,**kwargs):\n", - " kw = {**kwargs}\n", - " if len(anno) > 0:\n", - " for i,arg in enumerate(args): kw[names[i]] = arg\n", - " for k,v in kw.items():\n", - " if not isinstance(v,anno[k]): raise _typeerr(k, v, anno[k])\n", - " res = f(*args,**kwargs)\n", - " if ret is not None and not isinstance(res,ret): raise _typeerr(\"return\", res, ret)\n", - " return res\n", - " return functools.update_wrapper(_f, f)" + "def _f(x,a=1):\n", + " \"test func\"\n", + " return x-a\n", + "_f.order=1\n", + "\n", + "f = partialler(_f, 2)\n", + "test_eq(f.order, 1)\n", + "test_eq(f(3), -1)\n", + "f = partialler(_f, a=2, order=3)\n", + "test_eq(f.__doc__, \"test func\")\n", + "test_eq(f.order, 3)\n", + "test_eq(f(3), _f(3,2))" ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "`typed` validates argument types at **runtime**. This is in contrast to [MyPy](http://mypy-lang.org/) which only offers static type checking.\n", + "class partial0:\n", + " \"Like `partialler`, but args passed to callable are inserted at started, instead of at end\"\n", + " def __init__(self, f, *args, order=None, **kwargs):\n", + " self.f,self.args,self.kwargs = f,args,kwargs\n", + " self.order = ifnone(order, getattr(f,'order',None))\n", + " self.__doc__ = f.__doc__\n", "\n", - "For example, a `TypeError` will be raised if we try to pass an integer into the first argument of the below function: " + " def __call__(self, *args, **kwargs): return self.f(*args, *self.args, **kwargs, **self.kwargs)" ] }, { @@ -3876,18 +2377,21 @@ "metadata": {}, "outputs": [], "source": [ - "@typed\n", - "def discount(price:int, pct:float): \n", - " return (1-pct) * price\n", - "\n", - "with ExceptionExpected(TypeError): discount(100.0, .1)" + "f = partial0(_f, 2)\n", + "test_eq(f.order, 1)\n", + "test_eq(f(3), 1) # NB: different to `partialler` example" ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "We can also optionally allow multiple types by enumarating the types in a tuple as illustrated below:" + "#export\n", + "def instantiate(t):\n", + " \"Instantiate `t` if it's a type, otherwise do nothing\"\n", + " return t() if isinstance(t, type) else t" ] }, { @@ -3896,10 +2400,8 @@ "metadata": {}, "outputs": [], "source": [ - "def discount(price:(int,float), pct:float): \n", - " return (1-pct) * price\n", - "\n", - "assert 90.0 == discount(100.0, .1)" + "test_eq_type(instantiate(int), 0)\n", + "test_eq_type(instantiate(1), 1)" ] }, { @@ -3908,19 +2410,8 @@ "metadata": {}, "outputs": [], "source": [ - "@typed\n", - "def foo(a:int, b:str='a'): return a\n", - "test_eq(foo(1, '2'), 1)\n", - "\n", - "with ExceptionExpected(TypeError): foo(1,2)\n", - "\n", - "@typed\n", - "def foo()->str: return 1\n", - "with ExceptionExpected(TypeError): foo()\n", - "\n", - "@typed\n", - "def foo()->str: return '1'\n", - "assert foo()" + "#export\n", + "def _using_attr(f, attr, x): return f(getattr(x,attr))" ] }, { @@ -3930,10 +2421,9 @@ "outputs": [], "source": [ "#export\n", - "def str2bool(s):\n", - " \"Case-insensitive convert string `s` too a bool (`y`,`yes`,`t`,`true`,`on`,`1`->`True`)\"\n", - " if not isinstance(s,str): return bool(s)\n", - " return bool(distutils.util.strtobool(s)) if s else False" + "def using_attr(f, attr):\n", + " \"Change function `f` to operate on `attr`\"\n", + " return partial(_using_attr, f, attr)" ] }, { @@ -3942,17 +2432,52 @@ "metadata": {}, "outputs": [], "source": [ - "for o in \"y YES t True on 1\".split(): assert str2bool(o)\n", - "for o in \"n no FALSE off 0\".split(): assert not str2bool(o)\n", - "for o in 0,None,'',False: assert not str2bool(o)\n", - "for o in 1,True: assert str2bool(o)" + "t = Path('/a/b.txt')\n", + "f = using_attr(str.upper, 'name')\n", + "test_eq(f(t), 'B.TXT')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "## Multiprocessing" + "### Self (with an _uppercase_ S)\n", + "\n", + "A Concise Way To Create Lambdas" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "class _Self:\n", + " \"An alternative to `lambda` for calling methods on passed object.\"\n", + " def __init__(self): self.nms,self.args,self.kwargs,self.ready = [],[],[],True\n", + " def __repr__(self): return f'self: {self.nms}({self.args}, {self.kwargs})'\n", + "\n", + " def __call__(self, *args, **kwargs):\n", + " if self.ready:\n", + " x = args[0]\n", + " for n,a,k in zip(self.nms,self.args,self.kwargs):\n", + " x = getattr(x,n)\n", + " if callable(x) and a is not None: x = x(*a, **k)\n", + " return x\n", + " else:\n", + " self.args.append(args)\n", + " self.kwargs.append(kwargs)\n", + " self.ready = True\n", + " return self\n", + "\n", + " def __getattr__(self,k):\n", + " if not self.ready:\n", + " self.args.append(None)\n", + " self.kwargs.append(None)\n", + " self.nms.append(k)\n", + " self.ready = False\n", + " return self" ] }, { @@ -3962,10 +2487,11 @@ "outputs": [], "source": [ "#export\n", - "from multiprocessing import Process, Queue\n", - "import concurrent.futures\n", - "import time\n", - "from multiprocessing import Manager" + "class _SelfCls:\n", + " def __getattr__(self,k): return getattr(_Self(),k)\n", + " def __getitem__(self,i): return self.__getattr__('__getitem__')(i)\n", + "\n", + "Self = _SelfCls()" ] }, { @@ -3975,25 +2501,16 @@ "outputs": [], "source": [ "#export\n", - "def set_num_threads(nt):\n", - " \"Get numpy (and others) to use `nt` threads\"\n", - " try: import mkl; mkl.set_num_threads(nt)\n", - " except: pass\n", - " try: import torch; torch.set_num_threads(nt)\n", - " except: pass\n", - " os.environ['IPC_ENABLE']='1'\n", - " for o in ['OPENBLAS_NUM_THREADS','NUMEXPR_NUM_THREADS','OMP_NUM_THREADS','MKL_NUM_THREADS']:\n", - " os.environ[o] = str(nt)" + "_all_ = ['Self']" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "This sets the number of threads consistently for many tools, by:\n", + "This is a concise way to create lambdas that are calling methods on an object (note the capitalization!)\n", "\n", - "1. Set the following environment variables equal to `nt`: `OPENBLAS_NUM_THREADS`,`NUMEXPR_NUM_THREADS`,`OMP_NUM_THREADS`,`MKL_NUM_THREADS`\n", - "2. Sets `nt` threads for numpy and pytorch." + "`Self.sum()`, for instance, is a shortcut for `lambda o: o.sum()`." ] }, { @@ -4002,41 +2519,39 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def _call(lock, pause, n, g, item):\n", - " l = False\n", - " if pause:\n", - " try:\n", - " l = lock.acquire(timeout=pause*(n+2))\n", - " time.sleep(pause)\n", - " finally:\n", - " if l: lock.release()\n", - " return g(item)" + "f = Self.sum()\n", + "x = np.array([3.,1])\n", + "test_eq(f(x), 4.)\n", + "\n", + "# This is equivalent to above\n", + "f = lambda o: o.sum()\n", + "x = np.array([3.,1])\n", + "test_eq(f(x), 4.)\n", + "\n", + "f = Self.argmin()\n", + "arr = np.array([1,2,3,4,5])\n", + "test_eq(f(arr), arr.argmin())\n", + "\n", + "f = Self.sum().is_integer()\n", + "x = np.array([3.,1])\n", + "test_eq(f(x), True)\n", + "\n", + "f = Self.sum().real.is_integer()\n", + "x = np.array([3.,1])\n", + "test_eq(f(x), True)\n", + "\n", + "f = Self.imag()\n", + "test_eq(f(3), 0)\n", + "\n", + "f = Self[1]\n", + "test_eq(f(x), 1)" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "#export\n", - "class ProcessPoolExecutor(concurrent.futures.ProcessPoolExecutor):\n", - " \"Same as Python's ProcessPoolExecutor, except can pass `max_workers==0` for serial execution\"\n", - " def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs):\n", - " if max_workers is None: max_workers=defaults.cpus\n", - " store_attr()\n", - " self.not_parallel = max_workers==0\n", - " if self.not_parallel: max_workers=1\n", - " super().__init__(max_workers, **kwargs)\n", - "\n", - " def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs):\n", - " self.lock = Manager().Lock()\n", - " g = partial(f, *args, **kwargs)\n", - " if self.not_parallel: return map(g, items)\n", - " _g = partial(_call, self.lock, self.pause, self.max_workers, g)\n", - " try: return super().map(_g, items, timeout=timeout, chunksize=chunksize)\n", - " except Exception as e: self.on_exc(e)" + "## Other Helpers" ] }, { @@ -4046,22 +2561,9 @@ "outputs": [], "source": [ "#export\n", - "class ThreadPoolExecutor(concurrent.futures.ThreadPoolExecutor):\n", - " \"Same as Python's ThreadPoolExecutor, except can pass `max_workers==0` for serial execution\"\n", - " def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs):\n", - " if max_workers is None: max_workers=defaults.cpus\n", - " store_attr()\n", - " self.not_parallel = max_workers==0\n", - " if self.not_parallel: max_workers=1\n", - " super().__init__(max_workers, **kwargs)\n", - "\n", - " def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs):\n", - " self.lock = Manager().Lock()\n", - " g = partial(f, *args, **kwargs)\n", - " if self.not_parallel: return map(g, items)\n", - " _g = partial(_call, self.lock, self.pause, self.max_workers, g)\n", - " try: return super().map(_g, items, timeout=timeout, chunksize=chunksize)\n", - " except Exception as e: self.on_exc(e)" + "class PrettyString(str):\n", + " \"Little hack to get strings to show properly in Jupyter.\"\n", + " def __repr__(self): return self" ] }, { @@ -4072,11 +2574,11 @@ { "data": { "text/markdown": [ - "

class ProcessPoolExecutor[source]

\n", + "

class PrettyString[source]

\n", "\n", - "> ProcessPoolExecutor(**`max_workers`**=*`4`*, **`on_exc`**=*`print`*, **`pause`**=*`0`*, **\\*\\*`kwargs`**) :: [`ProcessPoolExecutor`](/utils.html#ProcessPoolExecutor)\n", + "> PrettyString() :: `str`\n", "\n", - "Same as Python's ProcessPoolExecutor, except can pass `max_workers==0` for serial execution" + "Little hack to get strings to show properly in Jupyter." ], "text/plain": [ "" @@ -4087,38 +2589,42 @@ } ], "source": [ - "show_doc(ProcessPoolExecutor, title_level=4)" + "show_doc(PrettyString, title_level=4)" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "#export\n", - "try: from fastprogress import progress_bar\n", - "except: progress_bar = None" + "Allow strings with special characters to render properly in Jupyter. Without calling `print()` strings with special characters are displayed like so:" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "'a string\\nwith\\nnew\\nlines and\\ttabs'" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#export \n", - "def parallel(f, items, *args, n_workers=defaults.cpus, total=None, progress=None, pause=0,\n", - " threadpool=False, timeout=None, chunksize=1, **kwargs):\n", - " \"Applies `func` in parallel to `items`, using `n_workers`\"\n", - " if progress is None: progress = progress_bar is not None\n", - " pool = ThreadPoolExecutor if threadpool else ProcessPoolExecutor\n", - " with pool(n_workers, pause=pause) as ex:\n", - " r = ex.map(f,items, *args, timeout=timeout, chunksize=chunksize, **kwargs)\n", - " if progress:\n", - " if total is None: total = len(items)\n", - " r = progress_bar(r, total=total, leave=False)\n", - " return L(r)" + "with_special_chars='a string\\nwith\\nnew\\nlines and\\ttabs'\n", + "with_special_chars" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can correct this with `PrettyString`:" ] }, { @@ -4128,53 +2634,46 @@ "outputs": [ { "data": { - "text/html": [], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "text/html": [], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "text/html": [], "text/plain": [ - "" + "a string\n", + "with\n", + "new\n", + "lines and\ttabs" ] }, + "execution_count": null, "metadata": {}, - "output_type": "display_data" + "output_type": "execute_result" } ], "source": [ - "def add_one(x, a=1): \n", - " time.sleep(random.random()/80)\n", - " return x+a\n", - "\n", - "inp,exp = range(50),range(1,51)\n", - "test_eq(parallel(add_one, inp, n_workers=2, progress=False), exp)\n", - "test_eq(parallel(add_one, inp, threadpool=True, n_workers=2, progress=False), exp)\n", - "test_eq(parallel(add_one, inp, n_workers=0), exp)\n", - "test_eq(parallel(add_one, inp, n_workers=1, a=2), range(2,52))\n", - "test_eq(parallel(add_one, inp, n_workers=0, a=2), range(2,52))" + "PrettyString(with_special_chars)" ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def even_mults(start, stop, n):\n", + " \"Build log-stepped array from `start` to `stop` in `n` steps.\"\n", + " if n==1: return stop\n", + " mult = stop/start\n", + " step = mult**(1/(n-1))\n", + " return [start*(step**i) for i in range(n)]" + ] + }, + { + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "Use the `pause` parameter to ensure a pause of `pause` seconds between processes starting. This is in case there are race conditions in starting some process, or to stagger the time each process starts, for example when making many requests to a webserver. Set `threadpool=True` to use `ThreadPoolExecutor` instead of `ProcessPoolExecutor`." + "test_eq(even_mults(2,8,3), [2,4,8])\n", + "test_eq(even_mults(2,32,5), [2,4,8,16,32])\n", + "test_eq(even_mults(2,8,1), 8)" ] }, { @@ -4183,7 +2682,13 @@ "metadata": {}, "outputs": [], "source": [ - "from datetime import datetime" + "#export\n", + "def num_cpus():\n", + " \"Get number of cpus\"\n", + " try: return len(os.sched_getaffinity(0))\n", + " except AttributeError: return os.cpu_count()\n", + "\n", + "defaults.cpus = num_cpus()" ] }, { @@ -4193,39 +2698,30 @@ "outputs": [ { "data": { - "text/html": [], "text/plain": [ - "" + "64" ] }, + "execution_count": null, "metadata": {}, - "output_type": "display_data" - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "1 2020-10-12 21:48:54.012317\n", - "0 2020-10-12 21:48:54.265181\n", - "2 2020-10-12 21:48:54.519284\n", - "3 2020-10-12 21:48:54.773004\n", - "4 2020-10-12 21:48:55.026344\n" - ] + "output_type": "execute_result" } ], "source": [ - "def print_time(i): \n", - " time.sleep(random.random()/1000)\n", - " print(i, datetime.now())\n", - "\n", - "parallel(print_time, range(5), n_workers=2, pause=0.25);" + "num_cpus()" ] }, { - "cell_type": "markdown", + "cell_type": "code", + "execution_count": null, "metadata": {}, + "outputs": [], "source": [ - "Note that `f` should accept a collection of items." + "#export\n", + "def add_props(f, g=None, n=2):\n", + " \"Create properties passing each of `range(n)` to f\"\n", + " if g is None: return (property(partial(f,i)) for i in range(n))\n", + " return (property(partial(f,i), partial(g,i)) for i in range(n))" ] }, { @@ -4234,13 +2730,11 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def run_procs(f, f_done, args):\n", - " \"Call `f` for each item in `args` in parallel, yielding `f_done`\"\n", - " processes = L(args).map(Process, args=arg0, target=f)\n", - " for o in processes: o.start()\n", - " yield from f_done()\n", - " processes.map(Self.join())" + "class _T(): a,b = add_props(lambda i,x:i*2)\n", + "\n", + "t = _T()\n", + "test_eq(t.a,0)\n", + "test_eq(t.b,2)" ] }, { @@ -4249,11 +2743,18 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def _f_pg(obj, queue, batch, start_idx):\n", - " for i,b in enumerate(obj(batch)): queue.put((start_idx+i,b))\n", + "class _T(): \n", + " def __init__(self, v): self.v=v\n", + " def _set(i, self, v): self.v[i] = v\n", + " a,b = add_props(lambda i,x: x.v[i], _set)\n", "\n", - "def _done_pg(queue, items): return (queue.get() for _ in items)" + "t = _T([0,2])\n", + "test_eq(t.a,0)\n", + "test_eq(t.b,2)\n", + "t.a = t.a+1\n", + "t.b = 3\n", + "test_eq(t.a,1)\n", + "test_eq(t.b,3)" ] }, { @@ -4262,87 +2763,73 @@ "metadata": {}, "outputs": [], "source": [ - "#export \n", - "def parallel_gen(cls, items, n_workers=defaults.cpus, **kwargs):\n", - " \"Instantiate `cls` in `n_workers` procs & call each on a subset of `items` in parallel.\"\n", - " if n_workers==0:\n", - " yield from enumerate(list(cls(**kwargs)(items)))\n", - " return\n", - " batches = L(chunked(items, n_chunks=n_workers))\n", - " idx = L(itertools.accumulate(0 + batches.map(len)))\n", - " queue = Queue()\n", - " if progress_bar: items = progress_bar(items, leave=False)\n", - " f=partial(_f_pg, cls(**kwargs), queue)\n", - " done=partial(_done_pg, queue, items)\n", - " yield from run_procs(f, done, L(batches,idx).zip())" + "#export\n", + "def _typeerr(arg, val, typ): return TypeError(f\"{arg}=={val} not {typ}\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "class _C:\n", - " def __call__(self, o): return ((i+1) for i in o)\n", - "\n", - "items = range(5)\n", + "#export\n", + "def typed(f):\n", + " \"Decorator to check param and return types at runtime\"\n", + " names = f.__code__.co_varnames\n", + " anno = f.__annotations__\n", + " ret = anno.pop('return',None)\n", + " def _f(*args,**kwargs):\n", + " kw = {**kwargs}\n", + " if len(anno) > 0:\n", + " for i,arg in enumerate(args): kw[names[i]] = arg\n", + " for k,v in kw.items():\n", + " if not isinstance(v,anno[k]): raise _typeerr(k, v, anno[k])\n", + " res = f(*args,**kwargs)\n", + " if ret is not None and not isinstance(res,ret): raise _typeerr(\"return\", res, ret)\n", + " return res\n", + " return functools.update_wrapper(_f, f)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "`typed` validates argument types at **runtime**. This is in contrast to [MyPy](http://mypy-lang.org/) which only offers static type checking.\n", "\n", - "res = L(parallel_gen(_C, items, n_workers=3))\n", - "idxs,dat1 = zip(*res.sorted(itemgetter(0)))\n", - "test_eq(dat1, range(1,6))\n", + "For example, a `TypeError` will be raised if we try to pass an integer into the first argument of the below function: " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "@typed\n", + "def discount(price:int, pct:float): \n", + " return (1-pct) * price\n", "\n", - "res = L(parallel_gen(_C, items, n_workers=0))\n", - "idxs,dat2 = zip(*res.sorted(itemgetter(0)))\n", - "test_eq(dat2, dat1)" + "with ExceptionExpected(TypeError): discount(100.0, .1)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "`cls` is any class with `__call__`. It will be passed `args` and `kwargs` when initialized. Note that `n_workers` instances of `cls` are created, one in each process. `items` are then split in `n_workers` batches and one is sent to each `cls`. The function then returns a generator of tuples of item indices and results." + "We can also optionally allow multiple types by enumarating the types in a tuple as illustrated below:" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "class TestSleepyBatchFunc:\n", - " \"For testing parallel processes that run at different speeds\"\n", - " def __init__(self): self.a=1\n", - " def __call__(self, batch):\n", - " for k in batch:\n", - " time.sleep(random.random()/4)\n", - " yield k+self.a\n", + "def discount(price:(int,float), pct:float): \n", + " return (1-pct) * price\n", "\n", - "x = np.linspace(0,0.99,20)\n", - "res = L(parallel_gen(TestSleepyBatchFunc, x, n_workers=2))\n", - "test_eq(res.sorted().itemgot(1), x+1)" + "assert 90.0 == discount(100.0, .1)" ] }, { @@ -4351,15 +2838,19 @@ "metadata": {}, "outputs": [], "source": [ - "#export\n", - "def threaded(f):\n", - " \"Run `f` in a thread, and returns the thread\"\n", - " @wraps(f)\n", - " def _f(*args, **kwargs):\n", - " res = Thread(target=f, args=args, kwargs=kwargs)\n", - " res.start()\n", - " return res\n", - " return _f" + "@typed\n", + "def foo(a:int, b:str='a'): return a\n", + "test_eq(foo(1, '2'), 1)\n", + "\n", + "with ExceptionExpected(TypeError): foo(1,2)\n", + "\n", + "@typed\n", + "def foo()->str: return 1\n", + "with ExceptionExpected(TypeError): foo()\n", + "\n", + "@typed\n", + "def foo()->str: return '1'\n", + "assert foo()" ] }, { @@ -4503,7 +2994,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "These variables are availabe as booleans in `fastcore.utils` as `IN_IPYTHON`, `IN_JUPYTER`, `IN_COLAB` and `IN_NOTEBOOK`." + "These variables are availabe as booleans in `fastcore.basics` as `IN_IPYTHON`, `IN_JUPYTER`, `IN_COLAB` and `IN_NOTEBOOK`." ] }, { @@ -4543,9 +3034,10 @@ "output_type": "stream", "text": [ "Converted 00_test.ipynb.\n", - "Converted 01_foundation.ipynb.\n", - "Converted 02_utils.ipynb.\n", + "Converted 01_basics.ipynb.\n", + "Converted 02_foundation.ipynb.\n", "Converted 03_dispatch.ipynb.\n", + "Converted 03_xtras.ipynb.\n", "Converted 04_transform.ipynb.\n", "Converted 05_logargs.ipynb.\n", "Converted 06_meta.ipynb.\n", diff --git a/nbs/01_foundation.ipynb b/nbs/02_foundation.ipynb similarity index 96% rename from nbs/01_foundation.ipynb rename to nbs/02_foundation.ipynb index c0fb8740..0efe0eb2 100644 --- a/nbs/01_foundation.ipynb +++ b/nbs/02_foundation.ipynb @@ -17,6 +17,7 @@ "source": [ "#export\n", "from fastcore.imports import *\n", + "from fastcore.basics import *\n", "from functools import lru_cache\n", "from contextlib import contextmanager\n", "from copy import copy\n", @@ -45,16 +46,6 @@ "> Basic functions used in the fastai library" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# export\n", - "defaults = SimpleNamespace()" - ] - }, { "cell_type": "markdown", "metadata": {}, @@ -747,23 +738,6 @@ "test_eq(mask2idxs(array([1,2,3])), [1,2,3])" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def _is_array(x): return hasattr(x,'__array__') or hasattr(x,'iloc')\n", - "\n", - "def _listify(o):\n", - " if o is None: return []\n", - " if isinstance(o, list): return o\n", - " if isinstance(o, str) or _is_array(o): return [o]\n", - " if is_iter(o): return list(o)\n", - " return [o]" - ] - }, { "cell_type": "code", "execution_count": null, @@ -773,7 +747,7 @@ "#export\n", "def cycle(o):\n", " \"Like `itertools.cycle` except creates list of `None`s if `o` is empty\"\n", - " o = _listify(o)\n", + " o = listify(o)\n", " return itertools.cycle(o) if o is not None and len(o) > 0 else itertools.cycle([None])" ] }, @@ -1476,28 +1450,6 @@ "test_eq(range_of(4), [0,1,2,3])" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def sorted_ex(iterable, key=None, reverse=False):\n", - " \"Like `sorted`, but if key is str use `attrgetter`; if int use `itemgetter`\"\n", - " if isinstance(key,str): k=lambda o:getattr(o,key,0)\n", - " elif isinstance(key,int): k=itemgetter(key)\n", - " else: k=key\n", - " return sorted(iterable, key=k, reverse=reverse)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "See `L.sorted` for examples." - ] - }, { "cell_type": "code", "execution_count": null, @@ -1578,40 +1530,6 @@ "test_eq(nested_attr(a, 'b.d'), None)" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#export\n", - "def stop(e=StopIteration):\n", - " \"Raises exception `e` (by default `StopException`)\"\n", - " raise e\n", - "\n", - "def tst():\n", - " try: \n", - " stop() \n", - " except StopIteration: \n", - " return True\n", - " \n", - "def tst2():\n", - " try: \n", - " stop(e=ValueError) \n", - " except ValueError: \n", - " return True" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "assert tst()\n", - "assert tst2()" - ] - }, { "cell_type": "code", "execution_count": null, @@ -1686,8 +1604,8 @@ " def __init__(self, items=None, *rest, use_list=False, match=None):\n", " if rest: items = (items,)+rest\n", " if items is None: items = []\n", - " if (use_list is not None) or not _is_array(items):\n", - " items = list(items) if use_list else _listify(items)\n", + " if (use_list is not None) or not is_array(items):\n", + " items = list(items) if use_list else listify(items)\n", " if match is not None:\n", " if is_coll(match): match = len(match)\n", " if len(items)==1: items = items*match\n", @@ -1711,7 +1629,7 @@ " \"Set `idx` (can be list of indices, or mask, or int) items to `o` (which is broadcast if not iterable)\"\n", " if isinstance(idx, int): self.items[idx] = o\n", " else:\n", - " idx = idx if isinstance(idx,L) else _listify(idx)\n", + " idx = idx if isinstance(idx,L) else listify(idx)\n", " if not is_iter(o): o = [o]*len(idx)\n", " for i,o_ in zip(idx,o): self.items[i] = o_\n", "\n", @@ -1727,9 +1645,9 @@ " def __invert__(self): return self._new(not i for i in self)\n", " def __repr__(self): return repr(self.items)\n", " def _repr_pretty_(self, p, cycle):\n", - " p.text('...' if cycle else repr(self.items) if _is_array(self.items) else coll_repr(self))\n", + " p.text('...' if cycle else repr(self.items) if is_array(self.items) else coll_repr(self))\n", " def __mul__ (a,b): return a._new(a.items*b)\n", - " def __add__ (a,b): return a._new(a.items+_listify(b))\n", + " def __add__ (a,b): return a._new(a.items+listify(b))\n", " def __radd__(a,b): return a._new(b)+a\n", " def __addi__(a,b):\n", " a.items += list(b)\n", @@ -1831,7 +1749,7 @@ { "data": { "text/plain": [ - "b'\\x80\\x04\\x95\\x01\\x01\\x00\\x00\\x00\\x00\\x00\\x00\\x8c\\x07inspect\\x94\\x8c\\tSignature\\x94\\x93\\x94(h\\x00\\x8c\\tParameter\\x94\\x93\\x94\\x8c\\x05items\\x94h\\x00\\x8c\\x0e_ParameterKind\\x94\\x93\\x94K\\x01\\x85\\x94R\\x94\\x86\\x94R\\x94}\\x94(\\x8c\\x08_default\\x94N\\x8c\\x0b_annotation\\x94h\\x00\\x8c\\x06_empty\\x94\\x93\\x94ubh\\x04\\x8c\\x04rest\\x94h\\x07K\\x02\\x85\\x94R\\x94\\x86\\x94R\\x94}\\x94(h\\rh\\x10h\\x0eh\\x10ubh\\x04\\x8c\\x08use_list\\x94h\\x07K\\x03\\x85\\x94R\\x94\\x86\\x94R\\x94}\\x94(h\\r\\x89h\\x0eh\\x10ubh\\x04\\x8c\\x05match\\x94h\\x19\\x86\\x94R\\x94}\\x94(h\\rNh\\x0eh\\x10ubt\\x94\\x85\\x94R\\x94}\\x94\\x8c\\x12_return_annotation\\x94h\\x10sb.'" + "b'\\x80\\x03cinspect\\nSignature\\nq\\x00(cinspect\\nParameter\\nq\\x01X\\x05\\x00\\x00\\x00itemsq\\x02cinspect\\n_ParameterKind\\nq\\x03K\\x01\\x85q\\x04Rq\\x05\\x86q\\x06Rq\\x07}q\\x08(X\\x08\\x00\\x00\\x00_defaultq\\tNX\\x0b\\x00\\x00\\x00_annotationq\\ncinspect\\n_empty\\nq\\x0bubh\\x01X\\x04\\x00\\x00\\x00restq\\x0ch\\x03K\\x02\\x85q\\rRq\\x0e\\x86q\\x0fRq\\x10}q\\x11(h\\th\\x0bh\\nh\\x0bubh\\x01X\\x08\\x00\\x00\\x00use_listq\\x12h\\x03K\\x03\\x85q\\x13Rq\\x14\\x86q\\x15Rq\\x16}q\\x17(h\\t\\x89h\\nh\\x0bubh\\x01X\\x05\\x00\\x00\\x00matchq\\x18h\\x14\\x86q\\x19Rq\\x1a}q\\x1b(h\\tNh\\nh\\x0bubtq\\x1c\\x85q\\x1dRq\\x1e}q\\x1fX\\x12\\x00\\x00\\x00_return_annotationq h\\x0bsb.'" ] }, "execution_count": null, @@ -1978,7 +1896,7 @@ { "data": { "text/plain": [ - "[10, 'j', 4]" + "[2, 'j', 1]" ] }, "execution_count": null, @@ -3176,9 +3094,10 @@ "output_type": "stream", "text": [ "Converted 00_test.ipynb.\n", - "Converted 01_foundation.ipynb.\n", - "Converted 02_utils.ipynb.\n", + "Converted 01_basics.ipynb.\n", + "Converted 02_foundation.ipynb.\n", "Converted 03_dispatch.ipynb.\n", + "Converted 03_xtras.ipynb.\n", "Converted 04_transform.ipynb.\n", "Converted 05_logargs.ipynb.\n", "Converted 06_meta.ipynb.\n", diff --git a/nbs/03_xtras.ipynb b/nbs/03_xtras.ipynb new file mode 100644 index 00000000..1464a487 --- /dev/null +++ b/nbs/03_xtras.ipynb @@ -0,0 +1,1708 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#default_exp xtras" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "from fastcore.imports import *\n", + "from fastcore.foundation import *\n", + "from fastcore.basics import *\n", + "from functools import wraps\n", + "\n", + "import mimetypes,bz2,pickle,random,json,urllib,subprocess,shlex,bz2,gzip,distutils.util\n", + "from contextlib import contextmanager,ExitStack\n", + "from pdb import set_trace\n", + "from urllib.request import Request,urlopen\n", + "from urllib.error import HTTPError\n", + "from urllib.parse import urlencode\n", + "from threading import Thread" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from fastcore.test import *\n", + "from nbdev.showdoc import *\n", + "from fastcore.nb_imports import *" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Utility functions\n", + "\n", + "> Utility functions used in the fastai library" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Collections" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def dict2obj(d):\n", + " \"Convert (possibly nested) dicts (or lists of dicts) to `AttrDict`\"\n", + " if isinstance(d, (L,list)): return L(d).map(dict2obj)\n", + " if not isinstance(d, dict): return d\n", + " return AttrDict(**{k:dict2obj(v) for k,v in d.items()})" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This is a convenience to give you \"dotted\" access to (possibly nested) dictionaries, e.g:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'a': 1, 'b': {'c': 2, 'd': 3}}" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "d1 = dict(a=1, b=dict(c=2,d=3))\n", + "d2 = dict2obj(d1)\n", + "test_eq(d2.b.c, 2)\n", + "test_eq(d2.b['c'], 2)\n", + "d2" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "It can also be used on lists of dicts." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "ds = L(d1, d1)\n", + "test_eq(dict2obj(ds)[0].b.c, 2)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def tuplify(o, use_list=False, match=None):\n", + " \"Make `o` a tuple\"\n", + " return tuple(L(o, use_list=use_list, match=match))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "test_eq(tuplify(None),())\n", + "test_eq(tuplify([1,2,3]),(1,2,3))\n", + "test_eq(tuplify(1,match=[1,2,3]),(1,1,1))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def uniqueify(x, sort=False, bidir=False, start=None):\n", + " \"Unique elements in `x`, optionally `sort`-ed, optionally return reverse correspondence, optionally prepend with elements.\"\n", + " res = L(x).unique()\n", + " if start is not None: res = start+res\n", + " if sort: res.sort()\n", + " if bidir: return res, res.val2idx()\n", + " return res" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# test\n", + "test_eq(set(uniqueify([1,1,0,5,0,3])),{0,1,3,5})\n", + "test_eq(uniqueify([1,1,0,5,0,3], sort=True),[0,1,3,5])\n", + "test_eq(uniqueify([1,1,0,5,0,3], start=[7,8,6]), [7,8,6,1,0,5,3])\n", + "v,o = uniqueify([1,1,0,5,0,3], bidir=True)\n", + "test_eq(v,[1,0,5,3])\n", + "test_eq(o,{1:0, 0: 1, 5: 2, 3: 3})\n", + "v,o = uniqueify([1,1,0,5,0,3], sort=True, bidir=True)\n", + "test_eq(v,[0,1,3,5])\n", + "test_eq(o,{0:0, 1: 1, 3: 2, 5: 3})" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def is_listy(x):\n", + " \"`isinstance(x, (tuple,list,L,slice,Generator))`\"\n", + " return isinstance(x, (tuple,list,L,slice,Generator))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "assert is_listy((1,))\n", + "assert is_listy([1])\n", + "assert is_listy(L([1]))\n", + "assert is_listy(slice(2))\n", + "assert not is_listy(array([1]))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def shufflish(x, pct=0.04):\n", + " \"Randomly relocate items of `x` up to `pct` of `len(x)` from their starting location\"\n", + " n = len(x)\n", + " return L(x[i] for i in sorted(range_of(x), key=lambda o: o+n*(1+random.random()*pct)))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def mapped(f, it):\n", + " \"map `f` over `it`, unless it's not listy, in which case return `f(it)`\"\n", + " return L(it).map(f) if is_listy(it) else f(it)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def _f(x,a=1): return x-a\n", + "\n", + "test_eq(mapped(_f,1),0)\n", + "test_eq(mapped(_f,[1,2]),[0,1])\n", + "test_eq(mapped(_f,(1,)),(0,))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Reindexing Collections" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "#hide\n", + "class IterLen:\n", + " \"Base class to add iteration to anything supporting `__len__` and `__getitem__`\"\n", + " def __iter__(self): return (self[i] for i in range_of(self))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "@docs\n", + "class ReindexCollection(GetAttr, IterLen):\n", + " \"Reindexes collection `coll` with indices `idxs` and optional LRU cache of size `cache`\"\n", + " _default='coll'\n", + " def __init__(self, coll, idxs=None, cache=None, tfm=noop):\n", + " if idxs is None: idxs = L.range(coll) \n", + " store_attr()\n", + " if cache is not None: self._get = functools.lru_cache(maxsize=cache)(self._get)\n", + "\n", + " def _get(self, i): return self.tfm(self.coll[i])\n", + " def __getitem__(self, i): return self._get(self.idxs[i])\n", + " def __len__(self): return len(self.coll)\n", + " def reindex(self, idxs): self.idxs = idxs\n", + " def shuffle(self): random.shuffle(self.idxs)\n", + " def cache_clear(self): self._get.cache_clear()\n", + " def __getstate__(self): return {'coll': self.coll, 'idxs': self.idxs, 'cache': self.cache, 'tfm': self.tfm}\n", + " def __setstate__(self, s): self.coll,self.idxs,self.cache,self.tfm = s['coll'],s['idxs'],s['cache'],s['tfm']\n", + "\n", + " _docs = dict(reindex=\"Replace `self.idxs` with idxs\",\n", + " shuffle=\"Randomly shuffle indices\",\n", + " cache_clear=\"Clear LRU cache\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "

class ReindexCollection[source]

\n", + "\n", + "> ReindexCollection(**`coll`**, **`idxs`**=*`None`*, **`cache`**=*`None`*, **`tfm`**=*`noop`*) :: [`GetAttr`](/foundation.html#GetAttr)\n", + "\n", + "Reindexes collection `coll` with indices `idxs` and optional LRU cache of size `cache`" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "show_doc(ReindexCollection, title_level=4)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This is useful when constructing batches or organizing data in a particular manner (i.e. for deep learning). This class is primarly used in organizing data for language models in fastai." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can supply a custom index upon instantiation with the `idxs` argument, or you can call the `reindex` method to supply a new index for your collection.\n", + "\n", + "Here is how you can reindex a list such that the elements are reversed:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['e', 'd', 'c', 'b', 'a']" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "rc=ReindexCollection(['a', 'b', 'c', 'd', 'e'], idxs=[4,3,2,1,0])\n", + "list(rc)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Alternatively, you can use the `reindex` method:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "
ReindexCollection.reindex[source]
\n", + "\n", + "> ReindexCollection.reindex(**`idxs`**)\n", + "\n", + "Replace `self.idxs` with idxs" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "show_doc(ReindexCollection.reindex, title_level=6)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['e', 'd', 'c', 'b', 'a']" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "rc=ReindexCollection(['a', 'b', 'c', 'd', 'e'])\n", + "rc.reindex([4,3,2,1,0])\n", + "list(rc)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can optionally specify a LRU cache, which uses [functools.lru_cache](https://docs.python.org/3/library/functools.html#functools.lru_cache) upon instantiation:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "CacheInfo(hits=1, misses=1, maxsize=2, currsize=1)" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sz = 50\n", + "t = ReindexCollection(L.range(sz), cache=2)\n", + "\n", + "#trigger a cache hit by indexing into the same element multiple times\n", + "t[0], t[0]\n", + "t._get.cache_info()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can optionally clear the LRU cache by calling the `cache_clear` method:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "
ReindexCollection.cache_clear[source]
\n", + "\n", + "> ReindexCollection.cache_clear()\n", + "\n", + "Clear LRU cache" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "show_doc(ReindexCollection.cache_clear, title_level=5)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "CacheInfo(hits=0, misses=0, maxsize=2, currsize=0)" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sz = 50\n", + "t = ReindexCollection(L.range(sz), cache=2)\n", + "\n", + "#trigger a cache hit by indexing into the same element multiple times\n", + "t[0], t[0]\n", + "t.cache_clear()\n", + "t._get.cache_info()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "
ReindexCollection.shuffle[source]
\n", + "\n", + "> ReindexCollection.shuffle()\n", + "\n", + "Randomly shuffle indices" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "show_doc(ReindexCollection.shuffle, title_level=5)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Note that an ordered index is automatically constructed for the data structure even if one is not supplied." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['e', 'h', 'a', 'd', 'f', 'g', 'b', 'c']" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "rc=ReindexCollection(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'])\n", + "rc.shuffle()\n", + "list(rc)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "sz = 50\n", + "t = ReindexCollection(L.range(sz), cache=2)\n", + "test_eq(list(t), range(sz))\n", + "test_eq(t[sz-1], sz-1)\n", + "test_eq(t._get.cache_info().hits, 1)\n", + "t.shuffle()\n", + "test_eq(t._get.cache_info().hits, 1)\n", + "test_ne(list(t), range(sz))\n", + "test_eq(set(t), set(range(sz)))\n", + "t.cache_clear()\n", + "test_eq(t._get.cache_info().hits, 0)\n", + "test_eq(t.count(0), 1)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#hide\n", + "#Test ReindexCollection pickles\n", + "t1 = pickle.loads(pickle.dumps(t))\n", + "test_eq(list(t), list(t1))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Extensions to Pathlib.Path" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "An extension of the standard python libary [Pathlib.Path](https://docs.python.org/3/library/pathlib.html#basic-use). These extensions are accomplished by monkey patching additional methods onto `Pathlib.Path`." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "@patch\n", + "def readlines(self:Path, hint=-1, encoding='utf8'):\n", + " \"Read the content of `self`\"\n", + " with self.open(encoding=encoding) as f: return f.readlines(hint)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "@patch\n", + "def mk_write(self:Path, data, encoding=None, errors=None, mode=511):\n", + " \"Make all parent dirs of `self`\"\n", + " self.parent.mkdir(exist_ok=True, parents=True, mode=mode)\n", + " self.write_text(data, encoding=encoding, errors=errors)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "@patch\n", + "def ls(self:Path, n_max=None, file_type=None, file_exts=None):\n", + " \"Contents of path as a list\"\n", + " extns=L(file_exts)\n", + " if file_type: extns += L(k for k,v in mimetypes.types_map.items() if v.startswith(file_type+'/'))\n", + " has_extns = len(extns)==0\n", + " res = (o for o in self.iterdir() if has_extns or o.suffix in extns)\n", + " if n_max is not None: res = itertools.islice(res, n_max)\n", + " return L(res)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We add an `ls()` method to `pathlib.Path` which is simply defined as `list(Path.iterdir())`, mainly for convenience in REPL environments such as notebooks." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Path('.ipynb_checkpoints')" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "path = Path()\n", + "t = path.ls()\n", + "assert len(t)>0\n", + "t1 = path.ls(10)\n", + "test_eq(len(t1), 10)\n", + "t2 = path.ls(file_exts='.ipynb')\n", + "assert len(t)>len(t2)\n", + "t[0]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can also pass an optional `file_type` MIME prefix and/or a list of file extensions." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(Path('../fastcore/logargs.py'), Path('04_transform.ipynb'))" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "lib_path = (path/'../fastcore')\n", + "txt_files=lib_path.ls(file_type='text')\n", + "assert len(txt_files) > 0 and txt_files[0].suffix=='.py'\n", + "ipy_files=path.ls(file_exts=['.ipynb'])\n", + "assert len(ipy_files) > 0 and ipy_files[0].suffix=='.ipynb'\n", + "txt_files[0],ipy_files[0]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#hide\n", + "path = Path()\n", + "pkl = pickle.dumps(path)\n", + "p2 = pickle.loads(pkl)\n", + "test_eq(path.ls()[0], p2.ls()[0])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def open_file(fn, mode='r'):\n", + " \"Open a file, with optional compression if gz or bz2 suffix\"\n", + " if isinstance(fn, io.IOBase): return fn\n", + " fn = Path(fn)\n", + " if fn.suffix=='.bz2': return bz2.BZ2File(fn, mode)\n", + " elif fn.suffix=='.gz' : return gzip.GzipFile(fn, mode)\n", + " else: return open(fn,mode)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def save_pickle(fn, o):\n", + " \"Save a pickle file, to a file name or opened file\"\n", + " with open_file(fn, 'wb') as f: pickle.dump(o, f)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def load_pickle(fn):\n", + " \"Load a pickle file from a file name or opened file\"\n", + " with open_file(fn, 'rb') as f: return pickle.load(f)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "for suf in '.pkl','.bz2','.gz':\n", + " with tempfile.NamedTemporaryFile(suffix=suf) as f:\n", + " fn = Path(f.name)\n", + " save_pickle(fn, 't')\n", + " t = load_pickle(fn)\n", + " test_eq(t,'t')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "@patch\n", + "def __repr__(self:Path):\n", + " b = getattr(Path, 'BASE_PATH', None)\n", + " if b:\n", + " try: self = self.relative_to(b)\n", + " except: pass\n", + " return f\"Path({self.as_posix()!r})\"" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "fastai also updates the `repr` of `Path` such that, if `Path.BASE_PATH` is defined, all paths are printed relative to that path (as long as they are contained in `Path.BASE_PATH`:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "t = ipy_files[0].absolute()\n", + "try:\n", + " Path.BASE_PATH = t.parent.parent\n", + " test_eq(repr(t), f\"Path('nbs/{t.name}')\")\n", + "finally: Path.BASE_PATH = None" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## File Functions\n", + "\n", + "Utilities (other than extensions to Pathlib.Path) for dealing with IO." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def bunzip(fn):\n", + " \"bunzip `fn`, raising exception if output already exists\"\n", + " fn = Path(fn)\n", + " assert fn.exists(), f\"{fn} doesn't exist\"\n", + " out_fn = fn.with_suffix('')\n", + " assert not out_fn.exists(), f\"{out_fn} already exists\"\n", + " with bz2.BZ2File(fn, 'rb') as src, out_fn.open('wb') as dst:\n", + " for d in iter(lambda: src.read(1024*1024), b''): dst.write(d)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "f = Path('files/test.txt')\n", + "if f.exists(): f.unlink()\n", + "bunzip('files/test.txt.bz2')\n", + "t = f.open().readlines()\n", + "test_eq(len(t),1)\n", + "test_eq(t[0], 'test\\n')\n", + "f.unlink()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def join_path_file(file, path, ext=''):\n", + " \"Return `path/file` if file is a string or a `Path`, file otherwise\"\n", + " if not isinstance(file, (str, Path)): return file\n", + " path.mkdir(parents=True, exist_ok=True)\n", + " return path/f'{file}{ext}'" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "path = Path.cwd()/'_tmp'/'tst'\n", + "f = join_path_file('tst.txt', path)\n", + "assert path.exists()\n", + "test_eq(f, path/'tst.txt')\n", + "with open(f, 'w') as f_: assert join_path_file(f_, path) == f_\n", + "shutil.rmtree(Path.cwd()/'_tmp')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def urlread(url, data=None, **kwargs):\n", + " \"Retrieve `url`, using `data` dict or `kwargs` to `POST` if present\"\n", + " if kwargs and not data: data=kwargs\n", + " if data is not None:\n", + " if not isinstance(data, (str,bytes)): data = urlencode(data)\n", + " if not isinstance(data, bytes): data = data.encode('ascii')\n", + " cls = urllib.request.Request\n", + " if not isinstance(url,cls): url = cls(url)\n", + " url.headers['User-Agent'] = 'Mozilla/5.0'\n", + " with urlopen(url, data=data) as res: return res.read()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def urljson(url, data=None):\n", + " \"Retrieve `url` and decode json\"\n", + " return json.loads(urlread(url, data=data))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def run(cmd, *rest, ignore_ex=False, as_bytes=False):\n", + " \"Pass `cmd` (splitting with `shlex` if string) to `subprocess.run`; return `stdout`; raise `IOError` if fails\"\n", + " if rest: cmd = (cmd,)+rest\n", + " elif isinstance(cmd,str): cmd = shlex.split(cmd)\n", + " res = subprocess.run(cmd, capture_output=True)\n", + " stdout = res.stdout\n", + " if not as_bytes: stdout = stdout.decode()\n", + " if ignore_ex: return (res.returncode, stdout)\n", + " if res.returncode: raise IOError(\"{} ;; {}\".format(res.stdout, res.stderr))\n", + " return stdout" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can pass a string (which will be split based on standard shell rules), a list, or pass args directly:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "assert 'ipynb' in run('ls -l')\n", + "assert 'ipynb' in run(['ls', '-l'])\n", + "assert 'ipynb' in run('ls', '-l')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Some commands fail in non-error situations, like `grep`. Use `ignore_ex` in those cases, which will return a tuple of stdout and returncode:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "test_eq(run('grep asdfds 00_test.ipynb', ignore_ex=True)[0], 1)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "`run` automatically decodes returned bytes to a `str`. Use `as_bytes` to skip that:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "test_eq(run('echo hi', as_bytes=True), b'hi\\n')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def do_request(url, post=False, headers=None, **data):\n", + " \"Call GET or json-encoded POST on `url`, depending on `post`\"\n", + " if data:\n", + " if post: data = json.dumps(data).encode('ascii')\n", + " else:\n", + " url += \"?\" + urlencode(data)\n", + " data = None\n", + " return urljson(Request(url, headers=headers, data=data or None))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Other Helpers" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def _is_instance(f, gs):\n", + " tst = [g if type(g) in [type, 'function'] else g.__class__ for g in gs]\n", + " for g in tst:\n", + " if isinstance(f, g) or f==g: return True\n", + " return False\n", + "\n", + "def _is_first(f, gs):\n", + " for o in L(getattr(f, 'run_after', None)):\n", + " if _is_instance(o, gs): return False\n", + " for g in gs:\n", + " if _is_instance(f, L(getattr(g, 'run_before', None))): return False\n", + " return True\n", + "\n", + "def sort_by_run(fs):\n", + " end = L(fs).attrgot('toward_end')\n", + " inp,res = L(fs)[~end] + L(fs)[end], L()\n", + " while len(inp):\n", + " for i,o in enumerate(inp):\n", + " if _is_first(o, inp):\n", + " res.append(inp.pop(i))\n", + " break\n", + " else: raise Exception(\"Impossible to sort\")\n", + " return res" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Transforms and callbacks will have run_after/run_before attributes, this function will sort them to respect those requirements (if it's possible). Also, sometimes we want a tranform/callback to be run at the end, but still be able to use run_after/run_before behaviors. For those, the function checks for a toward_end attribute (that needs to be True)." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "class Tst(): pass \n", + "class Tst1(): run_before=[Tst]\n", + "class Tst2():\n", + " run_before=Tst\n", + " run_after=Tst1\n", + " \n", + "tsts = [Tst(), Tst1(), Tst2()]\n", + "test_eq(sort_by_run(tsts), [tsts[1], tsts[2], tsts[0]])\n", + "\n", + "Tst2.run_before,Tst2.run_after = Tst1,Tst\n", + "test_fail(lambda: sort_by_run([Tst(), Tst1(), Tst2()]))\n", + "\n", + "def tst1(x): return x\n", + "tst1.run_before = Tst\n", + "test_eq(sort_by_run([tsts[0], tst1]), [tst1, tsts[0]])\n", + " \n", + "class Tst1():\n", + " toward_end=True\n", + "class Tst2():\n", + " toward_end=True\n", + " run_before=Tst1\n", + "tsts = [Tst(), Tst1(), Tst2()]\n", + "test_eq(sort_by_run(tsts), [tsts[0], tsts[2], tsts[1]])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def trace(f):\n", + " \"Add `set_trace` to an existing function `f`\"\n", + " if getattr(f, '_traced', False): return f\n", + " def _inner(*args,**kwargs):\n", + " set_trace()\n", + " return f(*args,**kwargs)\n", + " _inner._traced = True\n", + " return _inner" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "You can add a breakpoint to an existing function, e.g:\n", + "\n", + "```python\n", + "Path.cwd = trace(Path.cwd)\n", + "Path.cwd()\n", + "```\n", + "\n", + "Now, when the function is called it will drop you into the debugger. Note, you must issue the `s` command when you begin to step into the function that is being traced." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def round_multiple(x, mult, round_down=False):\n", + " \"Round `x` to nearest multiple of `mult`\"\n", + " def _f(x_): return (int if round_down else round)(x_/mult)*mult\n", + " res = L(x).map(_f)\n", + " return res if is_listy(x) else res[0]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "test_eq(round_multiple(63,32), 64)\n", + "test_eq(round_multiple(50,32), 64)\n", + "test_eq(round_multiple(40,32), 32)\n", + "test_eq(round_multiple( 0,32), 0)\n", + "test_eq(round_multiple(63,32, round_down=True), 32)\n", + "test_eq(round_multiple((63,40),32), (64,32))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "@contextmanager\n", + "def modified_env(*delete, **replace):\n", + " \"Context manager temporarily modifying `os.environ` by deleting `delete` and replacing `replace`\"\n", + " prev = dict(os.environ)\n", + " try:\n", + " os.environ.update(replace)\n", + " for k in delete: os.environ.pop(k, None)\n", + " yield\n", + " finally:\n", + " os.environ.clear()\n", + " os.environ.update(prev)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "oldsh = os.environ['SHELL']\n", + "\n", + "with modified_env('PATH', SHELL='a'):\n", + " test_eq(os.environ['SHELL'], 'a')\n", + " assert 'PATH' not in os.environ\n", + "\n", + "assert 'PATH' in os.environ\n", + "test_eq(os.environ['SHELL'], oldsh)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "class ContextManagers(GetAttr):\n", + " \"Wrapper for `contextlib.ExitStack` which enters a collection of context managers\"\n", + " def __init__(self, mgrs): self.default,self.stack = L(mgrs),ExitStack()\n", + " def __enter__(self): self.default.map(self.stack.enter_context)\n", + " def __exit__(self, *args, **kwargs): self.stack.__exit__(*args, **kwargs)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "

class ContextManagers[source]

\n", + "\n", + "> ContextManagers(**`mgrs`**) :: [`GetAttr`](/foundation.html#GetAttr)\n", + "\n", + "Wrapper for `contextlib.ExitStack` which enters a collection of context managers" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "show_doc(ContextManagers, title_level=4)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def str2bool(s):\n", + " \"Case-insensitive convert string `s` too a bool (`y`,`yes`,`t`,`true`,`on`,`1`->`True`)\"\n", + " if not isinstance(s,str): return bool(s)\n", + " return bool(distutils.util.strtobool(s)) if s else False" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "for o in \"y YES t True on 1\".split(): assert str2bool(o)\n", + "for o in \"n no FALSE off 0\".split(): assert not str2bool(o)\n", + "for o in 0,None,'',False: assert not str2bool(o)\n", + "for o in 1,True: assert str2bool(o)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Multiprocessing" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "from multiprocessing import Process, Queue\n", + "import concurrent.futures\n", + "import time\n", + "from multiprocessing import Manager" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def set_num_threads(nt):\n", + " \"Get numpy (and others) to use `nt` threads\"\n", + " try: import mkl; mkl.set_num_threads(nt)\n", + " except: pass\n", + " try: import torch; torch.set_num_threads(nt)\n", + " except: pass\n", + " os.environ['IPC_ENABLE']='1'\n", + " for o in ['OPENBLAS_NUM_THREADS','NUMEXPR_NUM_THREADS','OMP_NUM_THREADS','MKL_NUM_THREADS']:\n", + " os.environ[o] = str(nt)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This sets the number of threads consistently for many tools, by:\n", + "\n", + "1. Set the following environment variables equal to `nt`: `OPENBLAS_NUM_THREADS`,`NUMEXPR_NUM_THREADS`,`OMP_NUM_THREADS`,`MKL_NUM_THREADS`\n", + "2. Sets `nt` threads for numpy and pytorch." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def _call(lock, pause, n, g, item):\n", + " l = False\n", + " if pause:\n", + " try:\n", + " l = lock.acquire(timeout=pause*(n+2))\n", + " time.sleep(pause)\n", + " finally:\n", + " if l: lock.release()\n", + " return g(item)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "class ProcessPoolExecutor(concurrent.futures.ProcessPoolExecutor):\n", + " \"Same as Python's ProcessPoolExecutor, except can pass `max_workers==0` for serial execution\"\n", + " def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs):\n", + " if max_workers is None: max_workers=defaults.cpus\n", + " store_attr()\n", + " self.not_parallel = max_workers==0\n", + " if self.not_parallel: max_workers=1\n", + " super().__init__(max_workers, **kwargs)\n", + "\n", + " def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs):\n", + " self.lock = Manager().Lock()\n", + " g = partial(f, *args, **kwargs)\n", + " if self.not_parallel: return map(g, items)\n", + " _g = partial(_call, self.lock, self.pause, self.max_workers, g)\n", + " try: return super().map(_g, items, timeout=timeout, chunksize=chunksize)\n", + " except Exception as e: self.on_exc(e)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "class ThreadPoolExecutor(concurrent.futures.ThreadPoolExecutor):\n", + " \"Same as Python's ThreadPoolExecutor, except can pass `max_workers==0` for serial execution\"\n", + " def __init__(self, max_workers=defaults.cpus, on_exc=print, pause=0, **kwargs):\n", + " if max_workers is None: max_workers=defaults.cpus\n", + " store_attr()\n", + " self.not_parallel = max_workers==0\n", + " if self.not_parallel: max_workers=1\n", + " super().__init__(max_workers, **kwargs)\n", + "\n", + " def map(self, f, items, timeout=None, chunksize=1, *args, **kwargs):\n", + " self.lock = Manager().Lock()\n", + " g = partial(f, *args, **kwargs)\n", + " if self.not_parallel: return map(g, items)\n", + " _g = partial(_call, self.lock, self.pause, self.max_workers, g)\n", + " try: return super().map(_g, items, timeout=timeout, chunksize=chunksize)\n", + " except Exception as e: self.on_exc(e)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "

class ProcessPoolExecutor[source]

\n", + "\n", + "> ProcessPoolExecutor(**`max_workers`**=*`64`*, **`on_exc`**=*`print`*, **`pause`**=*`0`*, **\\*\\*`kwargs`**) :: [`ProcessPoolExecutor`](/xtras.html#ProcessPoolExecutor)\n", + "\n", + "Same as Python's ProcessPoolExecutor, except can pass `max_workers==0` for serial execution" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "show_doc(ProcessPoolExecutor, title_level=4)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "try: from fastprogress import progress_bar\n", + "except: progress_bar = None" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export \n", + "def parallel(f, items, *args, n_workers=defaults.cpus, total=None, progress=None, pause=0,\n", + " threadpool=False, timeout=None, chunksize=1, **kwargs):\n", + " \"Applies `func` in parallel to `items`, using `n_workers`\"\n", + " if progress is None: progress = progress_bar is not None\n", + " pool = ThreadPoolExecutor if threadpool else ProcessPoolExecutor\n", + " with pool(n_workers, pause=pause) as ex:\n", + " r = ex.map(f,items, *args, timeout=timeout, chunksize=chunksize, **kwargs)\n", + " if progress:\n", + " if total is None: total = len(items)\n", + " r = progress_bar(r, total=total, leave=False)\n", + " return L(r)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def add_one(x, a=1): \n", + " time.sleep(random.random()/80)\n", + " return x+a\n", + "\n", + "inp,exp = range(50),range(1,51)\n", + "test_eq(parallel(add_one, inp, n_workers=2, progress=False), exp)\n", + "test_eq(parallel(add_one, inp, threadpool=True, n_workers=2, progress=False), exp)\n", + "test_eq(parallel(add_one, inp, n_workers=0), exp)\n", + "test_eq(parallel(add_one, inp, n_workers=1, a=2), range(2,52))\n", + "test_eq(parallel(add_one, inp, n_workers=0, a=2), range(2,52))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Use the `pause` parameter to ensure a pause of `pause` seconds between processes starting. This is in case there are race conditions in starting some process, or to stagger the time each process starts, for example when making many requests to a webserver. Set `threadpool=True` to use `ThreadPoolExecutor` instead of `ProcessPoolExecutor`." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from datetime import datetime" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0 2020-10-24 14:12:11.014495\n", + "1 2020-10-24 14:12:11.265213\n", + "2 2020-10-24 14:12:11.515864\n", + "3 2020-10-24 14:12:11.767123\n", + "4 2020-10-24 14:12:12.017351\n" + ] + } + ], + "source": [ + "def print_time(i): \n", + " time.sleep(random.random()/1000)\n", + " print(i, datetime.now())\n", + "\n", + "parallel(print_time, range(5), n_workers=2, pause=0.25);" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Note that `f` should accept a collection of items." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def run_procs(f, f_done, args):\n", + " \"Call `f` for each item in `args` in parallel, yielding `f_done`\"\n", + " processes = L(args).map(Process, args=arg0, target=f)\n", + " for o in processes: o.start()\n", + " yield from f_done()\n", + " processes.map(Self.join())" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def _f_pg(obj, queue, batch, start_idx):\n", + " for i,b in enumerate(obj(batch)): queue.put((start_idx+i,b))\n", + "\n", + "def _done_pg(queue, items): return (queue.get() for _ in items)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export \n", + "def parallel_gen(cls, items, n_workers=defaults.cpus, **kwargs):\n", + " \"Instantiate `cls` in `n_workers` procs & call each on a subset of `items` in parallel.\"\n", + " if n_workers==0:\n", + " yield from enumerate(list(cls(**kwargs)(items)))\n", + " return\n", + " batches = L(chunked(items, n_chunks=n_workers))\n", + " idx = L(itertools.accumulate(0 + batches.map(len)))\n", + " queue = Queue()\n", + " if progress_bar: items = progress_bar(items, leave=False)\n", + " f=partial(_f_pg, cls(**kwargs), queue)\n", + " done=partial(_done_pg, queue, items)\n", + " yield from run_procs(f, done, L(batches,idx).zip())" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "class _C:\n", + " def __call__(self, o): return ((i+1) for i in o)\n", + "\n", + "items = range(5)\n", + "\n", + "res = L(parallel_gen(_C, items, n_workers=3))\n", + "idxs,dat1 = zip(*res.sorted(itemgetter(0)))\n", + "test_eq(dat1, range(1,6))\n", + "\n", + "res = L(parallel_gen(_C, items, n_workers=0))\n", + "idxs,dat2 = zip(*res.sorted(itemgetter(0)))\n", + "test_eq(dat2, dat1)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "`cls` is any class with `__call__`. It will be passed `args` and `kwargs` when initialized. Note that `n_workers` instances of `cls` are created, one in each process. `items` are then split in `n_workers` batches and one is sent to each `cls`. The function then returns a generator of tuples of item indices and results." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "class TestSleepyBatchFunc:\n", + " \"For testing parallel processes that run at different speeds\"\n", + " def __init__(self): self.a=1\n", + " def __call__(self, batch):\n", + " for k in batch:\n", + " time.sleep(random.random()/4)\n", + " yield k+self.a\n", + "\n", + "x = np.linspace(0,0.99,20)\n", + "res = L(parallel_gen(TestSleepyBatchFunc, x, n_workers=2))\n", + "test_eq(res.sorted().itemgot(1), x+1)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#export\n", + "def threaded(f):\n", + " \"Run `f` in a thread, and returns the thread\"\n", + " @wraps(f)\n", + " def _f(*args, **kwargs):\n", + " res = Thread(target=f, args=args, kwargs=kwargs)\n", + " res.start()\n", + " return res\n", + " return _f" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Export -" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Converted 00_test.ipynb.\n", + "Converted 01_basics.ipynb.\n", + "Converted 02_foundation.ipynb.\n", + "Converted 03_dispatch.ipynb.\n", + "Converted 03_xtras.ipynb.\n", + "Converted 04_transform.ipynb.\n", + "Converted 05_logargs.ipynb.\n", + "Converted 06_meta.ipynb.\n", + "Converted 07_script.ipynb.\n", + "Converted index.ipynb.\n" + ] + } + ], + "source": [ + "#hide\n", + "from nbdev.export import notebook2script\n", + "notebook2script()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "jupytext": { + "split_at_heading": true + }, + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + } + }, + "nbformat": 4, + "nbformat_minor": 4 +} diff --git a/nbs/03_dispatch.ipynb b/nbs/04_dispatch.ipynb similarity index 100% rename from nbs/03_dispatch.ipynb rename to nbs/04_dispatch.ipynb diff --git a/nbs/04_transform.ipynb b/nbs/05_transform.ipynb similarity index 100% rename from nbs/04_transform.ipynb rename to nbs/05_transform.ipynb diff --git a/nbs/05_logargs.ipynb b/nbs/06_logargs.ipynb similarity index 100% rename from nbs/05_logargs.ipynb rename to nbs/06_logargs.ipynb diff --git a/nbs/06_meta.ipynb b/nbs/07_meta.ipynb similarity index 100% rename from nbs/06_meta.ipynb rename to nbs/07_meta.ipynb diff --git a/nbs/07_script.ipynb b/nbs/08_script.ipynb similarity index 100% rename from nbs/07_script.ipynb rename to nbs/08_script.ipynb