# https://github.com/laike9m/pdir2/wiki/User-Configuration
!export PDIR2_CONFIG_FILE="~/.pdir2config"


%%file ~/.pdir2config
[global]
category-color = magenta
attribute-color = bright blue
comma-color = bright blue
doc-color = bright black
#uniform-color = bright black

Overwriting /home/enrico/.pdir2config

a = [1, 2, 3]
a.append(4) # add a new element to the list
a.index(3) # return the index of the element, without changing the object

def add(a, b):
    return a+b

>>> timer = Timer()
>>> timer.tick("event")
>>> timer.log()


import time

class Timer:
    def __init__(self):
        self._ticks: dict[str, int] = {}
            
    def tick(self, event_name: str):
        self._ticks[event_name] = time.time()
            
    def log(self):
        for name, epoch in self._ticks.items():
            print(repr(name), "happened at", epoch)
                
timer = Timer()
timer.tick("hello, world!")
timer.log()

'hello, world!' happened at 1615649618.2291648

>>> timer = Timer()
>>> timer.tick("event")
>>> timer.tick("event")
>>> timer.log()


import time
from collections import defaultdict

class Timer:
    def __init__(self):
        self._ticks: dict[str, list[int]] = defaultdict(list)
            
    def tick(self, event_name: str):
        self._ticks[event_name].append(time.time())
            
    def log(self):
        for name, epochs in self._ticks.items():
            joined_str = " and ".join(str(e) for e in epochs)
            print(repr(name), "happened at", joined_str)
            
                
timer = Timer()
timer.tick("hello, world!")
timer.tick("hello, world!")
timer.log()

'hello, world!' happened at 1615649833.8234465 and 1615649833.8235137

>>> timer = Timer()
>>> timer.tick("fun1/event")
>>> timer.tick("fun2/event")
>>> timer.log("fun1/")


import time
from collections import defaultdict

class Timer:
    def __init__(self):
        self._ticks: dict[str, list[int]] = defaultdict(list)
            
    def tick(self, event_name: str):
        self._ticks[event_name].append(time.time())
            
    def log(self, filter=""):
        for name, epochs in self._ticks.items():
            if filter not in name:
                continue
            joined_str = " and ".join(str(e) for e in epochs)
            print(repr(name), "happened at", joined_str)
            
                
timer = Timer()
timer.tick("fun1/event")
timer.tick("fun2/event")
timer.log()
print("-"*60)
timer.log("fun1/")

'fun1/event' happened at 1615651954.5938675
'fun2/event' happened at 1615651954.5939393
------------------------------------------------------------
'fun1/event' happened at 1615651954.5938675


from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import make_pipeline
from sklearn.linear_model import LinearRegression

import numpy as np
import numpy.random as rn


rn.seed(42)               # fix the random seed to have replicability
data = rn.randn(200, 2)   # 200 bidimensional data points
y = (
    + 1.0 * data[:, 0]    # first component, weight 1
    + 0.5 * data[:, 1]    # second component, weight 0.5
    + rn.randn(len(data)) # noise component
)


# this is the data that we want to do the prediction about
new_data = rn.randn(10, 2)


sc = StandardScaler()
sc.fit(data)# estimate the parameters for the standardization
print(sc.transform(data)[:5, :]) # apply the standardization to the OLD data
# apply the standardization to the NEW data with the estimates of the old
print(sc.transform(new_data)[:5, :])

[[ 0.51326213 -0.18391283]
 [ 0.67128389  1.542076  ]
 [-0.25172177 -0.28351899]
 [ 1.64629106  0.75705623]
 [-0.4980274   0.5234244 ]]
[[ 0.78568602 -0.99834079]
 [ 0.90356022  1.36816536]
 [ 0.42609546  1.90961842]
 [-0.81654741 -1.33338866]
 [-1.86838793  1.51403957]]


lr = LinearRegression()
lr.fit(data, y)          # fit the regressor on the OLD data
lr.predict(new_data)[:5] # use the learned parameter to predict the NEW ones

array([ 0.21489663,  1.58054749,  1.37919105, -1.59348275, -1.16617208])


lr.coef_

array([1.06614468, 0.54683588])


pipe = make_pipeline(
    StandardScaler(),    # scale the data
    LinearRegression(),  # perform the linear regression
)

pipe.fit(data, y)        # fit the linear regressor 
pipe.predict(new_data)   # predict for the new values

array([ 0.21489663,  1.58054749,  1.37919105, -1.59348275, -1.16617208,
        0.57936311, -0.4048604 ,  2.59029857,  0.42561625,  0.54736359])


class AvgPredictor:
    def fit(self, X, y):
        self.avg = np.mean(y)
        return self # flow interface, debatable
    
    def predict(self, X):
        return np.ones(len(X))*self.avg
    
pipe = make_pipeline(
    StandardScaler(), 
    AvgPredictor(),
)
pipe.fit(data, y)
pipe.predict(new_data)

array([-0.05993531, -0.05993531, -0.05993531, -0.05993531, -0.05993531,
       -0.05993531, -0.05993531, -0.05993531, -0.05993531, -0.05993531])


import pdir as dir

class MyclassName:
    <classbody>

spotty = Dog()


class Empty:
    """this class does not do anything.
    
    it's just a stub for explainations, and this is its docstring"""


some_object = Empty()


type(some_object)

__main__.Empty


isinstance(some_object, Empty)

True


help(some_object)

Help on Empty in module __main__ object:

class Empty(builtins.object)
 |  this class does not do anything.
 |  
 |  it's just a stub for explainations, and this is its docstring
 |  
 |  Data descriptors defined here:
 |  
 |  __dict__
 |      dictionary for instance variables (if defined)
 |  
 |  __weakref__
 |      list of weak references to the object (if defined)


dir(some_object).public


dir(some_object)

special attribute:
    __class__, __dict__, __doc__, __module__, __weakref__
abstract class:
    __subclasshook__
object customization:
    __format__, __hash__, __init__, __new__, __repr__, __sizeof__, __str__
rich comparison:
    __eq__, __ge__, __gt__, __le__, __lt__, __ne__
attribute access:
    __delattr__, __dir__, __getattribute__, __setattr__
class customization:
    __init_subclass__
pickle:
    __reduce__, __reduce_ex__


class Empty:
    pass

namespace_0 = Empty()
namespace_1 = Empty()


namespace_0.a = 2
namespace_0.a

2


namespace_1.a

---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
<ipython-input-134-e8dada81b736> in <module>
----> 1 namespace_1.a

AttributeError: 'Empty' object has no attribute 'a'


dir(namespace_0).public.properties

property:
    a


namespace_0.__dict__

{'a': 2}


namespace_1.__dict__

{}


hasattr(namespace_0, 'a')

True


hasattr(namespace_1, 'a')

False


setattr(namespace_1, 'a', 4)
getattr(namespace_1, 'a')

4


getattr(namespace_1, 'b', 'default_value')

'default_value'


namespace_0.__class__

__main__.Empty


class Something:
    b = 3

namespace_0 = Something()
namespace_1 = Something()


namespace_0.__dict__

{}


namespace_0.b

3


Something.mro()

[__main__.Something, object]


dir(Something).public

property:
    b


namespace_0.b = 5
namespace_0.b

5


namespace_1.b

3


del namespace_0.b
namespace_0.b

3

class MyClass:
    __version__ = (0, 1, 0)


class Something:
    a = 2
    def multiply(self, b=2):
        return self.a*b


namespace_0 = Something()

namespace_0.multiply

<bound method Something.multiply of <__main__.Something object at 0x7fbf46e70ba8>>


namespace_0.multiply(b=2)

4


Something.multiply(namespace_0, b=3)

6


class Empty:
    a = 3

weird = Empty()

Something.multiply(weird, b=3)

9


from operator import methodcaller


obj_set = set([1, 2])
updater = methodcaller("update", [3])
updater(obj_set)
print(obj_set)

{1, 2, 3}


obj_dict = dict(a=1, b=2)
updater = methodcaller("update", [('c', 3)])
updater(obj_dict)
print(obj_dict)

{'a': 1, 'b': 2, 'c': 3}


# wrapping
def apply(fname, obj, *args, **kwargs):
    return methodcaller(fname, *args, **kwargs)(obj)

obj_dict = dict(a=1, b=2)
apply("update", obj_dict, [('c', 3)])
print(obj_dict)

{'a': 1, 'b': 2, 'c': 3}


from functools import partial
class DeferredMethodExecution:
    def __getattr__(self, fname):
        return partial(apply, fname)
do = DeferredMethodExecution()

# actual use
obj_dict = dict(a=1, b=2)
do.update(obj_dict, [('c', 3)])
print(obj_dict)

{'a': 1, 'b': 2, 'c': 3}


def triple_function(self):
    return self.a*3

Something.triple = triple_function

namespace_0 = Something()
namespace_0.triple()

6


from types import MethodType

def external_function(self):
    return self.a*2

namespace = Something()
namespace.func = MethodType(external_function, namespace)
namespace.func()

4


class Something:
    def __init__(self, a):
        self.a = a

namespace = Something(a=3)
namespace.a

3


from dataclasses import dataclass

@dataclass
class InventoryItem:
    name: str
    unit_price: float
    quantity_on_hand: int = 0

    def total_cost(self) -> float:
        return self.unit_price * self.quantity_on_hand

item = InventoryItem('hammers', 10.0, 12)
print(item.total_cost())

120.0

def __init__(self, name: str, unit_price: float, quantity_on_hand: int=0):
    self.name = name
    self.unit_price = unit_price
    self.quantity_on_hand = quantity_on_hand

my_object + something


@dataclass
class Something:
    a: int
        
    def __add__(self, other):
        return self.__class__(self.a+other)

namespace_0 = Something(a=3)
print(namespace_0.a)

namespace_1 = namespace_0 + 2
print(namespace_1.a)

3
5


namespace_2 = 2 + namespace_0

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-193-6ca245b48fe2> in <module>
----> 1 namespace_2 = 2 + namespace_0

TypeError: unsupported operand type(s) for +: 'int' and 'Something'

__radd__ = __add__


@dataclass
class Something:
    a: int
        
    def __add__(self, other):
        if not isinstance(other, int):
            return NotImplemented
        return self.__class__(self.a+other)
    
    __radd__ = __add__

namespace_0 = Something(a=3)
namespace_2 = 2 + namespace_0
namespace_2.a

5


namespace_2 + "a"

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-240-52e8ac33a07f> in <module>
----> 1 namespace_2 + "a"

TypeError: unsupported operand type(s) for +: 'Something' and 'str'


class Something:
    @property
    def myattr(self):
        return 1

namespace = Something()
namespace.myattr

1


namespace.myattr = 2

---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
<ipython-input-206-41b7a728e224> in <module>
----> 1 namespace.myattr = 2

AttributeError: can't set attribute


class Something:
    @property
    def name(self):
        return self._name
    
    @name.setter
    def name(self, value):
        self._name = value.title()
        

namespace = Something()
namespace.name = "eNRICO"
namespace.name

'Enrico'


dir(namespace).own.public

descriptor:
    name: @property with getter, setter


class Something:
    @property
    def name(self):
        if not hasattr(self, "_name"):
            raise ValueError("the `name` attribute has not been set")
        return self._name
    
    @name.setter
    def name(self, value):
        if not isinstance(value, str):
            s = ("name need to be a string, "
                 "a value of <{}> was provided")
            raise TypeError(s.format(repr(value)))
        self._name = value.title()


namespace = Something()
namespace.name

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-213-36921b093d67> in <module>
      1 namespace = Something()
----> 2 namespace.name

<ipython-input-212-e3b8550f5f83> in name(self)
      3     def name(self):
      4         if not hasattr(self, "_name"):
----> 5             raise ValueError("the `name` attribute has not been set")
      6         return self._name
      7 

ValueError: the `name` attribute has not been set


namespace.name = [1, 2]

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-215-2fb97a563220> in <module>
----> 1 namespace.name = [1, 2]

<ipython-input-212-e3b8550f5f83> in name(self, value)
      9     def name(self, value):
     10         if not isinstance(value, str):
---> 11             raise TypeError("name need to be a string, a value of <{}> was provided".format(repr(value)))
     12         self._name = value.title()
     13 

TypeError: name need to be a string, a value of <[1, 2]> was provided


namespace.name = "eNRICO"
namespace.name

'Enrico'


class Something:
    def __getattr__(self, name):
        return "{} has been requested".format(repr(name))

namespace = Something()
namespace.b

"'b' has been requested"

class ClassName(SuperClass_0, SuperClass_1):
    <class_body>


class ZeroError(ValueError): pass
class NegativeError(ValueError): pass

def myfunction(a):
    if a<0:
        raise NegativeError("the value should not be negative")
    if a==0:
        raise ZeroError("the value should not be zero")
        
    return a*2


try:
    myfunction(0)
except ValueError:
    pass

try:
    myfunction(-1)
except ValueError:
    pass


try:
    myfunction(0)
except ZeroError:
    pass


try:
    myfunction(-1)
except ZeroError:
    pass

---------------------------------------------------------------------------
NegativeError                             Traceback (most recent call last)
<ipython-input-380-07678d184437> in <module>
      1 try:
----> 2     myfunction(-1)
      3 except ZeroError:
      4     pass

<ipython-input-377-674f95bb9925> in myfunction(a)
      4 def myfunction(a):
      5     if a<0:
----> 6         raise NegativeError("the value should not be negative")
      7     if a==0:
      8         raise ZeroError("the value should not be zero")

NegativeError: the value should not be negative


class ValueOrIndexError(ValueError, IndexError): pass
import string

class MyDict(dict):
    def __getitem__(self, char):
        if char not in string.ascii_letters:
            raise ValueOrIndexError(f"'{char}' is not a valid character!")
        else:
            return ord(char)


temp = MyDict()
temp['a']

97


temp['2']

---------------------------------------------------------------------------
ValueOrIndexError                         Traceback (most recent call last)
<ipython-input-407-c40d2261fa0f> in <module>
----> 1 temp['2']

<ipython-input-399-1cfb1db28486> in __getitem__(self, char)
      5     def __getitem__(self, char):
      6         if char not in string.ascii_letters:
----> 7             raise ValueOrIndexError(f"'{char}' is not a valid character!")
      8         else:
      9             return ord(char)

ValueOrIndexError: '2' is not a valid character!


try:
    temp['2']
except ValueError:
    pass


try:
    temp['2']
except IndexError:
    pass

@dataclass
class Animal:
   name: str

   def walk(self):
       print(f"{self.name} is walking")

class Dog(Animal):
    def bark(self):
        print(f"{self.name} is barking!")

class Snake(Animal):
    def walk(self):
        print(f"{self.name} is slithering!")

class Cat(Animal):
    def walk(self):
        super().walk()
        print(f"{self.name} is wagging is tail!")


import collections

class Empty(collections.MutableMapping):
    def __getitem__(): pass
    def __setitem__(): pass
    def __delitem__(): pass 
    def keys(): pass

dir(Empty).public

function:
    clear: D.clear() -> None.  Remove all items from D.
    get: D.get(k[,d]) -> D[k] if k in D, else d.  d defaults to None.
    items: D.items() -> a set-like object providing a view on D's items
    keys: D.keys() -> a set-like object providing a view on D's keys
    pop: D.pop(k[,d]) -> v, remove specified key and return the corresponding value.
    popitem: D.popitem() -> (k, v), remove and return some (key, value) pair
    setdefault: D.setdefault(k[,d]) -> D.get(k,d), also set D[k]=d if k not in D
    update: D.update([E, ]**F) -> None.  Update D from mapping/iterable E and F.
    values: D.values() -> an object providing a view on D's values


from typing import Protocol, runtime_checkable

# this class check if the object has an attribute called handles that is integer
@runtime_checkable
class Portable(Protocol):
    handles: int
        
# this class check if the class provides the method with the given signature
@runtime_checkable
class Ducky(Protocol):
    def quack(self) -> None:
        pass


class Empty:
    pass

obj = Empty()
assert not isinstance(obj, Portable)

obj.handles = 3
assert isinstance(obj, Portable)


class Duck:
    def quack(self):
        pass
    
assert issubclass(Duck, Ducky)
duck_instance = Duck()
assert isinstance(duck_instance, Ducky)

def talk_with(pet: Ducky):
    pet.quack()


%%file temp_mypy.py
from typing import Protocol, runtime_checkable

@runtime_checkable
class TalkativeDuck(Protocol):
    def quack(self) -> str:
        return "quack"
    
class MechanicalDuck:
    def quack(self) -> int:
        return 0
    
assert issubclass(MechanicalDuck, TalkativeDuck)

def talk(pet: TalkativeDuck):
    print(pet.quack())

talk(MechanicalDuck())

Overwriting temp_mypy.py


!python temp_mypy.py

0


!mypy temp_mypy.py

temp_mypy.py:17: error: Argument 1 to "talk" has incompatible type "MechanicalDuck"; expected "TalkativeDuck"
temp_mypy.py:17: note: Following member(s) of "MechanicalDuck" have conflicts:
temp_mypy.py:17: note:     Expected:
temp_mypy.py:17: note:         def quack(self) -> str
temp_mypy.py:17: note:     Got:
temp_mypy.py:17: note:         def quack(self) -> int
Found 1 error in 1 file (checked 1 source file)


class BasicPrinter:
    def printer(self, message):
        print(message)
        
    def say_hello(self, name):
        s = f"hello {name}!\n"
        self.printer(s)
        
class LoggingPrinter(BasicPrinter):
    def printer(self, message):
        import logging
        logging.warning(message)
        
BasicPrinter().say_hello("everybody")
LoggingPrinter().say_hello("everybody")

WARNING:root:hello everybody!

hello everybody!


@dataclass
class Printer:
    printer: callable = print
        
    def say_hello(self, name):
        s = f"hello {name}!\n"
        self.printer(s)
        
myprinter = Printer()
myprinter.say_hello("everybody")

hello everybody!


from io import StringIO
s = StringIO()

myprinter.printer = s.write
myprinter.say_hello("everybody")
myprinter.say_hello("nobody")

print(s.getvalue())

hello everybody!
hello nobody!


from dataclasses import dataclass
from typing import List

@dataclass
class ColumnSelector(BaseEstimator, TransformerMixin):
    columns: List[str]

    def fit(self, X, y=None):
        return self

    def transform(self, X):
        return X[self.columns]


cs = ColumnSelector(columns=["a", "e"])
print(cs.get_params())

{'columns': ['a', 'e']}


import pandas as pd
df = pd.DataFrame(rn.randn(5, 5), columns=list("abcde"))
cs.fit_transform(df)

def times(a, b):
    return a*b


from functools import singledispatch
from statistics import mean
import numpy as np

def average(iterable):
    if isinstance(iterable, np.ndarray):
        print("using the specific (and fast) numpy mean")
        return iterable.mean()
    else:
        print("using the generic (and slow) python mean")
        return mean(iterable)


average([1, 2, 3])

using the generic (and slow) python mean

2


data = np.array([1, 2, 3])
average(data)

using the specific (and fast) numpy mean

2.0


@singledispatch
def average(iterable):
    print("using the generic (and slow) python mean")
    return mean(iterable)

@average.register
def _(np_array: np.ndarray):
    print("using the specific (and very fast) numpy mean")
    return np_array.mean()


average([1, 2, 3])

using the generic (and slow) python mean

2


data = np.array([1, 2, 3])
average(data)

using the specific (and very fast) numpy mean

2.0


class AverageAware:
    def __init__(self, value):
        self.value = value
    
    def _my_avg(self):
        return self.value

average.register(AverageAware)(AverageAware._my_avg)

a = AverageAware(5)
average(a)

5


from typing import Protocol, runtime_checkable

@singledispatch
def average(iterable):
    "when not defined, try to use python"
    print("python mean used")
    return mean(iterable)

@runtime_checkable
class Provide_mean(Protocol):
    "this is the protocol to identify classes that have a `mean` function"
    def mean(self):
        pass

@average.register
def _(instance: Provide_mean):
    "if the class has a `mean` function, calls it"
    print("object's own mean function used")
    return instance.mean()


print(average([1, 2, 3]))

python mean used
2


data = np.array([1, 2, 3])
average(data)

object's own mean function used

2.0


class MyClass:
    def mean(self):
        return 0.0
        
pippo = MyClass()
print(average(pippo))

object's own mean function used
0.0


def average2(iterable):
    avg_fun = getattr(iterable, "mean", None)
    if callable(avg_fun):
        return avg_fun()
    return mean(iterable)

print(average2([1, 2, 3]))
print(average2(np.array([4, 5, 6])))
pippo = MyClass()
print(average2(pippo))

2
5.0
0.0


from functools import singledispatchmethod
from dataclasses import dataclass
from numbers import Number

@dataclass
class Container:
    value: Number
    
    @singledispatchmethod
    def __add__(self, other):
        return NotImplemented
    
    @__add__.register
    def _(self, other: Number):
        return self.__class__(self.value+other)


cont = Container(3)
print(cont)
print(cont+"1")

Container(value=3)

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Input In [28], in <cell line: 3>()
      1 cont = Container(3)
      2 print(cont)
----> 3 print(cont+"1")

TypeError: unsupported operand type(s) for +: 'Container' and 'str'


cont = Container(3)
print(cont)
print(cont+1)

Container(value=3)
Container(value=4)


class Broken:
    def test(self, a: Broken):
        pass

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
Cell In[3], line 1
----> 1 class Broken:
      2     def test(self, a: Broken):
      3         pass

Cell In[3], line 2, in Broken()
      1 class Broken:
----> 2     def test(self, a: Broken):
      3         pass

NameError: name 'Broken' is not defined


from functools import singledispatchmethod

class SelfReferent:
    @singledispatchmethod
    def __add__(self, other):
        """generic version of the function"""
        return NotImplemented

@SelfReferent.__add__.register
def _(self, other: SelfReferent):
    return 2


p = SelfReferent()
q = SelfReferent()

p+q

2

p+1

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[8], line 1
----> 1 p+1

TypeError: unsupported operand type(s) for +: 'SelfReferent' and 'int'

predictor_transformer = PT(LinearRegression)
predictor_transformer.fit(X_train, y_train)
predictor_transformer.transform(X_test) # should return a 2d array Nx1 with the predicted y_test

group_standardizer = GS(groupby_column='country')
group_standardizer.fit(X_train, y_train)
group_standardizer.transform(X_train)


# type is an object that have type type, which is an object that have type type, etc...
class Empty_base:
    pass

class Empty(Empty_base):
    pass

assert issubclass(Empty, Empty_base)
assert isinstance(Empty, object)

assert type(Empty()) is Empty
assert type(Empty) is type

assert type(type) is type
assert type(object) is type
assert isinstance(type, object)


# dynamical class generation
Foo = type('SomeClass', (Empty, ), {'x':100})
assert Foo.__name__ == 'SomeClass'

someobject = Foo()
assert isinstance(someobject, Foo)
assert type(Foo) is type

someobject.x

100


# we can subclass type and use it to generate classes, and so the new class type in going to be a subclass of type
class Meta(type):
    def __new__(cls, name, bases, dct):
        x = super().__new__(cls, name, bases, dct)
        x.attr = 100
        
        def obscure(self):
            return self.attr
        x.obscure = obscure
        
        return x
    
Foo = Meta('SomeClass', (Empty, ), {})
assert Foo.__name__ == 'SomeClass'

someobject = Foo()
assert isinstance(someobject, Foo)
assert type(Foo) is Meta

assert someobject.obscure() == someobject.attr


class Foo(metaclass=Meta):
    pass

someobject = Foo()
assert isinstance(someobject, Foo)
assert type(Foo) is Meta

assert someobject.obscure() == someobject.attr

def evolve(initial_state, rule, boundary='fixed dead'):
    # do something with those info


import enum

class BoundaryType(enum.Enum):
    REFLECTIVE = "reflective"
    CIRCULAR = "circular"
    FIXED_DEAD = 'fixed dead'
    FIXED_ALIVE = 'fixed alive'

def evolve(initial_state, rule, boundary=BoundaryType.FIXED_DEAD):
    # function body


def fun():
    pass

fun.x = 3
dir(fun).public

property:
    x


class LineStyle(enum.Enum):
    NO_LINE = 'noline'
    THIN = 'thin'
    BOLD = 'bold'
    
def draw_square(top=LineStyle.THIN, bottom=LineStyle.THIN, left=LineStyle.THIN, right=LineStyle.THIN):
    pass

for style in LineStyle:
    setattr(draw_square, style.name, style)

dir(draw_square).public

property:
    BOLD, NO_LINE, THIN

draw_square(bottom=draw_square.BOLD)


class LineStyle(enum.Enum):
    NO_LINE = 'noline'
    THIN = 'thin'
    BOLD = 'bold'
    
def draw_square(top=LineStyle.THIN, bottom=LineStyle.THIN, left=LineStyle.THIN, right=LineStyle.THIN):
    pass

draw_square.LineStyle = LineStyle

dir(draw_square).public

class:
    LineStyle: An enumeration.

draw_square(bottom=draw_square.LineStyle.BOLD)


class CornerStyle(enum.Enum):
    POINTY = 'pointy'
    SQUARED = 'squared'
    CURVED = 'curved'
    
def draw_square(corners=CornerStyle.SQUARED):
    pass

draw_square.corners = LineStyle

dir(draw_square).public

class:
    corners: An enumeration.

draw_square(corners=draw_square.corners.CURVED)


class FluentNumber:
    def __init__(self, value):
        self.value = value
        
    def add(self, value):
        self.value += value
        return self
    
    def multiply(self, value):
        self.value *= value
        return self
    
number2 = FluentNumber(2)
result = number2.add(3).multiply(2)
print(result.value)

10


class PippoInterface(metaclass=abc.ABCMeta):
    pass
        
@PippoInterface.register
class Myclass:
    def pippo(self):
        pass

obj = Myclass()
assert issubclass(Myclass, PippoInterface)
assert isinstance(obj, PippoInterface)


class Temp:
    a = 4
    print(f"I'm executing but not doing anything, with a value of {a}")
    del a
    
assert not hasattr(Temp, 'a')

I'm executing but not doing anything, with a value of 4


debug_mode = True
import logging

class Conditional:
    if not debug_mode:
        def __init__(self, a):
            self.a = a
    else:
        def __init__(self, a):
            self.a = a
            logging.warning("setting 'a' to {}".format(a))
            
myobj = Conditional(a=3)

WARNING:root:setting 'a' to 3


debug_mode = False
myobj = Conditional(a=3)

WARNING:root:setting 'a' to 3


from functools import partial
class DarkMagic:
    def __getattr__(self, name):
        func = eval(name) # dynamical resolution of the function name
        if not callable(func):
            raise TypeError("the requested dynamic attribute with name <{}> is not a function".format(name))
        return partial(func, self)
    
def hideous_function(self, b):
    return self.a*b*2

dark_beast = DarkMagic()
dark_beast.a = 3
dark_beast.hideous_function(b=3)

18


# if you know what you're doing, you can do some weird ass stuff
# like attributes with names that are not legitimate attribute names 
# and can't therefore be accessed with the dot operator
class HiddenMagic:
    def __init__(self, a):
        setattr(self, "_secret 'a'", a)
        
    @property
    def a(self):
        return getattr(self, "_secret 'a'")
        
crazy_obj = HiddenMagic(3)
print(crazy_obj.a)
dir(crazy_obj).own

3

property:
    _secret 'a'
special attribute:
    __dict__, __doc__, __module__, __weakref__
object customization:
    __init__
descriptor:
    a: @property with getter


class Wrapper:
    @classmethod
    def unwrap(cls, obj):
        return getattr(obj, "_ other _ ")
    
    def __init__(self, other):
        self.__dict__["_ other _ "] = other
        
    def __getattr__(self, name):
        other = getattr(self, "_ other _ ")
        return getattr(other, name)
    
    def __setattr__(self, name, value):
        other = getattr(self, "_ other _ ")
        return setattr(other, name, value)
    
class Empty:
    pass

tipo = Empty()
wrapped = Wrapper(tipo)
wrapped.a = 2
print(wrapped.a, tipo.a)
print(Wrapper.unwrap(wrapped))

2 2
<__main__.Empty object at 0x7fbf54091860>


class Worm:
    def mutate(self):
        self.__class__ = Butterfly
        
class Butterfly:
    def describe(self):
        return "I'm fabulous"

beast = Worm()
beast.mutate()
beast.describe()

"I'm fabulous"


# implements a count access for an attribute...this is terrible practices!
# this can be done, but one might be better off using a Descriptor
from collections import namedtuple
rw_counts = namedtuple("RWcounts", ["reads", "writes"])

class AnotherWeirdo:
    def __init__(self):
        self._a = 0
        self._a_readings = 0
        self._a_writings = 0
    
    @property
    def a(self):
        self._a_readings += 1
        return self._a
    
    @a.setter
    def a(self, value):
        self._a_writings += 1
        self._a = value
        
    def get_access_stats(self):
        return rw_counts(self._a_readings, self._a_writings)
        
weirdo = AnotherWeirdo()
weirdo.a = 3
print(weirdo.a)
print(weirdo.a)
print(weirdo.get_access_stats())

3
3
RWcounts(reads=2, writes=1)


# a map-calling interface similar to that of pandas' Series.str
class MapInterface:
    def __init__(self, target):
        setattr(self, "_ target _", target)
        
    def __getattr__(self, function):
        setattr(self, "_ target function_", function)
        return self
    
    def __call__(self, *args, **kwargs):
        target = getattr(self, "_ target _")
        funcname = getattr(self, "_ target function_")
        results = []
        for item in target:
            function = getattr(item, funcname)
            result = function(*args, **kwargs)
            results.append(result)
        return MyList(results)
            
class MyList(list):
    @property
    def str(self):
        return MapInterface(self)
        
mylist = MyList('abcde')
print(mylist)
print(mylist.str.replace('a', 'A'))

['a', 'b', 'c', 'd', 'e']
['A', 'b', 'c', 'd', 'e']


class MyEvilList(list):
    def __getattr__(self, name):
        base, cls = name.split('_')
        assert base == 'getas'
        cls = eval(cls)
        return cls(iter(self))
    
a = MyEvilList([1, 2, 3])
print(a.getas_tuple)
print(a.getas_set)

(1, 2, 3)
{1, 2, 3}


# a class as the one used in the example, but that can parse generic formulas in the dataframe space using eval
from dataclasses import dataclass
from typing import List
import pandas as pd

@dataclass
class ColumnSelector(BaseEstimator, TransformerMixin):
    columns: List[str]

    def fit(self, X, y=None):
        return self

    def transform(self, X: pd.DataFrame):
        new_series = {col: X.eval(col) for col in self.columns}
        return pd.DataFrame(new_series)


df = pd.DataFrame(rn.randn(100, 5), columns=list("abcde"))
            
cs = ColumnSelector(columns=["a", "e", "abs(a)*exp(e)"])
print(cs.get_params())
cs.fit_transform(df).head()

{'columns': ['a', 'e', 'abs(a)*exp(e)']}


class NameSpace:
    def __init__(self, **kwargs):
        for name, value in kwargs.items():
            self.__setattr__(name, value)
            
    def __setattr__(self, name, value):
        if hasattr(self, name):
            raise AttributeError("tried to rewrite an attribute!")
        super().__setattr__(name, value)
        
namespace = NameSpace(a=4)
namespace.b = 4
assert namespace.a == 4 == namespace.b
namespace.a = 2

---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
<ipython-input-413-c9ed41df8539> in <module>
     11 namespace.b = 4
     12 assert namespace.a == 4 == namespace.b
---> 13 namespace.a = 2

<ipython-input-413-c9ed41df8539> in __setattr__(self, name, value)
      5     def __setattr__(self, name, value):
      6         if hasattr(self, name):
----> 7             raise AttributeError("tried to rewrite an attribute!")
      8         super().__setattr__(name, value)
      9 

AttributeError: tried to rewrite an attribute!


class Container:
    seq = list()
    
instance_1 = Container()
instance_2 = Container()

instance_1.seq
instance_1.seq.append(1)
instance_1.seq
instance_2.seq
# %%
from dataclasses import dataclass

class Human:
    def __init__(self, waist, hip):
        self.waist = waist
        self.hip = hip
        self.w2h_ratio = waist/hip
        
giorgio = Human(110, 100)
giorgio.w2h_ratio

giorgio.waist = 100
giorgio.w2h_ratio

# %%
class Human:
    def __init__(self, waist, hip):
        self.waist = waist
        self.hip = hip
    
    @property
    def w2h_ratio(self):
        return self.waist/self.hip

giorgio = Human(110, 100)
giorgio.w2h_ratio

giorgio.waist = 100
giorgio.w2h_ratio

giorgio.w2h_ratio = 2

# %%

class Something:
    def __getattr__(self, name):
        if not name.startswith('add_'):
            raise AttributeError("don't have that attribute")
        number_value = float(name[4:])
        return number_value+self.a
        

namespace = Something()
namespace.a = 3
namespace.add_7

# %%
import pylab as plt
from sklearn.linear_model import LinearRegression

x = plt.rand(100)
y = x**2 +1 + plt.randn(100)*0.1

plt.scatter(x, y)
lin = LinearRegression()
lin.fit(x.reshape(-1, 1), y)

base = plt.linspace(0,1, 101)

y_hat = lin.predict(base.reshape(-1, 1))

plt.scatter(x, y); plt.plot(base, y_hat)

# %%
from dataclasses import dataclass
from typing import List
from sklearn.base import BaseEstimator, TransformerMixin

@dataclass
class ColumnSelector(BaseEstimator, TransformerMixin):
    columns: List[str]

    def fit(self, X, y=None):
        return self

    def transform(self, X):
        return X[self.columns]


# %%

df = pd.DataFrame(plt.randn(50, 5), columns=list("abcde"))
df['y'] = df['a']*3 + 1 + plt.randn(50)
y_train = df.loc[:30, 'y']
X_train = df.loc[:30, ['a', 'b', 'c', 'd', 'e']]

y_test = df.loc[30:, 'y']
X_test = df.loc[30:, ['a', 'b', 'c', 'd', 'e']]
# %%
cs = ColumnSelector(columns=["a", "e"])
lin = LinearRegression()

x_train_reduced = cs.fit_transform(X_train)
lin.fit(x_train_reduced, y_train)

x_test_reduced = cs.transform(X_test)
lin.predict(x_test_reduced)
# %%
from sklearn.pipeline import make_pipeline
pipeline = make_pipeline(ColumnSelector(columns=["a", "e"]),
                         LinearRegression())

pipeline.fit(X_train, y_train)
pipeline.predict(X_test)
# %%
from sklearn.model_selection import cross_val_predict, cross_val_score
y = df['y']
X = df[['a', 'b', 'c', 'd', 'e']]
cross_val_score(pipeline, X, y, cv=5)

pipeline.fit(X, y)
y_hat = pipeline.predict(X)
score(y, y_hat)


# this is only available in python 3.4+
import abc
class PippoInterface(abc.ABC):
    @classmethod
    def __subclasshook__(cls, subclass):
        # I define a instance or subclass as having a method called "pippo"
        return hasattr(subclass, "pippo") and callable(getattr(subclass, "pippo"))


class Myclass_1:
    def pippo(self):
        pass
    
assert issubclass(Myclass_1, PippoInterface)
assert isinstance(Myclass_1(), PippoInterface)


class Myclass_2:
    def pluto(self):
        pass
    
assert not issubclass(Myclass_2, PippoInterface)
assert not isinstance(Myclass_2(), PippoInterface)


class Myclass_3:
    pippo = 1

assert not issubclass(Myclass_3, PippoInterface)
assert not isinstance(Myclass_3(), PippoInterface)


# can be used to distinguish classes based on some attribut value
# would allow to simulate composition
# even if plain composition is just better

class PippoInterface(abc.ABC):
    @classmethod
    def __subclasshook__(cls, subclass):
        # I define a instance or subclass as having a method called "pippo"
        return hasattr(subclass, "pippo") and getattr(subclass, "pippo")==True


class Myclass_1:
    pippo = True
    
assert issubclass(Myclass_1, PippoInterface)
assert isinstance(Myclass_1(), PippoInterface)


class Myclass_1:
    pippo = False
    
assert not issubclass(Myclass_1, PippoInterface)
b = Myclass_1()
assert not isinstance(b, PippoInterface)
# it doesn't check the instance value!
b.pippo = True
assert not isinstance(b, PippoInterface)

	producer	vehicle
animal	cow	horse
mechanical	coffee machine	car

	a	e
0	-1.606346	-0.300311
1	0.020452	-0.678270
2	1.406233	0.581932
3	-2.292684	0.420558
4	0.959172	1.054905

	a	e	abs(a)*exp(e)
0	0.987063	0.307840	1.342883
1	0.817038	-1.034727	0.290312
2	0.143144	0.078301	0.154803
3	2.307495	1.301436	8.479050
4	-0.218387	-0.722837	0.105999

	indexable	non-indexable
mutable	list	set
non-mutable	string	int

Object Oriented Programming in Python¶

code categorization¶

prompt¶

scripts¶

libraries¶

programs¶

frameworks¶

What is an Object Oriented Programming? and why do we care?¶

Using OOP¶

What is an object?¶

Classes and Interfaces: describing common properties¶

Example of Python Interfaces and Classes¶

How to comunicate with an object?¶

Internal state¶

Using objects: Polymorphism and Substitution Principle¶

How to use objects to make a library¶

note¶

example - logging timer¶

Scikit-learn (sklearn) use case¶

Objects anatomy¶

Ontologies¶

Interfaces¶

sidenote: pdir2¶

sidenote: docstring¶

Creating a new class¶

object attributes¶

setting and retrieving attributes¶

hasattr, getattr, setattr, delattr¶

the __class__ attribute¶

class attributes and MRO¶

methods¶

Monkey patching¶

init method¶

magic methods¶

The dot operator¶

note - privates attributes part 1 of 3¶

note - privates attributes part 2 of 3¶

note - privates attributes part 3 of 3¶

Inheritance¶

Ontology definition - Exceptions¶

the use of multiple inheritance in the ontology¶

Traditional inheritance - methods¶

adding¶

overriding¶

extending¶

interface extension¶

Interface validation¶

static validation¶

Composition Over Inheritance¶

framework logic¶

Create scikit.learn compatible classes¶

Polymorphism¶

single dispatch¶

Function Hooks¶

method dispatching¶

Exercise 1 - simpler¶

exercise 2 - harder¶

end of the general programming module¶

Extra material¶

metaprogramming: metaclasses¶

Improving your library API design and management¶

deprecation warning¶

using function parameters using the enum module¶

storing all the enums in a single namespace¶

each enum in an attribute with the same name of the enum¶

each enum in an attribute with the same name of the parameter¶

notes on subclassing¶

Fluent Interface¶

Black Magic section¶

class registration with ABCMeta¶

Classes bodies are code blocks¶

Uniform Calling Syntax¶

secret attributes with unproper names¶

transparent wrapping objects relying attributes exploiting unproper names¶

Dynamical class change of an instance¶

Attributes with access logging¶

Calling interfaces (such as pandas.Series.str)¶

dynamical attribute resolution¶

A sklearn class to perform column selection from a dataframe including columns operations¶

write once attributes¶

the `class` attribute¶

using function parameters using the `enum` module¶

Calling interfaces (such as `pandas.Series.str`)¶