# 2 equivalent ways to define an empty list
l0 = []
l1 = list()
assert l0 == l1

# not empty lists
l2 = ['a', 2]
l3 = list(range(3))
print(l2, l3, l2 + l3)
print(3 * l2)

['a', 2] [0, 1, 2] ['a', 2, 0, 1, 2]
['a', 2, 'a', 2, 'a', 2]


print(dir(l3))

['__add__', '__class__', '__contains__', '__delattr__', '__delitem__', '__dir__', '__doc__', '__eq__', '__format__', '__ge__', '__getattribute__', '__getitem__', '__gt__', '__hash__', '__iadd__', '__imul__', '__init__', '__init_subclass__', '__iter__', '__le__', '__len__', '__lt__', '__mul__', '__ne__', '__new__', '__reduce__', '__reduce_ex__', '__repr__', '__reversed__', '__rmul__', '__setattr__', '__setitem__', '__sizeof__', '__str__', '__subclasshook__', 'append', 'clear', 'copy', 'count', 'extend', 'index', 'insert', 'pop', 'remove', 'reverse', 'sort']


l3.append(10)
print(l3)
l3.reverse()
print(l3)

[0, 1, 2, 10]
[10, 2, 1, 0]


# Built-in functions applied on lists
# return lower value
print(min(l3))
# return higher value
print(max(l3))
# return sorted list
print(sorted([5, 2, 10, 0]))

0
10
[0, 2, 5, 10]


# "pasting" two lists can be done using zip
l1 = [1, 2, 3]
s = 'abc'
print(list(zip(l1, s)))
print(list(zip('abc', 'defg')))

[(1, 'a'), (2, 'b'), (3, 'c')]
[('a', 'd'), ('b', 'e'), ('c', 'f')]


l0 = [1, 4, 10]
l1 = []
for number in l0:
    l1.append(number**2)
    
print(l1)

[1, 16, 100]


l1 = [number**2 for number in l0]
print(l1)

[1, 16, 100]


# list comprehension with a condition
[s for s in ['a', 'bbb', 'e'] if len(s) == 1]

['a', 'e']


# lists comprehensions can be cascaded
l1 = [(x,y) for x in [1,2] for y in ['a','b'] ]
print(l1)

# Equivalent without list comprehensions
l2 = []
for x in [1,2]:
    for y in ['a','b']:
        l2.append((x, y))

assert l1 == l2

[(1, 'a'), (1, 'b'), (2, 'a'), (2, 'b')]


text = "basically"

def extract_patterns(text, n=3):
    pat = [text[i:i+n] for i in range(len(text)-n+1)]
    return pat

print("patterns=", extract_patterns(text))
print("patterns=", extract_patterns(text, n=5))

patterns= ['bas', 'asi', 'sic', 'ica', 'cal', 'all', 'lly']
patterns= ['basic', 'asica', 'sical', 'icall', 'cally']


# 2 equivalent notations to define an empty tuple (not very useful...)
t0 = ()
t1 = tuple()
assert t0 == t1

# not empty tuple
t2 = (1, 2, 'a')  # with the parentheses
t2 = 1, 2, 'a'    # it also works without parentheses
t3 = tuple(l3)  # from a list


# tuples only have 2 public methods (with a list comprehension)
[name for name in dir(t3) if not name.startswith('__')]

['count', 'index']


# assigment of multiple variables in 1 line
a, b = 1, 2
print(a, b)
# exchange of values
b, a = a, b
print(a, b)

1 2
2 1


def myfunc():
    return 1, 2, 3

t = myfunc()
print(type(t), t)
# Directly unpacking the tuple
a, b, c = myfunc()
print(a, b, c)

<class 'tuple'> (1, 2, 3)
1 2 3


s0 = set()


{1, 1, 1, 3}

{1, 3}


set([1, 1, 1, 3])

{1, 3}


s1 = {1, 2}
s2 = {2, 3}
print(s1.intersection(s2))
print(s1.union(s2))

{2}
{1, 2, 3}


print(1 in s1, 1 in s2)

True False


from random import shuffle, randint

n = 20
i = randint(0, n-1)
print('integer remove from the list:', i)
l = list(range(n))
l.remove(i)
shuffle(l)
print('shuffled list: ', l)

integer remove from the list: 9
shuffled list:  [12, 16, 4, 13, 0, 5, 6, 11, 2, 10, 8, 3, 17, 19, 14, 15, 1, 18, 7]


full_set = set(range(n))
changed_set = set(l)
ns = full_set - changed_set
ns.pop()

9


d = {'a': 1, 'b': 2, 0: False, 1: True}
print(d)

{'a': 1, 'b': 2, 0: False, 1: True}


date = {}
date['Year'] = 2020
date['Month'] = 1
print(date)
date['Year'] = 2015
date

{'Year': 2020, 'Month': 1}

{'Year': 2015, 'Month': 1}


print(date['Year'])
try:
    current_day = date['Day']
except KeyError as e:
    print(f'{e} is not an existing key !')

2015
'Day' is not an existing key !


l = ["value0", "value1"]
l.append("value2")
print(l)

['value0', 'value1', 'value2']


l[1]

'value1'


d = {"key0": "value0", "key1": "value1"}
d["key2"] = "value2"
print(d)

{'key0': 'value0', 'key1': 'value1', 'key2': 'value2'}


d["key1"]

'value1'


# dict have 11 public methods (with a list comprehension)
[name for name in dir(d) if not name.startswith('__')]

['clear',
 'copy',
 'fromkeys',
 'get',
 'items',
 'keys',
 'pop',
 'popitem',
 'setdefault',
 'update',
 'values']


# loop on items
for key, value in d.items():
    print(key, value)

key0 value0
key1 value1
key2 value2


# loop on values
for value in d.values():
    print(value)

value0
value1
value2


# loop on keys
for key in d.keys():
    print(key)

key0
key1
key2


# dict comprehension (here to change the case of values)
print(d)
d1 = {k: v.upper() for k, v in d.items()}
print(d1)

{'key0': 'value0', 'key1': 'value1', 'key2': 'value2'}
{'key0': 'VALUE0', 'key1': 'VALUE1', 'key2': 'VALUE2'}


text = 'abbbcc'


def count_elem(sequence):
    d = {}

    for letter in sequence:
        if letter not in d:
            d[letter] = 1
        else:
            d[letter] += 1
    return d

print("text=", text, "counts=", count_elem(text))

text= abbbcc counts= {'a': 1, 'b': 3, 'c': 2}


def build_count_base(t):                 
    d = {}                   
    for s in t:
        if s in d:
            d[s] += 1
        else:  
            d[s] = 1
    return d

def build_count_set(t):                   
    d = {k:0 for k in set(t)}
    for s in t:
        d[s] += 1
    return d

def build_count_count(t):
    d = {k:t.count(k) for k in set(t)}
    return d

def build_count_except(t):             
    d = {}                   
    for s in t:
        try:     
            d[s] += 1
        except KeyError:
            d[s] = 1
    return d

import collections

def build_count_counter(t):
    return collections.Counter(t)

def build_count_defaultdict(t):
    d = collections.defaultdict(int)
    for k in s:
        d[k] += 1
    return d

s = "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Nam tristique at velit in varius. Cras ut ultricies orci. Fusce vel consequat ante, vitae luctus tortor. Sed condimentum faucibus enim, sit amet pulvinar ligula feugiat ac. Sed interdum id risus id rhoncus. Nullam nisi justo, ultrices eu est nec, hendrerit maximus lorem. Nam urna eros, accumsan nec magna eu, elementum semper diam. Nulla tempus, nibh id elementum dapibus, ex diam lacinia est, sit amet suscipit nulla nibh eu sapien. Aliquam orci enim, malesuada in facilisis vitae, pharetra sit amet mi. Pellentesque mi tortor, sagittis quis odio quis, fermentum faucibus ex. Aenean sagittis nisl orci. Maecenas tristique velit sed leo facilisis porttitor. "
s = s*10000
print(f"len(s) = {len(s)}, nbkeys {len(set(s))} base, count, count_count, except, collections.Counter")
%timeit build_count_base(s)
%timeit build_count_set(s)
%timeit build_count_count(s)
%timeit build_count_except(s)
%timeit build_count_counter(s)
%timeit build_count_defaultdict(s)

print("with split")
s2 = s.split()
print(f"len(s) = {len(s2)}, nbkeys {len(set(s2))} base, count, count_count, except, collections.Counter")
%timeit build_count_base(s2)
%timeit build_count_set(s2)
%timeit build_count_count(s2)
%timeit build_count_except(s2)
%timeit build_count_counter(s2)
%timeit build_count_defaultdict(s2)

len(s) = 7160000, nbkeys 33 base, count, count_count, except, collections.Counter
738 ms ± 20.9 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
747 ms ± 22.8 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
187 ms ± 15.4 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
621 ms ± 52.4 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
333 ms ± 2.82 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
544 ms ± 2.8 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
with split
len(s) = 1100000, nbkeys 90 base, count, count_count, except, collections.Counter
141 ms ± 922 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)
153 ms ± 28.6 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
1.84 s ± 201 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
122 ms ± 4.97 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
75.8 ms ± 552 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)
591 ms ± 34.2 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)


text="Las Vegas Overlook Loop is a 6.3 mile loop trail located near Las Vegas"

def extract_patterns(text, n=3):
    "extracts the patterns of size n from text and return it"
    pat = [text[i:i+n] for i in range(len(text)-n+1)]
    return pat

def guess(prefix, count):
    "complete the prefix with the most probable pattern (according to count)"
    # get all the pattern in keys of count that starts with prefix
    # compat_prefix = DIY
    
    # find among the compatible prefixes the one wich score best according to count
    best_prefix = "?"
    return best_prefix

patterns = extract_patterns(text)
print("patterns = ", patterns)
patterns_count = count_elem(patterns)
print("patterns_counts = ", patterns_count)

print("guess for oo = ", guess("oo", patterns_count))
print("guess for eg = ", guess("eg", patterns_count))

patterns =  ['Las', 'as ', 's V', ' Ve', 'Veg', 'ega', 'gas', 'as ', 's O', ' Ov', 'Ove', 'ver', 'erl', 'rlo', 'loo', 'ook', 'ok ', 'k L', ' Lo', 'Loo', 'oop', 'op ', 'p i', ' is', 'is ', 's a', ' a ', 'a 6', ' 6.', '6.3', '.3 ', '3 m', ' mi', 'mil', 'ile', 'le ', 'e l', ' lo', 'loo', 'oop', 'op ', 'p t', ' tr', 'tra', 'rai', 'ail', 'il ', 'l l', ' lo', 'loc', 'oca', 'cat', 'ate', 'ted', 'ed ', 'd n', ' ne', 'nea', 'ear', 'ar ', 'r L', ' La', 'Las', 'as ', 's V', ' Ve', 'Veg', 'ega', 'gas']
patterns_counts =  {'Las': 2, 'as ': 3, 's V': 2, ' Ve': 2, 'Veg': 2, 'ega': 2, 'gas': 2, 's O': 1, ' Ov': 1, 'Ove': 1, 'ver': 1, 'erl': 1, 'rlo': 1, 'loo': 2, 'ook': 1, 'ok ': 1, 'k L': 1, ' Lo': 1, 'Loo': 1, 'oop': 2, 'op ': 2, 'p i': 1, ' is': 1, 'is ': 1, 's a': 1, ' a ': 1, 'a 6': 1, ' 6.': 1, '6.3': 1, '.3 ': 1, '3 m': 1, ' mi': 1, 'mil': 1, 'ile': 1, 'le ': 1, 'e l': 1, ' lo': 2, 'p t': 1, ' tr': 1, 'tra': 1, 'rai': 1, 'ail': 1, 'il ': 1, 'l l': 1, 'loc': 1, 'oca': 1, 'cat': 1, 'ate': 1, 'ted': 1, 'ed ': 1, 'd n': 1, ' ne': 1, 'nea': 1, 'ear': 1, 'ar ': 1, 'r L': 1, ' La': 1}
guess for oo =  ?
guess for eg =  ?


text="Las Vegas Overlook Loop is a 6.3 mile loop trail located near Las Vegas"

def extract_patterns(text, n=3):
    pat = [text[i:i+n] for i in range(len(text)-n+1)]
    return pat

def guess(prefix, count):
    "complete the prefix with the most probable pattern (according to count)"
    # get all the pattern in keys of count that starts with prefix
    compatibles_prefixes = [x for x in count.keys() if x.startswith(prefix)]
    if len(compatibles_prefixes) == 0:
        return None
    best_prefix = compatibles_prefixes[0]
    best_score = count[best_prefix]
    for pref in compatibles_prefixes[1:]:
        if best_score < count[best_prefix]:
            best_score = count[pref]
            best_prefix = pref
    return best_prefix

patterns = extract_patterns(text)
print("patterns = ", patterns)
patterns_count = count_elem(patterns)
print("patterns_counts = ", patterns_count)

print("guess for oo = ", guess("oo", patterns_count))
print("guess for eg = ", guess("eg", patterns_count))

patterns =  ['Las', 'as ', 's V', ' Ve', 'Veg', 'ega', 'gas', 'as ', 's O', ' Ov', 'Ove', 'ver', 'erl', 'rlo', 'loo', 'ook', 'ok ', 'k L', ' Lo', 'Loo', 'oop', 'op ', 'p i', ' is', 'is ', 's a', ' a ', 'a 6', ' 6.', '6.3', '.3 ', '3 m', ' mi', 'mil', 'ile', 'le ', 'e l', ' lo', 'loo', 'oop', 'op ', 'p t', ' tr', 'tra', 'rai', 'ail', 'il ', 'l l', ' lo', 'loc', 'oca', 'cat', 'ate', 'ted', 'ed ', 'd n', ' ne', 'nea', 'ear', 'ar ', 'r L', ' La', 'Las', 'as ', 's V', ' Ve', 'Veg', 'ega', 'gas']
patterns_counts =  {'Las': 2, 'as ': 3, 's V': 2, ' Ve': 2, 'Veg': 2, 'ega': 2, 'gas': 2, 's O': 1, ' Ov': 1, 'Ove': 1, 'ver': 1, 'erl': 1, 'rlo': 1, 'loo': 2, 'ook': 1, 'ok ': 1, 'k L': 1, ' Lo': 1, 'Loo': 1, 'oop': 2, 'op ': 2, 'p i': 1, ' is': 1, 'is ': 1, 's a': 1, ' a ': 1, 'a 6': 1, ' 6.': 1, '6.3': 1, '.3 ': 1, '3 m': 1, ' mi': 1, 'mil': 1, 'ile': 1, 'le ': 1, 'e l': 1, ' lo': 2, 'p t': 1, ' tr': 1, 'tra': 1, 'rai': 1, 'ail': 1, 'il ': 1, 'l l': 1, 'loc': 1, 'oca': 1, 'cat': 1, 'ate': 1, 'ted': 1, 'ed ': 1, 'd n': 1, ' ne': 1, 'nea': 1, 'ear': 1, 'ar ': 1, 'r L': 1, ' La': 1}
guess for oo =  ook
guess for eg =  ega


text="Las Vegas Overlook Loop is a 6.3 mile loop trail located near Las Vegas"

def extract_patterns(text, n=3):
    pat = [text[i:i+n] for i in range(len(text)-n+1)]
    return pat

def guess(prefix, count):
    "complete the prefix with the most probable pattern (according to count)"
    # get all the pattern in keys of count that starts with prefix
    compat_prefix = [(x, count[x]) for x in count.keys() if x.startswith(prefix)]
    ordered_compat_pref = sorted(compat_prefix, key=lambda x: x[1], 
                                 reverse=True)
    return ordered_compat_pref

patterns = extract_patterns(text)
print("patterns = ", patterns)
patterns_count = count_elem(patterns)
print("patterns_counts = ", patterns_count)

print("guess for oo = ", guess("oo", patterns_count))
print("guess for eg = ", guess("eg", patterns_count))

patterns =  ['Las', 'as ', 's V', ' Ve', 'Veg', 'ega', 'gas', 'as ', 's O', ' Ov', 'Ove', 'ver', 'erl', 'rlo', 'loo', 'ook', 'ok ', 'k L', ' Lo', 'Loo', 'oop', 'op ', 'p i', ' is', 'is ', 's a', ' a ', 'a 6', ' 6.', '6.3', '.3 ', '3 m', ' mi', 'mil', 'ile', 'le ', 'e l', ' lo', 'loo', 'oop', 'op ', 'p t', ' tr', 'tra', 'rai', 'ail', 'il ', 'l l', ' lo', 'loc', 'oca', 'cat', 'ate', 'ted', 'ed ', 'd n', ' ne', 'nea', 'ear', 'ar ', 'r L', ' La', 'Las', 'as ', 's V', ' Ve', 'Veg', 'ega', 'gas']
patterns_counts =  {'Las': 2, 'as ': 3, 's V': 2, ' Ve': 2, 'Veg': 2, 'ega': 2, 'gas': 2, 's O': 1, ' Ov': 1, 'Ove': 1, 'ver': 1, 'erl': 1, 'rlo': 1, 'loo': 2, 'ook': 1, 'ok ': 1, 'k L': 1, ' Lo': 1, 'Loo': 1, 'oop': 2, 'op ': 2, 'p i': 1, ' is': 1, 'is ': 1, 's a': 1, ' a ': 1, 'a 6': 1, ' 6.': 1, '6.3': 1, '.3 ': 1, '3 m': 1, ' mi': 1, 'mil': 1, 'ile': 1, 'le ': 1, 'e l': 1, ' lo': 2, 'p t': 1, ' tr': 1, 'tra': 1, 'rai': 1, 'ail': 1, 'il ': 1, 'l l': 1, 'loc': 1, 'oca': 1, 'cat': 1, 'ate': 1, 'ted': 1, 'ed ': 1, 'd n': 1, ' ne': 1, 'nea': 1, 'ear': 1, 'ar ': 1, 'r L': 1, ' La': 1}
guess for oo =  [('oop', 2), ('ook', 1)]
guess for eg =  [('ega', 2)]

Python training UGA 2017¶

Data structures ¶

list: mutable sequence¶

list: mutable sequence¶

`list`: list comprehension¶

Do it yourself (advanced)¶

A possible solution¶

`tuple`: immutable sequence¶

`tuple`: immutable sequence¶

`set`: a hashtable¶

`set`: lookup¶

What is a hashtable?¶

DIY: back to the "find the removed element" problem¶

A possible solution :¶

Complexity :¶

Complexity of the "sum" solution :¶

`dict`: unordered set of key: value pairs¶

Dictionary creation¶

Adding/replacing an entry to an exisiting dict:¶

Get an existing entry¶

Tip: parallel between `dict` and `list`¶

`dict`: public methods¶

`dict`: different ways to loop over a dictionary¶

Do it yourself:¶

A possible solution:¶

Do it yourself : smart completion (advanced)¶

A possible solution¶

Python training UGA 2017¶

Data structures¶

list: mutable sequence¶

list: mutable sequence¶

list: list comprehension¶

Do it yourself (advanced)¶

A possible solution¶

tuple: immutable sequence¶

tuple: immutable sequence¶

set: a hashtable¶

set: lookup¶

What is a hashtable?¶

DIY: back to the "find the removed element" problem¶

A possible solution :¶

Complexity :¶

Complexity of the "sum" solution :¶

dict: unordered set of key: value pairs¶

Dictionary creation¶

Adding/replacing an entry to an exisiting dict:¶

Get an existing entry¶

Tip: parallel between dict and list¶

dict: public methods¶

dict: different ways to loop over a dictionary¶

Do it yourself:¶

A possible solution:¶

Do it yourself : smart completion (advanced)¶

A possible solution¶

Data structures ¶

`list`: list comprehension¶

`tuple`: immutable sequence¶

`tuple`: immutable sequence¶

`set`: a hashtable¶

`set`: lookup¶

`dict`: unordered set of key: value pairs¶

Tip: parallel between `dict` and `list`¶

`dict`: public methods¶

`dict`: different ways to loop over a dictionary¶