Python Training at VMWare Pune - Day 2¶

Dec 13-15, 2017 Vikrant Patil

These notes are available online at http://notes.pipal.in/2017/vmware-nov-python

problem:

Write a csvparser which parses data written in csv format and loads it in memory as 2 dimensional list.

def csvparser(filename):
    return [line.split(",") for line in open(filename)]

csvparser("data1.csv")

[['A1', 'B1', 'C1\n'],
 ['A2', 'B2', 'C2\n'],
 ['A3', 'B3', 'C3\n'],
 ['A4', 'B4', 'C4\n']]

with statement¶

with open("numbers.txt", "a") as f:
    f.write("ten\n")
    f.write("nine\n")

import cat
cat.cat(["numbers.txt"])

one
two
three
four
five
six
ten
nine
ten
nine

Lets make our parsers and writers generic

def genericparser(file, delimiter=","):
    return [line.strip().split(delimiter) for line in open(file)]

def genericwriter(data, filename, delimiter=","):
    with open(filename, "w") as fhandle:
        for row in data:
            fhandle.write(delimiter.join(row) + "\n")

data = [[str(i*j) for i in range(1,11)] for j in range(1,6)]

data

[['1', '2', '3', '4', '5', '6', '7', '8', '9', '10'],
 ['2', '4', '6', '8', '10', '12', '14', '16', '18', '20'],
 ['3', '6', '9', '12', '15', '18', '21', '24', '27', '30'],
 ['4', '8', '12', '16', '20', '24', '28', '32', '36', '40'],
 ['5', '10', '15', '20', '25', '30', '35', '40', '45', '50']]

genericwriter(data, "tables.tsv", delimiter="\t")

!python cat.py tables.tsv

1	2	3	4	5	6	7	8	9	10
2	4	6	8	10	12	14	16	18	20
3	6	9	12	15	18	21	24	27	30
4	8	12	16	20	24	28	32	36	40
5	10	15	20	25	30	35	40	45	50

how do you transpose data?

data[0] # 0th row

['1', '2', '3', '4', '5', '6', '7', '8', '9', '10']

data[0][0] # item from 0th row and 0th column

'1'

#data[rownumber][columnnumber]

[data[rownumber][0] for rownumber in range(len(data))]

['1', '2', '3', '4', '5']

[data[rownumber][1] for rownumber in range(len(data))]

['2', '4', '6', '8', '10']

rows = len(data)

cols = len(data[0])

data

[['1', '2', '3', '4', '5', '6', '7', '8', '9', '10'],
 ['2', '4', '6', '8', '10', '12', '14', '16', '18', '20'],
 ['3', '6', '9', '12', '15', '18', '21', '24', '27', '30'],
 ['4', '8', '12', '16', '20', '24', '28', '32', '36', '40'],
 ['5', '10', '15', '20', '25', '30', '35', '40', '45', '50']]

[data[rownum][0] for rownum in range(rows)]

['1', '2', '3', '4', '5']

[data[rownum][1] for rownum in range(rows)]

['2', '4', '6', '8', '10']

[[data[rownum][colnum] for rownum in range(rows)]  for colnum in range(cols) ]

[['1', '2', '3', '4', '5'],
 ['2', '4', '6', '8', '10'],
 ['3', '6', '9', '12', '15'],
 ['4', '8', '12', '16', '20'],
 ['5', '10', '15', '20', '25'],
 ['6', '12', '18', '24', '30'],
 ['7', '14', '21', '28', '35'],
 ['8', '16', '24', '32', '40'],
 ['9', '18', '27', '36', '45'],
 ['10', '20', '30', '40', '50']]

def transpose(data):
    rows = len(data)
    cols = len(data[0])
    return [[data[rownum][colnum] for rownum in range(rows)]  for colnum in range(cols) ]

genericwriter(transpose(data), "tables.tsv", delimiter="\t")

!python cat.py tables.tsv

1	2	3	4	5
2	4	6	8	10
3	6	9	12	15
4	8	12	16	20
5	10	15	20	25
6	12	18	24	30
7	14	21	28	35
8	16	24	32	40
9	18	27	36	45
10	20	30	40	50

genericparser("tables.tsv", delimiter="\t")

[['1', '2', '3', '4', '5'],
 ['2', '4', '6', '8', '10'],
 ['3', '6', '9', '12', '15'],
 ['4', '8', '12', '16', '20'],
 ['5', '10', '15', '20', '25'],
 ['6', '12', '18', '24', '30'],
 ['7', '14', '21', '28', '35'],
 ['8', '16', '24', '32', '40'],
 ['9', '18', '27', '36', '45'],
 ['10', '20', '30', '40', '50']]

csvparser = lambda filename: genericparser(filename, delimiter=",")

csvparser("data1.csv")

[['A1', 'B1', 'C1'],
 ['A2', 'B2', 'C2'],
 ['A3', 'B3', 'C3'],
 ['A4', 'B4', 'C4']]

def csvparser(filename):
    return genericparser(filename, delimiter=",")

Writing to standard error and output¶

import sys

sys.stdout.write("Hello this is just output!")

Hello this is just output!

sys.stderr.write("Something went wrong !!")

Something went wrong !!

Dictionaries¶

person = {"name":"lewis carrol",
         "books":["ALice in wonderland", "Looking through the glass"],
         "language":"English"}

person['name']

'lewis carrol'

person['name'] = "lewis"

person

{'books': ['ALice in wonderland', 'Looking through the glass'],
 'language': 'English',
 'name': 'lewis'}

del person['language']

person

{'books': ['ALice in wonderland', 'Looking through the glass'],
 'name': 'lewis'}

person['language']

---------------------------------------------------------------------------
KeyError                                  Traceback (most recent call last)
<ipython-input-54-808e22d5936d> in <module>()
----> 1 person['language']

KeyError: 'language'

person.get("language", "english")

'english'

person.get("name", "unknown")

'lewis'

person['books'][0]

'ALice in wonderland'

person['books'][1]

'Looking through the glass'

grub conf on my laptop looks like this

!python cat.py /etc/default/grub

# If you change this file, run 'update-grub' afterwards to update
# /boot/grub/grub.cfg.
# For full documentation of the options in this file, see:
#   info -f grub -n 'Simple configuration'

GRUB_DEFAULT=0
GRUB_HIDDEN_TIMEOUT=0
GRUB_HIDDEN_TIMEOUT_QUIET=true
GRUB_TIMEOUT=10
GRUB_DISTRIBUTOR=`lsb_release -i -s 2> /dev/null || echo Debian`
GRUB_CMDLINE_LINUX_DEFAULT="quiet splash"
GRUB_CMDLINE_LINUX=""

# Uncomment to enable BadRAM filtering, modify to suit your needs
# This works with Linux (no patch required) and with any kernel that obtains
# the memory map information from GRUB (GNU Mach, kernel of FreeBSD ...)
#GRUB_BADRAM="0x01234567,0xfefefefe,0x89abcdef,0xefefefef"

# Uncomment to disable graphical terminal (grub-pc only)
#GRUB_TERMINAL=console

# The resolution used on graphical terminal
# note that you can use only modes which your graphic card supports via VBE
# you can see them in real GRUB with the command `vbeinfo'
#GRUB_GFXMODE=640x480

# Uncomment if you don't want GRUB to pass "root=UUID=xxx" parameter to Linux
#GRUB_DISABLE_LINUX_UUID=true

# Uncomment to disable generation of recovery mode menu entries
#GRUB_DISABLE_RECOVERY="true"

# Uncomment to get a beep at grub start
#GRUB_INIT_TUNE="480 440 1"

Example : parse conf file and load as dictionary¶

def confreader(file):
    data = {}
    for line in open(file):
        if line.startswith("#") or line.strip()=="":
            continue
        items = line.strip().split("=")
        data[items[0]] = "".join(items[1:])
    return data

confreader("/etc/default/grub")

{'GRUB_CMDLINE_LINUX': '""',
 'GRUB_CMDLINE_LINUX_DEFAULT': '"quiet splash"',
 'GRUB_DEFAULT': '0',
 'GRUB_DISTRIBUTOR': '`lsb_release -i -s 2> /dev/null || echo Debian`',
 'GRUB_HIDDEN_TIMEOUT': '0',
 'GRUB_HIDDEN_TIMEOUT_QUIET': 'true',
 'GRUB_TIMEOUT': '10'}

confdata = confreader("/etc/default/grub")

confdata['GRUB_CMDLINE_LINUX_DEFAULT']

'"quiet splash"'

digits = [("one",1), ("two",2), ("three",3)]

dict(digits)

{'one': 1, 'three': 3, 'two': 2}

names = ["Anand", "Nouful", "David", "Lewis", "Ronbinson"]
place = ["India", "India", "USA", "UK", "USA"]

d = dict(zip(names, place))

Iterating over dictionaries¶

for item in d:
    print(item)

Anand
Nouful
David
Lewis
Ronbinson

for key in d.keys():
    print(key, d[key])

Anand India
Nouful India
David USA
Lewis UK
Ronbinson USA

for value in d.values():
    print(value)

India
India
USA
UK
USA

for key,value in d.items():
    print(key, value)

Anand India
Nouful India
David USA
Lewis UK
Ronbinson USA

items = ["Pencil", "Colorbox", "Pen", "Eraser"]
prices = [10, 25, 12, 5]

cart = dict(zip(items, prices))

cart

{'Colorbox': 25, 'Eraser': 5, 'Pen': 12, 'Pencil': 10}

for item, price in cart.items():
    print(item.rjust(10), price)
print("-"*20)
print("Total".rjust(10), sum(cart.values()))

    Pencil 10
  Colorbox 25
       Pen 12
    Eraser 5
--------------------
     Total 52

problem :

Write a program to count frequency of words from given file

%%file words.txt
one
one two
one two three
one two three four
one two three four five
one two three four five six
six seven eight nine ten
seven eight nine ten
eight nine ten
nine ten
ten

Overwriting words.txt

d

{'Anand': 'India',
 'David': 'USA',
 'Lewis': 'UK',
 'Nouful': 'India',
 'Ronbinson': 'USA'}

"alice" in ["alice", "alex"]

True

"Anand" in d

True

"Anand" in d.keys()

True

"India" in d.values()

True

def getwords(filename):
    return open(filename).read().split()

words = getwords("words.txt")

words

['one',
 'one',
 'two',
 'one',
 'two',
 'three',
 'one',
 'two',
 'three',
 'four',
 'one',
 'two',
 'three',
 'four',
 'five',
 'one',
 'two',
 'three',
 'four',
 'five',
 'six',
 'six',
 'seven',
 'eight',
 'nine',
 'ten',
 'seven',
 'eight',
 'nine',
 'ten',
 'eight',
 'nine',
 'ten',
 'nine',
 'ten',
 'ten']

def wordfreq(words):
    freq = {}
    
    for word in words:
        if word in freq:
            freq[word] += 1
        else:
            freq[word] = 1
    return freq

wordfreq(words)

{'eight': 3,
 'five': 2,
 'four': 3,
 'nine': 4,
 'one': 6,
 'seven': 2,
 'six': 2,
 'ten': 5,
 'three': 4,
 'two': 5}

def wordfreq1(words):
    freq  = {}
    for w in words:
        freq[w] = freq.get(w, 0) + 1
    return freq

wordfreq1(words)

{'eight': 3,
 'five': 2,
 'four': 3,
 'nine': 4,
 'one': 6,
 'seven': 2,
 'six': 2,
 'ten': 5,
 'three': 4,
 'two': 5}

def wordfreq2(words):
    freq = {}
    unique = set(words)
    for w in unique:
        freq[w] = words.count(w)
    return freq

def wordfreq3(words):
    freq = dict(zip(words, [0]*len(words)))
    for w in words:
        freq[w] += 1
    return freq

wordfreq3(words)

{'eight': 3,
 'five': 2,
 'four': 3,
 'nine': 4,
 'one': 6,
 'seven': 2,
 'six': 2,
 'ten': 5,
 'three': 4,
 'two': 5}

freq = wordfreq3(words)

for key in freq:
    print(key, freq[key])

one 6
two 5
three 4
four 3
five 2
six 2
seven 2
eight 3
nine 4
ten 5

for key in sorted(freq):
    print(key, freq[key])

eight 3
five 2
four 3
nine 4
one 6
seven 2
six 2
ten 5
three 4
two 5

for key in sorted(freq, key=lambda k:freq[k]):
    print(key, freq[key])

five 2
six 2
seven 2
four 3
eight 3
three 4
nine 4
two 5
ten 5
one 6

for key in sorted(freq, key=lambda k:freq[k], reverse=True):
    print(key, freq[key])

one 6
two 5
ten 5
three 4
nine 4
four 3
eight 3
five 2
six 2
seven 2

for key in sorted(freq, key=lambda k:freq[k], reverse=True):
    print(key.rjust(6), "*"*freq[key])

   one ******
   two *****
   ten *****
 three ****
  nine ****
  four ***
 eight ***
  five **
   six **
 seven **

d

{'Anand': 'India',
 'David': 'USA',
 'Lewis': 'UK',
 'Nouful': 'India',
 'Ronbinson': 'USA'}

[ name for name,place in d.items() if place=="India"]

['Anand', 'Nouful']

[ name for name,place in d.items() if place=="USA"]

['David', 'Ronbinson']

Pitfalls¶

x = [1,2,3,4]
y = x
y.append(5)
print(x)

[1, 2, 3, 4, 5]

x = [1,2,3,4,5]
y = x
x = [1,2,3]
print(y)

[1, 2, 3, 4, 5]

d.keys()

dict_keys(['Anand', 'Nouful', 'David', 'Lewis', 'Ronbinson'])

d.values()

dict_values(['India', 'India', 'USA', 'UK', 'USA'])

def unzip(data):
    keys = list(data.keys())
    values = [data[k] for k in keys]
    return keys, values

unzip(d)

(['Anand', 'Nouful', 'David', 'Lewis', 'Ronbinson'],
 ['India', 'India', 'USA', 'UK', 'USA'])

Classes¶

class Complex:
    def __init__(self, real, imag):
        self.real = real
        self.imag = imag
        
    def get_real(self):
        return self.real
    
    def get_imag(self):
        return self.imag

    def display(self):
        print(self.real ,"+", str(self.imag)+"j")
        
    def add(self, c):
        pass

Complex

__main__.Complex

print(Complex)

<class '__main__.Complex'>

c1 = Complex(2,3)

c1

<__main__.Complex at 0x7f778005ec18>

c1.get_imag()

3

c1.get_real()

2

c1.display()

2 + 3j

isinstance(c1, Complex)

True

class Complex:
    def __init__(self, real, imag):
        self.real = real
        self.imag = imag
        
    def get_real(self):
        return self.real
    
    def get_imag(self):
        return self.imag

    def display(self):
        print(self.real ,"+", str(self.imag)+"j")
        
    def add(self, c):
        return Complex(self.real+c.real, self.imag+c.imag)
    
    def double(self):
        return Complex(2*self.real, 2*self.imag)

c = Complex(1,2)

c2 = c.double()

c2.display()

2 + 4j

c.display()

1 + 2j

c3 = c.add(c2)

c3.display()

3 + 6j

Why classes?¶

%%file module1.py
x = 10

def getx():
    return x

def getdouble():
    return 2*x

Overwriting module1.py

%%file module2.py
x = 10

def getx():
    print("from module2")
    return x

def getdouble():
    print("from module2")
    return 2*x

Writing module2.py

import module1

import module2

module1.x

10

module2.x

10

module2.x = 20

module2.getx()

from module2

20

%%file bank0.py
balance = 0

def get_balance():
    return balance

def withdraw(amount):
    global balance
    balance = balance - amount
    
def deposite(amount):
    global balance
    balance += amount
    
if __name__ == "__main__":
    deposite(100)
    print(get_balance())
    withdraw(20)
    print(get_balance())

Writing bank0.py

!python bank0.py

100
80

%%file bank1.py

def create_account():
    return {"balance":0}

def get_balance(account):
    return account['balance']

def withdraw(account, amount):
    account['balance'] -= amount
    
def deposit(account, amount):
    account['balance'] += amount
    

if __name__ == "__main__":
    a1 = create_account()
    a2 = create_account()
    deposit(a1, 100)
    deposit(a2, 200)
    print("a1 : ", get_balance(a1))
    print("a2 : ", get_balance(a2))
    withdraw(a1, 10)
    withdraw(a2, 20)
    print("a1 : ", get_balance(a1))
    print("a2 : ", get_balance(a2))

Writing bank1.py

!python bank1.py

a1 :  100
a2 :  200
a1 :  90
a2 :  180

%%file bank2.py

class BankAccount:
    def __init__(self):
        self.balance = 0
        
    def get_balance(self):
        return self.balance
    
    def deposit(self, amount):
        self.balance += amount
        
    def withdraw(self, amount):
        self.balance -= amount
        
if __name__ == "__main__":
    a1 = BankAccount()
    a2 = BankAccount()
    a1.deposit(100)
    a2.deposit(200)
    print("a1 : ", a1.get_balance())
    print("a2 : ", a2.get_balance())
    a1.withdraw(10)
    a2.withdraw(20)
    print("a1 : ", a1.get_balance())
    print("a2 : ", a2.get_balance())

Overwriting bank2.py

!python bank2.py

a1 :  100
a2 :  200
a1 :  90
a2 :  180

class Point:
    def __init__(self, x, y):
        self.x = x
        self.y = y

p = Point(1, 2)

p.x

1

p.y

2

p.z = 3

p.z

3

p.x

1

p.y

2

p.__dict__

{'x': 1, 'y': 2, 'z': 3}

class ColoredPoint(Point):
    color = (0,0,0) #rgb

cp = ColoredPoint(2, 3)

cp.color

(0, 0, 0)

cp.x

2

cp.y

3

cp.__dict__

{'x': 2, 'y': 3}

type(ColoredPoint)

type

type(cp)

__main__.ColoredPoint

ColoredPoint.__dict__

mappingproxy({'__doc__': None, '__module__': '__main__', 'color': (0, 0, 0)})

cp.__dict__

{'x': 2, 'y': 3}

problem:

Wrtie a class Timer which can be used to time a task. it should work as shown below. **hint: use time.time() to get timestamp**
```
t = Timer()
t.start()
do some stuff (may a loop with some calculations)
t.stop()
print(t.get_time_taken())
```

import time

time.time()

1513321010.1740944

import time

class Timer:
    def __init__(self):
        self._start = 0
        self._end = 0
        
    def start(self):
        self._start = time.time()
        
    def stop(self):
        self._end = time.time()
        
    def get_time_taken(self):
        return self._end - self._start

t = Timer()
t.start()
s = 0
for i in range(1000):
    for j in range(10000):
        s += i*j*1.0
t.stop()
print("{0:.3f}".format(t.get_time_taken()))

2.875

Exceptions¶

x + 2

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-194-d693fb1bd54c> in <module>()
----> 1 x + 2

TypeError: can only concatenate list (not "int") to list

2 + "3"

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-195-2068cae7beb7> in <module>()
----> 1 2 + "3"

TypeError: unsupported operand type(s) for +: 'int' and 'str'

doom

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-196-301636d58674> in <module>()
----> 1 doom

NameError: name 'doom' is not defined

int("hello")

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-197-045de671ab8a> in <module>()
----> 1 int("hello")

ValueError: invalid literal for int() with base 10: 'hello'

try:
    a = int("dfdf")
except ValueError as e:
    print("Handled ValueError", e)
    a = 0

Handled ValueError invalid literal for int() with base 10: 'dfdf'

a

0

%%file missing.csv
1,2,3,4,5,Nan
1,2,3,4,5,6
1,,3,2,4,5
Nan,1,1,1,1,1

Overwriting missing.csv

csvparser("missing.csv")

[['1', '2', '3', '4', '5', 'Nan'],
 ['1', '2', '3', '4', '5', '6'],
 ['1', '', '3', '2', '4', '5'],
 ['Nan', '1', '1', '1', '1', '1']]

def parsenumerccsv(filename):
    data = []
    for line in open(filename):
        items = line.strip().split(",")
        data.append([int(i) for i in items])
    return data

parsenumerccsv("missing.csv")

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-204-e7497688da74> in <module>()
----> 1 parsenumerccsv("missing.csv")

<ipython-input-203-6b54f33a74c4> in parsenumerccsv(filename)
      3     for line in open(filename):
      4         items = line.strip().split(",")
----> 5         data.append([int(i) for i in items])
      6     return data

<ipython-input-203-6b54f33a74c4> in <listcomp>(.0)
      3     for line in open(filename):
      4         items = line.strip().split(",")
----> 5         data.append([int(i) for i in items])
      6     return data

ValueError: invalid literal for int() with base 10: 'Nan'

def parsenumerccsv(filename):
    def parseint(s):
        try:
            return int(s)
        except ValueError as e:
            return 0
        
    data = []
    for line in open(filename):
        items = line.strip().split(",")
        data.append([parseint(i) for i in items])
    return data

parsenumerccsv("missing.csv")

[[1, 2, 3, 4, 5, 0],
 [1, 2, 3, 4, 5, 6],
 [1, 0, 3, 2, 4, 5],
 [0, 1, 1, 1, 1, 1]]

try:
    x = int(s)
except ValueError as v:
    pass
except NameError as n:
    pass
except TypeError as t:
    pass

Commandline applications¶

%%file grep.py
import argparse
    
def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument("pattern",
                        type=str,
                        help="pattern to be serched")
    parser.add_argument("filename",
                        type=str,
                       help="file in which pattern has to be searched")
    return parser.parse_args()


if __name__ == "__main__":
    args = parse_args()
    print(args)

Writing grep.py

!python grep.py "def" bank2.py

Namespace(filename='bank2.py', pattern='def')

%%file grep.py
import argparse
    
def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument("pattern",
                        type=str,
                        help="pattern to be serched")
    parser.add_argument("filename",
                        type=str,
                       help="file in which pattern has to be searched")
    return parser.parse_args()

def grep(pattern, filename):
    for line in open(filename):
        if pattern in line:
            print(line.strip())
        
if __name__ == "__main__":
    args = parse_args()
    print(args)
    grep(args.pattern, args.filename)

Overwriting grep.py

!python grep.py def bank2.py

Namespace(filename='bank2.py', pattern='def')
def __init__(self):
def get_balance(self):
def deposit(self, amount):
def withdraw(self, amount):

!python grep.py --help

usage: grep.py [-h] pattern filename

positional arguments:
  pattern     pattern to be serched
  filename    file in which pattern has to be searched

optional arguments:
  -h, --help  show this help message and exit

%%file grep.py
import argparse
    
def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument("pattern",
                        type=str,
                        help="pattern to be serched")
    parser.add_argument("filename",
                        type=str,
                       help="file in which pattern has to be searched")
    parser.add_argument("-v", "--invert_match",
                        action="store_true",
                        help="lines which do not have given pattern")
    
    return parser.parse_args()

def grep(pattern, filename):
    for line in open(filename):
        if pattern in line:
            print(line.strip())
            
def grep_invert(pattern, filename):
    for line in open(filename):
        if pattern not in line:
            print(line.strip())
        
if __name__ == "__main__":
    args = parse_args()
    print(args)
    if args.invert_match:
        grep_invert(args.pattern, args.filename)
    else:
        grep(args.pattern, args.filename)

Overwriting grep.py

!python grep.py -h

usage: grep.py [-h] [-v] pattern filename

positional arguments:
  pattern             pattern to be serched
  filename            file in which pattern has to be searched

optional arguments:
  -h, --help          show this help message and exit
  -v, --invert_match  lines which do not have given pattern

!python grep.py -v balance bank0.py

Namespace(filename='bank0.py', invert_match=True, pattern='balance')


def withdraw(amount):

def deposite(amount):

if __name__ == "__main__":
deposite(100)
withdraw(20)

%%file grep.py
import argparse
    
def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument("pattern",
                        type=str,
                        help="pattern to be serched")
    parser.add_argument("filename",
                        type=str,
                       help="file in which pattern has to be searched")
    parser.add_argument("-v", "--invert_match",
                        action="store_true",
                        help="lines which do not have given pattern")
    parser.add_argument("-b", "--backcontext",
                        type=int,
                        help="number of context lines to be printed")
    
    return parser.parse_args()

def grep(pattern, filename):
    for line in open(filename):
        if pattern in line:
            print(line.strip())
            
def grep_invert(pattern, filename):
    for line in open(filename):
        if pattern not in line:
            print(line.strip())
        
if __name__ == "__main__":
    args = parse_args()
    print(args)
    if args.invert_match:
        grep_invert(args.pattern, args.filename)
    else:
        grep(args.pattern, args.filename)

Overwriting grep.py

!python grep.py -h

usage: grep.py [-h] [-v] [-b BACKCONTEXT] pattern filename

positional arguments:
  pattern               pattern to be serched
  filename              file in which pattern has to be searched

optional arguments:
  -h, --help            show this help message and exit
  -v, --invert_match    lines which do not have given pattern
  -b BACKCONTEXT, --backcontext BACKCONTEXT
                        number of context lines to be printed

!python grep.py -b 5 def bank0.py

Namespace(backcontext=5, filename='bank0.py', invert_match=False, pattern='def')
def get_balance():
def withdraw(amount):
def deposite(amount):

problem:

Write a command fib.py which has two arguments. one is positional and default argument n, with this you should print nth fibonacci number. second argument is optional and boolean argument -s/--sequence. if -s option is given you should print sequence of first n fibonacci numbers.
```
python fib.py 3
2
python fib.py -s 6
1 1 2 3 5 8
```

Downloading stuff from internet¶

you can install requests library using

pip3 install requests

import requests

resp = requests.get("http://httpbin.org/get", params={"param1":1, "param2":"2"})

resp.status_code

200

resp.text[:50]

'{\n  "args": {\n    "param1": "1", \n    "param2": "2'

resp.text

'{\n  "args": {\n    "param1": "1", \n    "param2": "2"\n  }, \n  "headers": {\n    "Accept": "*/*", \n    "Accept-Encoding": "gzip, deflate", \n    "Connection": "close", \n    "Host": "httpbin.org", \n    "User-Agent": "python-requests/2.14.2"\n  }, \n  "origin": "42.107.68.185", \n  "url": "http://httpbin.org/get?param1=1&param2=2"\n}\n'

resp.json()

{'args': {'param1': '1', 'param2': '2'},
 'headers': {'Accept': '*/*',
  'Accept-Encoding': 'gzip, deflate',
  'Connection': 'close',
  'Host': 'httpbin.org',
  'User-Agent': 'python-requests/2.14.2'},
 'origin': '42.107.68.185',
 'url': 'http://httpbin.org/get?param1=1&param2=2'}

resp = requests.post("http://httpbin.org/post", data={"name":"python", "param":"hello"})

resp.json()

{'args': {},
 'data': '',
 'files': {},
 'form': {'name': 'python', 'param': 'hello'},
 'headers': {'Accept': '*/*',
  'Accept-Encoding': 'gzip, deflate',
  'Connection': 'close',
  'Content-Length': '23',
  'Content-Type': 'application/x-www-form-urlencoded',
  'Host': 'httpbin.org',
  'User-Agent': 'python-requests/2.14.2'},
 'json': None,
 'origin': '42.107.68.185',
 'url': 'http://httpbin.org/post'}

resp = requests.post("http://httpbin.org/post", data="Plain text data")

resp.json()

{'args': {},
 'data': 'Plain text data',
 'files': {},
 'form': {},
 'headers': {'Accept': '*/*',
  'Accept-Encoding': 'gzip, deflate',
  'Connection': 'close',
  'Content-Length': '15',
  'Host': 'httpbin.org',
  'User-Agent': 'python-requests/2.14.2'},
 'json': None,
 'origin': '42.107.68.185',
 'url': 'http://httpbin.org/post'}

resp = requests.post("http://httpbin.org/post", data=open("data1.csv"))

resp.json()

{'args': {},
 'data': 'A1,B1,C1\nA2,B2,C2\nA3,B3,C3\nA4,B4,C4\n',
 'files': {},
 'form': {},
 'headers': {'Accept': '*/*',
  'Accept-Encoding': 'gzip, deflate',
  'Connection': 'close',
  'Content-Length': '36',
  'Host': 'httpbin.org',
  'User-Agent': 'python-requests/2.14.2'},
 'json': None,
 'origin': '42.107.68.185',
 'url': 'http://httpbin.org/post'}

Example: Popular github repopsitories of vmware¶

url = "https://api.github.com/orgs/vmware/repos"

resp = requests.get(url)

repos = resp.json()

type(repos)

list

len(repos)

30

print(repos[0]['forks'])

4

for r in repos:
    print(r['name'], r['forks'])

pyvco 4
rvc 46
rbvmomi 153
vprobe-toolkit 9
CloudFS 16
vcd-nclient 2
lmock 5
FireBreath 2
weasel 1
vmware-vcenter 86
vmware-vshield 6
vcloud-rest 37
GemstoneWebTools 0
vmware-vcsa 17
vmware-vmware_lib 24
saml20serviceprovider 1
pg_rewind 18
vco-powershel-plugin 2
jenkins-reviewbot 12
dbeekeeper 0
thinapp_factory 16
vmware-cassandra 4
vmware-java 0
data-driven-framework 3
pyvmomi 450
pyvmomi-community-samples 387
open-vm-tools 146
pyvmomi-tools 18
upgrade-framework 11
webcommander 30

def get_forks(repo):
    return repo['forks']

for repo in sorted(repos, key=get_forks, reverse=True)[:5]:
    print(repo['name'], repo['forks'])

pyvmomi 450
pyvmomi-community-samples 387
rbvmomi 153
open-vm-tools 146
vmware-vcenter 86

problem:

write a function to find distance between two cities using google api.
```
distance("bangalore", "pune")
800km
```

def distance(source, dest):
    url = "https://maps.googleapis.com/maps/api/distancematrix/json"
    resp = requests.get(url, params={"origins":source,"destinations":dest, "units":"metric"})
    data = resp.json()
    return data['rows'][0]['elements'][0]['distance']['text']

distance("bangalore", "pune")

'837 km'

import json

s = json.dumps({"data":[1,2,3,{"x":"y"}]})

s

'{"data": [1, 2, 3, {"x": "y"}]}'

json.loads(s)

{'data': [1, 2, 3, {'x': 'y'}]}

Feedback ¶

References¶

https://docs.python.org/3/index.html
http://anandology.com/python-practice-book/index.html
bangpypers group in bangalore
for advanced and basic maths and programming problems try this https://projecteuler.net/archives
google for structure and interpretation of computer programs (SICP)

Python Training at VMWare Pune - Day 2¶

with statement¶

Writing to standard error and output¶

Dictionaries¶

Example : parse conf file and load as dictionary¶

Iterating over dictionaries¶

Pitfalls¶

Classes¶

Why classes?¶

Exceptions¶

Commandline applications¶

Downloading stuff from internet¶

Example: Popular github repopsitories of vmware¶

Feedback¶

References¶

Feedback ¶