# setup
import sqlite3
import comp521
import math

check, report = comp521.start('A3')

# these are the variables you will use below. You must use the variables because
# they will have different values when I grade your assignment.
from A3vars import *


# using variables N and P compute your answers and leave them in variables
# Bl and Bu
Bl = 1
Bu = math.ceil(math.log(N/P,2))

print 'lower bound =', Bl
print 'upper bound =', Bu

check('Bl', Bl, points=5)
check('Bu', Bu, points=5)

lower bound = 1
upper bound = 10.0
Bl correct
Bu correct


# leave your answer in variable A2.
A2 = 2

print 'A2 =', A2

check('A2', A2, points=5)

A2 = 2
A2 correct


# compute your answer into A3
A3 = 1

check('A3', A3, points=5)

A3 correct


# compute your answer into A4
A4 = N/float(M*P)*100

print 'A4 =', A4

check('A4', A4, points=5)

A4 = 51.2
A4 correct


# compute your answer into A5
A5 = 3

print 'A5 =', A5

check('A5', A5, points=5)

A5 = 3
A5 correct


# compute your answer into A6
A6 = (Csect*St)/(math.pow(2,20))

print 'A6 =', A6

check('A6', A6, points=5)

A6 = 16.0
A6 correct


# compute your answer into A7
A7 = Csurf*1024/((Csect*St)/(math.pow(2,20)))

print 'A7 =', A7

check('A7', A7, points=5)

A7 = 8192.0
A7 correct


# compute your answer into A8
A8 =  Cdisk*1024/(2*Csurf)

print 'A8 =', A8

check('A8', A8, points=5)

A8 = 8
A8 correct


# compute your answer into A9
A9 = Csurf*1024/(((Csect*St)/(math.pow(2,20))))

print 'A9 =', A9

check('A9', A9, points=5)

A9 = 8192.0
A9 correct


# compute your answer into A10
A10 = (1/Trotation)*60

print 'A10 =', A10

check('A10', A10, points=5)

A10 = 6000.0
A10 correct


# Leave your answer in A11
A11 = Nfile/(math.ceil(Cblock/250))

print 'A11 =', A11
check('A11', A11, points=5)

A11 = 62500.0
A11 correct


# this is a helper function to clear indexes for timing without them
# no need to change it

def dropIndexes(dbname):
    '''drop any indexes that we may have created'''
    db = sqlite3.connect(dbname)
    cursor = db.cursor()
    cursor.execute("""
        select name from sqlite_master 
            where type = 'index' and sql not null
    """)
    for row in cursor.fetchall():
        name = row[0]
        print 'dropping', name
        cursor.execute('drop index if exists %s' % name)
    db.commit()
    db.close()


# this is a helper function to measure the time required for a query to run
# no need to change it.

import time
def timeQuery(cursor, query, repeat=1):
    T = 0
    for i in range(repeat):
        Tstart = time.time()
        cursor.execute(query)
        rowCounter = len(cursor.fetchall())
        Tend = time.time()
        T += Tend - Tstart
    return (T/repeat, rowCounter)


# a helper to time several queries
# no need to change it
def runQueries(dbName, queries):
    '''time queries from a list'''
    db = sqlite3.connect(dbName)
    cursor = db.cursor()
    times = []
    for q in queries:
        t, rows = timeQuery(cursor, q, 5)
        print q
        print 'returned %d rows in %f seconds' % (rows, t)
        times.append(t)
    db.close()
    return times


queries = [
    """
    SELECT LName, FName FROM Actors WHERE LName = "Smith"
    """,
    """
    SELECT m.title FROM Movies m
        WHERE m.Year > 2000 AND m.Year < 2002
    """,
    """
    SELECT A.LName, A.FName, M.year, M.title
        FROM Actors A, Movies M, Casts C
        WHERE A.aid = C.aid and M.mid = C.mid and
              A.LName = 'Bishop' and
              M.year >= 2000 and M.year <= 2002 and
              C.role = 'Himself'
        ORDER BY A.LName, A.FName, M.year
    """    
]


# get the base time for the queries without indexes
# you shouldn't need to change this code
# though you might find it useful as I did to move the db to another drive

dbName = 'actors.db'
dropIndexes(dbName)
TimeWithout = runQueries(dbName, queries)

dropping lastNameIndex
dropping movieYearIndex
dropping actorIDIndex
dropping movieIDIndex
dropping bro
dropping dude

    SELECT LName, FName FROM Actors WHERE LName = "Smith"
    
returned 5773 rows in 0.230371 seconds

    SELECT m.title FROM Movies m
        WHERE m.Year > 2000 AND m.Year < 2002
    
returned 11039 rows in 0.098444 seconds

    SELECT A.LName, A.FName, M.year, M.title
        FROM Actors A, Movies M, Casts C
        WHERE A.aid = C.aid and M.mid = C.mid and
              A.LName = 'Bishop' and
              M.year >= 2000 and M.year <= 2002 and
              C.role = 'Himself'
        ORDER BY A.LName, A.FName, M.year
    
returned 11 rows in 0.221059 seconds


# can you do better with an index?
dropIndexes(dbName)
db = sqlite3.connect(dbName)
cursor = db.cursor()

# create your indexes here
cursor.execute("CREATE INDEX lastNameIndex ON Actors(LName)")
cursor.execute("CREATE INDEX movieYearIndex ON Movies(Year)")

# your work should go between this comment and the one above
db.commit()
db.close()


# now get the time for the queries with indexes
TimeWith = runQueries(dbName, queries)

    SELECT LName, FName FROM Actors WHERE LName = "Smith"
    
returned 5773 rows in 0.009840 seconds

    SELECT m.title FROM Movies m
        WHERE m.Year > 2000 AND m.Year < 2002
    
returned 11039 rows in 0.033627 seconds

    SELECT A.LName, A.FName, M.year, M.title
        FROM Actors A, Movies M, Casts C
        WHERE A.aid = C.aid and M.mid = C.mid and
              A.LName = 'Bishop' and
              M.year >= 2000 and M.year <= 2002 and
              C.role = 'Himself'
        ORDER BY A.LName, A.FName, M.year
    
returned 11 rows in 0.001804 seconds


# I'm computing the speedup here
for i in range(len(queries)):
    print i, TimeWithout[i]/TimeWith[i]

0 23.4110221645
1 2.92755146029
2 122.549895583


onyen = 'jpuccio'
collaborators = ['Patrick Lung', 'Zen Yang']
report(onyen, collaborators)

A10
A11
A2
A3
A4
A5
A6
A7
A8
A9
Bl
Bu
Report for jpuccio
  Collaborators: ['Patrick Lung', 'Zen Yang']
  12 of 12 correct, 60 of 60 points


dropIndexes(dbName)

dropping lastNameIndex
dropping movieYearIndex

Query	Speedup
0	24.6
1	3.1
2	783

Assignment 3¶

Part 1¶

Part 2¶

Part 3¶

Queries¶

Add indexes¶

Report your results¶