Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from math import sqrt
- movie_reviews = {
- 'Lisa Rose': {'Catch Me If You Can': 3.0, 'Snakes on a Plane': 3.5, 'Superman Returns': 3.5,
- 'You, Me and Dupree': 2.5, 'The Night Listener': 3.0, 'Snitch': 3.0},
- 'Gene Seymour': {'Lady in the Water': 3.0, 'Snakes on a Plane': 3.5, 'Just My Luck': 1.5, 'The Night Listener': 3.0,
- 'You, Me and Dupree': 3.5},
- 'Michael Phillips': {'Catch Me If You Can': 2.5, 'Lady in the Water': 2.5, 'Superman Returns': 3.5,
- 'The Night Listener': 4.0, 'Snitch': 2.0},
- 'Claudia Puig': {'Snakes on a Plane': 3.5, 'Just My Luck': 3.0, 'The Night Listener': 4.5, 'Superman Returns': 4.0,
- 'You, Me and Dupree': 2.5},
- 'Mick LaSalle': {'Lady in the Water': 3.0, 'Snakes on a Plane': 4.0, 'Just My Luck': 2.0, 'Superman Returns': 3.0,
- 'You, Me and Dupree': 2.0},
- 'Jack Matthews': {'Catch Me If You Can': 4.5, 'Lady in the Water': 3.0, 'Snakes on a Plane': 4.0,
- 'The Night Listener': 3.0, 'Superman Returns': 5.0, 'You, Me and Dupree': 3.5, 'Snitch': 4.5},
- 'Toby': {'Snakes on a Plane': 4.5, 'Snitch': 5.0},
- 'Michelle Nichols': {'Just My Luck': 1.0, 'The Night Listener': 4.5, 'You, Me and Dupree': 3.5,
- 'Catch Me If You Can': 2.5, 'Snakes on a Plane': 3.0},
- 'Gary Coleman': {'Lady in the Water': 1.0, 'Catch Me If You Can': 1.5, 'Superman Returns': 1.5,
- 'You, Me and Dupree': 2.0},
- 'Larry': {'Lady in the Water': 3.0, 'Just My Luck': 3.5, 'Snitch': 1.5, 'The Night Listener': 3.5}
- }
- def sim_distance(reviews, person1, person2):
- # Se pravi lista na zaednicki predmeti (filmovi)
- filmovi1=set(reviews[person1].keys())
- filmovi2=set(reviews[person2].keys())
- zaednicki = filmovi1.intersection(filmovi2)
- # print(filmovi1)
- # print(filmovi2)
- # print(zaednicki)
- # for item in oceni[person1].keys():
- # if item in oceni[person2]:
- # zaednicki.add(item)
- # # ako nemaat zaednicki rejtinzi, vrati 0
- if len(zaednicki) == 0: return 0
- # # Soberi gi kvadratite na zaednickite razliki
- suma = 0.0
- for item in zaednicki:
- ocena1 = reviews[person1][item]
- ocena2 = reviews[person2][item]
- suma += (ocena1 - ocena2) ** 2
- # print(item, person1, ocena1, person2, ocena2)
- return round(1 / (1 + sqrt(suma)),3)
- # Go vrakja koeficientot na Pearsonova korelacija pomegu p1 i p2 (licnost 1 i licnost 2)
- # Vrednostite se pomegu -1 i 1
- def sim_pearson(reviews, p1, p2):
- # Se kreira recnik vo koj ke se cuvaat predmetite (filmovi) koi se oceneti od dvajcata
- # Vo recnikot ni se vazni samo klucevite za da gi cuvame iminjata na filmovite koi se zaednicki, a vrednostite ne ni se vazni
- zaednicki = set()
- for item in reviews[p1]:
- if item in reviews[p2]:
- zaednicki.add(item)
- # Se presmetuva brojot na predmeti oceneti od dvajcata
- n = len(zaednicki)
- # Ako nemaat zaednicki predmeti vrati korelacija 0
- if n == 0: return 0
- # Soberi gi zaednickite oceni (rejtinzi) za sekoja licnost posebno
- sum1 = 0
- sum2 = 0
- # Soberi gi kvadratite od zaednickite oceni (rejtinzi) za sekoja licnost posebno
- sum1Sq = 0
- sum2Sq = 0
- # Soberi gi proizvodite od ocenite na dvete licnosti
- pSum = 0
- for item in zaednicki:
- ocena1 = reviews[p1][item]
- ocena2 = reviews[p2][item]
- sum1 += ocena1
- sum1Sq += ocena1 ** 2
- sum2 += ocena2
- sum2Sq += ocena2 ** 2
- pSum += ocena1 * ocena2
- # Presmetaj go koeficientot na korelacija
- num = pSum - (sum1 * sum2 / n)
- den = sqrt((sum1Sq - pow(sum1, 2) / n) * (sum2Sq - pow(sum2, 2) / n))
- if den == 0: return 0
- r = num / den
- return round(r,3)
- def zaednicki (reviews, p1, p2):
- zaednicki = set()
- for item in reviews[p1]:
- if item in reviews[p2]:
- zaednicki.add(item)
- return len(zaednicki)
- def tabela_na_slichni_korisnici(reviews):
- slicnosti = {}
- for item in reviews:
- slicnosti[item] = {}
- for item2 in reviews:
- if (item != item2):
- sim1 = sim_distance(reviews,item,item2)
- sim2 = sim_pearson(reviews,item,item2)
- slicnosti[item][item2] = (sim1,sim2,zaednicki(reviews,item,item2))
- return slicnosti
- if __name__ == "__main__":
- korisnik1 = input()
- korisnik2 = input()
- tabela = tabela_na_slichni_korisnici(movie_reviews)
- print(tabela[korisnik1][korisnik2])
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement