Update README.md

2023-04-06 18:10:40 +03:00 · 2023-04-06 18:10:40 +03:00 · 5e53e3e745
commit 5e53e3e745
--- a/README.md
+++ b/README.md
@ -95,3 +95,37 @@ Close the window without logging out (Otherwise the cookies are made invalid).
 # Example usages:
 ## Using SpotiFile to create a song recommendation module based off song lyrics' semantic similarity: 
 ```python
 from spotify_scraper import SpotifyScraper
 import nltk
 from nltk.corpus import stopwords
 from sklearn.feature_extraction.text import TfidfVectorizer
 from sklearn.metrics.pairwise import cosine_similarity
 import sys
 def semantic_similarity(paragraph1, paragraph2):
    # Preprocess text
    stop_words = set(stopwords.words('english'))
    paragraph1 = ' '.join([word.lower() for word in nltk.word_tokenize(paragraph1) if word.lower() not in stop_words])
    paragraph2 = ' '.join([word.lower() for word in nltk.word_tokenize(paragraph2) if word.lower() not in stop_words])
    # Compute similarity score
    tfidf_vectorizer = TfidfVectorizer()
    tfidf_matrix = tfidf_vectorizer.fit_transform([paragraph1, paragraph2])
    similarity_score = cosine_similarity(tfidf_matrix)[0][1]
    return similarity_score
 # Usage
 scraper = SpotifyScraper()
 lyrics1 = '\n'.join(x['words'] for x in scraper.get_lyrics(sys.argv[1])['lyrics']['lines'])
 lyrics2 = '\n'.join(x['words'] for x in scraper.get_lyrics(sys.argv[2])['lyrics']['lines'])
 sim = semantic_similarity(lyrics1, lyrics2)
 print(f'The similarity between the two tracks is: {sim}')
 ```