songs-lyrics-generator/main.py

import os
import random
import pandas as pd
from scrapper import scrap_data
from markov_model import clean_data
from markov_model import create_markov_model
from markov_model import generate_lyrics

blacksabbath_selected_albums = ["Black Sabbath", "Paranoid", "Master Of Reality", "Vol 4", "Sabbath Bloody Sabbath",
                                "Sabotage", "Technical Ecstasy", "Never Say Die!", "Heaven And Hell", "Mob Rules",
                                "Born Again", "Seventh Star", "The Eternal Idol", "Headless Cross", "Tyr",
                                "Dehumanizer", "Cross Purposes", "Forbidden", "13"]

pinkfloyd_selected_albums = ["The Piper At The Gates Of Dawn", "A Saucerful Of Secrets", "Meddle", "More", "Ummagumma",
                             "Atom Heart Mother", "Obscured By Clouds", "The Dark Side Of The Moon",
                             "Wish You Were Here", "Animals", "The Wall", "The Final Cut",
                             "A Momentary Lapse Of Reason", "The Division Bell"]

time_stamp = 3.5
path = os.path.dirname(os.path.abspath(__file__))
path = os.path.join(path, "Data")


def generate_song(name):
    dataset = clean_data(os.path.join(path, name))
    n_gram = int(input("Select number of words in Markov state: "))
    number_of_verses = int(input("Select number of verses: "))
    words_in_verses = int((int(input("Select number of words in verses: ")) - 1) / n_gram)
    degree_of_chain = int(input("Select degree of chain: "))
    model = create_markov_model(dataset, n_gram, degree_of_chain)
    print('\n')
    last_state = random.choice(list(model.keys()))
    for i in range(number_of_verses):
        generated_lyrics, last_state = generate_lyrics(model, last_state, words_in_verses)
        print(generated_lyrics)
        last_state = random.choices(list(model[last_state].keys()),
                                    list(model[last_state].values()))[0]


def scraping():
    with open("links.txt", "r") as f:
        lines = f.readlines()
        for i in range(len(lines)):
            if i != (len(lines) - 1):
                print(str(i) + ".", lines[i][:-1])
            else:
                print(str(i) + ".", lines[i])
    line_index = int(input("Select url to scrap: "))
    url = lines[line_index]
    if line_index != (len(lines) - 1):
        url = url[:-1]
    if url.split('/')[2] == 'www.azlyrics.com':
        selected_albums_name = url.split('/')[4][:-5] + "_selected_albums"
        if selected_albums_name in globals():
            selected_albums = globals()[selected_albums_name]
            scrap_data(url, selected_albums, time_stamp)
        else:
            print("Define selected albums in global list variable in format: bandname_selected_albums")
            return
    if url.split('/')[2] == 'www.tekstowo.pl':
        scrap_data(url, [], 0.0)


def merging():
    name1 = input("Select first band file: ")
    if os.path.exists(os.path.join(path, name1)):
        df1 = pd.read_csv(os.path.join(path, name1))
    else:
        print("No such file in directory!")
        return
    name2 = input("Select second band file: ")
    if os.path.exists(os.path.join(path, name2)):
        df2 = pd.read_csv(os.path.join(path, name2))
    else:
        print("No such file in directory!")
        return
    dfResult = pd.concat([df1, df2], ignore_index=True)
    result_name = input("Select name of result file: ")
    dfResult.to_csv(os.path.join(path, result_name))


def main():
    print("Select data set to use in generation or other option:\n1. Generate text based on input filename\n2. Scrap "
          "data\n3. Merge CSV band's songs\n4. Exit")
    while True:
        selection = int(input())
        match selection:
            case 1:
                name = input("Select name of data file: ")
                generate_song(name)
            case 2:
                scraping()
            case 3:
                merging()
            case 4:
                break
        print("\nCommand executed")


if __name__ == '__main__':
    main()
Initial commit 2023-03-26 15:22:02 +02:00			`import os`
			`import random`
Interface improvements. 2023-03-28 15:08:23 +02:00			`import pandas as pd`
Initial commit 2023-03-26 15:22:02 +02:00			`from scrapper import scrap_data`
Interface change and minor improvement in data cleaning. 2023-03-28 00:21:13 +02:00			`from markov_model import clean_data`
Initial commit 2023-03-26 15:22:02 +02:00			`from markov_model import create_markov_model`
			`from markov_model import generate_lyrics`

Interface improvements. 2023-03-28 15:08:23 +02:00			`blacksabbath_selected_albums = ["Black Sabbath", "Paranoid", "Master Of Reality", "Vol 4", "Sabbath Bloody Sabbath",`
Minor bugs repair. 2023-03-28 15:30:52 +02:00			`"Sabotage", "Technical Ecstasy", "Never Say Die!", "Heaven And Hell", "Mob Rules",`
			`"Born Again", "Seventh Star", "The Eternal Idol", "Headless Cross", "Tyr",`
			`"Dehumanizer", "Cross Purposes", "Forbidden", "13"]`
Initial commit 2023-03-26 15:22:02 +02:00
Interface improvements. 2023-03-28 15:08:23 +02:00			`pinkfloyd_selected_albums = ["The Piper At The Gates Of Dawn", "A Saucerful Of Secrets", "Meddle", "More", "Ummagumma",`
Minor bugs repair. 2023-03-28 15:30:52 +02:00			`"Atom Heart Mother", "Obscured By Clouds", "The Dark Side Of The Moon",`
			`"Wish You Were Here", "Animals", "The Wall", "The Final Cut",`
			`"A Momentary Lapse Of Reason", "The Division Bell"]`
Initial commit 2023-03-26 15:22:02 +02:00
			`time_stamp = 3.5`
Interface change and minor improvement in data cleaning. 2023-03-28 00:21:13 +02:00			`path = os.path.dirname(os.path.abspath(__file__))`
			`path = os.path.join(path, "Data")`


			`def generate_song(name):`
			`dataset = clean_data(os.path.join(path, name))`
			`n_gram = int(input("Select number of words in Markov state: "))`
			`number_of_verses = int(input("Select number of verses: "))`
Interface improvements. 2023-03-28 15:08:23 +02:00			`words_in_verses = int((int(input("Select number of words in verses: ")) - 1) / n_gram)`
			`degree_of_chain = int(input("Select degree of chain: "))`
			`model = create_markov_model(dataset, n_gram, degree_of_chain)`
Interface change and minor improvement in data cleaning. 2023-03-28 00:21:13 +02:00			`print('\n')`
Interface improvements. 2023-03-28 15:08:23 +02:00			`last_state = random.choice(list(model.keys()))`
Interface change and minor improvement in data cleaning. 2023-03-28 00:21:13 +02:00			`for i in range(number_of_verses):`
Interface improvements. 2023-03-28 15:08:23 +02:00			`generated_lyrics, last_state = generate_lyrics(model, last_state, words_in_verses)`
Interface change and minor improvement in data cleaning. 2023-03-28 00:21:13 +02:00			`print(generated_lyrics)`
Interface improvements. 2023-03-28 15:08:23 +02:00			`last_state = random.choices(list(model[last_state].keys()),`
			`list(model[last_state].values()))[0]`


			`def scraping():`
			`with open("links.txt", "r") as f:`
			`lines = f.readlines()`
			`for i in range(len(lines)):`
			`if i != (len(lines) - 1):`
			`print(str(i) + ".", lines[i][:-1])`
			`else:`
			`print(str(i) + ".", lines[i])`
			`line_index = int(input("Select url to scrap: "))`
			`url = lines[line_index]`
			`if line_index != (len(lines) - 1):`
			`url = url[:-1]`
			`if url.split('/')[2] == 'www.azlyrics.com':`
			`selected_albums_name = url.split('/')[4][:-5] + "_selected_albums"`
			`if selected_albums_name in globals():`
			`selected_albums = globals()[selected_albums_name]`
			`scrap_data(url, selected_albums, time_stamp)`
			`else:`
			`print("Define selected albums in global list variable in format: bandname_selected_albums")`
			`return`
			`if url.split('/')[2] == 'www.tekstowo.pl':`
			`scrap_data(url, [], 0.0)`


			`def merging():`
			`name1 = input("Select first band file: ")`
Minor bugs repair. 2023-03-28 15:30:52 +02:00			`if os.path.exists(os.path.join(path, name1)):`
			`df1 = pd.read_csv(os.path.join(path, name1))`
Interface improvements. 2023-03-28 15:08:23 +02:00			`else:`
			`print("No such file in directory!")`
			`return`
			`name2 = input("Select second band file: ")`
Minor bugs repair. 2023-03-28 15:30:52 +02:00			`if os.path.exists(os.path.join(path, name2)):`
			`df2 = pd.read_csv(os.path.join(path, name2))`
Interface improvements. 2023-03-28 15:08:23 +02:00			`else:`
			`print("No such file in directory!")`
			`return`
			`dfResult = pd.concat([df1, df2], ignore_index=True)`
			`result_name = input("Select name of result file: ")`
Minor bugs repair. 2023-03-28 15:30:52 +02:00			`dfResult.to_csv(os.path.join(path, result_name))`
Initial commit 2023-03-26 15:22:02 +02:00

			`def main():`
Interface improvements. 2023-03-28 15:08:23 +02:00			`print("Select data set to use in generation or other option:\n1. Generate text based on input filename\n2. Scrap "`
			`"data\n3. Merge CSV band's songs\n4. Exit")`
Initial commit 2023-03-26 15:22:02 +02:00			`while True:`
			`selection = int(input())`
			`match selection:`
			`case 1:`
Interface improvements. 2023-03-28 15:08:23 +02:00			`name = input("Select name of data file: ")`
			`generate_song(name)`
Initial commit 2023-03-26 15:22:02 +02:00			`case 2:`
Interface improvements. 2023-03-28 15:08:23 +02:00			`scraping()`
Initial commit 2023-03-26 15:22:02 +02:00			`case 3:`
Interface improvements. 2023-03-28 15:08:23 +02:00			`merging()`
Initial commit 2023-03-26 15:22:02 +02:00			`case 4:`
			`break`
			`print("\nCommand executed")`


			`if __name__ == '__main__':`
			`main()`