Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import random
- import sys
- def check_for_duplicates(pair,key1,key2):
- if len(pair) == 1:
- return False
- for num,x in enumerate(pair):
- if num+1 == len(pair):
- return False
- if pair[num]['seg1'] == key1 and pair[num]['seg2'] == key2:
- return True
- return False
- def generate():
- cycle_count = int(sys.argv[1])
- maintext = ""
- pair1 = {}
- pair2 = {}
- pair3 = {}
- pair4 = {}
- pair5 = {}
- texts_count = 0
- for x in range(cycle_count):
- discarded = False
- temptext = ""
- text = open("segmentas1.txt", "r")
- index = random.randint(0,file_lengthy("segmentas1.txt")-1)
- pair1[x] = {"seg1": index, "seg2": -1}
- for i, line in enumerate(text):
- if i == index:
- tmp = line.replace("\n", "")
- temptext = temptext +str(x+1)+"."+ tmp + " "
- break
- text.close()
- text = open("segmentas2.txt", "r")
- index = random.randint(0,file_lengthy("segmentas2.txt")-1)
- pair1[x]["seg2"] = index
- u = 0
- while check_for_duplicates(pair1,pair1[x]["seg1"],pair1[x]["seg2"]):
- if u == 100:
- print("discarded #" + str(x+1))
- discarded = True
- break
- index = random.randint(0, file_lengthy("segmentas2.txt") - 1)
- pair1[x]["seg2"] = index
- u = u + 1
- pair2[x] = {"seg1": index, "seg2": -1}
- for i, line in enumerate(text):
- if i == index:
- tmp = line.replace("\n","")
- temptext = temptext + tmp+ " "
- break
- text.close()
- text = open("segmentas3.txt", "r")
- index = random.randint(0,file_lengthy("segmentas3.txt")-1)
- pair2[x]["seg2"] = index
- u = 0
- while check_for_duplicates(pair2,pair2[x]["seg1"],pair2[x]["seg2"]):
- if u == 1000:
- print("discarded #" + str(x+1))
- discarded = True
- break
- index = random.randint(0, file_lengthy("segmentas3.txt") - 1)
- pair2[x]["seg2"] = index
- u = u + 1
- pair3[x] = {"seg1": index, "seg2": -1}
- for i, line in enumerate(text):
- if i == index:
- tmp = line.replace("\n", "")
- temptext = temptext + tmp+ " "
- break
- text.close()
- text = open("segmentas4.txt", "r")
- index = random.randint(0,file_lengthy("segmentas4.txt")-1)
- pair3[x]["seg2"] = index
- u = 0
- while check_for_duplicates(pair3, pair3[x]["seg1"], pair3[x]["seg2"]):
- if u == 1000:
- print("discarded #" + str(x+1))
- discarded = True
- break
- index = random.randint(0, file_lengthy("segmentas4.txt") - 1)
- pair3[x]["seg2"] = index
- u = u + 1
- pair4[x] = {"seg1": index, "seg2": -1}
- for i, line in enumerate(text):
- if i == index:
- tmp = line.replace("\n", "")
- temptext = temptext + tmp+ " "
- break
- text.close()
- text = open("segmentas5.txt", "r")
- index = random.randint(0,file_lengthy("segmentas5.txt")-1)
- pair4[x]["seg2"] = index
- u = 0
- while check_for_duplicates(pair4, pair4[x]["seg1"], pair4[x]["seg2"]):
- if u == 1000:
- print("discarded #" + str(x+1))
- discarded = True
- break
- index = random.randint(0, file_lengthy("segmentas5.txt") - 1)
- pair4[x]["seg2"] = index
- u = u + 1
- pair5[x] = {"seg1": index, "seg2": -1}
- for i, line in enumerate(text):
- if i == index:
- tmp = line.replace("\n", "")
- temptext = temptext + tmp+ " "
- break
- text.close()
- text = open("segmentas6.txt", "r")
- index = random.randint(0,file_lengthy("segmentas6.txt")-1)
- u = 0
- while check_for_duplicates(pair5, pair5[x]["seg1"], pair5[x]["seg2"]):
- if u == 1000:
- print("discarded #" + str(x+1))
- discarded = True
- break
- index = random.randint(0, file_lengthy("segmentas6.txt") - 1)
- pair5[x]["seg2"] = index
- u = u + 1
- for i, line in enumerate(text):
- if i == index:
- tmp = line.replace("\n", "")
- temptext = temptext + tmp+ "\n \n \n"
- break
- text.close()
- if discarded != True:
- maintext = maintext + temptext
- texts_count = texts_count + 1
- print(str(texts_count)+" texts created.")
- f = open(sys.argv[2], "w")
- f.write(maintext)
- def file_lengthy(fname):
- with open(fname) as f:
- for i, l in enumerate(f):
- pass
- return i + 1
- if __name__ == '__main__':
- generate()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement