Advertisement
Guest User

Untitled

a guest
Dec 14th, 2019
143
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.44 KB | None | 0 0
  1. import os
  2. import pandas as pd
  3. import sys
  4.  
  5.  
  6. def crawl(dir_path, idx):
  7.     for d in os.listdir(dir_path):
  8.         if os.path.isfile(dir_path + "\\" + d) == False:
  9.             crawl(dir_path + "\\" + d, idx)
  10.         else:
  11.             file_name = str(df['FileName'][idx][0:len(df['FileName'][idx]) - 9]) + ".java"
  12.             # print(df['FileName'][idx])
  13.             if d == file_name:
  14.                 actual_file_path = dir_path + "\\" + file_name
  15.                 df_out.append({'ProjectName': 'RxJava','TestFilePath': df['FilePath'][idx], 'FilePath': actual_file_path}, ignore_index=True)
  16.                 # print("Achei " + df['FileName'][i] + " e " + file_name + " at dir: " + actual_file_path)
  17.    
  18. csv_dir = r"C:\Users\guiga\EASY\TestSmells\csv"
  19. project_path = r"C:\Users\guiga\EASY\TestSmells\repositories\RxJava"
  20. files = []
  21. test_files_list = list()
  22. sys.setrecursionlimit(100000000)
  23. df_out = pd.DataFrame(columns = ['ProjectName', 'TestFilePath', 'FilePath'])
  24.  
  25. for csv_file in os.listdir(csv_dir):
  26.     # print(csv_file)
  27.     df = pd.read_csv(csv_dir + "\\" + csv_file)
  28.     df = df[['FileName', 'FilePath']]
  29.     df = df.drop_duplicates()
  30.     # print(df['FileName'][0])
  31.     # test_files_list = list(set(df['FileName'].values))
  32.     for i in df.index:
  33.         # print(df['FileName'][i])
  34.         if df['FileName'][i].endswith('Test.java'):
  35.             crawl(project_path, i)
  36. df_out.to_csv('out.csv', header=False)
  37. # print(test_files_list)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement