Advertisement
Guest User

Untitled

a guest
Dec 15th, 2018
71
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 4.41 KB | None | 0 0
  1. import numpy as np
  2. import pandas as pd
  3. import os
  4.  
  5. def load_data(base_dir):
  6. print(f"base_dir = {base_dir}")
  7. print(os.listdir(f"{base_dir}"))
  8. x_train = None
  9. for i in range(1, 5):
  10. filename = f"{base_dir}/x_train_{i}.npz"
  11. with np.load(filename) as data:
  12. print(f"files in {filename}: {data.files}")
  13. temp_data = data[data.files[0]]
  14. if x_train is None:
  15. x_train = temp_data
  16. else:
  17. x_train = np.concatenate((x_train, temp_data))
  18.  
  19.  
  20. with np.load(f'{base_dir}/y_train.npz') as data:
  21. print(f"files in {base_dir}/y_train.npz: {data.files}")
  22. y_train = data[data.files[0]]
  23.  
  24. with np.load(f'{base_dir}/x_test.npz') as data:
  25. print(f"files in {base_dir}/x_test.npz: {data.files}")
  26. x_test = data[data.files[0]]
  27. return x_train, y_train, x_test
  28.  
  29. def save_submission(submission, name="prediction.csv"):
  30. result = pd.DataFrame(submission)
  31. result = result.rename({0: "Label", }, axis=1)
  32. result.index.name = "Id"
  33. result.index += 1
  34. result.to_csv(name)
  35.  
  36. x, y, t = load_data("../input")
  37.  
  38.  
  39. import catboost as cb
  40.  
  41. CBR = cb.CatBoostRegressor(iterations=10000,
  42. learning_rate=0.1,
  43. depth=8,
  44. l2_leaf_reg=0.1,
  45. model_size_reg=None,
  46. rsm=None,
  47. loss_function='RMSE',
  48. border_count=None,
  49. feature_border_type=None,
  50. fold_permutation_block_size=None,
  51. od_pval=None,
  52. od_wait=None,
  53. od_type=None,
  54. nan_mode=None,
  55. counter_calc_method=None,
  56. leaf_estimation_iterations=None,
  57. leaf_estimation_method=None,
  58. thread_count=2,
  59. random_seed=None,
  60. use_best_model=None,
  61. verbose=None,
  62. logging_level=None,
  63. metric_period=None,
  64. ctr_leaf_count_limit=None,
  65. store_all_simple_ctr=None,
  66. max_ctr_complexity=None,
  67. has_time=None,
  68. allow_const_label=None,
  69. one_hot_max_size=None,
  70. random_strength=None,
  71. name=None,
  72. ignored_features=None,
  73. train_dir=None,
  74. custom_metric=None,
  75. eval_metric=None,
  76. bagging_temperature=None,
  77. save_snapshot=None,
  78. snapshot_file=None,
  79. snapshot_interval=None,
  80. fold_len_multiplier=None,
  81. used_ram_limit=None,
  82. gpu_ram_part=None,
  83. allow_writing_files=None,
  84. final_ctr_computation_mode=None,
  85. approx_on_full_history=None,
  86. boosting_type=None,
  87. simple_ctr=None,
  88. combinations_ctr=None,
  89. per_feature_ctr=None,
  90. task_type="GPU",
  91. device_config=None,
  92. devices=None,
  93. bootstrap_type=None,
  94. subsample=None,
  95. max_depth=None,
  96. n_estimators=None,
  97. num_boost_round=None,
  98. num_trees=None,
  99. colsample_bylevel=None,
  100. random_state=42,
  101. reg_lambda=None,
  102. objective=None,
  103. eta=None,
  104. max_bin=None,
  105. gpu_cat_features_storage=None,
  106. data_partition=None,
  107. metadata=None,
  108. early_stopping_rounds=None,
  109. cat_features=None)
  110.  
  111. CBR.fit(x, y * 5)
  112. submission = CBR.predict(t).astype(int)
  113. submission[submission > 20] = 20
  114. submission[submission < 0] = 0
  115. save_submission(submission)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement